diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=2.0247.pt b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=2.0247.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ba85be5b1b87609964d0016715a64e02d05a9aa --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=2.0247.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea404b1a4f73402d4b9b01686c5e1a72f80b41999ec1ab1520508fcb42f622d +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-010000-epoch-00-loss=1.9681.pt b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-010000-epoch-00-loss=1.9681.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0bdffb3b9767811c58ecff9bce52151cdc85c4 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-010000-epoch-00-loss=1.9681.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1e2bef7774e234a4ca79dd73a28592a80b3dfc2e3b06236c7a710dc3624888 +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-015000-epoch-00-loss=2.0020.pt b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-015000-epoch-00-loss=2.0020.pt new file mode 100644 index 0000000000000000000000000000000000000000..de275444a08b3973af40b89094b98b62f1fd5afb --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-015000-epoch-00-loss=2.0020.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91f7a99c2b4817407e079e100cecfdc3fd5c0645f4589049dd7f805a0cfa849 +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-019073-epoch-00-loss=1.8610.pt b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-019073-epoch-00-loss=1.8610.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2f7dd11e0042c2d02b9caa0da7af74c0c8ba62 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/checkpoints/step-019073-epoch-00-loss=1.8610.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:438ec42470c1625c168c5eee3e4240d11c7968d1433bfe0a8f8260c291d866a9 +size 15336322587 diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.json b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a323f8337d1b247311abed1819c0bcad4d4e6903 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.json @@ -0,0 +1,74 @@ +{ + "dataset": { + "align_stage_components": [ + "download/llava-laion-cc-sbu-558k/chat.json", + "download/llava-laion-cc-sbu-558k" + ], + "dataset_id": "obelics", + "dataset_resampled": true, + "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/", + "finetune_stage_components": [ + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", + "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data" + ], + "max_num_images": 6, + "min_num_images": 1, + "train_num_samples": 4882814, + "type": "obelics", + "workers": 4 + }, + "model": { + "align_epochs": 1, + "align_global_batch_size": 256, + "align_learning_rate": 0.001, + "align_lr_scheduler_type": "linear-warmup+cosine-decay", + "align_max_grad_norm": 1.0, + "align_max_steps": null, + "align_per_device_batch_size": 16, + "align_train_strategy": "fsdp-shard-grad-op", + "align_warmup_ratio": 0.03, + "align_weight_decay": 0.0, + "arch_specifier": "no-align+avgpool", + "enable_gradient_checkpointing": true, + "enable_mixed_precision_training": true, + "finetune_epochs": 1, + "finetune_global_batch_size": 128, + "finetune_learning_rate": 2e-05, + "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", + "finetune_max_grad_norm": 1.0, + "finetune_max_steps": null, + "finetune_per_device_batch_size": 16, + "finetune_train_strategy": "fsdp-full-shard", + "finetune_warmup_ratio": 0.03, + "finetune_weight_decay": 0.1, + "image_resize_strategy": "resize-naive", + "llm_backbone_id": "phi3-3b", + "llm_max_length": 4096, + "model_id": "phi3-3b-continue-training-hq-20b", + "pretrain_epochs": 1, + "pretrain_global_batch_size": 256, + "pretrain_learning_rate": 5e-05, + "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", + "pretrain_max_grad_norm": 1.0, + "pretrain_max_steps": 19073, + "pretrain_per_device_batch_size": 8, + "pretrain_train_strategy": "fsdp-full-shard", + "pretrain_warmup_ratio": 0.03, + "pretrain_weight_decay": 0.01, + "reduce_in_full_precision": false, + "type": "one-stage+7b", + "vision_backbone_id": "siglip-vit-so400m-384px" + }, + "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", + "pretrained_checkpoint": null, + "run_id": "obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7", + "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints", + "seed": 7, + "stage": "pretrain", + "trackers": [ + "jsonl", + "wandb" + ], + "wandb_entity": null, + "wandb_project": "mmpretrain" +} \ No newline at end of file diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.yaml b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..5db43ffc5826f4bc209bad3f01755c390533acc6 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/config.yaml @@ -0,0 +1,67 @@ +dataset: + align_stage_components: + - download/llava-laion-cc-sbu-558k/chat.json + - download/llava-laion-cc-sbu-558k + dataset_id: obelics + dataset_resampled: true + dataset_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/ + finetune_stage_components: + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json + - /fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data + max_num_images: 6 + min_num_images: 1 + train_num_samples: 4882814 + type: obelics + workers: 4 +model: + align_epochs: 1 + align_global_batch_size: 256 + align_learning_rate: 0.001 + align_lr_scheduler_type: linear-warmup+cosine-decay + align_max_grad_norm: 1.0 + align_max_steps: null + align_per_device_batch_size: 16 + align_train_strategy: fsdp-shard-grad-op + align_warmup_ratio: 0.03 + align_weight_decay: 0.0 + arch_specifier: no-align+avgpool + enable_gradient_checkpointing: true + enable_mixed_precision_training: true + finetune_epochs: 1 + finetune_global_batch_size: 128 + finetune_learning_rate: 2.0e-05 + finetune_lr_scheduler_type: linear-warmup+cosine-decay + finetune_max_grad_norm: 1.0 + finetune_max_steps: null + finetune_per_device_batch_size: 16 + finetune_train_strategy: fsdp-full-shard + finetune_warmup_ratio: 0.03 + finetune_weight_decay: 0.1 + image_resize_strategy: resize-naive + llm_backbone_id: phi3-3b + llm_max_length: 4096 + model_id: phi3-3b-continue-training-hq-20b + pretrain_epochs: 1 + pretrain_global_batch_size: 256 + pretrain_learning_rate: 5.0e-05 + pretrain_lr_scheduler_type: linear-warmup+cosine-decay + pretrain_max_grad_norm: 1.0 + pretrain_max_steps: 19073 + pretrain_per_device_batch_size: 8 + pretrain_train_strategy: fsdp-full-shard + pretrain_warmup_ratio: 0.03 + pretrain_weight_decay: 0.01 + reduce_in_full_precision: false + type: one-stage+7b + vision_backbone_id: siglip-vit-so400m-384px +mount_path: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models +pretrained_checkpoint: null +run_id: obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7 +run_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints +seed: 7 +stage: pretrain +trackers: +- jsonl +- wandb +wandb_entity: null +wandb_project: mmpretrain diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7.jsonl b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4f008f566c206935c4fe0d6796430cebb761e366 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7.jsonl @@ -0,0 +1,19314 @@ +{"Pretrain/Learning Rate": 8.741258741258742e-08, "Pretrain/Loss": 3.9224002361297607, "Pretrain/Loss (Raw)": 3.9224002361297607, "Pretrain/Step": 1, "Pretrain/Step Time": 29.52978277206421} +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 5.028595447540283, "Pretrain/Loss (Raw)": 6.134790897369385, "Pretrain/Step": 2, "Pretrain/Step Time": 28.70302379131317} +{"Pretrain/Learning Rate": 2.622377622377623e-07, "Pretrain/Loss": 4.9587836265563965, "Pretrain/Loss (Raw)": 4.819158554077148, "Pretrain/Step": 3, "Pretrain/Step Time": 29.214937607447307} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 5.058506011962891, "Pretrain/Loss (Raw)": 5.357674598693848, "Pretrain/Step": 4, "Pretrain/Step Time": 28.742215633392334} +{"Pretrain/Learning Rate": 4.370629370629371e-07, "Pretrain/Loss": 4.961846828460693, "Pretrain/Loss (Raw)": 4.575209617614746, "Pretrain/Step": 5, "Pretrain/Step Time": 28.850903034210205} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 5.0043253898620605, "Pretrain/Loss (Raw)": 5.216718673706055, "Pretrain/Step": 6, "Pretrain/Step Time": 29.115926504135132} +{"Pretrain/Learning Rate": 6.118881118881119e-07, "Pretrain/Loss": 4.844728946685791, "Pretrain/Loss (Raw)": 3.887148857116699, "Pretrain/Step": 7, "Pretrain/Step Time": 28.887727430888585} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 4.8267364501953125, "Pretrain/Loss (Raw)": 4.700788497924805, "Pretrain/Step": 8, "Pretrain/Step Time": 28.9187373816967} +{"Pretrain/Learning Rate": 7.867132867132868e-07, "Pretrain/Loss": 4.843726634979248, "Pretrain/Loss (Raw)": 4.979649543762207, "Pretrain/Step": 9, "Pretrain/Step Time": 28.97314198811849} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 4.917479515075684, "Pretrain/Loss (Raw)": 5.5812530517578125, "Pretrain/Step": 10, "Pretrain/Step Time": 28.81627745628357} +{"Pretrain/Learning Rate": 9.615384615384617e-07, "Pretrain/Loss": 4.918389797210693, "Pretrain/Loss (Raw)": 4.927493095397949, "Pretrain/Step": 11, "Pretrain/Step Time": 29.000413699583575} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 4.963073253631592, "Pretrain/Loss (Raw)": 5.454590797424316, "Pretrain/Step": 12, "Pretrain/Step Time": 28.92355481783549} +{"Pretrain/Learning Rate": 1.1363636363636364e-06, "Pretrain/Loss": 4.853196144104004, "Pretrain/Loss (Raw)": 3.5346717834472656, "Pretrain/Step": 13, "Pretrain/Step Time": 28.820202534015362} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 4.839229106903076, "Pretrain/Loss (Raw)": 4.657661437988281, "Pretrain/Step": 14, "Pretrain/Step Time": 29.037938458578928} +{"Pretrain/Learning Rate": 1.3111888111888113e-06, "Pretrain/Loss": 4.752209663391113, "Pretrain/Loss (Raw)": 3.5339322090148926, "Pretrain/Step": 15, "Pretrain/Step Time": 28.95368962287903} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 4.819477558135986, "Pretrain/Loss (Raw)": 5.828500747680664, "Pretrain/Step": 16, "Pretrain/Step Time": 28.974414885044098} +{"Pretrain/Learning Rate": 1.4860139860139862e-06, "Pretrain/Loss": 4.767443656921387, "Pretrain/Loss (Raw)": 3.089857578277588, "Pretrain/Step": 17, "Pretrain/Step Time": 29.027586880852194} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 4.6460652351379395, "Pretrain/Loss (Raw)": 4.192737579345703, "Pretrain/Step": 18, "Pretrain/Step Time": 28.946349117490982} +{"Pretrain/Learning Rate": 1.6608391608391608e-06, "Pretrain/Loss": 4.617422103881836, "Pretrain/Loss (Raw)": 4.3608598709106445, "Pretrain/Step": 19, "Pretrain/Step Time": 29.02002155153375} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 4.5252485275268555, "Pretrain/Loss (Raw)": 3.8829007148742676, "Pretrain/Step": 20, "Pretrain/Step Time": 29.028027606010436} +{"Pretrain/Learning Rate": 1.8356643356643357e-06, "Pretrain/Loss": 4.509396553039551, "Pretrain/Loss (Raw)": 4.3215789794921875, "Pretrain/Step": 21, "Pretrain/Step Time": 29.002898772557575} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 4.408271789550781, "Pretrain/Loss (Raw)": 3.5987250804901123, "Pretrain/Step": 22, "Pretrain/Step Time": 29.087611404332247} +{"Pretrain/Learning Rate": 2.0104895104895104e-06, "Pretrain/Loss": 4.362872123718262, "Pretrain/Loss (Raw)": 3.1607580184936523, "Pretrain/Step": 23, "Pretrain/Step Time": 29.067374789196514} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 4.339448928833008, "Pretrain/Loss (Raw)": 4.3260111808776855, "Pretrain/Step": 24, "Pretrain/Step Time": 29.07484543323517} +{"Pretrain/Learning Rate": 2.1853146853146853e-06, "Pretrain/Loss": 4.244109153747559, "Pretrain/Loss (Raw)": 3.454218864440918, "Pretrain/Step": 25, "Pretrain/Step Time": 29.100589599609375} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 4.1691083908081055, "Pretrain/Loss (Raw)": 4.38123893737793, "Pretrain/Step": 26, "Pretrain/Step Time": 29.076156368622414} +{"Pretrain/Learning Rate": 2.36013986013986e-06, "Pretrain/Loss": 4.074308395385742, "Pretrain/Loss (Raw)": 3.4106857776641846, "Pretrain/Step": 27, "Pretrain/Step Time": 29.141940664362025} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.950439929962158, "Pretrain/Loss (Raw)": 3.4726994037628174, "Pretrain/Step": 28, "Pretrain/Step Time": 29.123158718858445} +{"Pretrain/Learning Rate": 2.534965034965035e-06, "Pretrain/Loss": 3.933138370513916, "Pretrain/Loss (Raw)": 3.257845401763916, "Pretrain/Step": 29, "Pretrain/Step Time": 29.10173385718773} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 3.852195978164673, "Pretrain/Loss (Raw)": 3.3625857830047607, "Pretrain/Step": 30, "Pretrain/Step Time": 29.1764718691508} +{"Pretrain/Learning Rate": 2.7097902097902096e-06, "Pretrain/Loss": 3.815816640853882, "Pretrain/Loss (Raw)": 2.9518611431121826, "Pretrain/Step": 31, "Pretrain/Step Time": 29.15601578835518} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 3.6228535175323486, "Pretrain/Loss (Raw)": 2.7410926818847656, "Pretrain/Step": 32, "Pretrain/Step Time": 29.144019320607185} +{"Pretrain/Learning Rate": 2.884615384615385e-06, "Pretrain/Loss": 3.625187635421753, "Pretrain/Loss (Raw)": 3.1272003650665283, "Pretrain/Step": 33, "Pretrain/Step Time": 29.22341009342309} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 3.566953182220459, "Pretrain/Loss (Raw)": 3.260988235473633, "Pretrain/Step": 34, "Pretrain/Step Time": 29.181303529178393} +{"Pretrain/Learning Rate": 3.0594405594405598e-06, "Pretrain/Loss": 3.4807355403900146, "Pretrain/Loss (Raw)": 2.981375217437744, "Pretrain/Step": 35, "Pretrain/Step Time": 29.197005251475744} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 3.4442849159240723, "Pretrain/Loss (Raw)": 3.2996950149536133, "Pretrain/Step": 36, "Pretrain/Step Time": 29.199343217743767} +{"Pretrain/Learning Rate": 3.2342657342657347e-06, "Pretrain/Loss": 3.3769915103912354, "Pretrain/Loss (Raw)": 3.244882106781006, "Pretrain/Step": 37, "Pretrain/Step Time": 29.18681272300514} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 3.3205981254577637, "Pretrain/Loss (Raw)": 2.696432113647461, "Pretrain/Step": 38, "Pretrain/Step Time": 29.237600583779184} +{"Pretrain/Learning Rate": 3.409090909090909e-06, "Pretrain/Loss": 3.29773211479187, "Pretrain/Loss (Raw)": 2.794900894165039, "Pretrain/Step": 39, "Pretrain/Step Time": 29.226215038544094} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 3.1968603134155273, "Pretrain/Loss (Raw)": 2.712066888809204, "Pretrain/Step": 40, "Pretrain/Step Time": 29.236094444990158} +{"Pretrain/Learning Rate": 3.583916083916084e-06, "Pretrain/Loss": 3.153980255126953, "Pretrain/Loss (Raw)": 2.7681314945220947, "Pretrain/Step": 41, "Pretrain/Step Time": 29.250012013970352} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 3.05564546585083, "Pretrain/Loss (Raw)": 2.8078839778900146, "Pretrain/Step": 42, "Pretrain/Step Time": 29.229568072727748} +{"Pretrain/Learning Rate": 3.7587412587412585e-06, "Pretrain/Loss": 2.990428924560547, "Pretrain/Loss (Raw)": 2.367224931716919, "Pretrain/Step": 43, "Pretrain/Step Time": 29.233421819154607} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 2.9541807174682617, "Pretrain/Loss (Raw)": 2.892725944519043, "Pretrain/Step": 44, "Pretrain/Step Time": 29.235542985526} +{"Pretrain/Learning Rate": 3.933566433566433e-06, "Pretrain/Loss": 2.908191680908203, "Pretrain/Loss (Raw)": 2.522021770477295, "Pretrain/Step": 45, "Pretrain/Step Time": 29.23585867881775} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 2.8618640899658203, "Pretrain/Loss (Raw)": 2.621342658996582, "Pretrain/Step": 46, "Pretrain/Step Time": 29.248927634695303} +{"Pretrain/Learning Rate": 4.108391608391608e-06, "Pretrain/Loss": 2.829981803894043, "Pretrain/Loss (Raw)": 2.4417452812194824, "Pretrain/Step": 47, "Pretrain/Step Time": 29.263043799298874} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 2.8471477031707764, "Pretrain/Loss (Raw)": 3.015747547149658, "Pretrain/Step": 48, "Pretrain/Step Time": 29.275155281027157} +{"Pretrain/Learning Rate": 4.283216783216783e-06, "Pretrain/Loss": 2.816720485687256, "Pretrain/Loss (Raw)": 2.640362501144409, "Pretrain/Step": 49, "Pretrain/Step Time": 29.29827583566004} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 2.785097599029541, "Pretrain/Loss (Raw)": 2.755023717880249, "Pretrain/Step": 50, "Pretrain/Step Time": 29.32401316165924} +{"Pretrain/Learning Rate": 4.458041958041959e-06, "Pretrain/Loss": 2.7465953826904297, "Pretrain/Loss (Raw)": 2.3653404712677, "Pretrain/Step": 51, "Pretrain/Step Time": 29.320572951260736} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 2.7038588523864746, "Pretrain/Loss (Raw)": 2.6159119606018066, "Pretrain/Step": 52, "Pretrain/Step Time": 29.350184559822083} +{"Pretrain/Learning Rate": 4.632867132867133e-06, "Pretrain/Loss": 2.680983781814575, "Pretrain/Loss (Raw)": 2.8788771629333496, "Pretrain/Step": 53, "Pretrain/Step Time": 29.356065651155866} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 2.6656606197357178, "Pretrain/Loss (Raw)": 2.451262950897217, "Pretrain/Step": 54, "Pretrain/Step Time": 29.36181695814486} +{"Pretrain/Learning Rate": 4.807692307692308e-06, "Pretrain/Loss": 2.6719672679901123, "Pretrain/Loss (Raw)": 2.895808219909668, "Pretrain/Step": 55, "Pretrain/Step Time": 29.365039270574396} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 2.6749095916748047, "Pretrain/Loss (Raw)": 2.759145975112915, "Pretrain/Step": 56, "Pretrain/Step Time": 29.386860626084463} +{"Pretrain/Learning Rate": 4.982517482517483e-06, "Pretrain/Loss": 2.6643829345703125, "Pretrain/Loss (Raw)": 2.5997045040130615, "Pretrain/Step": 57, "Pretrain/Step Time": 29.374904527998808} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 2.6530847549438477, "Pretrain/Loss (Raw)": 2.6271088123321533, "Pretrain/Step": 58, "Pretrain/Step Time": 29.396726201320515} +{"Pretrain/Learning Rate": 5.157342657342658e-06, "Pretrain/Loss": 2.6726155281066895, "Pretrain/Loss (Raw)": 2.679718494415283, "Pretrain/Step": 59, "Pretrain/Step Time": 29.413248450069105} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 2.6543519496917725, "Pretrain/Loss (Raw)": 2.6005077362060547, "Pretrain/Step": 60, "Pretrain/Step Time": 29.419821027914683} +{"Pretrain/Learning Rate": 5.3321678321678325e-06, "Pretrain/Loss": 2.670313835144043, "Pretrain/Loss (Raw)": 2.7774131298065186, "Pretrain/Step": 61, "Pretrain/Step Time": 29.443770623597942} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 2.659111499786377, "Pretrain/Loss (Raw)": 2.442106246948242, "Pretrain/Step": 62, "Pretrain/Step Time": 29.429937016579412} +{"Pretrain/Learning Rate": 5.5069930069930074e-06, "Pretrain/Loss": 2.6667394638061523, "Pretrain/Loss (Raw)": 2.563793420791626, "Pretrain/Step": 63, "Pretrain/Step Time": 29.44102578692966} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.647381544113159, "Pretrain/Loss (Raw)": 2.706019401550293, "Pretrain/Step": 64, "Pretrain/Step Time": 29.460045225918293} +{"Pretrain/Learning Rate": 5.681818181818182e-06, "Pretrain/Loss": 2.6322124004364014, "Pretrain/Loss (Raw)": 2.3976550102233887, "Pretrain/Step": 65, "Pretrain/Step Time": 29.445630029531625} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.623671770095825, "Pretrain/Loss (Raw)": 2.618375778198242, "Pretrain/Step": 66, "Pretrain/Step Time": 29.459291317246176} +{"Pretrain/Learning Rate": 5.856643356643357e-06, "Pretrain/Loss": 2.6370229721069336, "Pretrain/Loss (Raw)": 2.5789566040039062, "Pretrain/Step": 67, "Pretrain/Step Time": 29.465799619902427} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.6405344009399414, "Pretrain/Loss (Raw)": 2.672095775604248, "Pretrain/Step": 68, "Pretrain/Step Time": 29.472986606990588} +{"Pretrain/Learning Rate": 6.031468531468531e-06, "Pretrain/Loss": 2.6369855403900146, "Pretrain/Loss (Raw)": 2.8220953941345215, "Pretrain/Step": 69, "Pretrain/Step Time": 29.479962317839913} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.644449234008789, "Pretrain/Loss (Raw)": 2.570685386657715, "Pretrain/Step": 70, "Pretrain/Step Time": 29.46174430165972} +{"Pretrain/Learning Rate": 6.206293706293707e-06, "Pretrain/Loss": 2.633190870285034, "Pretrain/Loss (Raw)": 2.7156729698181152, "Pretrain/Step": 71, "Pretrain/Step Time": 29.488916548205093} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.631801128387451, "Pretrain/Loss (Raw)": 2.7369091510772705, "Pretrain/Step": 72, "Pretrain/Step Time": 29.49188142021497} +{"Pretrain/Learning Rate": 6.381118881118882e-06, "Pretrain/Loss": 2.6316323280334473, "Pretrain/Loss (Raw)": 2.59700345993042, "Pretrain/Step": 73, "Pretrain/Step Time": 29.48660135269165} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.622802257537842, "Pretrain/Loss (Raw)": 2.4858295917510986, "Pretrain/Step": 74, "Pretrain/Step Time": 29.496597534901387} +{"Pretrain/Learning Rate": 6.555944055944056e-06, "Pretrain/Loss": 2.6073012351989746, "Pretrain/Loss (Raw)": 2.4316983222961426, "Pretrain/Step": 75, "Pretrain/Step Time": 29.49738810221354} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.620945930480957, "Pretrain/Loss (Raw)": 2.8188250064849854, "Pretrain/Step": 76, "Pretrain/Step Time": 29.4927537598108} +{"Pretrain/Learning Rate": 6.730769230769231e-06, "Pretrain/Loss": 2.626570701599121, "Pretrain/Loss (Raw)": 2.867412567138672, "Pretrain/Step": 77, "Pretrain/Step Time": 29.50058005692123} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.6544737815856934, "Pretrain/Loss (Raw)": 2.888556718826294, "Pretrain/Step": 78, "Pretrain/Step Time": 29.504708962562756} +{"Pretrain/Learning Rate": 6.905594405594405e-06, "Pretrain/Loss": 2.65161395072937, "Pretrain/Loss (Raw)": 2.5180349349975586, "Pretrain/Step": 79, "Pretrain/Step Time": 29.51031024546563} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.6402816772460938, "Pretrain/Loss (Raw)": 2.524704933166504, "Pretrain/Step": 80, "Pretrain/Step Time": 29.505665910243987} +{"Pretrain/Learning Rate": 7.0804195804195815e-06, "Pretrain/Loss": 2.6479110717773438, "Pretrain/Loss (Raw)": 2.519725799560547, "Pretrain/Step": 81, "Pretrain/Step Time": 29.513708335381967} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.6603217124938965, "Pretrain/Loss (Raw)": 2.8169422149658203, "Pretrain/Step": 82, "Pretrain/Step Time": 29.521043812356343} +{"Pretrain/Learning Rate": 7.2552447552447555e-06, "Pretrain/Loss": 2.6658873558044434, "Pretrain/Loss (Raw)": 2.6680054664611816, "Pretrain/Step": 83, "Pretrain/Step Time": 29.513216136449792} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.6650609970092773, "Pretrain/Loss (Raw)": 2.65887713432312, "Pretrain/Step": 84, "Pretrain/Step Time": 29.52038319905599} +{"Pretrain/Learning Rate": 7.43006993006993e-06, "Pretrain/Loss": 2.649322032928467, "Pretrain/Loss (Raw)": 2.5702695846557617, "Pretrain/Step": 85, "Pretrain/Step Time": 29.530117093815523} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.648853302001953, "Pretrain/Loss (Raw)": 2.5631837844848633, "Pretrain/Step": 86, "Pretrain/Step Time": 29.53480003046435} +{"Pretrain/Learning Rate": 7.604895104895106e-06, "Pretrain/Loss": 2.6347851753234863, "Pretrain/Loss (Raw)": 2.4905834197998047, "Pretrain/Step": 87, "Pretrain/Step Time": 29.545942607967334} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.6071295738220215, "Pretrain/Loss (Raw)": 2.294421911239624, "Pretrain/Step": 88, "Pretrain/Step Time": 29.54721228371967} +{"Pretrain/Learning Rate": 7.77972027972028e-06, "Pretrain/Loss": 2.595658779144287, "Pretrain/Loss (Raw)": 2.41347074508667, "Pretrain/Step": 89, "Pretrain/Step Time": 29.548367674431105} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.5834834575653076, "Pretrain/Loss (Raw)": 2.2910232543945312, "Pretrain/Step": 90, "Pretrain/Step Time": 29.555707205666437} +{"Pretrain/Learning Rate": 7.954545454545455e-06, "Pretrain/Loss": 2.581355094909668, "Pretrain/Loss (Raw)": 2.3976428508758545, "Pretrain/Step": 91, "Pretrain/Step Time": 29.55588721705007} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.5617592334747314, "Pretrain/Loss (Raw)": 2.505293130874634, "Pretrain/Step": 92, "Pretrain/Step Time": 29.570115307103034} +{"Pretrain/Learning Rate": 8.12937062937063e-06, "Pretrain/Loss": 2.5567002296447754, "Pretrain/Loss (Raw)": 2.786471128463745, "Pretrain/Step": 93, "Pretrain/Step Time": 29.572135643292498} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.537234306335449, "Pretrain/Loss (Raw)": 2.5770978927612305, "Pretrain/Step": 94, "Pretrain/Step Time": 29.572851665476534} +{"Pretrain/Learning Rate": 8.304195804195805e-06, "Pretrain/Loss": 2.563526153564453, "Pretrain/Loss (Raw)": 2.9387049674987793, "Pretrain/Step": 95, "Pretrain/Step Time": 29.576632585023578} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.5669782161712646, "Pretrain/Loss (Raw)": 2.5799386501312256, "Pretrain/Step": 96, "Pretrain/Step Time": 29.58465953419606} +{"Pretrain/Learning Rate": 8.47902097902098e-06, "Pretrain/Loss": 2.5777981281280518, "Pretrain/Loss (Raw)": 2.692845344543457, "Pretrain/Step": 97, "Pretrain/Step Time": 29.594000155163794} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.5666956901550293, "Pretrain/Loss (Raw)": 2.639303684234619, "Pretrain/Step": 98, "Pretrain/Step Time": 29.594041293981125} +{"Pretrain/Learning Rate": 8.653846153846155e-06, "Pretrain/Loss": 2.5466980934143066, "Pretrain/Loss (Raw)": 2.3480443954467773, "Pretrain/Step": 99, "Pretrain/Step Time": 29.59155262359465} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.5438337326049805, "Pretrain/Loss (Raw)": 2.6130454540252686, "Pretrain/Step": 100, "Pretrain/Step Time": 29.598620645999908} +{"Pretrain/Learning Rate": 8.828671328671328e-06, "Pretrain/Loss": 2.5432658195495605, "Pretrain/Loss (Raw)": 2.561185359954834, "Pretrain/Step": 101, "Pretrain/Step Time": 29.607076071276524} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.5408992767333984, "Pretrain/Loss (Raw)": 2.525315284729004, "Pretrain/Step": 102, "Pretrain/Step Time": 29.603713694740744} +{"Pretrain/Learning Rate": 9.003496503496504e-06, "Pretrain/Loss": 2.5428466796875, "Pretrain/Loss (Raw)": 2.5217461585998535, "Pretrain/Step": 103, "Pretrain/Step Time": 29.60518400414476} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.5715131759643555, "Pretrain/Loss (Raw)": 2.753086566925049, "Pretrain/Step": 104, "Pretrain/Step Time": 29.609023814017956} +{"Pretrain/Learning Rate": 9.17832167832168e-06, "Pretrain/Loss": 2.5778770446777344, "Pretrain/Loss (Raw)": 2.5152854919433594, "Pretrain/Step": 105, "Pretrain/Step Time": 29.61988443647112} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.5831315517425537, "Pretrain/Loss (Raw)": 2.3750991821289062, "Pretrain/Step": 106, "Pretrain/Step Time": 29.626370729140515} +{"Pretrain/Learning Rate": 9.353146853146853e-06, "Pretrain/Loss": 2.5877392292022705, "Pretrain/Loss (Raw)": 2.4713635444641113, "Pretrain/Step": 107, "Pretrain/Step Time": 29.626199530663893} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.5935111045837402, "Pretrain/Loss (Raw)": 2.5976459980010986, "Pretrain/Step": 108, "Pretrain/Step Time": 29.631033394071792} +{"Pretrain/Learning Rate": 9.527972027972027e-06, "Pretrain/Loss": 2.576785087585449, "Pretrain/Loss (Raw)": 2.5188519954681396, "Pretrain/Step": 109, "Pretrain/Step Time": 29.641010120374347} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.5529778003692627, "Pretrain/Loss (Raw)": 2.19618558883667, "Pretrain/Step": 110, "Pretrain/Step Time": 29.637810124050485} +{"Pretrain/Learning Rate": 9.702797202797204e-06, "Pretrain/Loss": 2.517961263656616, "Pretrain/Loss (Raw)": 2.3784399032592773, "Pretrain/Step": 111, "Pretrain/Step Time": 29.639863368627186} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.5273523330688477, "Pretrain/Loss (Raw)": 2.7301931381225586, "Pretrain/Step": 112, "Pretrain/Step Time": 29.634600268942968} +{"Pretrain/Learning Rate": 9.877622377622379e-06, "Pretrain/Loss": 2.5006542205810547, "Pretrain/Loss (Raw)": 2.2656760215759277, "Pretrain/Step": 113, "Pretrain/Step Time": 29.640847090071283} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.495417594909668, "Pretrain/Loss (Raw)": 2.5555200576782227, "Pretrain/Step": 114, "Pretrain/Step Time": 29.645945143281367} +{"Pretrain/Learning Rate": 1.0052447552447552e-05, "Pretrain/Loss": 2.4985806941986084, "Pretrain/Loss (Raw)": 2.3986496925354004, "Pretrain/Step": 115, "Pretrain/Step Time": 29.637685359042624} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.482457160949707, "Pretrain/Loss (Raw)": 2.3550686836242676, "Pretrain/Step": 116, "Pretrain/Step Time": 29.638106502335646} +{"Pretrain/Learning Rate": 1.0227272727272729e-05, "Pretrain/Loss": 2.4832561016082764, "Pretrain/Loss (Raw)": 2.5739669799804688, "Pretrain/Step": 117, "Pretrain/Step Time": 29.64195790250077} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.4785823822021484, "Pretrain/Loss (Raw)": 2.4505386352539062, "Pretrain/Step": 118, "Pretrain/Step Time": 29.64513587547561} +{"Pretrain/Learning Rate": 1.0402097902097904e-05, "Pretrain/Loss": 2.476123094558716, "Pretrain/Loss (Raw)": 2.4823977947235107, "Pretrain/Step": 119, "Pretrain/Step Time": 29.652525244640703} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.462099075317383, "Pretrain/Loss (Raw)": 2.5286989212036133, "Pretrain/Step": 120, "Pretrain/Step Time": 29.648204561074575} +{"Pretrain/Learning Rate": 1.0576923076923077e-05, "Pretrain/Loss": 2.452901840209961, "Pretrain/Loss (Raw)": 2.3681321144104004, "Pretrain/Step": 121, "Pretrain/Step Time": 29.64192296453744} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.4325337409973145, "Pretrain/Loss (Raw)": 2.049207925796509, "Pretrain/Step": 122, "Pretrain/Step Time": 29.645907232018768} +{"Pretrain/Learning Rate": 1.0751748251748252e-05, "Pretrain/Loss": 2.4299607276916504, "Pretrain/Loss (Raw)": 2.430198907852173, "Pretrain/Step": 123, "Pretrain/Step Time": 29.645173850098278} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.4269514083862305, "Pretrain/Loss (Raw)": 2.5494930744171143, "Pretrain/Step": 124, "Pretrain/Step Time": 29.65025337665312} +{"Pretrain/Learning Rate": 1.0926573426573428e-05, "Pretrain/Loss": 2.418780565261841, "Pretrain/Loss (Raw)": 2.388120412826538, "Pretrain/Step": 125, "Pretrain/Step Time": 29.647310972213745} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.438143253326416, "Pretrain/Loss (Raw)": 2.5059890747070312, "Pretrain/Step": 126, "Pretrain/Step Time": 29.643762980188644} +{"Pretrain/Learning Rate": 1.1101398601398601e-05, "Pretrain/Loss": 2.4463443756103516, "Pretrain/Loss (Raw)": 2.5096564292907715, "Pretrain/Step": 127, "Pretrain/Step Time": 29.64649667890053} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.423840045928955, "Pretrain/Loss (Raw)": 2.370126247406006, "Pretrain/Step": 128, "Pretrain/Step Time": 29.64452796243131} +{"Pretrain/Learning Rate": 1.1276223776223776e-05, "Pretrain/Loss": 2.4386258125305176, "Pretrain/Loss (Raw)": 2.5022449493408203, "Pretrain/Step": 129, "Pretrain/Step Time": 29.645716348662972} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.4289917945861816, "Pretrain/Loss (Raw)": 2.4013772010803223, "Pretrain/Step": 130, "Pretrain/Step Time": 29.663855727761984} +{"Pretrain/Learning Rate": 1.1451048951048951e-05, "Pretrain/Loss": 2.4189577102661133, "Pretrain/Loss (Raw)": 2.238107681274414, "Pretrain/Step": 131, "Pretrain/Step Time": 29.654603281989694} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.4090797901153564, "Pretrain/Loss (Raw)": 2.197021245956421, "Pretrain/Step": 132, "Pretrain/Step Time": 29.672420017421246} +{"Pretrain/Learning Rate": 1.1625874125874126e-05, "Pretrain/Loss": 2.386538028717041, "Pretrain/Loss (Raw)": 2.2132961750030518, "Pretrain/Step": 133, "Pretrain/Step Time": 29.673221232369542} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.3750576972961426, "Pretrain/Loss (Raw)": 2.2668519020080566, "Pretrain/Step": 134, "Pretrain/Step Time": 29.669508380815387} +{"Pretrain/Learning Rate": 1.1800699300699301e-05, "Pretrain/Loss": 2.359199047088623, "Pretrain/Loss (Raw)": 2.2286601066589355, "Pretrain/Step": 135, "Pretrain/Step Time": 29.689225209876895} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.354126453399658, "Pretrain/Loss (Raw)": 2.447537899017334, "Pretrain/Step": 136, "Pretrain/Step Time": 29.684569243341684} +{"Pretrain/Learning Rate": 1.1975524475524476e-05, "Pretrain/Loss": 2.379413604736328, "Pretrain/Loss (Raw)": 2.7727270126342773, "Pretrain/Step": 137, "Pretrain/Step Time": 29.688114166259766} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.4171011447906494, "Pretrain/Loss (Raw)": 2.6522092819213867, "Pretrain/Step": 138, "Pretrain/Step Time": 29.704200834035873} +{"Pretrain/Learning Rate": 1.215034965034965e-05, "Pretrain/Loss": 2.4390454292297363, "Pretrain/Loss (Raw)": 2.781308650970459, "Pretrain/Step": 139, "Pretrain/Step Time": 29.691995920613408} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.4246411323547363, "Pretrain/Loss (Raw)": 2.319023609161377, "Pretrain/Step": 140, "Pretrain/Step Time": 29.705658869817853} +{"Pretrain/Learning Rate": 1.2325174825174826e-05, "Pretrain/Loss": 2.4389753341674805, "Pretrain/Loss (Raw)": 2.617465019226074, "Pretrain/Step": 141, "Pretrain/Step Time": 29.725726766511798} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.432730197906494, "Pretrain/Loss (Raw)": 2.406069755554199, "Pretrain/Step": 142, "Pretrain/Step Time": 29.71704138442874} +{"Pretrain/Learning Rate": 1.25e-05, "Pretrain/Loss": 2.434103488922119, "Pretrain/Loss (Raw)": 2.531625270843506, "Pretrain/Step": 143, "Pretrain/Step Time": 29.738039387390018} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.4285151958465576, "Pretrain/Loss (Raw)": 2.280717372894287, "Pretrain/Step": 144, "Pretrain/Step Time": 29.739434134215117} +{"Pretrain/Learning Rate": 1.2674825174825175e-05, "Pretrain/Loss": 2.408717393875122, "Pretrain/Loss (Raw)": 2.1854782104492188, "Pretrain/Step": 145, "Pretrain/Step Time": 29.743684194982052} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.408168077468872, "Pretrain/Loss (Raw)": 2.392590045928955, "Pretrain/Step": 146, "Pretrain/Step Time": 29.762978522107005} +{"Pretrain/Learning Rate": 1.2849650349650349e-05, "Pretrain/Loss": 2.4263322353363037, "Pretrain/Loss (Raw)": 2.5287346839904785, "Pretrain/Step": 147, "Pretrain/Step Time": 29.75226343423128} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.4360744953155518, "Pretrain/Loss (Raw)": 2.3528971672058105, "Pretrain/Step": 148, "Pretrain/Step Time": 29.759689999744296} +{"Pretrain/Learning Rate": 1.3024475524475524e-05, "Pretrain/Loss": 2.4467177391052246, "Pretrain/Loss (Raw)": 2.3835864067077637, "Pretrain/Step": 149, "Pretrain/Step Time": 29.766596609726548} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.4445860385894775, "Pretrain/Loss (Raw)": 2.232746124267578, "Pretrain/Step": 150, "Pretrain/Step Time": 29.761016441509128} +{"Pretrain/Learning Rate": 1.3199300699300702e-05, "Pretrain/Loss": 2.4546186923980713, "Pretrain/Loss (Raw)": 2.389180898666382, "Pretrain/Step": 151, "Pretrain/Step Time": 29.771972209215164} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.4589927196502686, "Pretrain/Loss (Raw)": 2.5175223350524902, "Pretrain/Step": 152, "Pretrain/Step Time": 29.77385846339166} +{"Pretrain/Learning Rate": 1.3374125874125875e-05, "Pretrain/Loss": 2.4283127784729004, "Pretrain/Loss (Raw)": 2.2818503379821777, "Pretrain/Step": 153, "Pretrain/Step Time": 29.77502593398094} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.4130396842956543, "Pretrain/Loss (Raw)": 2.407837390899658, "Pretrain/Step": 154, "Pretrain/Step Time": 29.790833784267306} +{"Pretrain/Learning Rate": 1.354895104895105e-05, "Pretrain/Loss": 2.3919837474823, "Pretrain/Loss (Raw)": 2.4444146156311035, "Pretrain/Step": 155, "Pretrain/Step Time": 29.782927494496107} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.372002363204956, "Pretrain/Loss (Raw)": 1.9993226528167725, "Pretrain/Step": 156, "Pretrain/Step Time": 29.801797879859805} +{"Pretrain/Learning Rate": 1.3723776223776225e-05, "Pretrain/Loss": 2.361788034439087, "Pretrain/Loss (Raw)": 2.454036235809326, "Pretrain/Step": 157, "Pretrain/Step Time": 29.81173306889832} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.3628692626953125, "Pretrain/Loss (Raw)": 2.423367500305176, "Pretrain/Step": 158, "Pretrain/Step Time": 29.796109937131405} +{"Pretrain/Learning Rate": 1.38986013986014e-05, "Pretrain/Loss": 2.3494434356689453, "Pretrain/Loss (Raw)": 2.316812515258789, "Pretrain/Step": 159, "Pretrain/Step Time": 29.812038274481893} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.353003978729248, "Pretrain/Loss (Raw)": 2.337684154510498, "Pretrain/Step": 160, "Pretrain/Step Time": 29.812212048098445} +{"Pretrain/Learning Rate": 1.4073426573426573e-05, "Pretrain/Loss": 2.362980365753174, "Pretrain/Loss (Raw)": 2.345102071762085, "Pretrain/Step": 161, "Pretrain/Step Time": 29.800487466156483} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.357649087905884, "Pretrain/Loss (Raw)": 2.3072898387908936, "Pretrain/Step": 162, "Pretrain/Step Time": 29.81836893223226} +{"Pretrain/Learning Rate": 1.4248251748251748e-05, "Pretrain/Loss": 2.3763985633850098, "Pretrain/Loss (Raw)": 2.8287301063537598, "Pretrain/Step": 163, "Pretrain/Step Time": 29.825166700407863} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.3886940479278564, "Pretrain/Loss (Raw)": 2.54962158203125, "Pretrain/Step": 164, "Pretrain/Step Time": 29.832998171448708} +{"Pretrain/Learning Rate": 1.4423076923076923e-05, "Pretrain/Loss": 2.381537437438965, "Pretrain/Loss (Raw)": 2.2690820693969727, "Pretrain/Step": 165, "Pretrain/Step Time": 29.840286998078227} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.3879833221435547, "Pretrain/Loss (Raw)": 2.3358778953552246, "Pretrain/Step": 166, "Pretrain/Step Time": 29.83376694098115} +{"Pretrain/Learning Rate": 1.45979020979021e-05, "Pretrain/Loss": 2.399078369140625, "Pretrain/Loss (Raw)": 2.5667009353637695, "Pretrain/Step": 167, "Pretrain/Step Time": 29.849400497972965} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.3903183937072754, "Pretrain/Loss (Raw)": 2.377363681793213, "Pretrain/Step": 168, "Pretrain/Step Time": 29.844614872708917} +{"Pretrain/Learning Rate": 1.4772727272727274e-05, "Pretrain/Loss": 2.3981215953826904, "Pretrain/Loss (Raw)": 2.40670108795166, "Pretrain/Step": 169, "Pretrain/Step Time": 29.850801130756736} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.3976941108703613, "Pretrain/Loss (Raw)": 2.400998592376709, "Pretrain/Step": 170, "Pretrain/Step Time": 29.863849548622966} +{"Pretrain/Learning Rate": 1.4947552447552449e-05, "Pretrain/Loss": 2.3816497325897217, "Pretrain/Loss (Raw)": 2.1877048015594482, "Pretrain/Step": 171, "Pretrain/Step Time": 29.85898326151073} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.389908790588379, "Pretrain/Loss (Raw)": 2.1314687728881836, "Pretrain/Step": 172, "Pretrain/Step Time": 29.867229379713535} +{"Pretrain/Learning Rate": 1.5122377622377622e-05, "Pretrain/Loss": 2.3863039016723633, "Pretrain/Loss (Raw)": 2.3963589668273926, "Pretrain/Step": 173, "Pretrain/Step Time": 29.868428748100996} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.392556667327881, "Pretrain/Loss (Raw)": 2.523411273956299, "Pretrain/Step": 174, "Pretrain/Step Time": 29.865499632433057} +{"Pretrain/Learning Rate": 1.5297202797202797e-05, "Pretrain/Loss": 2.3929381370544434, "Pretrain/Loss (Raw)": 2.3229169845581055, "Pretrain/Step": 175, "Pretrain/Step Time": 29.86544527299702} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.3995919227600098, "Pretrain/Loss (Raw)": 2.444141387939453, "Pretrain/Step": 176, "Pretrain/Step Time": 29.855695025995374} +{"Pretrain/Learning Rate": 1.547202797202797e-05, "Pretrain/Loss": 2.389159917831421, "Pretrain/Loss (Raw)": 2.178191661834717, "Pretrain/Step": 177, "Pretrain/Step Time": 29.856352919712663} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.3801016807556152, "Pretrain/Loss (Raw)": 2.1623544692993164, "Pretrain/Step": 178, "Pretrain/Step Time": 29.84860661625862} +{"Pretrain/Learning Rate": 1.5646853146853147e-05, "Pretrain/Loss": 2.3536620140075684, "Pretrain/Loss (Raw)": 2.405696392059326, "Pretrain/Step": 179, "Pretrain/Step Time": 29.853629868477583} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.3481414318084717, "Pretrain/Loss (Raw)": 2.461292028427124, "Pretrain/Step": 180, "Pretrain/Step Time": 29.849054409191012} +{"Pretrain/Learning Rate": 1.5821678321678324e-05, "Pretrain/Loss": 2.3511581420898438, "Pretrain/Loss (Raw)": 2.3173532485961914, "Pretrain/Step": 181, "Pretrain/Step Time": 29.851126926019788} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.368518590927124, "Pretrain/Loss (Raw)": 2.6136412620544434, "Pretrain/Step": 182, "Pretrain/Step Time": 29.846639716997743} +{"Pretrain/Learning Rate": 1.5996503496503497e-05, "Pretrain/Loss": 2.349752902984619, "Pretrain/Loss (Raw)": 2.2664525508880615, "Pretrain/Step": 183, "Pretrain/Step Time": 29.853759514167905} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.342717170715332, "Pretrain/Loss (Raw)": 2.2647886276245117, "Pretrain/Step": 184, "Pretrain/Step Time": 29.843115486204624} +{"Pretrain/Learning Rate": 1.6171328671328673e-05, "Pretrain/Loss": 2.3394980430603027, "Pretrain/Loss (Raw)": 2.355194091796875, "Pretrain/Step": 185, "Pretrain/Step Time": 29.85528147779405} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.336886405944824, "Pretrain/Loss (Raw)": 2.35921311378479, "Pretrain/Step": 186, "Pretrain/Step Time": 29.84757181815803} +{"Pretrain/Learning Rate": 1.6346153846153847e-05, "Pretrain/Loss": 2.3668107986450195, "Pretrain/Loss (Raw)": 2.666494607925415, "Pretrain/Step": 187, "Pretrain/Step Time": 29.83855313807726} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.3801865577697754, "Pretrain/Loss (Raw)": 2.3454840183258057, "Pretrain/Step": 188, "Pretrain/Step Time": 29.847731854766607} +{"Pretrain/Learning Rate": 1.6520979020979023e-05, "Pretrain/Loss": 2.3729004859924316, "Pretrain/Loss (Raw)": 2.279784917831421, "Pretrain/Step": 189, "Pretrain/Step Time": 29.834730880334973} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.3570730686187744, "Pretrain/Loss (Raw)": 2.2701709270477295, "Pretrain/Step": 190, "Pretrain/Step Time": 29.845079557970166} +{"Pretrain/Learning Rate": 1.6695804195804196e-05, "Pretrain/Loss": 2.3490161895751953, "Pretrain/Loss (Raw)": 2.1940083503723145, "Pretrain/Step": 191, "Pretrain/Step Time": 29.84333704598248} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.341010570526123, "Pretrain/Loss (Raw)": 2.316049575805664, "Pretrain/Step": 192, "Pretrain/Step Time": 29.832383319735527} +{"Pretrain/Learning Rate": 1.687062937062937e-05, "Pretrain/Loss": 2.3718605041503906, "Pretrain/Loss (Raw)": 2.6717867851257324, "Pretrain/Step": 193, "Pretrain/Step Time": 29.848536793142557} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.3768012523651123, "Pretrain/Loss (Raw)": 2.2414114475250244, "Pretrain/Step": 194, "Pretrain/Step Time": 29.845946272835135} +{"Pretrain/Learning Rate": 1.7045454545454546e-05, "Pretrain/Loss": 2.3660895824432373, "Pretrain/Loss (Raw)": 2.2343063354492188, "Pretrain/Step": 195, "Pretrain/Step Time": 29.843428030610085} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.3534505367279053, "Pretrain/Loss (Raw)": 2.2590689659118652, "Pretrain/Step": 196, "Pretrain/Step Time": 29.84639992378652} +{"Pretrain/Learning Rate": 1.7220279720279723e-05, "Pretrain/Loss": 2.3480961322784424, "Pretrain/Loss (Raw)": 2.231680393218994, "Pretrain/Step": 197, "Pretrain/Step Time": 29.852932818233967} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.3257761001586914, "Pretrain/Loss (Raw)": 2.256520986557007, "Pretrain/Step": 198, "Pretrain/Step Time": 29.86750515550375} +{"Pretrain/Learning Rate": 1.7395104895104896e-05, "Pretrain/Loss": 2.322561502456665, "Pretrain/Loss (Raw)": 2.2150189876556396, "Pretrain/Step": 199, "Pretrain/Step Time": 29.857237063348293} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.3342247009277344, "Pretrain/Loss (Raw)": 2.4514026641845703, "Pretrain/Step": 200, "Pretrain/Step Time": 29.85004996880889} +{"Pretrain/Learning Rate": 1.7569930069930072e-05, "Pretrain/Loss": 2.3340163230895996, "Pretrain/Loss (Raw)": 2.3518590927124023, "Pretrain/Step": 201, "Pretrain/Step Time": 29.85600669682026} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.324047088623047, "Pretrain/Loss (Raw)": 2.1997079849243164, "Pretrain/Step": 202, "Pretrain/Step Time": 29.851580755785108} +{"Pretrain/Learning Rate": 1.7744755244755246e-05, "Pretrain/Loss": 2.3123111724853516, "Pretrain/Loss (Raw)": 2.4787163734436035, "Pretrain/Step": 203, "Pretrain/Step Time": 29.851437870413065} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.3111581802368164, "Pretrain/Loss (Raw)": 2.327035903930664, "Pretrain/Step": 204, "Pretrain/Step Time": 29.868909679353237} +{"Pretrain/Learning Rate": 1.791958041958042e-05, "Pretrain/Loss": 2.3081071376800537, "Pretrain/Loss (Raw)": 2.2309677600860596, "Pretrain/Step": 205, "Pretrain/Step Time": 29.866672676056623} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.3127126693725586, "Pretrain/Loss (Raw)": 2.3438596725463867, "Pretrain/Step": 206, "Pretrain/Step Time": 29.86483523249626} +{"Pretrain/Learning Rate": 1.8094405594405595e-05, "Pretrain/Loss": 2.3210458755493164, "Pretrain/Loss (Raw)": 2.327342987060547, "Pretrain/Step": 207, "Pretrain/Step Time": 29.871724909171462} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.3488173484802246, "Pretrain/Loss (Raw)": 2.760389804840088, "Pretrain/Step": 208, "Pretrain/Step Time": 29.873920425772667} +{"Pretrain/Learning Rate": 1.826923076923077e-05, "Pretrain/Loss": 2.337130546569824, "Pretrain/Loss (Raw)": 2.484801769256592, "Pretrain/Step": 209, "Pretrain/Step Time": 29.86683394946158} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.334214210510254, "Pretrain/Loss (Raw)": 2.194748878479004, "Pretrain/Step": 210, "Pretrain/Step Time": 29.873073779046535} +{"Pretrain/Learning Rate": 1.8444055944055945e-05, "Pretrain/Loss": 2.343928337097168, "Pretrain/Loss (Raw)": 2.389730930328369, "Pretrain/Step": 211, "Pretrain/Step Time": 29.879184063524008} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.341834545135498, "Pretrain/Loss (Raw)": 2.2255682945251465, "Pretrain/Step": 212, "Pretrain/Step Time": 29.88328205049038} +{"Pretrain/Learning Rate": 1.8618881118881122e-05, "Pretrain/Loss": 2.3407158851623535, "Pretrain/Loss (Raw)": 2.2137789726257324, "Pretrain/Step": 213, "Pretrain/Step Time": 29.87964617088437} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.3490207195281982, "Pretrain/Loss (Raw)": 2.3894009590148926, "Pretrain/Step": 214, "Pretrain/Step Time": 29.87802980840206} +{"Pretrain/Learning Rate": 1.8793706293706295e-05, "Pretrain/Loss": 2.342487335205078, "Pretrain/Loss (Raw)": 2.110483169555664, "Pretrain/Step": 215, "Pretrain/Step Time": 29.885501923039556} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.332685947418213, "Pretrain/Loss (Raw)": 2.294581890106201, "Pretrain/Step": 216, "Pretrain/Step Time": 29.880962312221527} +{"Pretrain/Learning Rate": 1.8968531468531468e-05, "Pretrain/Loss": 2.331557035446167, "Pretrain/Loss (Raw)": 2.333796501159668, "Pretrain/Step": 217, "Pretrain/Step Time": 29.878343764692545} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.3302173614501953, "Pretrain/Loss (Raw)": 2.1782760620117188, "Pretrain/Step": 218, "Pretrain/Step Time": 29.884180538356304} +{"Pretrain/Learning Rate": 1.9143356643356645e-05, "Pretrain/Loss": 2.317436456680298, "Pretrain/Loss (Raw)": 2.274219036102295, "Pretrain/Step": 219, "Pretrain/Step Time": 29.876259431242943} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.3290843963623047, "Pretrain/Loss (Raw)": 2.51340389251709, "Pretrain/Step": 220, "Pretrain/Step Time": 29.875000217929482} +{"Pretrain/Learning Rate": 1.9318181818181818e-05, "Pretrain/Loss": 2.340285301208496, "Pretrain/Loss (Raw)": 2.4101834297180176, "Pretrain/Step": 221, "Pretrain/Step Time": 29.875845247879624} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.331179618835449, "Pretrain/Loss (Raw)": 2.1981656551361084, "Pretrain/Step": 222, "Pretrain/Step Time": 29.87131712399423} +{"Pretrain/Learning Rate": 1.9493006993006995e-05, "Pretrain/Loss": 2.318652868270874, "Pretrain/Loss (Raw)": 2.1269173622131348, "Pretrain/Step": 223, "Pretrain/Step Time": 29.884240217506886} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.2907752990722656, "Pretrain/Loss (Raw)": 2.3143463134765625, "Pretrain/Step": 224, "Pretrain/Step Time": 29.871525641530752} +{"Pretrain/Learning Rate": 1.9667832167832168e-05, "Pretrain/Loss": 2.3038887977600098, "Pretrain/Loss (Raw)": 2.6946210861206055, "Pretrain/Step": 225, "Pretrain/Step Time": 29.86088940128684} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.303861618041992, "Pretrain/Loss (Raw)": 2.194312810897827, "Pretrain/Step": 226, "Pretrain/Step Time": 29.873813780024648} +{"Pretrain/Learning Rate": 1.9842657342657344e-05, "Pretrain/Loss": 2.3006162643432617, "Pretrain/Loss (Raw)": 2.3378024101257324, "Pretrain/Step": 227, "Pretrain/Step Time": 29.866858687251806} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.31221342086792, "Pretrain/Loss (Raw)": 2.4111244678497314, "Pretrain/Step": 228, "Pretrain/Step Time": 29.87641842290759} +{"Pretrain/Learning Rate": 2.0017482517482518e-05, "Pretrain/Loss": 2.309652805328369, "Pretrain/Loss (Raw)": 2.172807455062866, "Pretrain/Step": 229, "Pretrain/Step Time": 29.87059411406517} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.300765037536621, "Pretrain/Loss (Raw)": 2.2471981048583984, "Pretrain/Step": 230, "Pretrain/Step Time": 29.866276867687702} +{"Pretrain/Learning Rate": 2.0192307692307694e-05, "Pretrain/Loss": 2.321364402770996, "Pretrain/Loss (Raw)": 2.4400739669799805, "Pretrain/Step": 231, "Pretrain/Step Time": 29.870181201025844} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.3242907524108887, "Pretrain/Loss (Raw)": 2.341402530670166, "Pretrain/Step": 232, "Pretrain/Step Time": 29.86999449878931} +{"Pretrain/Learning Rate": 2.0367132867132867e-05, "Pretrain/Loss": 2.3152573108673096, "Pretrain/Loss (Raw)": 2.189260482788086, "Pretrain/Step": 233, "Pretrain/Step Time": 29.861678240820765} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.323896884918213, "Pretrain/Loss (Raw)": 2.3165111541748047, "Pretrain/Step": 234, "Pretrain/Step Time": 29.860762597993016} +{"Pretrain/Learning Rate": 2.0541958041958044e-05, "Pretrain/Loss": 2.3310387134552, "Pretrain/Loss (Raw)": 2.3884878158569336, "Pretrain/Step": 235, "Pretrain/Step Time": 29.85189849883318} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.305908203125, "Pretrain/Loss (Raw)": 2.111314058303833, "Pretrain/Step": 236, "Pretrain/Step Time": 29.85796906799078} +{"Pretrain/Learning Rate": 2.0716783216783217e-05, "Pretrain/Loss": 2.299576759338379, "Pretrain/Loss (Raw)": 2.308882713317871, "Pretrain/Step": 237, "Pretrain/Step Time": 29.851032162085176} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.307786464691162, "Pretrain/Loss (Raw)": 2.3295211791992188, "Pretrain/Step": 238, "Pretrain/Step Time": 29.851947333663702} +{"Pretrain/Learning Rate": 2.089160839160839e-05, "Pretrain/Loss": 2.32517147064209, "Pretrain/Loss (Raw)": 2.4050750732421875, "Pretrain/Step": 239, "Pretrain/Step Time": 29.85805074684322} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.3122622966766357, "Pretrain/Loss (Raw)": 2.1078009605407715, "Pretrain/Step": 240, "Pretrain/Step Time": 29.870028423145413} +{"Pretrain/Learning Rate": 2.106643356643357e-05, "Pretrain/Loss": 2.2771239280700684, "Pretrain/Loss (Raw)": 2.1324057579040527, "Pretrain/Step": 241, "Pretrain/Step Time": 29.86306118965149} +{"Pretrain/Learning Rate": 8.741258741258742e-08, "Pretrain/Loss": 2.863297462463379, "Pretrain/Loss (Raw)": 2.863297462463379, "Pretrain/Step": 1, "Pretrain/Step Time": 12.41039752960205} +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 4.046108245849609, "Pretrain/Loss (Raw)": 5.228918552398682, "Pretrain/Step": 2, "Pretrain/Step Time": 10.479020714759827} +{"Pretrain/Learning Rate": 2.622377622377623e-07, "Pretrain/Loss": 3.815037488937378, "Pretrain/Loss (Raw)": 3.352896213531494, "Pretrain/Step": 3, "Pretrain/Step Time": 9.71382506688436} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 3.7597692012786865, "Pretrain/Loss (Raw)": 3.5939643383026123, "Pretrain/Step": 4, "Pretrain/Step Time": 9.308871984481812} +{"Pretrain/Learning Rate": 4.370629370629371e-07, "Pretrain/Loss": 3.627333164215088, "Pretrain/Loss (Raw)": 3.097588539123535, "Pretrain/Step": 5, "Pretrain/Step Time": 9.072826242446899} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.6489455699920654, "Pretrain/Loss (Raw)": 3.7570090293884277, "Pretrain/Step": 6, "Pretrain/Step Time": 8.900511940320333} +{"Pretrain/Learning Rate": 6.118881118881119e-07, "Pretrain/Loss": 3.639660596847534, "Pretrain/Loss (Raw)": 3.5839481353759766, "Pretrain/Step": 7, "Pretrain/Step Time": 8.824113232748848} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.5437331199645996, "Pretrain/Loss (Raw)": 2.872241497039795, "Pretrain/Step": 8, "Pretrain/Step Time": 8.722468227148056} +{"Pretrain/Learning Rate": 7.867132867132868e-07, "Pretrain/Loss": 3.4924697875976562, "Pretrain/Loss (Raw)": 3.0823655128479004, "Pretrain/Step": 9, "Pretrain/Step Time": 8.663914839426676} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.550689697265625, "Pretrain/Loss (Raw)": 4.0746684074401855, "Pretrain/Step": 10, "Pretrain/Step Time": 8.583510088920594} +{"Pretrain/Learning Rate": 9.615384615384617e-07, "Pretrain/Loss": 3.563692808151245, "Pretrain/Loss (Raw)": 3.6937215328216553, "Pretrain/Step": 11, "Pretrain/Step Time": 8.55236005783081} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.6316840648651123, "Pretrain/Loss (Raw)": 4.379590034484863, "Pretrain/Step": 12, "Pretrain/Step Time": 8.509673615296682} +{"Pretrain/Learning Rate": 1.1363636363636364e-06, "Pretrain/Loss": 3.563687324523926, "Pretrain/Loss (Raw)": 2.747722625732422, "Pretrain/Step": 13, "Pretrain/Step Time": 8.508776683073778} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.5536906719207764, "Pretrain/Loss (Raw)": 3.423734426498413, "Pretrain/Step": 14, "Pretrain/Step Time": 8.541461110115051} +{"Pretrain/Learning Rate": 1.3111888111888113e-06, "Pretrain/Loss": 3.4862725734710693, "Pretrain/Loss (Raw)": 2.54241943359375, "Pretrain/Step": 15, "Pretrain/Step Time": 8.562514511744181} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.538222074508667, "Pretrain/Loss (Raw)": 4.317466735839844, "Pretrain/Step": 16, "Pretrain/Step Time": 8.568438529968262} +{"Pretrain/Learning Rate": 1.4860139860139862e-06, "Pretrain/Loss": 3.481513023376465, "Pretrain/Loss (Raw)": 2.5741703510284424, "Pretrain/Step": 17, "Pretrain/Step Time": 8.562853995491476} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.4532008171081543, "Pretrain/Loss (Raw)": 2.971893787384033, "Pretrain/Step": 18, "Pretrain/Step Time": 8.537972476747301} +{"Pretrain/Learning Rate": 1.6608391608391608e-06, "Pretrain/Loss": 3.4290273189544678, "Pretrain/Loss (Raw)": 2.9939029216766357, "Pretrain/Step": 19, "Pretrain/Step Time": 8.520243920777974} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.399686574935913, "Pretrain/Loss (Raw)": 2.842209577560425, "Pretrain/Step": 20, "Pretrain/Step Time": 8.497618234157562} +{"Pretrain/Learning Rate": 1.8356643356643357e-06, "Pretrain/Loss": 3.375455617904663, "Pretrain/Loss (Raw)": 2.8908398151397705, "Pretrain/Step": 21, "Pretrain/Step Time": 8.476123673575264} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.3390614986419678, "Pretrain/Loss (Raw)": 2.5747833251953125, "Pretrain/Step": 22, "Pretrain/Step Time": 8.463101603768088} +{"Pretrain/Learning Rate": 2.0104895104895104e-06, "Pretrain/Loss": 3.3066413402557373, "Pretrain/Loss (Raw)": 2.593402147293091, "Pretrain/Step": 23, "Pretrain/Step Time": 8.445370404616646} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.3026721477508545, "Pretrain/Loss (Raw)": 3.2113797664642334, "Pretrain/Step": 24, "Pretrain/Step Time": 8.442641834417978} +{"Pretrain/Learning Rate": 2.1853146853146853e-06, "Pretrain/Loss": 3.276503801345825, "Pretrain/Loss (Raw)": 2.648465394973755, "Pretrain/Step": 25, "Pretrain/Step Time": 8.430367336273193} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.28037691116333, "Pretrain/Loss (Raw)": 3.377192497253418, "Pretrain/Step": 26, "Pretrain/Step Time": 8.416308072897104} +{"Pretrain/Learning Rate": 2.36013986013986e-06, "Pretrain/Loss": 3.258544921875, "Pretrain/Loss (Raw)": 2.690924882888794, "Pretrain/Step": 27, "Pretrain/Step Time": 8.398577531178793} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.2299463748931885, "Pretrain/Loss (Raw)": 2.457780599594116, "Pretrain/Step": 28, "Pretrain/Step Time": 8.387683306421552} +{"Pretrain/Learning Rate": 2.534965034965035e-06, "Pretrain/Loss": 3.2198359966278076, "Pretrain/Loss (Raw)": 2.936751365661621, "Pretrain/Step": 29, "Pretrain/Step Time": 8.388870995620202} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 3.1994707584381104, "Pretrain/Loss (Raw)": 2.60886812210083, "Pretrain/Step": 30, "Pretrain/Step Time": 8.405467613538105} +{"Pretrain/Learning Rate": 2.7097902097902096e-06, "Pretrain/Loss": 3.1765410900115967, "Pretrain/Loss (Raw)": 2.4886608123779297, "Pretrain/Step": 31, "Pretrain/Step Time": 8.409232124205559} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 3.1490368843078613, "Pretrain/Loss (Raw)": 2.2964072227478027, "Pretrain/Step": 32, "Pretrain/Step Time": 8.413749560713768} +{"Pretrain/Learning Rate": 2.884615384615385e-06, "Pretrain/Loss": 3.131903886795044, "Pretrain/Loss (Raw)": 2.583639144897461, "Pretrain/Step": 33, "Pretrain/Step Time": 8.416753833944147} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 3.119558811187744, "Pretrain/Loss (Raw)": 2.7121834754943848, "Pretrain/Step": 34, "Pretrain/Step Time": 8.40871768839219} +{"Pretrain/Learning Rate": 3.0594405594405598e-06, "Pretrain/Loss": 3.100386619567871, "Pretrain/Loss (Raw)": 2.448526620864868, "Pretrain/Step": 35, "Pretrain/Step Time": 8.400700732639857} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 3.0882256031036377, "Pretrain/Loss (Raw)": 2.6625940799713135, "Pretrain/Step": 36, "Pretrain/Step Time": 8.394349171055687} +{"Pretrain/Learning Rate": 3.2342657342657347e-06, "Pretrain/Loss": 3.0728304386138916, "Pretrain/Loss (Raw)": 2.5185959339141846, "Pretrain/Step": 37, "Pretrain/Step Time": 8.384655546497655} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 3.0508086681365967, "Pretrain/Loss (Raw)": 2.2360024452209473, "Pretrain/Step": 38, "Pretrain/Step Time": 8.382026164155258} +{"Pretrain/Learning Rate": 3.409090909090909e-06, "Pretrain/Loss": 3.034578800201416, "Pretrain/Loss (Raw)": 2.417849540710449, "Pretrain/Step": 39, "Pretrain/Step Time": 8.374476053775885} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 3.015434980392456, "Pretrain/Loss (Raw)": 2.268820285797119, "Pretrain/Step": 40, "Pretrain/Step Time": 8.365331131219865} +{"Pretrain/Learning Rate": 3.583916083916084e-06, "Pretrain/Loss": 2.995863914489746, "Pretrain/Loss (Raw)": 2.21303653717041, "Pretrain/Step": 41, "Pretrain/Step Time": 8.363665836613352} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 2.9807255268096924, "Pretrain/Loss (Raw)": 2.3600356578826904, "Pretrain/Step": 42, "Pretrain/Step Time": 8.359530954133897} +{"Pretrain/Learning Rate": 3.7587412587412585e-06, "Pretrain/Loss": 2.9637460708618164, "Pretrain/Loss (Raw)": 2.250614643096924, "Pretrain/Step": 43, "Pretrain/Step Time": 8.355951020883959} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 2.9538702964782715, "Pretrain/Loss (Raw)": 2.529210090637207, "Pretrain/Step": 44, "Pretrain/Step Time": 8.35506257685748} +{"Pretrain/Learning Rate": 3.933566433566433e-06, "Pretrain/Loss": 2.9419426918029785, "Pretrain/Loss (Raw)": 2.4171245098114014, "Pretrain/Step": 45, "Pretrain/Step Time": 8.35142633120219} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 2.93088698387146, "Pretrain/Loss (Raw)": 2.4333925247192383, "Pretrain/Step": 46, "Pretrain/Step Time": 8.36077370332635} +{"Pretrain/Learning Rate": 4.108391608391608e-06, "Pretrain/Loss": 2.914802312850952, "Pretrain/Loss (Raw)": 2.174906015396118, "Pretrain/Step": 47, "Pretrain/Step Time": 8.373031808974895} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 2.913299083709717, "Pretrain/Loss (Raw)": 2.842644453048706, "Pretrain/Step": 48, "Pretrain/Step Time": 8.395674154162407} +{"Pretrain/Learning Rate": 4.283216783216783e-06, "Pretrain/Loss": 2.903684616088867, "Pretrain/Loss (Raw)": 2.4421980381011963, "Pretrain/Step": 49, "Pretrain/Step Time": 8.389631655751442} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 2.892085552215576, "Pretrain/Loss (Raw)": 2.3237133026123047, "Pretrain/Step": 50, "Pretrain/Step Time": 8.386999731063844} +{"Pretrain/Learning Rate": 4.458041958041959e-06, "Pretrain/Loss": 2.8783674240112305, "Pretrain/Loss (Raw)": 2.1924684047698975, "Pretrain/Step": 51, "Pretrain/Step Time": 8.383375401590385} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 2.8667995929718018, "Pretrain/Loss (Raw)": 2.276832103729248, "Pretrain/Step": 52, "Pretrain/Step Time": 8.381153505582075} +{"Pretrain/Learning Rate": 4.632867132867133e-06, "Pretrain/Loss": 2.8612706661224365, "Pretrain/Loss (Raw)": 2.5737788677215576, "Pretrain/Step": 53, "Pretrain/Step Time": 8.378669252935445} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 2.8531689643859863, "Pretrain/Loss (Raw)": 2.4237775802612305, "Pretrain/Step": 54, "Pretrain/Step Time": 8.371503631273905} +{"Pretrain/Learning Rate": 4.807692307692308e-06, "Pretrain/Loss": 2.8457915782928467, "Pretrain/Loss (Raw)": 2.447415351867676, "Pretrain/Step": 55, "Pretrain/Step Time": 8.365837196870284} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 2.838097333908081, "Pretrain/Loss (Raw)": 2.4149019718170166, "Pretrain/Step": 56, "Pretrain/Step Time": 8.36000828232084} +{"Pretrain/Learning Rate": 4.982517482517483e-06, "Pretrain/Loss": 2.828528642654419, "Pretrain/Loss (Raw)": 2.292686700820923, "Pretrain/Step": 57, "Pretrain/Step Time": 8.362451055593658} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 2.82002592086792, "Pretrain/Loss (Raw)": 2.335378408432007, "Pretrain/Step": 58, "Pretrain/Step Time": 8.360179374957907} +{"Pretrain/Learning Rate": 5.157342657342658e-06, "Pretrain/Loss": 2.811284065246582, "Pretrain/Loss (Raw)": 2.3042385578155518, "Pretrain/Step": 59, "Pretrain/Step Time": 8.354625681699332} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 2.804405450820923, "Pretrain/Loss (Raw)": 2.398566246032715, "Pretrain/Step": 60, "Pretrain/Step Time": 8.352203238010407} +{"Pretrain/Learning Rate": 5.3321678321678325e-06, "Pretrain/Loss": 2.8010027408599854, "Pretrain/Loss (Raw)": 2.596872091293335, "Pretrain/Step": 61, "Pretrain/Step Time": 8.34976496461962} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 2.7927653789520264, "Pretrain/Loss (Raw)": 2.2902772426605225, "Pretrain/Step": 62, "Pretrain/Step Time": 8.350752749750692} +{"Pretrain/Learning Rate": 5.5069930069930074e-06, "Pretrain/Loss": 2.785282850265503, "Pretrain/Loss (Raw)": 2.3213577270507812, "Pretrain/Step": 63, "Pretrain/Step Time": 8.356286370565021} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 2.779874801635742, "Pretrain/Loss (Raw)": 2.439173936843872, "Pretrain/Step": 64, "Pretrain/Step Time": 8.36966297402978} +{"Pretrain/Learning Rate": 5.681818181818182e-06, "Pretrain/Loss": 2.7702879905700684, "Pretrain/Loss (Raw)": 2.1567344665527344, "Pretrain/Step": 65, "Pretrain/Step Time": 8.3698241013747} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 2.765523672103882, "Pretrain/Loss (Raw)": 2.4558217525482178, "Pretrain/Step": 66, "Pretrain/Step Time": 8.366713148174863} +{"Pretrain/Learning Rate": 5.856643356643357e-06, "Pretrain/Loss": 2.7589871883392334, "Pretrain/Loss (Raw)": 2.3275904655456543, "Pretrain/Step": 67, "Pretrain/Step Time": 8.365857334279303} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 2.752962350845337, "Pretrain/Loss (Raw)": 2.349292755126953, "Pretrain/Step": 68, "Pretrain/Step Time": 8.366186832680421} +{"Pretrain/Learning Rate": 6.031468531468531e-06, "Pretrain/Loss": 2.749072551727295, "Pretrain/Loss (Raw)": 2.4845783710479736, "Pretrain/Step": 69, "Pretrain/Step Time": 8.362720119780388} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 2.7418177127838135, "Pretrain/Loss (Raw)": 2.241227388381958, "Pretrain/Step": 70, "Pretrain/Step Time": 8.358160764830453} +{"Pretrain/Learning Rate": 6.206293706293707e-06, "Pretrain/Loss": 2.737514019012451, "Pretrain/Loss (Raw)": 2.4362547397613525, "Pretrain/Step": 71, "Pretrain/Step Time": 8.356947848494624} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 2.7337563037872314, "Pretrain/Loss (Raw)": 2.46696138381958, "Pretrain/Step": 72, "Pretrain/Step Time": 8.35299700167444} +{"Pretrain/Learning Rate": 6.381118881118882e-06, "Pretrain/Loss": 2.7263426780700684, "Pretrain/Loss (Raw)": 2.192565441131592, "Pretrain/Step": 73, "Pretrain/Step Time": 8.352879259684315} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 2.7212793827056885, "Pretrain/Loss (Raw)": 2.3516294956207275, "Pretrain/Step": 74, "Pretrain/Step Time": 8.359036970782924} +{"Pretrain/Learning Rate": 6.555944055944056e-06, "Pretrain/Loss": 2.7138586044311523, "Pretrain/Loss (Raw)": 2.16473388671875, "Pretrain/Step": 75, "Pretrain/Step Time": 8.354044036865234} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 2.711749792098999, "Pretrain/Loss (Raw)": 2.5536036491394043, "Pretrain/Step": 76, "Pretrain/Step Time": 8.357166224404386} +{"Pretrain/Learning Rate": 6.730769230769231e-06, "Pretrain/Loss": 2.710066318511963, "Pretrain/Loss (Raw)": 2.582103729248047, "Pretrain/Step": 77, "Pretrain/Step Time": 8.35689058241906} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 2.709954261779785, "Pretrain/Loss (Raw)": 2.7013280391693115, "Pretrain/Step": 78, "Pretrain/Step Time": 8.362256557513506} +{"Pretrain/Learning Rate": 6.905594405594405e-06, "Pretrain/Loss": 2.7050890922546387, "Pretrain/Loss (Raw)": 2.3256208896636963, "Pretrain/Step": 79, "Pretrain/Step Time": 8.361159436310395} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 2.699794054031372, "Pretrain/Loss (Raw)": 2.281466007232666, "Pretrain/Step": 80, "Pretrain/Step Time": 8.36881245970726} +{"Pretrain/Learning Rate": 7.0804195804195815e-06, "Pretrain/Loss": 2.694150924682617, "Pretrain/Loss (Raw)": 2.242711305618286, "Pretrain/Step": 81, "Pretrain/Step Time": 8.368508400740447} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 2.6952412128448486, "Pretrain/Loss (Raw)": 2.7835693359375, "Pretrain/Step": 82, "Pretrain/Step Time": 8.369937268699088} +{"Pretrain/Learning Rate": 7.2552447552447555e-06, "Pretrain/Loss": 2.6923341751098633, "Pretrain/Loss (Raw)": 2.453939437866211, "Pretrain/Step": 83, "Pretrain/Step Time": 8.369156754160501} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 2.6871228218078613, "Pretrain/Loss (Raw)": 2.2545745372772217, "Pretrain/Step": 84, "Pretrain/Step Time": 8.376257394041334} +{"Pretrain/Learning Rate": 7.43006993006993e-06, "Pretrain/Loss": 2.6830973625183105, "Pretrain/Loss (Raw)": 2.3449671268463135, "Pretrain/Step": 85, "Pretrain/Step Time": 8.376308247622323} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 2.6785080432891846, "Pretrain/Loss (Raw)": 2.288416624069214, "Pretrain/Step": 86, "Pretrain/Step Time": 8.3739947025166} +{"Pretrain/Learning Rate": 7.604895104895106e-06, "Pretrain/Loss": 2.671813488006592, "Pretrain/Loss (Raw)": 2.0960707664489746, "Pretrain/Step": 87, "Pretrain/Step Time": 8.374280408881177} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 2.6652932167053223, "Pretrain/Loss (Raw)": 2.0980212688446045, "Pretrain/Step": 88, "Pretrain/Step Time": 8.373201023448598} +{"Pretrain/Learning Rate": 7.77972027972028e-06, "Pretrain/Loss": 2.660959005355835, "Pretrain/Loss (Raw)": 2.2795603275299072, "Pretrain/Step": 89, "Pretrain/Step Time": 8.369996978995506} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 2.6554172039031982, "Pretrain/Loss (Raw)": 2.162182569503784, "Pretrain/Step": 90, "Pretrain/Step Time": 8.367987169159782} +{"Pretrain/Learning Rate": 7.954545454545455e-06, "Pretrain/Loss": 2.651263952255249, "Pretrain/Loss (Raw)": 2.277491331100464, "Pretrain/Step": 91, "Pretrain/Step Time": 8.36593883902162} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 2.6480984687805176, "Pretrain/Loss (Raw)": 2.3600218296051025, "Pretrain/Step": 92, "Pretrain/Step Time": 8.36345548733421} +{"Pretrain/Learning Rate": 8.12937062937063e-06, "Pretrain/Loss": 2.6482625007629395, "Pretrain/Loss (Raw)": 2.663362979888916, "Pretrain/Step": 93, "Pretrain/Step Time": 8.368457509625342} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 2.6451003551483154, "Pretrain/Loss (Raw)": 2.351041555404663, "Pretrain/Step": 94, "Pretrain/Step Time": 8.368332279489396} +{"Pretrain/Learning Rate": 8.304195804195805e-06, "Pretrain/Loss": 2.6472859382629395, "Pretrain/Loss (Raw)": 2.8527157306671143, "Pretrain/Step": 95, "Pretrain/Step Time": 8.380070342515644} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 2.644087314605713, "Pretrain/Loss (Raw)": 2.3402023315429688, "Pretrain/Step": 96, "Pretrain/Step Time": 8.383996891478697} +{"Pretrain/Learning Rate": 8.47902097902098e-06, "Pretrain/Loss": 2.6433589458465576, "Pretrain/Loss (Raw)": 2.5734634399414062, "Pretrain/Step": 97, "Pretrain/Step Time": 8.385895013809204} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 2.641983985900879, "Pretrain/Loss (Raw)": 2.5085842609405518, "Pretrain/Step": 98, "Pretrain/Step Time": 8.391486985342842} +{"Pretrain/Learning Rate": 8.653846153846155e-06, "Pretrain/Loss": 2.6367945671081543, "Pretrain/Loss (Raw)": 2.128248691558838, "Pretrain/Step": 99, "Pretrain/Step Time": 8.389275382263492} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 2.6361706256866455, "Pretrain/Loss (Raw)": 2.574382781982422, "Pretrain/Step": 100, "Pretrain/Step Time": 8.393364233970642} +{"Pretrain/Learning Rate": 8.828671328671328e-06, "Pretrain/Loss": 2.632490396499634, "Pretrain/Loss (Raw)": 2.264465808868408, "Pretrain/Step": 101, "Pretrain/Step Time": 8.389282606615879} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 2.6298506259918213, "Pretrain/Loss (Raw)": 2.3632702827453613, "Pretrain/Step": 102, "Pretrain/Step Time": 8.388022822492262} +{"Pretrain/Learning Rate": 9.003496503496504e-06, "Pretrain/Loss": 2.6261863708496094, "Pretrain/Loss (Raw)": 2.2524378299713135, "Pretrain/Step": 103, "Pretrain/Step Time": 8.385409561175745} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 2.6255717277526855, "Pretrain/Loss (Raw)": 2.5622479915618896, "Pretrain/Step": 104, "Pretrain/Step Time": 8.38414221085035} +{"Pretrain/Learning Rate": 9.17832167832168e-06, "Pretrain/Loss": 2.623220682144165, "Pretrain/Loss (Raw)": 2.3787221908569336, "Pretrain/Step": 105, "Pretrain/Step Time": 8.381141063145229} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 2.6188135147094727, "Pretrain/Loss (Raw)": 2.156039237976074, "Pretrain/Step": 106, "Pretrain/Step Time": 8.379983791765177} +{"Pretrain/Learning Rate": 9.353146853146853e-06, "Pretrain/Loss": 2.615917444229126, "Pretrain/Loss (Raw)": 2.308943271636963, "Pretrain/Step": 107, "Pretrain/Step Time": 8.381948136837684} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 2.6132118701934814, "Pretrain/Loss (Raw)": 2.323727607727051, "Pretrain/Step": 108, "Pretrain/Step Time": 8.383036703975112} +{"Pretrain/Learning Rate": 9.527972027972027e-06, "Pretrain/Loss": 2.609353542327881, "Pretrain/Loss (Raw)": 2.192647933959961, "Pretrain/Step": 109, "Pretrain/Step Time": 8.3840964037344} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 2.6047611236572266, "Pretrain/Loss (Raw)": 2.1041743755340576, "Pretrain/Step": 110, "Pretrain/Step Time": 8.383405017852784} +{"Pretrain/Learning Rate": 9.702797202797204e-06, "Pretrain/Loss": 2.6011006832122803, "Pretrain/Loss (Raw)": 2.1984260082244873, "Pretrain/Step": 111, "Pretrain/Step Time": 8.38650113612682} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.6004228591918945, "Pretrain/Loss (Raw)": 2.5251996517181396, "Pretrain/Step": 112, "Pretrain/Step Time": 8.394133863704544} +{"Pretrain/Learning Rate": 9.877622377622379e-06, "Pretrain/Loss": 2.5960092544555664, "Pretrain/Loss (Raw)": 2.101733684539795, "Pretrain/Step": 113, "Pretrain/Step Time": 8.393087720448992} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.5936338901519775, "Pretrain/Loss (Raw)": 2.3251659870147705, "Pretrain/Step": 114, "Pretrain/Step Time": 8.394566594508657} +{"Pretrain/Learning Rate": 1.0052447552447552e-05, "Pretrain/Loss": 2.5901899337768555, "Pretrain/Loss (Raw)": 2.197627067565918, "Pretrain/Step": 115, "Pretrain/Step Time": 8.397004944345225} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.5880720615386963, "Pretrain/Loss (Raw)": 2.344524621963501, "Pretrain/Step": 116, "Pretrain/Step Time": 8.394627932844491} +{"Pretrain/Learning Rate": 1.0227272727272729e-05, "Pretrain/Loss": 2.58604097366333, "Pretrain/Loss (Raw)": 2.350400447845459, "Pretrain/Step": 117, "Pretrain/Step Time": 8.392688753258469} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.5833051204681396, "Pretrain/Loss (Raw)": 2.26322078704834, "Pretrain/Step": 118, "Pretrain/Step Time": 8.393264192645832} +{"Pretrain/Learning Rate": 1.0402097902097904e-05, "Pretrain/Loss": 2.5813989639282227, "Pretrain/Loss (Raw)": 2.3564250469207764, "Pretrain/Step": 119, "Pretrain/Step Time": 8.3902904045682} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.5791029930114746, "Pretrain/Loss (Raw)": 2.3059000968933105, "Pretrain/Step": 120, "Pretrain/Step Time": 8.388868045806884} +{"Pretrain/Learning Rate": 1.0576923076923077e-05, "Pretrain/Loss": 2.57666015625, "Pretrain/Loss (Raw)": 2.283533811569214, "Pretrain/Step": 121, "Pretrain/Step Time": 8.386849277275653} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.572185516357422, "Pretrain/Loss (Raw)": 2.0307419300079346, "Pretrain/Step": 122, "Pretrain/Step Time": 8.385204346453557} +{"Pretrain/Learning Rate": 1.0751748251748252e-05, "Pretrain/Loss": 2.570934772491455, "Pretrain/Loss (Raw)": 2.4183576107025146, "Pretrain/Step": 123, "Pretrain/Step Time": 8.384920942104928} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.56927227973938, "Pretrain/Loss (Raw)": 2.3648157119750977, "Pretrain/Step": 124, "Pretrain/Step Time": 8.389622711366222} +{"Pretrain/Learning Rate": 1.0926573426573428e-05, "Pretrain/Loss": 2.566063165664673, "Pretrain/Loss (Raw)": 2.1680824756622314, "Pretrain/Step": 125, "Pretrain/Step Time": 8.386516839981079} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.5643961429595947, "Pretrain/Loss (Raw)": 2.3560028076171875, "Pretrain/Step": 126, "Pretrain/Step Time": 8.388834894649566} +{"Pretrain/Learning Rate": 1.1101398601398601e-05, "Pretrain/Loss": 2.5636463165283203, "Pretrain/Loss (Raw)": 2.469191312789917, "Pretrain/Step": 127, "Pretrain/Step Time": 8.396212453917256} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.5607500076293945, "Pretrain/Loss (Raw)": 2.1929211616516113, "Pretrain/Step": 128, "Pretrain/Step Time": 8.398266911506653} +{"Pretrain/Learning Rate": 1.1276223776223776e-05, "Pretrain/Loss": 2.5566418170928955, "Pretrain/Loss (Raw)": 2.3374834060668945, "Pretrain/Step": 129, "Pretrain/Step Time": 8.37213982641697} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.532299757003784, "Pretrain/Loss (Raw)": 2.1131253242492676, "Pretrain/Step": 130, "Pretrain/Step Time": 8.370484225451946} +{"Pretrain/Learning Rate": 1.1451048951048951e-05, "Pretrain/Loss": 2.522064208984375, "Pretrain/Loss (Raw)": 2.0427632331848145, "Pretrain/Step": 131, "Pretrain/Step Time": 8.372855510562658} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.5105526447296143, "Pretrain/Loss (Raw)": 2.1204416751861572, "Pretrain/Step": 132, "Pretrain/Step Time": 8.372227050364017} +{"Pretrain/Learning Rate": 1.1625874125874126e-05, "Pretrain/Loss": 2.503540277481079, "Pretrain/Loss (Raw)": 2.200019121170044, "Pretrain/Step": 133, "Pretrain/Step Time": 8.374791655689478} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.490773916244507, "Pretrain/Loss (Raw)": 2.122925043106079, "Pretrain/Step": 134, "Pretrain/Step Time": 8.374751368537545} +{"Pretrain/Learning Rate": 1.1800699300699301e-05, "Pretrain/Loss": 2.479224681854248, "Pretrain/Loss (Raw)": 2.1056509017944336, "Pretrain/Step": 135, "Pretrain/Step Time": 8.375599224120378} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.473616123199463, "Pretrain/Loss (Raw)": 2.1543562412261963, "Pretrain/Step": 136, "Pretrain/Step Time": 8.379766708239913} +{"Pretrain/Learning Rate": 1.1975524475524476e-05, "Pretrain/Loss": 2.470869302749634, "Pretrain/Loss (Raw)": 2.730731725692749, "Pretrain/Step": 137, "Pretrain/Step Time": 8.381762694567442} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.4593329429626465, "Pretrain/Loss (Raw)": 2.5980165004730225, "Pretrain/Step": 138, "Pretrain/Step Time": 8.383610041812062} +{"Pretrain/Learning Rate": 1.215034965034965e-05, "Pretrain/Loss": 2.450080156326294, "Pretrain/Loss (Raw)": 2.509382963180542, "Pretrain/Step": 139, "Pretrain/Step Time": 8.383149202913046} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.433223247528076, "Pretrain/Loss (Raw)": 2.2219066619873047, "Pretrain/Step": 140, "Pretrain/Step Time": 8.387065095826983} +{"Pretrain/Learning Rate": 1.2325174825174826e-05, "Pretrain/Loss": 2.4311861991882324, "Pretrain/Loss (Raw)": 2.486985683441162, "Pretrain/Step": 141, "Pretrain/Step Time": 8.387544438242912} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.424237012863159, "Pretrain/Loss (Raw)": 2.5342159271240234, "Pretrain/Step": 142, "Pretrain/Step Time": 8.383482614532113} +{"Pretrain/Learning Rate": 1.25e-05, "Pretrain/Loss": 2.4227209091186523, "Pretrain/Loss (Raw)": 2.3483800888061523, "Pretrain/Step": 143, "Pretrain/Step Time": 8.37925037369132} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.406473159790039, "Pretrain/Loss (Raw)": 2.237748622894287, "Pretrain/Step": 144, "Pretrain/Step Time": 8.380073560401797} +{"Pretrain/Learning Rate": 1.2674825174825175e-05, "Pretrain/Loss": 2.402494430541992, "Pretrain/Loss (Raw)": 2.064884662628174, "Pretrain/Step": 145, "Pretrain/Step Time": 8.383611282333732} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.3967971801757812, "Pretrain/Loss (Raw)": 2.24265456199646, "Pretrain/Step": 146, "Pretrain/Step Time": 8.38436521962285} +{"Pretrain/Learning Rate": 1.2849650349650349e-05, "Pretrain/Loss": 2.3919806480407715, "Pretrain/Loss (Raw)": 2.377392053604126, "Pretrain/Step": 147, "Pretrain/Step Time": 8.390538277104497} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.388171672821045, "Pretrain/Loss (Raw)": 2.354632616043091, "Pretrain/Step": 148, "Pretrain/Step Time": 8.392685603350401} +{"Pretrain/Learning Rate": 1.3024475524475524e-05, "Pretrain/Loss": 2.382549285888672, "Pretrain/Loss (Raw)": 2.171211004257202, "Pretrain/Step": 149, "Pretrain/Step Time": 8.39420972764492} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.3788161277770996, "Pretrain/Loss (Raw)": 2.096919059753418, "Pretrain/Step": 150, "Pretrain/Step Time": 8.396571459248662} +{"Pretrain/Learning Rate": 1.3199300699300702e-05, "Pretrain/Loss": 2.376234769821167, "Pretrain/Loss (Raw)": 2.262991189956665, "Pretrain/Step": 151, "Pretrain/Step Time": 8.39630145393312} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.3707377910614014, "Pretrain/Loss (Raw)": 2.507786273956299, "Pretrain/Step": 152, "Pretrain/Step Time": 8.394984733313322} +{"Pretrain/Learning Rate": 1.3374125874125875e-05, "Pretrain/Loss": 2.3671035766601562, "Pretrain/Loss (Raw)": 2.183250665664673, "Pretrain/Step": 153, "Pretrain/Step Time": 8.39447203092277} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.3581409454345703, "Pretrain/Loss (Raw)": 2.23000168800354, "Pretrain/Step": 154, "Pretrain/Step Time": 8.39595939964056} +{"Pretrain/Learning Rate": 1.354895104895105e-05, "Pretrain/Loss": 2.3549115657806396, "Pretrain/Loss (Raw)": 2.2775492668151855, "Pretrain/Step": 155, "Pretrain/Step Time": 8.397838082164526} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.351194143295288, "Pretrain/Loss (Raw)": 1.9819469451904297, "Pretrain/Step": 156, "Pretrain/Step Time": 8.398238940164447} +{"Pretrain/Learning Rate": 1.3723776223776225e-05, "Pretrain/Loss": 2.34584379196167, "Pretrain/Loss (Raw)": 2.2519073486328125, "Pretrain/Step": 157, "Pretrain/Step Time": 8.397588668391109} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.3433427810668945, "Pretrain/Loss (Raw)": 2.2887322902679443, "Pretrain/Step": 158, "Pretrain/Step Time": 8.395792054012418} +{"Pretrain/Learning Rate": 1.38986013986014e-05, "Pretrain/Loss": 2.3414621353149414, "Pretrain/Loss (Raw)": 2.247925043106079, "Pretrain/Step": 159, "Pretrain/Step Time": 8.39195610024035} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.3408238887786865, "Pretrain/Loss (Raw)": 2.214728355407715, "Pretrain/Step": 160, "Pretrain/Step Time": 8.389310574159026} +{"Pretrain/Learning Rate": 1.4073426573426573e-05, "Pretrain/Loss": 2.3388290405273438, "Pretrain/Loss (Raw)": 2.328277826309204, "Pretrain/Step": 161, "Pretrain/Step Time": 8.391853492707014} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.3349428176879883, "Pretrain/Loss (Raw)": 2.214773416519165, "Pretrain/Step": 162, "Pretrain/Step Time": 8.404526436701417} +{"Pretrain/Learning Rate": 1.4248251748251748e-05, "Pretrain/Loss": 2.3374104499816895, "Pretrain/Loss (Raw)": 2.7644107341766357, "Pretrain/Step": 163, "Pretrain/Step Time": 8.40645306557417} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.335136890411377, "Pretrain/Loss (Raw)": 2.3715426921844482, "Pretrain/Step": 164, "Pretrain/Step Time": 8.409646669402719} +{"Pretrain/Learning Rate": 1.4423076923076923e-05, "Pretrain/Loss": 2.3325705528259277, "Pretrain/Loss (Raw)": 2.190129280090332, "Pretrain/Step": 165, "Pretrain/Step Time": 8.411972671747208} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.332503318786621, "Pretrain/Loss (Raw)": 2.2273619174957275, "Pretrain/Step": 166, "Pretrain/Step Time": 8.41065681912005} +{"Pretrain/Learning Rate": 1.45979020979021e-05, "Pretrain/Loss": 2.3325700759887695, "Pretrain/Loss (Raw)": 2.426391124725342, "Pretrain/Step": 167, "Pretrain/Step Time": 8.411625985056162} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.331996440887451, "Pretrain/Loss (Raw)": 2.195425510406494, "Pretrain/Step": 168, "Pretrain/Step Time": 8.412860173732042} +{"Pretrain/Learning Rate": 1.4772727272727274e-05, "Pretrain/Loss": 2.3321902751922607, "Pretrain/Loss (Raw)": 2.237828493118286, "Pretrain/Step": 169, "Pretrain/Step Time": 8.411417754366994} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.3315305709838867, "Pretrain/Loss (Raw)": 2.275630474090576, "Pretrain/Step": 170, "Pretrain/Step Time": 8.410015940666199} +{"Pretrain/Learning Rate": 1.4947552447552449e-05, "Pretrain/Loss": 2.330366611480713, "Pretrain/Loss (Raw)": 2.1015877723693848, "Pretrain/Step": 171, "Pretrain/Step Time": 8.410018134862185} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.3262863159179688, "Pretrain/Loss (Raw)": 2.006950616836548, "Pretrain/Step": 172, "Pretrain/Step Time": 8.410219805315137} +{"Pretrain/Learning Rate": 1.5122377622377622e-05, "Pretrain/Loss": 2.325777053833008, "Pretrain/Loss (Raw)": 2.3519248962402344, "Pretrain/Step": 173, "Pretrain/Step Time": 8.409891018643975} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.325589656829834, "Pretrain/Loss (Raw)": 2.4094035625457764, "Pretrain/Step": 174, "Pretrain/Step Time": 8.40651217661798} +{"Pretrain/Learning Rate": 1.5297202797202797e-05, "Pretrain/Loss": 2.326923370361328, "Pretrain/Loss (Raw)": 2.3456201553344727, "Pretrain/Step": 175, "Pretrain/Step Time": 8.40491890721023} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.3223929405212402, "Pretrain/Loss (Raw)": 2.262744426727295, "Pretrain/Step": 176, "Pretrain/Step Time": 8.401401467621326} +{"Pretrain/Learning Rate": 1.547202797202797e-05, "Pretrain/Loss": 2.3198342323303223, "Pretrain/Loss (Raw)": 2.114682197570801, "Pretrain/Step": 177, "Pretrain/Step Time": 8.404384024441242} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.317688226699829, "Pretrain/Loss (Raw)": 2.0490548610687256, "Pretrain/Step": 178, "Pretrain/Step Time": 8.404763974249363} +{"Pretrain/Learning Rate": 1.5646853146853147e-05, "Pretrain/Loss": 2.3181381225585938, "Pretrain/Loss (Raw)": 2.2500672340393066, "Pretrain/Step": 179, "Pretrain/Step Time": 8.410837884992361} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.3185882568359375, "Pretrain/Loss (Raw)": 2.334411859512329, "Pretrain/Step": 180, "Pretrain/Step Time": 8.41537562571466} +{"Pretrain/Learning Rate": 1.5821678321678324e-05, "Pretrain/Loss": 2.3155908584594727, "Pretrain/Loss (Raw)": 2.190147638320923, "Pretrain/Step": 181, "Pretrain/Step Time": 8.417837750166655} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.3162841796875, "Pretrain/Loss (Raw)": 2.5124852657318115, "Pretrain/Step": 182, "Pretrain/Step Time": 8.420972526073456} +{"Pretrain/Learning Rate": 1.5996503496503497e-05, "Pretrain/Loss": 2.3156495094299316, "Pretrain/Loss (Raw)": 2.3661880493164062, "Pretrain/Step": 183, "Pretrain/Step Time": 8.423577228561044} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.3145456314086914, "Pretrain/Loss (Raw)": 2.273611307144165, "Pretrain/Step": 184, "Pretrain/Step Time": 8.425282299518585} +{"Pretrain/Learning Rate": 1.6171328671328673e-05, "Pretrain/Loss": 2.314079999923706, "Pretrain/Loss (Raw)": 2.233088493347168, "Pretrain/Step": 185, "Pretrain/Step Time": 8.423670889809728} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.3141398429870605, "Pretrain/Loss (Raw)": 2.3430562019348145, "Pretrain/Step": 186, "Pretrain/Step Time": 8.423519689589739} +{"Pretrain/Learning Rate": 1.6346153846153847e-05, "Pretrain/Loss": 2.316269636154175, "Pretrain/Loss (Raw)": 2.576838731765747, "Pretrain/Step": 187, "Pretrain/Step Time": 8.42606789432466} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.3145911693573, "Pretrain/Loss (Raw)": 2.1837141513824463, "Pretrain/Step": 188, "Pretrain/Step Time": 8.425497233867645} +{"Pretrain/Learning Rate": 1.6520979020979023e-05, "Pretrain/Loss": 2.312363386154175, "Pretrain/Loss (Raw)": 2.3117125034332275, "Pretrain/Step": 189, "Pretrain/Step Time": 8.427263751626015} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.3124470710754395, "Pretrain/Loss (Raw)": 2.3010029792785645, "Pretrain/Step": 190, "Pretrain/Step Time": 8.426616812124848} +{"Pretrain/Learning Rate": 1.6695804195804196e-05, "Pretrain/Loss": 2.3122200965881348, "Pretrain/Loss (Raw)": 2.292311191558838, "Pretrain/Step": 191, "Pretrain/Step Time": 8.425361284986138} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.3106982707977295, "Pretrain/Loss (Raw)": 2.244364023208618, "Pretrain/Step": 192, "Pretrain/Step Time": 8.4192501232028} +{"Pretrain/Learning Rate": 1.687062937062937e-05, "Pretrain/Loss": 2.31459903717041, "Pretrain/Loss (Raw)": 2.656047821044922, "Pretrain/Step": 193, "Pretrain/Step Time": 8.423742696642876} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.3118724822998047, "Pretrain/Loss (Raw)": 2.1068062782287598, "Pretrain/Step": 194, "Pretrain/Step Time": 8.422632919624448} +{"Pretrain/Learning Rate": 1.7045454545454546e-05, "Pretrain/Loss": 2.309581756591797, "Pretrain/Loss (Raw)": 2.0343756675720215, "Pretrain/Step": 195, "Pretrain/Step Time": 8.43314272351563} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.3080692291259766, "Pretrain/Loss (Raw)": 2.155672788619995, "Pretrain/Step": 196, "Pretrain/Step Time": 8.43354825489223} +{"Pretrain/Learning Rate": 1.7220279720279723e-05, "Pretrain/Loss": 2.305262804031372, "Pretrain/Loss (Raw)": 2.125401496887207, "Pretrain/Step": 197, "Pretrain/Step Time": 8.433377839624882} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.3047373294830322, "Pretrain/Loss (Raw)": 2.173947334289551, "Pretrain/Step": 198, "Pretrain/Step Time": 8.43505510315299} +{"Pretrain/Learning Rate": 1.7395104895104896e-05, "Pretrain/Loss": 2.30257511138916, "Pretrain/Loss (Raw)": 2.1594901084899902, "Pretrain/Step": 199, "Pretrain/Step Time": 8.437046580016613} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.301433563232422, "Pretrain/Loss (Raw)": 2.3208484649658203, "Pretrain/Step": 200, "Pretrain/Step Time": 8.435697063803673} +{"Pretrain/Learning Rate": 1.7569930069930072e-05, "Pretrain/Loss": 2.301593780517578, "Pretrain/Loss (Raw)": 2.2130842208862305, "Pretrain/Step": 201, "Pretrain/Step Time": 8.438346859067678} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.2991673946380615, "Pretrain/Loss (Raw)": 2.041038751602173, "Pretrain/Step": 202, "Pretrain/Step Time": 8.434087228029966} +{"Pretrain/Learning Rate": 1.7744755244755246e-05, "Pretrain/Loss": 2.30130672454834, "Pretrain/Loss (Raw)": 2.438555955886841, "Pretrain/Step": 203, "Pretrain/Step Time": 8.438697746023536} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.298656940460205, "Pretrain/Loss (Raw)": 2.214433193206787, "Pretrain/Step": 204, "Pretrain/Step Time": 8.435290820896626} +{"Pretrain/Learning Rate": 1.791958041958042e-05, "Pretrain/Loss": 2.2950587272644043, "Pretrain/Loss (Raw)": 2.121542453765869, "Pretrain/Step": 205, "Pretrain/Step Time": 8.433895278722048} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.29219388961792, "Pretrain/Loss (Raw)": 2.3346033096313477, "Pretrain/Step": 206, "Pretrain/Step Time": 8.431322081014514} +{"Pretrain/Learning Rate": 1.8094405594405595e-05, "Pretrain/Loss": 2.291703939437866, "Pretrain/Loss (Raw)": 2.2629308700561523, "Pretrain/Step": 207, "Pretrain/Step Time": 8.43015238828957} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.296515941619873, "Pretrain/Loss (Raw)": 2.897399663925171, "Pretrain/Step": 208, "Pretrain/Step Time": 8.429236529394984} +{"Pretrain/Learning Rate": 1.826923076923077e-05, "Pretrain/Loss": 2.2998046875, "Pretrain/Loss (Raw)": 2.663660764694214, "Pretrain/Step": 209, "Pretrain/Step Time": 8.426779739558697} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.2958860397338867, "Pretrain/Loss (Raw)": 2.281975269317627, "Pretrain/Step": 210, "Pretrain/Step Time": 8.430193750187755} +{"Pretrain/Learning Rate": 1.8444055944055945e-05, "Pretrain/Loss": 2.2941761016845703, "Pretrain/Loss (Raw)": 2.2350776195526123, "Pretrain/Step": 211, "Pretrain/Step Time": 8.43448449857533} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.294534683227539, "Pretrain/Loss (Raw)": 2.3004868030548096, "Pretrain/Step": 212, "Pretrain/Step Time": 8.435425689443946} +{"Pretrain/Learning Rate": 1.8618881118881122e-05, "Pretrain/Loss": 2.2930233478546143, "Pretrain/Loss (Raw)": 2.151516914367676, "Pretrain/Step": 213, "Pretrain/Step Time": 8.434597639366984} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.29276704788208, "Pretrain/Loss (Raw)": 2.2556233406066895, "Pretrain/Step": 214, "Pretrain/Step Time": 8.434857299551368} +{"Pretrain/Learning Rate": 1.8793706293706295e-05, "Pretrain/Loss": 2.2925820350646973, "Pretrain/Loss (Raw)": 2.072350025177002, "Pretrain/Step": 215, "Pretrain/Step Time": 8.437318509444594} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.293887138366699, "Pretrain/Loss (Raw)": 2.265105962753296, "Pretrain/Step": 216, "Pretrain/Step Time": 8.435751030221581} +{"Pretrain/Learning Rate": 1.8968531468531468e-05, "Pretrain/Loss": 2.2943170070648193, "Pretrain/Loss (Raw)": 2.334578275680542, "Pretrain/Step": 217, "Pretrain/Step Time": 8.437827091664076} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.2937517166137695, "Pretrain/Loss (Raw)": 2.089836359024048, "Pretrain/Step": 218, "Pretrain/Step Time": 8.440206663683057} +{"Pretrain/Learning Rate": 1.9143356643356645e-05, "Pretrain/Loss": 2.293149948120117, "Pretrain/Loss (Raw)": 2.200432062149048, "Pretrain/Step": 219, "Pretrain/Step Time": 8.439563577994704} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.293595790863037, "Pretrain/Loss (Raw)": 2.417102336883545, "Pretrain/Step": 220, "Pretrain/Step Time": 8.442179402336478} +{"Pretrain/Learning Rate": 1.9318181818181818e-05, "Pretrain/Loss": 2.2906792163848877, "Pretrain/Loss (Raw)": 2.2900478839874268, "Pretrain/Step": 221, "Pretrain/Step Time": 8.436470128595829} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.2897653579711914, "Pretrain/Loss (Raw)": 2.234074354171753, "Pretrain/Step": 222, "Pretrain/Step Time": 8.439415661618114} +{"Pretrain/Learning Rate": 1.9493006993006995e-05, "Pretrain/Loss": 2.283935546875, "Pretrain/Loss (Raw)": 2.1065075397491455, "Pretrain/Step": 223, "Pretrain/Step Time": 8.433029824867845} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.282613515853882, "Pretrain/Loss (Raw)": 2.1709675788879395, "Pretrain/Step": 224, "Pretrain/Step Time": 8.42814714461565} +{"Pretrain/Learning Rate": 1.9667832167832168e-05, "Pretrain/Loss": 2.2850406169891357, "Pretrain/Loss (Raw)": 2.884129047393799, "Pretrain/Step": 225, "Pretrain/Step Time": 8.429538244381547} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.281792640686035, "Pretrain/Loss (Raw)": 2.092855215072632, "Pretrain/Step": 226, "Pretrain/Step Time": 8.425531094893813} +{"Pretrain/Learning Rate": 1.9842657342657344e-05, "Pretrain/Loss": 2.2824108600616455, "Pretrain/Loss (Raw)": 2.2073721885681152, "Pretrain/Step": 227, "Pretrain/Step Time": 8.434392292052507} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.2807388305664062, "Pretrain/Loss (Raw)": 2.360372304916382, "Pretrain/Step": 228, "Pretrain/Step Time": 8.430363165214658} +{"Pretrain/Learning Rate": 2.0017482517482518e-05, "Pretrain/Loss": 2.2794814109802246, "Pretrain/Loss (Raw)": 2.103506326675415, "Pretrain/Step": 229, "Pretrain/Step Time": 8.43812814541161} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.277466297149658, "Pretrain/Loss (Raw)": 2.105348825454712, "Pretrain/Step": 230, "Pretrain/Step Time": 8.439282959327102} +{"Pretrain/Learning Rate": 2.0192307692307694e-05, "Pretrain/Loss": 2.2789692878723145, "Pretrain/Loss (Raw)": 2.4448091983795166, "Pretrain/Step": 231, "Pretrain/Step Time": 8.440444525331259} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.2774932384490967, "Pretrain/Loss (Raw)": 2.3733229637145996, "Pretrain/Step": 232, "Pretrain/Step Time": 8.443612426519394} +{"Pretrain/Learning Rate": 2.0367132867132867e-05, "Pretrain/Loss": 2.2769179344177246, "Pretrain/Loss (Raw)": 2.305083990097046, "Pretrain/Step": 233, "Pretrain/Step Time": 8.444620652124286} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.2782115936279297, "Pretrain/Loss (Raw)": 2.3216171264648438, "Pretrain/Step": 234, "Pretrain/Step Time": 8.444036081433296} +{"Pretrain/Learning Rate": 2.0541958041958044e-05, "Pretrain/Loss": 2.278562545776367, "Pretrain/Loss (Raw)": 2.3538763523101807, "Pretrain/Step": 235, "Pretrain/Step Time": 8.442226808518171} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.2764196395874023, "Pretrain/Loss (Raw)": 2.049431562423706, "Pretrain/Step": 236, "Pretrain/Step Time": 8.439712414517999} +{"Pretrain/Learning Rate": 2.0716783216783217e-05, "Pretrain/Loss": 2.276764392852783, "Pretrain/Loss (Raw)": 2.2367513179779053, "Pretrain/Step": 237, "Pretrain/Step Time": 8.437254140153527} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.2788774967193604, "Pretrain/Loss (Raw)": 2.374694585800171, "Pretrain/Step": 238, "Pretrain/Step Time": 8.437843583524227} +{"Pretrain/Learning Rate": 2.089160839160839e-05, "Pretrain/Loss": 2.280447006225586, "Pretrain/Loss (Raw)": 2.3993115425109863, "Pretrain/Step": 239, "Pretrain/Step Time": 8.436314990743995} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.2775790691375732, "Pretrain/Loss (Raw)": 2.1581056118011475, "Pretrain/Step": 240, "Pretrain/Step Time": 8.430081471800804} +{"Pretrain/Learning Rate": 2.106643356643357e-05, "Pretrain/Loss": 2.277310371398926, "Pretrain/Loss (Raw)": 2.0673141479492188, "Pretrain/Step": 241, "Pretrain/Step Time": 8.434354411438107} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.2746894359588623, "Pretrain/Loss (Raw)": 1.9897047281265259, "Pretrain/Step": 242, "Pretrain/Step Time": 8.432311730459332} +{"Pretrain/Learning Rate": 2.1241258741258744e-05, "Pretrain/Loss": 2.274280309677124, "Pretrain/Loss (Raw)": 2.1452476978302, "Pretrain/Step": 243, "Pretrain/Step Time": 8.43178103864193} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.271615982055664, "Pretrain/Loss (Raw)": 2.0034823417663574, "Pretrain/Step": 244, "Pretrain/Step Time": 8.440154114738107} +{"Pretrain/Learning Rate": 2.1416083916083917e-05, "Pretrain/Loss": 2.2702341079711914, "Pretrain/Loss (Raw)": 2.173534631729126, "Pretrain/Step": 245, "Pretrain/Step Time": 8.439165538176894} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.269418239593506, "Pretrain/Loss (Raw)": 2.1587743759155273, "Pretrain/Step": 246, "Pretrain/Step Time": 8.44488344155252} +{"Pretrain/Learning Rate": 2.1590909090909093e-05, "Pretrain/Loss": 2.267745018005371, "Pretrain/Loss (Raw)": 2.1422672271728516, "Pretrain/Step": 247, "Pretrain/Step Time": 8.446890257298946} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.265472412109375, "Pretrain/Loss (Raw)": 2.015010356903076, "Pretrain/Step": 248, "Pretrain/Step Time": 8.446108205243945} +{"Pretrain/Learning Rate": 2.1765734265734267e-05, "Pretrain/Loss": 2.264413833618164, "Pretrain/Loss (Raw)": 2.148029088973999, "Pretrain/Step": 249, "Pretrain/Step Time": 8.447387650609016} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.2636852264404297, "Pretrain/Loss (Raw)": 1.9374792575836182, "Pretrain/Step": 250, "Pretrain/Step Time": 8.450819263234735} +{"Pretrain/Learning Rate": 2.194055944055944e-05, "Pretrain/Loss": 2.2628865242004395, "Pretrain/Loss (Raw)": 2.3161263465881348, "Pretrain/Step": 251, "Pretrain/Step Time": 8.44763232767582} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.2618491649627686, "Pretrain/Loss (Raw)": 2.232051372528076, "Pretrain/Step": 252, "Pretrain/Step Time": 8.444111863151193} +{"Pretrain/Learning Rate": 2.2115384615384616e-05, "Pretrain/Loss": 2.2629804611206055, "Pretrain/Loss (Raw)": 2.3128626346588135, "Pretrain/Step": 253, "Pretrain/Step Time": 8.445146407932043} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.26259708404541, "Pretrain/Loss (Raw)": 2.306928873062134, "Pretrain/Step": 254, "Pretrain/Step Time": 8.441784221678972} +{"Pretrain/Learning Rate": 2.229020979020979e-05, "Pretrain/Loss": 2.261404275894165, "Pretrain/Loss (Raw)": 2.316516876220703, "Pretrain/Step": 255, "Pretrain/Step Time": 8.434661567211151} +{"Pretrain/Learning Rate": 2.237762237762238e-05, "Pretrain/Loss": 2.2600224018096924, "Pretrain/Loss (Raw)": 2.016042709350586, "Pretrain/Step": 256, "Pretrain/Step Time": 8.429808227345347} +{"Pretrain/Learning Rate": 2.2465034965034966e-05, "Pretrain/Loss": 2.258945941925049, "Pretrain/Loss (Raw)": 2.199704647064209, "Pretrain/Step": 257, "Pretrain/Step Time": 8.427519250661135} +{"Pretrain/Learning Rate": 2.2552447552447553e-05, "Pretrain/Loss": 2.260491132736206, "Pretrain/Loss (Raw)": 2.310899257659912, "Pretrain/Step": 258, "Pretrain/Step Time": 8.432921543717384} +{"Pretrain/Learning Rate": 2.2639860139860143e-05, "Pretrain/Loss": 2.266132354736328, "Pretrain/Loss (Raw)": 2.7648394107818604, "Pretrain/Step": 259, "Pretrain/Step Time": 8.43562432564795} +{"Pretrain/Learning Rate": 2.272727272727273e-05, "Pretrain/Loss": 2.266299247741699, "Pretrain/Loss (Raw)": 2.1418023109436035, "Pretrain/Step": 260, "Pretrain/Step Time": 8.441097335889935} +{"Pretrain/Learning Rate": 2.2814685314685316e-05, "Pretrain/Loss": 2.2662010192871094, "Pretrain/Loss (Raw)": 2.1874516010284424, "Pretrain/Step": 261, "Pretrain/Step Time": 8.44509121030569} +{"Pretrain/Learning Rate": 2.2902097902097902e-05, "Pretrain/Loss": 2.2663440704345703, "Pretrain/Loss (Raw)": 2.141240358352661, "Pretrain/Step": 262, "Pretrain/Step Time": 8.446913581341505} +{"Pretrain/Learning Rate": 2.298951048951049e-05, "Pretrain/Loss": 2.2654967308044434, "Pretrain/Loss (Raw)": 1.9972041845321655, "Pretrain/Step": 263, "Pretrain/Step Time": 8.44498141668737} +{"Pretrain/Learning Rate": 2.307692307692308e-05, "Pretrain/Loss": 2.2652487754821777, "Pretrain/Loss (Raw)": 2.122614622116089, "Pretrain/Step": 264, "Pretrain/Step Time": 8.446107832714915} +{"Pretrain/Learning Rate": 2.3164335664335666e-05, "Pretrain/Loss": 2.261927843093872, "Pretrain/Loss (Raw)": 2.3056366443634033, "Pretrain/Step": 265, "Pretrain/Step Time": 8.442637596279383} +{"Pretrain/Learning Rate": 2.3251748251748252e-05, "Pretrain/Loss": 2.2568893432617188, "Pretrain/Loss (Raw)": 1.9530844688415527, "Pretrain/Step": 266, "Pretrain/Step Time": 8.443152805790305} +{"Pretrain/Learning Rate": 2.333916083916084e-05, "Pretrain/Loss": 2.2548153400421143, "Pretrain/Loss (Raw)": 2.2439069747924805, "Pretrain/Step": 267, "Pretrain/Step Time": 8.44699607975781} +{"Pretrain/Learning Rate": 2.342657342657343e-05, "Pretrain/Loss": 2.254673719406128, "Pretrain/Loss (Raw)": 2.2037909030914307, "Pretrain/Step": 268, "Pretrain/Step Time": 8.443970946595073} +{"Pretrain/Learning Rate": 2.3513986013986015e-05, "Pretrain/Loss": 2.2526445388793945, "Pretrain/Loss (Raw)": 2.2272393703460693, "Pretrain/Step": 269, "Pretrain/Step Time": 8.440797951072454} +{"Pretrain/Learning Rate": 2.3601398601398602e-05, "Pretrain/Loss": 2.2517523765563965, "Pretrain/Loss (Raw)": 2.4200243949890137, "Pretrain/Step": 270, "Pretrain/Step Time": 8.440416863188148} +{"Pretrain/Learning Rate": 2.3688811188811192e-05, "Pretrain/Loss": 2.2494077682495117, "Pretrain/Loss (Raw)": 2.0482730865478516, "Pretrain/Step": 271, "Pretrain/Step Time": 8.440711924806237} +{"Pretrain/Learning Rate": 2.377622377622378e-05, "Pretrain/Loss": 2.2493717670440674, "Pretrain/Loss (Raw)": 2.2331342697143555, "Pretrain/Step": 272, "Pretrain/Step Time": 8.4380918815732} +{"Pretrain/Learning Rate": 2.3863636363636365e-05, "Pretrain/Loss": 2.2508420944213867, "Pretrain/Loss (Raw)": 2.2530815601348877, "Pretrain/Step": 273, "Pretrain/Step Time": 8.435203652828932} +{"Pretrain/Learning Rate": 2.3951048951048952e-05, "Pretrain/Loss": 2.2509636878967285, "Pretrain/Loss (Raw)": 2.258220911026001, "Pretrain/Step": 274, "Pretrain/Step Time": 8.436861289665103} +{"Pretrain/Learning Rate": 2.4038461538461542e-05, "Pretrain/Loss": 2.2502925395965576, "Pretrain/Loss (Raw)": 2.2915029525756836, "Pretrain/Step": 275, "Pretrain/Step Time": 8.439840136095881} +{"Pretrain/Learning Rate": 2.4125874125874125e-05, "Pretrain/Loss": 2.249403953552246, "Pretrain/Loss (Raw)": 2.2408740520477295, "Pretrain/Step": 276, "Pretrain/Step Time": 8.438797935843468} +{"Pretrain/Learning Rate": 2.4213286713286715e-05, "Pretrain/Loss": 2.249215602874756, "Pretrain/Loss (Raw)": 2.1471188068389893, "Pretrain/Step": 277, "Pretrain/Step Time": 8.43814006820321} +{"Pretrain/Learning Rate": 2.43006993006993e-05, "Pretrain/Loss": 2.250180721282959, "Pretrain/Loss (Raw)": 2.220418930053711, "Pretrain/Step": 278, "Pretrain/Step Time": 8.445159502327442} +{"Pretrain/Learning Rate": 2.4388111888111888e-05, "Pretrain/Loss": 2.248786211013794, "Pretrain/Loss (Raw)": 2.0845141410827637, "Pretrain/Step": 279, "Pretrain/Step Time": 8.44860983453691} +{"Pretrain/Learning Rate": 2.4475524475524478e-05, "Pretrain/Loss": 2.243856430053711, "Pretrain/Loss (Raw)": 1.876796007156372, "Pretrain/Step": 280, "Pretrain/Step Time": 8.452714594081044} +{"Pretrain/Learning Rate": 2.4562937062937065e-05, "Pretrain/Loss": 2.243849754333496, "Pretrain/Loss (Raw)": 2.1823642253875732, "Pretrain/Step": 281, "Pretrain/Step Time": 8.454678097739816} +{"Pretrain/Learning Rate": 2.465034965034965e-05, "Pretrain/Loss": 2.2450151443481445, "Pretrain/Loss (Raw)": 2.3791768550872803, "Pretrain/Step": 282, "Pretrain/Step Time": 8.454163953661919} +{"Pretrain/Learning Rate": 2.4737762237762238e-05, "Pretrain/Loss": 2.2429869174957275, "Pretrain/Loss (Raw)": 2.0179409980773926, "Pretrain/Step": 283, "Pretrain/Step Time": 8.454693442210555} +{"Pretrain/Learning Rate": 2.4825174825174828e-05, "Pretrain/Loss": 2.244630813598633, "Pretrain/Loss (Raw)": 2.1923599243164062, "Pretrain/Step": 284, "Pretrain/Step Time": 8.456929618492723} +{"Pretrain/Learning Rate": 2.491258741258741e-05, "Pretrain/Loss": 2.243767738342285, "Pretrain/Loss (Raw)": 2.1414339542388916, "Pretrain/Step": 285, "Pretrain/Step Time": 8.455436317250133} +{"Pretrain/Learning Rate": 2.5e-05, "Pretrain/Loss": 2.244993209838867, "Pretrain/Loss (Raw)": 2.4455950260162354, "Pretrain/Step": 286, "Pretrain/Step Time": 8.452519983053207} +{"Pretrain/Learning Rate": 2.508741258741259e-05, "Pretrain/Loss": 2.245441436767578, "Pretrain/Loss (Raw)": 2.3053226470947266, "Pretrain/Step": 287, "Pretrain/Step Time": 8.453893460333347} +{"Pretrain/Learning Rate": 2.5174825174825178e-05, "Pretrain/Loss": 2.246518135070801, "Pretrain/Loss (Raw)": 2.352550506591797, "Pretrain/Step": 288, "Pretrain/Step Time": 8.454016430303454} +{"Pretrain/Learning Rate": 2.526223776223776e-05, "Pretrain/Loss": 2.245332956314087, "Pretrain/Loss (Raw)": 2.1765599250793457, "Pretrain/Step": 289, "Pretrain/Step Time": 8.451688287779689} +{"Pretrain/Learning Rate": 2.534965034965035e-05, "Pretrain/Loss": 2.245317220687866, "Pretrain/Loss (Raw)": 2.212736129760742, "Pretrain/Step": 290, "Pretrain/Step Time": 8.444706231355667} +{"Pretrain/Learning Rate": 2.5437062937062938e-05, "Pretrain/Loss": 2.239760637283325, "Pretrain/Loss (Raw)": 2.053208112716675, "Pretrain/Step": 291, "Pretrain/Step Time": 8.44627920165658} +{"Pretrain/Learning Rate": 2.5524475524475528e-05, "Pretrain/Loss": 2.237837314605713, "Pretrain/Loss (Raw)": 2.1253502368927, "Pretrain/Step": 292, "Pretrain/Step Time": 8.445167807862163} +{"Pretrain/Learning Rate": 2.561188811188811e-05, "Pretrain/Loss": 2.2380971908569336, "Pretrain/Loss (Raw)": 2.223398208618164, "Pretrain/Step": 293, "Pretrain/Step Time": 8.4562868475914} +{"Pretrain/Learning Rate": 2.5699300699300697e-05, "Pretrain/Loss": 2.2384181022644043, "Pretrain/Loss (Raw)": 2.268420457839966, "Pretrain/Step": 294, "Pretrain/Step Time": 8.460959313437343} +{"Pretrain/Learning Rate": 2.5786713286713287e-05, "Pretrain/Loss": 2.2355244159698486, "Pretrain/Loss (Raw)": 2.0559985637664795, "Pretrain/Step": 295, "Pretrain/Step Time": 8.46257441304624} +{"Pretrain/Learning Rate": 2.5874125874125877e-05, "Pretrain/Loss": 2.2343153953552246, "Pretrain/Loss (Raw)": 2.0406670570373535, "Pretrain/Step": 296, "Pretrain/Step Time": 8.461836006492376} +{"Pretrain/Learning Rate": 2.5961538461538464e-05, "Pretrain/Loss": 2.233196496963501, "Pretrain/Loss (Raw)": 2.094620704650879, "Pretrain/Step": 297, "Pretrain/Step Time": 8.461382379755378} +{"Pretrain/Learning Rate": 2.6048951048951047e-05, "Pretrain/Loss": 2.2319679260253906, "Pretrain/Loss (Raw)": 2.1183879375457764, "Pretrain/Step": 298, "Pretrain/Step Time": 8.465624129399657} +{"Pretrain/Learning Rate": 2.6136363636363637e-05, "Pretrain/Loss": 2.231722354888916, "Pretrain/Loss (Raw)": 2.070129632949829, "Pretrain/Step": 299, "Pretrain/Step Time": 8.464548375457525} +{"Pretrain/Learning Rate": 2.6223776223776224e-05, "Pretrain/Loss": 2.2360081672668457, "Pretrain/Loss (Raw)": 2.5555381774902344, "Pretrain/Step": 300, "Pretrain/Step Time": 8.463131470605731} +{"Pretrain/Learning Rate": 2.6311188811188814e-05, "Pretrain/Loss": 2.2362709045410156, "Pretrain/Loss (Raw)": 2.3855397701263428, "Pretrain/Step": 301, "Pretrain/Step Time": 8.466500824317336} +{"Pretrain/Learning Rate": 2.6398601398601404e-05, "Pretrain/Loss": 2.2348883152008057, "Pretrain/Loss (Raw)": 2.23245906829834, "Pretrain/Step": 302, "Pretrain/Step Time": 8.465313764289021} +{"Pretrain/Learning Rate": 2.6486013986013987e-05, "Pretrain/Loss": 2.2332241535186768, "Pretrain/Loss (Raw)": 2.1326019763946533, "Pretrain/Step": 303, "Pretrain/Step Time": 8.461499342694879} +{"Pretrain/Learning Rate": 2.6573426573426574e-05, "Pretrain/Loss": 2.2330453395843506, "Pretrain/Loss (Raw)": 2.2398500442504883, "Pretrain/Step": 304, "Pretrain/Step Time": 8.455359349027276} +{"Pretrain/Learning Rate": 2.6660839160839164e-05, "Pretrain/Loss": 2.2363667488098145, "Pretrain/Loss (Raw)": 2.539839029312134, "Pretrain/Step": 305, "Pretrain/Step Time": 8.452573331072927} +{"Pretrain/Learning Rate": 2.674825174825175e-05, "Pretrain/Loss": 2.2369117736816406, "Pretrain/Loss (Raw)": 2.1188056468963623, "Pretrain/Step": 306, "Pretrain/Step Time": 8.453987082466483} +{"Pretrain/Learning Rate": 2.6835664335664333e-05, "Pretrain/Loss": 2.2382805347442627, "Pretrain/Loss (Raw)": 2.4252686500549316, "Pretrain/Step": 307, "Pretrain/Step Time": 8.451014740392566} +{"Pretrain/Learning Rate": 2.6923076923076923e-05, "Pretrain/Loss": 2.2388687133789062, "Pretrain/Loss (Raw)": 2.409727096557617, "Pretrain/Step": 308, "Pretrain/Step Time": 8.450624518096447} +{"Pretrain/Learning Rate": 2.7010489510489513e-05, "Pretrain/Loss": 2.2375411987304688, "Pretrain/Loss (Raw)": 2.0202176570892334, "Pretrain/Step": 309, "Pretrain/Step Time": 8.44914560765028} +{"Pretrain/Learning Rate": 2.70979020979021e-05, "Pretrain/Loss": 2.236342191696167, "Pretrain/Loss (Raw)": 2.358982563018799, "Pretrain/Step": 310, "Pretrain/Step Time": 8.455798970535398} +{"Pretrain/Learning Rate": 2.718531468531469e-05, "Pretrain/Loss": 2.2367942333221436, "Pretrain/Loss (Raw)": 2.4240612983703613, "Pretrain/Step": 311, "Pretrain/Step Time": 8.455742819234729} +{"Pretrain/Learning Rate": 2.7272727272727273e-05, "Pretrain/Loss": 2.237121105194092, "Pretrain/Loss (Raw)": 2.3154618740081787, "Pretrain/Step": 312, "Pretrain/Step Time": 8.457619423046708} +{"Pretrain/Learning Rate": 2.736013986013986e-05, "Pretrain/Loss": 2.2357404232025146, "Pretrain/Loss (Raw)": 2.0563626289367676, "Pretrain/Step": 313, "Pretrain/Step Time": 8.455968413501978} +{"Pretrain/Learning Rate": 2.744755244755245e-05, "Pretrain/Loss": 2.2360591888427734, "Pretrain/Loss (Raw)": 2.3838324546813965, "Pretrain/Step": 314, "Pretrain/Step Time": 8.457453882321715} +{"Pretrain/Learning Rate": 2.7534965034965036e-05, "Pretrain/Loss": 2.234313726425171, "Pretrain/Loss (Raw)": 2.353421449661255, "Pretrain/Step": 315, "Pretrain/Step Time": 8.457964865490794} +{"Pretrain/Learning Rate": 2.762237762237762e-05, "Pretrain/Loss": 2.2341814041137695, "Pretrain/Loss (Raw)": 2.166795253753662, "Pretrain/Step": 316, "Pretrain/Step Time": 8.457297576591372} +{"Pretrain/Learning Rate": 2.770979020979021e-05, "Pretrain/Loss": 2.2319469451904297, "Pretrain/Loss (Raw)": 2.025697946548462, "Pretrain/Step": 317, "Pretrain/Step Time": 8.455159595236182} +{"Pretrain/Learning Rate": 2.77972027972028e-05, "Pretrain/Loss": 2.231809139251709, "Pretrain/Loss (Raw)": 2.2833540439605713, "Pretrain/Step": 318, "Pretrain/Step Time": 8.45414592884481} +{"Pretrain/Learning Rate": 2.7884615384615386e-05, "Pretrain/Loss": 2.2310171127319336, "Pretrain/Loss (Raw)": 2.1909358501434326, "Pretrain/Step": 319, "Pretrain/Step Time": 8.450948210433125} +{"Pretrain/Learning Rate": 2.7972027972027976e-05, "Pretrain/Loss": 2.2317090034484863, "Pretrain/Loss (Raw)": 2.332923173904419, "Pretrain/Step": 320, "Pretrain/Step Time": 8.449223695322871} +{"Pretrain/Learning Rate": 2.805944055944056e-05, "Pretrain/Loss": 2.228031635284424, "Pretrain/Loss (Raw)": 2.18536114692688, "Pretrain/Step": 321, "Pretrain/Step Time": 8.444039953872561} +{"Pretrain/Learning Rate": 2.8146853146853146e-05, "Pretrain/Loss": 2.2276721000671387, "Pretrain/Loss (Raw)": 2.0607430934906006, "Pretrain/Step": 322, "Pretrain/Step Time": 8.447904571890831} +{"Pretrain/Learning Rate": 2.8234265734265736e-05, "Pretrain/Loss": 2.2294135093688965, "Pretrain/Loss (Raw)": 2.257294178009033, "Pretrain/Step": 323, "Pretrain/Step Time": 8.438875287771225} +{"Pretrain/Learning Rate": 2.8321678321678326e-05, "Pretrain/Loss": 2.231128692626953, "Pretrain/Loss (Raw)": 2.375232458114624, "Pretrain/Step": 324, "Pretrain/Step Time": 8.438013345003128} +{"Pretrain/Learning Rate": 2.8409090909090912e-05, "Pretrain/Loss": 2.231501817703247, "Pretrain/Loss (Raw)": 2.173158645629883, "Pretrain/Step": 325, "Pretrain/Step Time": 8.441926211118698} +{"Pretrain/Learning Rate": 2.8496503496503496e-05, "Pretrain/Loss": 2.2318344116210938, "Pretrain/Loss (Raw)": 2.2165372371673584, "Pretrain/Step": 326, "Pretrain/Step Time": 8.445087878033519} +{"Pretrain/Learning Rate": 2.8583916083916086e-05, "Pretrain/Loss": 2.230985164642334, "Pretrain/Loss (Raw)": 2.0507662296295166, "Pretrain/Step": 327, "Pretrain/Step Time": 8.446712067350745} +{"Pretrain/Learning Rate": 2.8671328671328672e-05, "Pretrain/Loss": 2.232097864151001, "Pretrain/Loss (Raw)": 2.4632725715637207, "Pretrain/Step": 328, "Pretrain/Step Time": 8.448932252824306} +{"Pretrain/Learning Rate": 2.8758741258741262e-05, "Pretrain/Loss": 2.2323172092437744, "Pretrain/Loss (Raw)": 2.2411649227142334, "Pretrain/Step": 329, "Pretrain/Step Time": 8.449214970692992} +{"Pretrain/Learning Rate": 2.8846153846153845e-05, "Pretrain/Loss": 2.2359676361083984, "Pretrain/Loss (Raw)": 2.508298873901367, "Pretrain/Step": 330, "Pretrain/Step Time": 8.44823869690299} +{"Pretrain/Learning Rate": 2.8933566433566432e-05, "Pretrain/Loss": 2.234147548675537, "Pretrain/Loss (Raw)": 2.205559015274048, "Pretrain/Step": 331, "Pretrain/Step Time": 8.448990017175674} +{"Pretrain/Learning Rate": 2.9020979020979022e-05, "Pretrain/Loss": 2.2329752445220947, "Pretrain/Loss (Raw)": 2.064387798309326, "Pretrain/Step": 332, "Pretrain/Step Time": 8.45004564896226} +{"Pretrain/Learning Rate": 2.9108391608391612e-05, "Pretrain/Loss": 2.2346303462982178, "Pretrain/Loss (Raw)": 2.3333826065063477, "Pretrain/Step": 333, "Pretrain/Step Time": 8.449109729379416} +{"Pretrain/Learning Rate": 2.91958041958042e-05, "Pretrain/Loss": 2.232593059539795, "Pretrain/Loss (Raw)": 2.073819160461426, "Pretrain/Step": 334, "Pretrain/Step Time": 8.449202401563525} +{"Pretrain/Learning Rate": 2.9283216783216782e-05, "Pretrain/Loss": 2.231630802154541, "Pretrain/Loss (Raw)": 2.139813184738159, "Pretrain/Step": 335, "Pretrain/Step Time": 8.449307540431619} +{"Pretrain/Learning Rate": 2.9370629370629372e-05, "Pretrain/Loss": 2.2275896072387695, "Pretrain/Loss (Raw)": 2.380129337310791, "Pretrain/Step": 336, "Pretrain/Step Time": 8.444946056231856} +{"Pretrain/Learning Rate": 2.945804195804196e-05, "Pretrain/Loss": 2.2241134643554688, "Pretrain/Loss (Raw)": 2.218708038330078, "Pretrain/Step": 337, "Pretrain/Step Time": 8.448244377970695} +{"Pretrain/Learning Rate": 2.954545454545455e-05, "Pretrain/Loss": 2.2233684062957764, "Pretrain/Loss (Raw)": 2.1865882873535156, "Pretrain/Step": 338, "Pretrain/Step Time": 8.446071300655603} +{"Pretrain/Learning Rate": 2.963286713286714e-05, "Pretrain/Loss": 2.2249159812927246, "Pretrain/Loss (Raw)": 2.4331600666046143, "Pretrain/Step": 339, "Pretrain/Step Time": 8.44549261406064} +{"Pretrain/Learning Rate": 2.972027972027972e-05, "Pretrain/Loss": 2.224546432495117, "Pretrain/Loss (Raw)": 2.253188133239746, "Pretrain/Step": 340, "Pretrain/Step Time": 8.44251411408186} +{"Pretrain/Learning Rate": 2.9807692307692308e-05, "Pretrain/Loss": 2.2259936332702637, "Pretrain/Loss (Raw)": 2.3367464542388916, "Pretrain/Step": 341, "Pretrain/Step Time": 8.445672715082765} +{"Pretrain/Learning Rate": 2.9895104895104898e-05, "Pretrain/Loss": 2.22629714012146, "Pretrain/Loss (Raw)": 2.294489622116089, "Pretrain/Step": 342, "Pretrain/Step Time": 8.448424460366368} +{"Pretrain/Learning Rate": 2.9982517482517485e-05, "Pretrain/Loss": 2.22753643989563, "Pretrain/Loss (Raw)": 2.2309725284576416, "Pretrain/Step": 343, "Pretrain/Step Time": 8.445520527660847} +{"Pretrain/Learning Rate": 3.0069930069930068e-05, "Pretrain/Loss": 2.227595567703247, "Pretrain/Loss (Raw)": 2.2726762294769287, "Pretrain/Step": 344, "Pretrain/Step Time": 8.4481456335634} +{"Pretrain/Learning Rate": 3.0157342657342658e-05, "Pretrain/Loss": 2.226269006729126, "Pretrain/Loss (Raw)": 2.164788246154785, "Pretrain/Step": 345, "Pretrain/Step Time": 8.444935817271471} +{"Pretrain/Learning Rate": 3.0244755244755245e-05, "Pretrain/Loss": 2.2274022102355957, "Pretrain/Loss (Raw)": 2.2348673343658447, "Pretrain/Step": 346, "Pretrain/Step Time": 8.447680169716477} +{"Pretrain/Learning Rate": 3.0332167832167835e-05, "Pretrain/Loss": 2.2274584770202637, "Pretrain/Loss (Raw)": 2.2076468467712402, "Pretrain/Step": 347, "Pretrain/Step Time": 8.449782252311707} +{"Pretrain/Learning Rate": 3.0419580419580425e-05, "Pretrain/Loss": 2.225482225418091, "Pretrain/Loss (Raw)": 2.1641223430633545, "Pretrain/Step": 348, "Pretrain/Step Time": 8.44693885743618} +{"Pretrain/Learning Rate": 3.0506993006993008e-05, "Pretrain/Loss": 2.2252185344696045, "Pretrain/Loss (Raw)": 2.256314516067505, "Pretrain/Step": 349, "Pretrain/Step Time": 8.449575297534466} +{"Pretrain/Learning Rate": 3.0594405594405594e-05, "Pretrain/Loss": 2.2255287170410156, "Pretrain/Loss (Raw)": 2.273784637451172, "Pretrain/Step": 350, "Pretrain/Step Time": 8.445139529183507} +{"Pretrain/Learning Rate": 3.068181818181818e-05, "Pretrain/Loss": 2.228343963623047, "Pretrain/Loss (Raw)": 2.466852903366089, "Pretrain/Step": 351, "Pretrain/Step Time": 8.441570838913321} +{"Pretrain/Learning Rate": 3.0769230769230774e-05, "Pretrain/Loss": 2.2281317710876465, "Pretrain/Loss (Raw)": 2.143812894821167, "Pretrain/Step": 352, "Pretrain/Step Time": 8.442146852612495} +{"Pretrain/Learning Rate": 3.0856643356643354e-05, "Pretrain/Loss": 2.223724365234375, "Pretrain/Loss (Raw)": 2.3199994564056396, "Pretrain/Step": 353, "Pretrain/Step Time": 8.443097088485956} +{"Pretrain/Learning Rate": 3.094405594405594e-05, "Pretrain/Loss": 2.2262158393859863, "Pretrain/Loss (Raw)": 2.4117519855499268, "Pretrain/Step": 354, "Pretrain/Step Time": 8.44580383040011} +{"Pretrain/Learning Rate": 3.1031468531468534e-05, "Pretrain/Loss": 2.226980447769165, "Pretrain/Loss (Raw)": 2.30521297454834, "Pretrain/Step": 355, "Pretrain/Step Time": 8.436292510479689} +{"Pretrain/Learning Rate": 3.111888111888112e-05, "Pretrain/Loss": 2.225489616394043, "Pretrain/Loss (Raw)": 2.1695504188537598, "Pretrain/Step": 356, "Pretrain/Step Time": 8.443802690133452} +{"Pretrain/Learning Rate": 3.120629370629371e-05, "Pretrain/Loss": 2.2273898124694824, "Pretrain/Loss (Raw)": 2.346736431121826, "Pretrain/Step": 357, "Pretrain/Step Time": 8.437438556924462} +{"Pretrain/Learning Rate": 3.1293706293706294e-05, "Pretrain/Loss": 2.230222225189209, "Pretrain/Loss (Raw)": 2.467914581298828, "Pretrain/Step": 358, "Pretrain/Step Time": 8.438238803297281} +{"Pretrain/Learning Rate": 3.138111888111888e-05, "Pretrain/Loss": 2.2285916805267334, "Pretrain/Loss (Raw)": 2.236074924468994, "Pretrain/Step": 359, "Pretrain/Step Time": 8.438349355012178} +{"Pretrain/Learning Rate": 3.146853146853147e-05, "Pretrain/Loss": 2.22866153717041, "Pretrain/Loss (Raw)": 2.38230299949646, "Pretrain/Step": 360, "Pretrain/Step Time": 8.438708700239658} +{"Pretrain/Learning Rate": 3.155594405594406e-05, "Pretrain/Loss": 2.2279436588287354, "Pretrain/Loss (Raw)": 2.213179588317871, "Pretrain/Step": 361, "Pretrain/Step Time": 8.43925366550684} +{"Pretrain/Learning Rate": 3.164335664335665e-05, "Pretrain/Loss": 2.2281599044799805, "Pretrain/Loss (Raw)": 2.3493051528930664, "Pretrain/Step": 362, "Pretrain/Step Time": 8.441380495205522} +{"Pretrain/Learning Rate": 3.1730769230769234e-05, "Pretrain/Loss": 2.225551128387451, "Pretrain/Loss (Raw)": 2.019932508468628, "Pretrain/Step": 363, "Pretrain/Step Time": 8.439373066648841} +{"Pretrain/Learning Rate": 3.181818181818182e-05, "Pretrain/Loss": 2.2271838188171387, "Pretrain/Loss (Raw)": 2.2584023475646973, "Pretrain/Step": 364, "Pretrain/Step Time": 8.440911928191781} +{"Pretrain/Learning Rate": 3.190559440559441e-05, "Pretrain/Loss": 2.227884292602539, "Pretrain/Loss (Raw)": 2.3264577388763428, "Pretrain/Step": 365, "Pretrain/Step Time": 8.442026380449533} +{"Pretrain/Learning Rate": 3.1993006993006994e-05, "Pretrain/Loss": 2.2268574237823486, "Pretrain/Loss (Raw)": 2.243236780166626, "Pretrain/Step": 366, "Pretrain/Step Time": 8.441090434789658} +{"Pretrain/Learning Rate": 3.208041958041958e-05, "Pretrain/Loss": 2.224459171295166, "Pretrain/Loss (Raw)": 2.092308521270752, "Pretrain/Step": 367, "Pretrain/Step Time": 8.438150458037853} +{"Pretrain/Learning Rate": 3.216783216783217e-05, "Pretrain/Loss": 2.2252166271209717, "Pretrain/Loss (Raw)": 2.2550792694091797, "Pretrain/Step": 368, "Pretrain/Step Time": 8.436184095218778} +{"Pretrain/Learning Rate": 3.225524475524476e-05, "Pretrain/Loss": 2.227602005004883, "Pretrain/Loss (Raw)": 2.372664451599121, "Pretrain/Step": 369, "Pretrain/Step Time": 8.429757837206125} +{"Pretrain/Learning Rate": 3.234265734265735e-05, "Pretrain/Loss": 2.2303972244262695, "Pretrain/Loss (Raw)": 2.347463607788086, "Pretrain/Step": 370, "Pretrain/Step Time": 8.432763392105699} +{"Pretrain/Learning Rate": 3.243006993006993e-05, "Pretrain/Loss": 2.2324092388153076, "Pretrain/Loss (Raw)": 2.4027798175811768, "Pretrain/Step": 371, "Pretrain/Step Time": 8.427658434957266} +{"Pretrain/Learning Rate": 3.251748251748252e-05, "Pretrain/Loss": 2.2333664894104004, "Pretrain/Loss (Raw)": 2.1260194778442383, "Pretrain/Step": 372, "Pretrain/Step Time": 8.425777850672603} +{"Pretrain/Learning Rate": 3.2604895104895106e-05, "Pretrain/Loss": 2.2342324256896973, "Pretrain/Loss (Raw)": 2.2843947410583496, "Pretrain/Step": 373, "Pretrain/Step Time": 8.434401974081993} +{"Pretrain/Learning Rate": 3.269230769230769e-05, "Pretrain/Loss": 2.234591007232666, "Pretrain/Loss (Raw)": 2.204685688018799, "Pretrain/Step": 374, "Pretrain/Step Time": 8.427211485803127} +{"Pretrain/Learning Rate": 3.277972027972028e-05, "Pretrain/Loss": 2.236320972442627, "Pretrain/Loss (Raw)": 2.363678455352783, "Pretrain/Step": 375, "Pretrain/Step Time": 8.425664683803916} +{"Pretrain/Learning Rate": 3.2867132867132866e-05, "Pretrain/Loss": 2.2364120483398438, "Pretrain/Loss (Raw)": 2.026668071746826, "Pretrain/Step": 376, "Pretrain/Step Time": 8.430130632594228} +{"Pretrain/Learning Rate": 3.295454545454545e-05, "Pretrain/Loss": 2.2348880767822266, "Pretrain/Loss (Raw)": 1.9529308080673218, "Pretrain/Step": 377, "Pretrain/Step Time": 8.430479811504483} +{"Pretrain/Learning Rate": 3.3041958041958046e-05, "Pretrain/Loss": 2.237135887145996, "Pretrain/Loss (Raw)": 2.2252421379089355, "Pretrain/Step": 378, "Pretrain/Step Time": 8.42683564312756} +{"Pretrain/Learning Rate": 3.312937062937063e-05, "Pretrain/Loss": 2.2352447509765625, "Pretrain/Loss (Raw)": 2.0740280151367188, "Pretrain/Step": 379, "Pretrain/Step Time": 8.430390443652868} +{"Pretrain/Learning Rate": 3.321678321678322e-05, "Pretrain/Loss": 2.2366883754730225, "Pretrain/Loss (Raw)": 2.416837215423584, "Pretrain/Step": 380, "Pretrain/Step Time": 8.429562294855714} +{"Pretrain/Learning Rate": 3.3304195804195806e-05, "Pretrain/Loss": 2.237490653991699, "Pretrain/Loss (Raw)": 2.415588617324829, "Pretrain/Step": 381, "Pretrain/Step Time": 8.43201282992959} +{"Pretrain/Learning Rate": 3.339160839160839e-05, "Pretrain/Loss": 2.2367005348205566, "Pretrain/Loss (Raw)": 2.2057924270629883, "Pretrain/Step": 382, "Pretrain/Step Time": 8.43099744990468} +{"Pretrain/Learning Rate": 3.347902097902098e-05, "Pretrain/Loss": 2.236921787261963, "Pretrain/Loss (Raw)": 2.3448030948638916, "Pretrain/Step": 383, "Pretrain/Step Time": 8.431758249178529} +{"Pretrain/Learning Rate": 3.356643356643357e-05, "Pretrain/Loss": 2.2394933700561523, "Pretrain/Loss (Raw)": 2.345212697982788, "Pretrain/Step": 384, "Pretrain/Step Time": 8.431752227246761} +{"Pretrain/Learning Rate": 3.365384615384616e-05, "Pretrain/Loss": 2.2397799491882324, "Pretrain/Loss (Raw)": 2.236370325088501, "Pretrain/Step": 385, "Pretrain/Step Time": 8.429471800103784} +{"Pretrain/Learning Rate": 3.374125874125874e-05, "Pretrain/Loss": 2.2394320964813232, "Pretrain/Loss (Raw)": 2.2663991451263428, "Pretrain/Step": 386, "Pretrain/Step Time": 8.424159403890371} +{"Pretrain/Learning Rate": 3.382867132867133e-05, "Pretrain/Loss": 2.2358951568603516, "Pretrain/Loss (Raw)": 2.3121070861816406, "Pretrain/Step": 387, "Pretrain/Step Time": 8.421413058415055} +{"Pretrain/Learning Rate": 3.391608391608392e-05, "Pretrain/Loss": 2.235652208328247, "Pretrain/Loss (Raw)": 2.110722541809082, "Pretrain/Step": 388, "Pretrain/Step Time": 8.418381361290812} +{"Pretrain/Learning Rate": 3.4003496503496506e-05, "Pretrain/Loss": 2.2348785400390625, "Pretrain/Loss (Raw)": 2.088376998901367, "Pretrain/Step": 389, "Pretrain/Step Time": 8.41783863864839} +{"Pretrain/Learning Rate": 3.409090909090909e-05, "Pretrain/Loss": 2.2379891872406006, "Pretrain/Loss (Raw)": 2.539443016052246, "Pretrain/Step": 390, "Pretrain/Step Time": 8.422944912686944} +{"Pretrain/Learning Rate": 3.417832167832168e-05, "Pretrain/Loss": 2.2400825023651123, "Pretrain/Loss (Raw)": 2.265148162841797, "Pretrain/Step": 391, "Pretrain/Step Time": 8.421103714033961} +{"Pretrain/Learning Rate": 3.4265734265734265e-05, "Pretrain/Loss": 2.2416279315948486, "Pretrain/Loss (Raw)": 2.320427656173706, "Pretrain/Step": 392, "Pretrain/Step Time": 8.424245530739427} +{"Pretrain/Learning Rate": 3.435314685314686e-05, "Pretrain/Loss": 2.240067958831787, "Pretrain/Loss (Raw)": 2.105928897857666, "Pretrain/Step": 393, "Pretrain/Step Time": 8.42500145174563} +{"Pretrain/Learning Rate": 3.4440559440559445e-05, "Pretrain/Loss": 2.2410531044006348, "Pretrain/Loss (Raw)": 2.079190969467163, "Pretrain/Step": 394, "Pretrain/Step Time": 8.427027463912964} +{"Pretrain/Learning Rate": 3.4527972027972025e-05, "Pretrain/Loss": 2.240067481994629, "Pretrain/Loss (Raw)": 2.1177663803100586, "Pretrain/Step": 395, "Pretrain/Step Time": 8.42339844442904} +{"Pretrain/Learning Rate": 3.461538461538462e-05, "Pretrain/Loss": 2.2395541667938232, "Pretrain/Loss (Raw)": 2.1380741596221924, "Pretrain/Step": 396, "Pretrain/Step Time": 8.423849817365408} +{"Pretrain/Learning Rate": 3.4702797202797205e-05, "Pretrain/Loss": 2.238844156265259, "Pretrain/Loss (Raw)": 2.1363613605499268, "Pretrain/Step": 397, "Pretrain/Step Time": 8.424231605604291} +{"Pretrain/Learning Rate": 3.479020979020979e-05, "Pretrain/Loss": 2.23758864402771, "Pretrain/Loss (Raw)": 2.259333848953247, "Pretrain/Step": 398, "Pretrain/Step Time": 8.42422110028565} +{"Pretrain/Learning Rate": 3.4877622377622385e-05, "Pretrain/Loss": 2.2441048622131348, "Pretrain/Loss (Raw)": 2.8823328018188477, "Pretrain/Step": 399, "Pretrain/Step Time": 8.424166347831488} +{"Pretrain/Learning Rate": 3.4965034965034965e-05, "Pretrain/Loss": 2.2433338165283203, "Pretrain/Loss (Raw)": 2.134469509124756, "Pretrain/Step": 400, "Pretrain/Step Time": 8.421540476381779} +{"Pretrain/Learning Rate": 3.505244755244755e-05, "Pretrain/Loss": 2.244774103164673, "Pretrain/Loss (Raw)": 2.4374141693115234, "Pretrain/Step": 401, "Pretrain/Step Time": 8.421855540946126} +{"Pretrain/Learning Rate": 3.5139860139860145e-05, "Pretrain/Loss": 2.244114637374878, "Pretrain/Loss (Raw)": 2.1738128662109375, "Pretrain/Step": 402, "Pretrain/Step Time": 8.421331629157066} +{"Pretrain/Learning Rate": 3.522727272727273e-05, "Pretrain/Loss": 2.2425875663757324, "Pretrain/Loss (Raw)": 2.0960352420806885, "Pretrain/Step": 403, "Pretrain/Step Time": 8.414058234542608} +{"Pretrain/Learning Rate": 3.531468531468531e-05, "Pretrain/Loss": 2.241266965866089, "Pretrain/Loss (Raw)": 2.0718507766723633, "Pretrain/Step": 404, "Pretrain/Step Time": 8.419279478490353} +{"Pretrain/Learning Rate": 3.5402097902097905e-05, "Pretrain/Loss": 2.2424070835113525, "Pretrain/Loss (Raw)": 2.2930221557617188, "Pretrain/Step": 405, "Pretrain/Step Time": 8.420650774613023} +{"Pretrain/Learning Rate": 3.548951048951049e-05, "Pretrain/Loss": 2.2442877292633057, "Pretrain/Loss (Raw)": 2.4611706733703613, "Pretrain/Step": 406, "Pretrain/Step Time": 8.414184564724565} +{"Pretrain/Learning Rate": 3.557692307692308e-05, "Pretrain/Loss": 2.2460994720458984, "Pretrain/Loss (Raw)": 2.316392183303833, "Pretrain/Step": 407, "Pretrain/Step Time": 8.413542851805687} +{"Pretrain/Learning Rate": 3.566433566433567e-05, "Pretrain/Loss": 2.248239040374756, "Pretrain/Loss (Raw)": 2.150689125061035, "Pretrain/Step": 408, "Pretrain/Step Time": 8.413361944258213} +{"Pretrain/Learning Rate": 3.575174825174825e-05, "Pretrain/Loss": 2.2476842403411865, "Pretrain/Loss (Raw)": 2.1113362312316895, "Pretrain/Step": 409, "Pretrain/Step Time": 8.416171383112669} +{"Pretrain/Learning Rate": 3.583916083916084e-05, "Pretrain/Loss": 2.24504017829895, "Pretrain/Loss (Raw)": 2.040750026702881, "Pretrain/Step": 410, "Pretrain/Step Time": 8.41742298938334} +{"Pretrain/Learning Rate": 3.592657342657343e-05, "Pretrain/Loss": 2.245786190032959, "Pretrain/Loss (Raw)": 2.1134164333343506, "Pretrain/Step": 411, "Pretrain/Step Time": 8.4164848793298} +{"Pretrain/Learning Rate": 3.601398601398602e-05, "Pretrain/Loss": 2.247218132019043, "Pretrain/Loss (Raw)": 2.3756589889526367, "Pretrain/Step": 412, "Pretrain/Step Time": 8.416206086054444} +{"Pretrain/Learning Rate": 3.61013986013986e-05, "Pretrain/Loss": 2.247753858566284, "Pretrain/Loss (Raw)": 2.209990978240967, "Pretrain/Step": 413, "Pretrain/Step Time": 8.419559765607119} +{"Pretrain/Learning Rate": 3.618881118881119e-05, "Pretrain/Loss": 2.244870662689209, "Pretrain/Loss (Raw)": 2.0765631198883057, "Pretrain/Step": 414, "Pretrain/Step Time": 8.418174777179956} +{"Pretrain/Learning Rate": 3.627622377622378e-05, "Pretrain/Loss": 2.24290132522583, "Pretrain/Loss (Raw)": 2.0532338619232178, "Pretrain/Step": 415, "Pretrain/Step Time": 8.418672285974026} +{"Pretrain/Learning Rate": 3.6363636363636364e-05, "Pretrain/Loss": 2.2407643795013428, "Pretrain/Loss (Raw)": 2.079024076461792, "Pretrain/Step": 416, "Pretrain/Step Time": 8.421336982399225} +{"Pretrain/Learning Rate": 3.645104895104896e-05, "Pretrain/Loss": 2.240687608718872, "Pretrain/Loss (Raw)": 2.166733980178833, "Pretrain/Step": 417, "Pretrain/Step Time": 8.41796494461596} +{"Pretrain/Learning Rate": 3.653846153846154e-05, "Pretrain/Loss": 2.239811897277832, "Pretrain/Loss (Raw)": 2.1006476879119873, "Pretrain/Step": 418, "Pretrain/Step Time": 8.413241878151894} +{"Pretrain/Learning Rate": 3.6625874125874124e-05, "Pretrain/Loss": 2.242434024810791, "Pretrain/Loss (Raw)": 2.3888416290283203, "Pretrain/Step": 419, "Pretrain/Step Time": 8.413690963760018} +{"Pretrain/Learning Rate": 3.671328671328672e-05, "Pretrain/Loss": 2.2419075965881348, "Pretrain/Loss (Raw)": 2.057950019836426, "Pretrain/Step": 420, "Pretrain/Step Time": 8.41428973339498} +{"Pretrain/Learning Rate": 3.6800699300699304e-05, "Pretrain/Loss": 2.2413411140441895, "Pretrain/Loss (Raw)": 2.1508805751800537, "Pretrain/Step": 421, "Pretrain/Step Time": 8.404949115589261} +{"Pretrain/Learning Rate": 3.688811188811189e-05, "Pretrain/Loss": 2.2424168586730957, "Pretrain/Loss (Raw)": 2.406169891357422, "Pretrain/Step": 422, "Pretrain/Step Time": 8.401240220293403} +{"Pretrain/Learning Rate": 3.697552447552448e-05, "Pretrain/Loss": 2.2433948516845703, "Pretrain/Loss (Raw)": 2.181152820587158, "Pretrain/Step": 423, "Pretrain/Step Time": 8.399269413203001} +{"Pretrain/Learning Rate": 3.7062937062937064e-05, "Pretrain/Loss": 2.2457656860351562, "Pretrain/Loss (Raw)": 2.3441479206085205, "Pretrain/Step": 424, "Pretrain/Step Time": 8.401071287691593} +{"Pretrain/Learning Rate": 3.715034965034965e-05, "Pretrain/Loss": 2.2459464073181152, "Pretrain/Loss (Raw)": 2.1177265644073486, "Pretrain/Step": 425, "Pretrain/Step Time": 8.403625328093767} +{"Pretrain/Learning Rate": 3.7237762237762244e-05, "Pretrain/Loss": 2.247584819793701, "Pretrain/Loss (Raw)": 2.32814359664917, "Pretrain/Step": 426, "Pretrain/Step Time": 8.401669561862946} +{"Pretrain/Learning Rate": 3.7325174825174824e-05, "Pretrain/Loss": 2.247704029083252, "Pretrain/Loss (Raw)": 2.0853347778320312, "Pretrain/Step": 427, "Pretrain/Step Time": 8.405979478731751} +{"Pretrain/Learning Rate": 3.741258741258741e-05, "Pretrain/Loss": 2.2442691326141357, "Pretrain/Loss (Raw)": 2.115889072418213, "Pretrain/Step": 428, "Pretrain/Step Time": 8.406175838783383} +{"Pretrain/Learning Rate": 3.7500000000000003e-05, "Pretrain/Loss": 2.2430715560913086, "Pretrain/Loss (Raw)": 2.2322444915771484, "Pretrain/Step": 429, "Pretrain/Step Time": 8.40745604597032} +{"Pretrain/Learning Rate": 3.758741258741259e-05, "Pretrain/Loss": 2.2414047718048096, "Pretrain/Loss (Raw)": 2.019138813018799, "Pretrain/Step": 430, "Pretrain/Step Time": 8.406692933291197} +{"Pretrain/Learning Rate": 3.767482517482518e-05, "Pretrain/Loss": 2.242779493331909, "Pretrain/Loss (Raw)": 2.308547258377075, "Pretrain/Step": 431, "Pretrain/Step Time": 8.407638426870108} +{"Pretrain/Learning Rate": 3.776223776223776e-05, "Pretrain/Loss": 2.243607759475708, "Pretrain/Loss (Raw)": 2.3458547592163086, "Pretrain/Step": 432, "Pretrain/Step Time": 8.407671874389052} +{"Pretrain/Learning Rate": 3.784965034965035e-05, "Pretrain/Loss": 2.240880012512207, "Pretrain/Loss (Raw)": 2.190666675567627, "Pretrain/Step": 433, "Pretrain/Step Time": 8.410806013271213} +{"Pretrain/Learning Rate": 3.7937062937062936e-05, "Pretrain/Loss": 2.240370035171509, "Pretrain/Loss (Raw)": 2.053582191467285, "Pretrain/Step": 434, "Pretrain/Step Time": 8.40878239646554} +{"Pretrain/Learning Rate": 3.802447552447553e-05, "Pretrain/Loss": 2.238121509552002, "Pretrain/Loss (Raw)": 2.1374526023864746, "Pretrain/Step": 435, "Pretrain/Step Time": 8.405565237626433} +{"Pretrain/Learning Rate": 3.811188811188811e-05, "Pretrain/Loss": 2.2356793880462646, "Pretrain/Loss (Raw)": 2.0971152782440186, "Pretrain/Step": 436, "Pretrain/Step Time": 8.40443767607212} +{"Pretrain/Learning Rate": 3.8199300699300696e-05, "Pretrain/Loss": 2.2367615699768066, "Pretrain/Loss (Raw)": 2.1587719917297363, "Pretrain/Step": 437, "Pretrain/Step Time": 8.41026403568685} +{"Pretrain/Learning Rate": 3.828671328671329e-05, "Pretrain/Loss": 2.234635353088379, "Pretrain/Loss (Raw)": 2.086808681488037, "Pretrain/Step": 438, "Pretrain/Step Time": 8.40273455530405} +{"Pretrain/Learning Rate": 3.8374125874125876e-05, "Pretrain/Loss": 2.232404947280884, "Pretrain/Loss (Raw)": 2.138547420501709, "Pretrain/Step": 439, "Pretrain/Step Time": 8.403456132858992} +{"Pretrain/Learning Rate": 3.846153846153846e-05, "Pretrain/Loss": 2.230362892150879, "Pretrain/Loss (Raw)": 2.0541136264801025, "Pretrain/Step": 440, "Pretrain/Step Time": 8.406489834189415} +{"Pretrain/Learning Rate": 3.854895104895105e-05, "Pretrain/Loss": 2.230682373046875, "Pretrain/Loss (Raw)": 2.0972280502319336, "Pretrain/Step": 441, "Pretrain/Step Time": 8.411283181980252} +{"Pretrain/Learning Rate": 3.8636363636363636e-05, "Pretrain/Loss": 2.2292041778564453, "Pretrain/Loss (Raw)": 2.194631814956665, "Pretrain/Step": 442, "Pretrain/Step Time": 8.4095612578094} +{"Pretrain/Learning Rate": 3.872377622377622e-05, "Pretrain/Loss": 2.2307963371276855, "Pretrain/Loss (Raw)": 2.557199239730835, "Pretrain/Step": 443, "Pretrain/Step Time": 8.411736905574799} +{"Pretrain/Learning Rate": 3.8811188811188816e-05, "Pretrain/Loss": 2.2312748432159424, "Pretrain/Loss (Raw)": 2.2280502319335938, "Pretrain/Step": 444, "Pretrain/Step Time": 8.411697028204799} +{"Pretrain/Learning Rate": 3.88986013986014e-05, "Pretrain/Loss": 2.2314858436584473, "Pretrain/Loss (Raw)": 2.0526888370513916, "Pretrain/Step": 445, "Pretrain/Step Time": 8.415589082986116} +{"Pretrain/Learning Rate": 3.898601398601399e-05, "Pretrain/Loss": 2.2313919067382812, "Pretrain/Loss (Raw)": 2.2713658809661865, "Pretrain/Step": 446, "Pretrain/Step Time": 8.413849709555507} +{"Pretrain/Learning Rate": 3.9073426573426576e-05, "Pretrain/Loss": 2.232741117477417, "Pretrain/Loss (Raw)": 2.3636341094970703, "Pretrain/Step": 447, "Pretrain/Step Time": 8.413333358243108} +{"Pretrain/Learning Rate": 3.916083916083916e-05, "Pretrain/Loss": 2.2330877780914307, "Pretrain/Loss (Raw)": 2.3772640228271484, "Pretrain/Step": 448, "Pretrain/Step Time": 8.414325904101133} +{"Pretrain/Learning Rate": 3.924825174825175e-05, "Pretrain/Loss": 2.2329375743865967, "Pretrain/Loss (Raw)": 2.166141986846924, "Pretrain/Step": 449, "Pretrain/Step Time": 8.415664155036211} +{"Pretrain/Learning Rate": 3.9335664335664336e-05, "Pretrain/Loss": 2.2343814373016357, "Pretrain/Loss (Raw)": 2.2455902099609375, "Pretrain/Step": 450, "Pretrain/Step Time": 8.41182616353035} +{"Pretrain/Learning Rate": 3.942307692307692e-05, "Pretrain/Loss": 2.2340986728668213, "Pretrain/Loss (Raw)": 2.221073865890503, "Pretrain/Step": 451, "Pretrain/Step Time": 8.412338083609939} +{"Pretrain/Learning Rate": 3.9510489510489516e-05, "Pretrain/Loss": 2.233410358428955, "Pretrain/Loss (Raw)": 2.287149429321289, "Pretrain/Step": 452, "Pretrain/Step Time": 8.412729172036052} +{"Pretrain/Learning Rate": 3.95979020979021e-05, "Pretrain/Loss": 2.234504222869873, "Pretrain/Loss (Raw)": 2.3131794929504395, "Pretrain/Step": 453, "Pretrain/Step Time": 8.416908010840416} +{"Pretrain/Learning Rate": 3.968531468531469e-05, "Pretrain/Loss": 2.234347343444824, "Pretrain/Loss (Raw)": 2.1964316368103027, "Pretrain/Step": 454, "Pretrain/Step Time": 8.412712777033448} +{"Pretrain/Learning Rate": 3.9772727272727275e-05, "Pretrain/Loss": 2.2345354557037354, "Pretrain/Loss (Raw)": 2.0748403072357178, "Pretrain/Step": 455, "Pretrain/Step Time": 8.414637168869376} +{"Pretrain/Learning Rate": 3.986013986013986e-05, "Pretrain/Loss": 2.232069969177246, "Pretrain/Loss (Raw)": 2.1476852893829346, "Pretrain/Step": 456, "Pretrain/Step Time": 8.412052012979984} +{"Pretrain/Learning Rate": 3.994755244755245e-05, "Pretrain/Loss": 2.231572151184082, "Pretrain/Loss (Raw)": 2.1774513721466064, "Pretrain/Step": 457, "Pretrain/Step Time": 8.4135279096663} +{"Pretrain/Learning Rate": 4.0034965034965035e-05, "Pretrain/Loss": 2.2296009063720703, "Pretrain/Loss (Raw)": 2.2559993267059326, "Pretrain/Step": 458, "Pretrain/Step Time": 8.41460551135242} +{"Pretrain/Learning Rate": 4.012237762237762e-05, "Pretrain/Loss": 2.2298781871795654, "Pretrain/Loss (Raw)": 2.2410378456115723, "Pretrain/Step": 459, "Pretrain/Step Time": 8.41171413473785} +{"Pretrain/Learning Rate": 4.020979020979021e-05, "Pretrain/Loss": 2.2309536933898926, "Pretrain/Loss (Raw)": 2.2020201683044434, "Pretrain/Step": 460, "Pretrain/Step Time": 8.41426401026547} +{"Pretrain/Learning Rate": 4.02972027972028e-05, "Pretrain/Loss": 2.2301454544067383, "Pretrain/Loss (Raw)": 2.229943037033081, "Pretrain/Step": 461, "Pretrain/Step Time": 8.416823660954833} +{"Pretrain/Learning Rate": 4.038461538461539e-05, "Pretrain/Loss": 2.23073148727417, "Pretrain/Loss (Raw)": 2.1488630771636963, "Pretrain/Step": 462, "Pretrain/Step Time": 8.414907190948725} +{"Pretrain/Learning Rate": 4.0472027972027975e-05, "Pretrain/Loss": 2.231755256652832, "Pretrain/Loss (Raw)": 2.2708580493927, "Pretrain/Step": 463, "Pretrain/Step Time": 8.415562964975834} +{"Pretrain/Learning Rate": 4.055944055944056e-05, "Pretrain/Loss": 2.2305643558502197, "Pretrain/Loss (Raw)": 2.2276618480682373, "Pretrain/Step": 464, "Pretrain/Step Time": 8.413309270516038} +{"Pretrain/Learning Rate": 4.064685314685315e-05, "Pretrain/Loss": 2.2315964698791504, "Pretrain/Loss (Raw)": 2.350829601287842, "Pretrain/Step": 465, "Pretrain/Step Time": 8.413526341319084} +{"Pretrain/Learning Rate": 4.0734265734265735e-05, "Pretrain/Loss": 2.2310891151428223, "Pretrain/Loss (Raw)": 2.121666193008423, "Pretrain/Step": 466, "Pretrain/Step Time": 8.412269176915288} +{"Pretrain/Learning Rate": 4.082167832167833e-05, "Pretrain/Loss": 2.229548454284668, "Pretrain/Loss (Raw)": 2.2359602451324463, "Pretrain/Step": 467, "Pretrain/Step Time": 8.407354414463043} +{"Pretrain/Learning Rate": 4.0909090909090915e-05, "Pretrain/Loss": 2.2281155586242676, "Pretrain/Loss (Raw)": 2.069772243499756, "Pretrain/Step": 468, "Pretrain/Step Time": 8.4041014816612} +{"Pretrain/Learning Rate": 4.0996503496503495e-05, "Pretrain/Loss": 2.226311206817627, "Pretrain/Loss (Raw)": 2.1057915687561035, "Pretrain/Step": 469, "Pretrain/Step Time": 8.402503730729222} +{"Pretrain/Learning Rate": 4.108391608391609e-05, "Pretrain/Loss": 2.2253928184509277, "Pretrain/Loss (Raw)": 2.1769297122955322, "Pretrain/Step": 470, "Pretrain/Step Time": 8.401603823527694} +{"Pretrain/Learning Rate": 4.1171328671328675e-05, "Pretrain/Loss": 2.2255754470825195, "Pretrain/Loss (Raw)": 2.254315137863159, "Pretrain/Step": 471, "Pretrain/Step Time": 8.405396407470107} +{"Pretrain/Learning Rate": 4.125874125874126e-05, "Pretrain/Loss": 2.2246673107147217, "Pretrain/Loss (Raw)": 2.156446695327759, "Pretrain/Step": 472, "Pretrain/Step Time": 8.405803747475147} +{"Pretrain/Learning Rate": 4.134615384615385e-05, "Pretrain/Loss": 2.2247114181518555, "Pretrain/Loss (Raw)": 2.1704394817352295, "Pretrain/Step": 473, "Pretrain/Step Time": 8.412469174712896} +{"Pretrain/Learning Rate": 4.1433566433566434e-05, "Pretrain/Loss": 2.224029302597046, "Pretrain/Loss (Raw)": 2.147556781768799, "Pretrain/Step": 474, "Pretrain/Step Time": 8.407560331746936} +{"Pretrain/Learning Rate": 4.152097902097902e-05, "Pretrain/Loss": 2.226060152053833, "Pretrain/Loss (Raw)": 2.4676053524017334, "Pretrain/Step": 475, "Pretrain/Step Time": 8.408628094941378} +{"Pretrain/Learning Rate": 4.1608391608391614e-05, "Pretrain/Loss": 2.225243091583252, "Pretrain/Loss (Raw)": 2.059522867202759, "Pretrain/Step": 476, "Pretrain/Step Time": 8.413215685635805} +{"Pretrain/Learning Rate": 4.16958041958042e-05, "Pretrain/Loss": 2.2223775386810303, "Pretrain/Loss (Raw)": 1.8895267248153687, "Pretrain/Step": 477, "Pretrain/Step Time": 8.410970175638795} +{"Pretrain/Learning Rate": 4.178321678321678e-05, "Pretrain/Loss": 2.2205734252929688, "Pretrain/Loss (Raw)": 2.042900562286377, "Pretrain/Step": 478, "Pretrain/Step Time": 8.409220008179545} +{"Pretrain/Learning Rate": 4.1870629370629374e-05, "Pretrain/Loss": 2.217799186706543, "Pretrain/Loss (Raw)": 2.1117148399353027, "Pretrain/Step": 479, "Pretrain/Step Time": 8.411212323233485} +{"Pretrain/Learning Rate": 4.195804195804196e-05, "Pretrain/Loss": 2.219054698944092, "Pretrain/Loss (Raw)": 2.3045313358306885, "Pretrain/Step": 480, "Pretrain/Step Time": 8.410362351685762} +{"Pretrain/Learning Rate": 4.204545454545455e-05, "Pretrain/Loss": 2.216952323913574, "Pretrain/Loss (Raw)": 2.0508873462677, "Pretrain/Step": 481, "Pretrain/Step Time": 8.40508477203548} +{"Pretrain/Learning Rate": 4.213286713286714e-05, "Pretrain/Loss": 2.21433687210083, "Pretrain/Loss (Raw)": 2.076993703842163, "Pretrain/Step": 482, "Pretrain/Step Time": 8.401289971545339} +{"Pretrain/Learning Rate": 4.222027972027972e-05, "Pretrain/Loss": 2.2132396697998047, "Pretrain/Loss (Raw)": 2.1647493839263916, "Pretrain/Step": 483, "Pretrain/Step Time": 8.402258183807135} +{"Pretrain/Learning Rate": 4.230769230769231e-05, "Pretrain/Loss": 2.213250160217285, "Pretrain/Loss (Raw)": 2.1709110736846924, "Pretrain/Step": 484, "Pretrain/Step Time": 8.396918304264545} +{"Pretrain/Learning Rate": 4.23951048951049e-05, "Pretrain/Loss": 2.211251735687256, "Pretrain/Loss (Raw)": 2.0909194946289062, "Pretrain/Step": 485, "Pretrain/Step Time": 8.40539557300508} +{"Pretrain/Learning Rate": 4.248251748251749e-05, "Pretrain/Loss": 2.2077646255493164, "Pretrain/Loss (Raw)": 2.0215840339660645, "Pretrain/Step": 486, "Pretrain/Step Time": 8.402956996113062} +{"Pretrain/Learning Rate": 4.256993006993007e-05, "Pretrain/Loss": 2.2068192958831787, "Pretrain/Loss (Raw)": 2.1150524616241455, "Pretrain/Step": 487, "Pretrain/Step Time": 8.402068994939327} +{"Pretrain/Learning Rate": 4.265734265734266e-05, "Pretrain/Loss": 2.2047600746154785, "Pretrain/Loss (Raw)": 2.1187078952789307, "Pretrain/Step": 488, "Pretrain/Step Time": 8.399646861478686} +{"Pretrain/Learning Rate": 4.274475524475525e-05, "Pretrain/Loss": 2.20447039604187, "Pretrain/Loss (Raw)": 2.1761298179626465, "Pretrain/Step": 489, "Pretrain/Step Time": 8.409979585558176} +{"Pretrain/Learning Rate": 4.2832167832167833e-05, "Pretrain/Loss": 2.203925609588623, "Pretrain/Loss (Raw)": 2.279557704925537, "Pretrain/Step": 490, "Pretrain/Step Time": 8.407756365835667} +{"Pretrain/Learning Rate": 4.291958041958043e-05, "Pretrain/Loss": 2.203996419906616, "Pretrain/Loss (Raw)": 2.029001474380493, "Pretrain/Step": 491, "Pretrain/Step Time": 8.414263056591153} +{"Pretrain/Learning Rate": 4.300699300699301e-05, "Pretrain/Loss": 2.2020981311798096, "Pretrain/Loss (Raw)": 2.0154147148132324, "Pretrain/Step": 492, "Pretrain/Step Time": 8.413652231916785} +{"Pretrain/Learning Rate": 4.309440559440559e-05, "Pretrain/Loss": 2.201129198074341, "Pretrain/Loss (Raw)": 2.202443838119507, "Pretrain/Step": 493, "Pretrain/Step Time": 8.413008965551853} +{"Pretrain/Learning Rate": 4.318181818181819e-05, "Pretrain/Loss": 2.2018065452575684, "Pretrain/Loss (Raw)": 2.3299005031585693, "Pretrain/Step": 494, "Pretrain/Step Time": 8.413068599998951} +{"Pretrain/Learning Rate": 4.326923076923077e-05, "Pretrain/Loss": 2.20392107963562, "Pretrain/Loss (Raw)": 2.3629848957061768, "Pretrain/Step": 495, "Pretrain/Step Time": 8.413152137771249} +{"Pretrain/Learning Rate": 4.335664335664335e-05, "Pretrain/Loss": 2.2025625705718994, "Pretrain/Loss (Raw)": 2.08120059967041, "Pretrain/Step": 496, "Pretrain/Step Time": 8.414519211277366} +{"Pretrain/Learning Rate": 4.3444055944055946e-05, "Pretrain/Loss": 2.200730323791504, "Pretrain/Loss (Raw)": 2.1381375789642334, "Pretrain/Step": 497, "Pretrain/Step Time": 8.415742607787251} +{"Pretrain/Learning Rate": 4.353146853146853e-05, "Pretrain/Loss": 2.199219226837158, "Pretrain/Loss (Raw)": 2.154040575027466, "Pretrain/Step": 498, "Pretrain/Step Time": 8.41172774322331} +{"Pretrain/Learning Rate": 4.361888111888112e-05, "Pretrain/Loss": 2.198516845703125, "Pretrain/Loss (Raw)": 2.3128597736358643, "Pretrain/Step": 499, "Pretrain/Step Time": 8.414926143363118} +{"Pretrain/Learning Rate": 4.370629370629371e-05, "Pretrain/Loss": 2.1976258754730225, "Pretrain/Loss (Raw)": 2.0120198726654053, "Pretrain/Step": 500, "Pretrain/Step Time": 8.410748224705458} +{"Pretrain/Learning Rate": 4.379370629370629e-05, "Pretrain/Loss": 2.195098400115967, "Pretrain/Loss (Raw)": 1.9608575105667114, "Pretrain/Step": 501, "Pretrain/Step Time": 8.40301670320332} +{"Pretrain/Learning Rate": 4.388111888111888e-05, "Pretrain/Loss": 2.194406032562256, "Pretrain/Loss (Raw)": 2.1160457134246826, "Pretrain/Step": 502, "Pretrain/Step Time": 8.406087439507246} +{"Pretrain/Learning Rate": 4.396853146853147e-05, "Pretrain/Loss": 2.1921257972717285, "Pretrain/Loss (Raw)": 2.0718395709991455, "Pretrain/Step": 503, "Pretrain/Step Time": 8.406687900424004} +{"Pretrain/Learning Rate": 4.405594405594406e-05, "Pretrain/Loss": 2.198296546936035, "Pretrain/Loss (Raw)": 2.8165225982666016, "Pretrain/Step": 504, "Pretrain/Step Time": 8.405750581994653} +{"Pretrain/Learning Rate": 4.4143356643356646e-05, "Pretrain/Loss": 2.199723958969116, "Pretrain/Loss (Raw)": 2.135622978210449, "Pretrain/Step": 505, "Pretrain/Step Time": 8.409650200977921} +{"Pretrain/Learning Rate": 4.423076923076923e-05, "Pretrain/Loss": 2.1982874870300293, "Pretrain/Loss (Raw)": 2.0413551330566406, "Pretrain/Step": 506, "Pretrain/Step Time": 8.411235926672816} +{"Pretrain/Learning Rate": 4.431818181818182e-05, "Pretrain/Loss": 2.199533700942993, "Pretrain/Loss (Raw)": 2.2335572242736816, "Pretrain/Step": 507, "Pretrain/Step Time": 8.41081415489316} +{"Pretrain/Learning Rate": 4.4405594405594406e-05, "Pretrain/Loss": 2.197272777557373, "Pretrain/Loss (Raw)": 2.1274731159210205, "Pretrain/Step": 508, "Pretrain/Step Time": 8.410700900480151} +{"Pretrain/Learning Rate": 4.4493006993007e-05, "Pretrain/Loss": 2.1959927082061768, "Pretrain/Loss (Raw)": 2.2517356872558594, "Pretrain/Step": 509, "Pretrain/Step Time": 8.410262048244476} +{"Pretrain/Learning Rate": 4.458041958041958e-05, "Pretrain/Loss": 2.195932388305664, "Pretrain/Loss (Raw)": 2.19803524017334, "Pretrain/Step": 510, "Pretrain/Step Time": 8.412539903074503} +{"Pretrain/Learning Rate": 4.4667832167832166e-05, "Pretrain/Loss": 2.1951093673706055, "Pretrain/Loss (Raw)": 2.2394602298736572, "Pretrain/Step": 511, "Pretrain/Step Time": 8.409850299358368} +{"Pretrain/Learning Rate": 4.475524475524476e-05, "Pretrain/Loss": 2.1928484439849854, "Pretrain/Loss (Raw)": 2.055826187133789, "Pretrain/Step": 512, "Pretrain/Step Time": 8.409714628010988} +{"Pretrain/Learning Rate": 4.4842657342657346e-05, "Pretrain/Loss": 2.189845085144043, "Pretrain/Loss (Raw)": 1.8519495725631714, "Pretrain/Step": 513, "Pretrain/Step Time": 8.409995896741748} +{"Pretrain/Learning Rate": 4.493006993006993e-05, "Pretrain/Loss": 2.1880688667297363, "Pretrain/Loss (Raw)": 2.0390119552612305, "Pretrain/Step": 514, "Pretrain/Step Time": 8.408039754256606} +{"Pretrain/Learning Rate": 4.501748251748252e-05, "Pretrain/Loss": 2.190061569213867, "Pretrain/Loss (Raw)": 2.567188262939453, "Pretrain/Step": 515, "Pretrain/Step Time": 8.406904755160213} +{"Pretrain/Learning Rate": 4.5104895104895105e-05, "Pretrain/Loss": 2.190711259841919, "Pretrain/Loss (Raw)": 2.1939046382904053, "Pretrain/Step": 516, "Pretrain/Step Time": 8.409827606752515} +{"Pretrain/Learning Rate": 4.519230769230769e-05, "Pretrain/Loss": 2.190744400024414, "Pretrain/Loss (Raw)": 2.0926101207733154, "Pretrain/Step": 517, "Pretrain/Step Time": 8.409435940906405} +{"Pretrain/Learning Rate": 4.5279720279720285e-05, "Pretrain/Loss": 2.187039375305176, "Pretrain/Loss (Raw)": 2.0651979446411133, "Pretrain/Step": 518, "Pretrain/Step Time": 8.405347546562552} +{"Pretrain/Learning Rate": 4.5367132867132865e-05, "Pretrain/Loss": 2.1855363845825195, "Pretrain/Loss (Raw)": 2.0727455615997314, "Pretrain/Step": 519, "Pretrain/Step Time": 8.406129211187363} +{"Pretrain/Learning Rate": 4.545454545454546e-05, "Pretrain/Loss": 2.182889461517334, "Pretrain/Loss (Raw)": 1.9816372394561768, "Pretrain/Step": 520, "Pretrain/Step Time": 8.400452533736825} +{"Pretrain/Learning Rate": 4.5541958041958045e-05, "Pretrain/Loss": 2.1834099292755127, "Pretrain/Loss (Raw)": 2.1725497245788574, "Pretrain/Step": 521, "Pretrain/Step Time": 8.405460162088275} +{"Pretrain/Learning Rate": 4.562937062937063e-05, "Pretrain/Loss": 2.184650421142578, "Pretrain/Loss (Raw)": 2.2379560470581055, "Pretrain/Step": 522, "Pretrain/Step Time": 8.409655924886465} +{"Pretrain/Learning Rate": 4.571678321678322e-05, "Pretrain/Loss": 2.185222625732422, "Pretrain/Loss (Raw)": 2.1910338401794434, "Pretrain/Step": 523, "Pretrain/Step Time": 8.414946842938662} +{"Pretrain/Learning Rate": 4.5804195804195805e-05, "Pretrain/Loss": 2.184929370880127, "Pretrain/Loss (Raw)": 2.1005144119262695, "Pretrain/Step": 524, "Pretrain/Step Time": 8.416446506977081} +{"Pretrain/Learning Rate": 4.589160839160839e-05, "Pretrain/Loss": 2.1854758262634277, "Pretrain/Loss (Raw)": 2.206324815750122, "Pretrain/Step": 525, "Pretrain/Step Time": 8.4176284391433} +{"Pretrain/Learning Rate": 4.597902097902098e-05, "Pretrain/Loss": 2.1841883659362793, "Pretrain/Loss (Raw)": 2.094545602798462, "Pretrain/Step": 526, "Pretrain/Step Time": 8.415576726198196} +{"Pretrain/Learning Rate": 4.606643356643357e-05, "Pretrain/Loss": 2.178386688232422, "Pretrain/Loss (Raw)": 2.1396913528442383, "Pretrain/Step": 527, "Pretrain/Step Time": 8.413662441074848} +{"Pretrain/Learning Rate": 4.615384615384616e-05, "Pretrain/Loss": 2.178647041320801, "Pretrain/Loss (Raw)": 2.167841911315918, "Pretrain/Step": 528, "Pretrain/Step Time": 8.413836739957333} +{"Pretrain/Learning Rate": 4.6241258741258745e-05, "Pretrain/Loss": 2.174903631210327, "Pretrain/Loss (Raw)": 1.9582387208938599, "Pretrain/Step": 529, "Pretrain/Step Time": 8.411834524944425} +{"Pretrain/Learning Rate": 4.632867132867133e-05, "Pretrain/Loss": 2.1749541759490967, "Pretrain/Loss (Raw)": 2.1802687644958496, "Pretrain/Step": 530, "Pretrain/Step Time": 8.414576133713126} +{"Pretrain/Learning Rate": 4.641608391608392e-05, "Pretrain/Loss": 2.173921585083008, "Pretrain/Loss (Raw)": 1.963851809501648, "Pretrain/Step": 531, "Pretrain/Step Time": 8.412859784439206} +{"Pretrain/Learning Rate": 4.6503496503496505e-05, "Pretrain/Loss": 2.172868490219116, "Pretrain/Loss (Raw)": 1.9370616674423218, "Pretrain/Step": 532, "Pretrain/Step Time": 8.408879535272717} +{"Pretrain/Learning Rate": 4.659090909090909e-05, "Pretrain/Loss": 2.172999858856201, "Pretrain/Loss (Raw)": 2.309845209121704, "Pretrain/Step": 533, "Pretrain/Step Time": 8.408327592536807} +{"Pretrain/Learning Rate": 4.667832167832168e-05, "Pretrain/Loss": 2.1695258617401123, "Pretrain/Loss (Raw)": 2.0165045261383057, "Pretrain/Step": 534, "Pretrain/Step Time": 8.408106630668044} +{"Pretrain/Learning Rate": 4.676573426573427e-05, "Pretrain/Loss": 2.170036792755127, "Pretrain/Loss (Raw)": 2.3817636966705322, "Pretrain/Step": 535, "Pretrain/Step Time": 8.408854698762298} +{"Pretrain/Learning Rate": 4.685314685314686e-05, "Pretrain/Loss": 2.1700439453125, "Pretrain/Loss (Raw)": 2.151655673980713, "Pretrain/Step": 536, "Pretrain/Step Time": 8.405495377257466} +{"Pretrain/Learning Rate": 4.6940559440559444e-05, "Pretrain/Loss": 2.171820640563965, "Pretrain/Loss (Raw)": 2.3387222290039062, "Pretrain/Step": 537, "Pretrain/Step Time": 8.402359709143639} +{"Pretrain/Learning Rate": 4.702797202797203e-05, "Pretrain/Loss": 2.172586441040039, "Pretrain/Loss (Raw)": 2.138775110244751, "Pretrain/Step": 538, "Pretrain/Step Time": 8.408212365582585} +{"Pretrain/Learning Rate": 4.711538461538462e-05, "Pretrain/Loss": 2.1727566719055176, "Pretrain/Loss (Raw)": 2.1352198123931885, "Pretrain/Step": 539, "Pretrain/Step Time": 8.408106248825788} +{"Pretrain/Learning Rate": 4.7202797202797204e-05, "Pretrain/Loss": 2.1712028980255127, "Pretrain/Loss (Raw)": 2.1767473220825195, "Pretrain/Step": 540, "Pretrain/Step Time": 8.41112825833261} +{"Pretrain/Learning Rate": 4.729020979020979e-05, "Pretrain/Loss": 2.1692347526550293, "Pretrain/Loss (Raw)": 1.9580825567245483, "Pretrain/Step": 541, "Pretrain/Step Time": 8.410174706950784} +{"Pretrain/Learning Rate": 4.7377622377622384e-05, "Pretrain/Loss": 2.170224189758301, "Pretrain/Loss (Raw)": 2.203228235244751, "Pretrain/Step": 542, "Pretrain/Step Time": 8.41176831535995} +{"Pretrain/Learning Rate": 4.7465034965034964e-05, "Pretrain/Loss": 2.1716301441192627, "Pretrain/Loss (Raw)": 2.2331478595733643, "Pretrain/Step": 543, "Pretrain/Step Time": 8.409932458773255} +{"Pretrain/Learning Rate": 4.755244755244756e-05, "Pretrain/Loss": 2.170769691467285, "Pretrain/Loss (Raw)": 1.9689149856567383, "Pretrain/Step": 544, "Pretrain/Step Time": 8.406014678999782} +{"Pretrain/Learning Rate": 4.7639860139860144e-05, "Pretrain/Loss": 2.171374559402466, "Pretrain/Loss (Raw)": 2.244162082672119, "Pretrain/Step": 545, "Pretrain/Step Time": 8.407367518171668} +{"Pretrain/Learning Rate": 4.772727272727273e-05, "Pretrain/Loss": 2.1729800701141357, "Pretrain/Loss (Raw)": 2.3061373233795166, "Pretrain/Step": 546, "Pretrain/Step Time": 8.40719946846366} +{"Pretrain/Learning Rate": 4.781468531468532e-05, "Pretrain/Loss": 2.171205520629883, "Pretrain/Loss (Raw)": 2.16167950630188, "Pretrain/Step": 547, "Pretrain/Step Time": 8.405099306255579} +{"Pretrain/Learning Rate": 4.7902097902097904e-05, "Pretrain/Loss": 2.1722400188446045, "Pretrain/Loss (Raw)": 2.190384864807129, "Pretrain/Step": 548, "Pretrain/Step Time": 8.408199895173311} +{"Pretrain/Learning Rate": 4.798951048951049e-05, "Pretrain/Loss": 2.1721887588500977, "Pretrain/Loss (Raw)": 2.144350051879883, "Pretrain/Step": 549, "Pretrain/Step Time": 8.407143525779247} +{"Pretrain/Learning Rate": 4.8076923076923084e-05, "Pretrain/Loss": 2.170620918273926, "Pretrain/Loss (Raw)": 2.205461025238037, "Pretrain/Step": 550, "Pretrain/Step Time": 8.409105697646737} +{"Pretrain/Learning Rate": 4.816433566433567e-05, "Pretrain/Loss": 2.170243740081787, "Pretrain/Loss (Raw)": 2.132855176925659, "Pretrain/Step": 551, "Pretrain/Step Time": 8.40991029702127} +{"Pretrain/Learning Rate": 4.825174825174825e-05, "Pretrain/Loss": 2.169970989227295, "Pretrain/Loss (Raw)": 2.3092856407165527, "Pretrain/Step": 552, "Pretrain/Step Time": 8.4097338616848} +{"Pretrain/Learning Rate": 4.8339160839160843e-05, "Pretrain/Loss": 2.169860363006592, "Pretrain/Loss (Raw)": 2.103541612625122, "Pretrain/Step": 553, "Pretrain/Step Time": 8.409406311810017} +{"Pretrain/Learning Rate": 4.842657342657343e-05, "Pretrain/Loss": 2.168337345123291, "Pretrain/Loss (Raw)": 2.133167028427124, "Pretrain/Step": 554, "Pretrain/Step Time": 8.414153648540378} +{"Pretrain/Learning Rate": 4.851398601398602e-05, "Pretrain/Loss": 2.169281482696533, "Pretrain/Loss (Raw)": 2.206228256225586, "Pretrain/Step": 555, "Pretrain/Step Time": 8.41138170287013} +{"Pretrain/Learning Rate": 4.86013986013986e-05, "Pretrain/Loss": 2.1724390983581543, "Pretrain/Loss (Raw)": 2.520063877105713, "Pretrain/Step": 556, "Pretrain/Step Time": 8.414486287161708} +{"Pretrain/Learning Rate": 4.868881118881119e-05, "Pretrain/Loss": 2.1723811626434326, "Pretrain/Loss (Raw)": 2.2248220443725586, "Pretrain/Step": 557, "Pretrain/Step Time": 8.414414461702108} +{"Pretrain/Learning Rate": 4.8776223776223776e-05, "Pretrain/Loss": 2.1742899417877197, "Pretrain/Loss (Raw)": 2.263467311859131, "Pretrain/Step": 558, "Pretrain/Step Time": 8.415956243872643} +{"Pretrain/Learning Rate": 4.886363636363637e-05, "Pretrain/Loss": 2.1716151237487793, "Pretrain/Loss (Raw)": 1.9661422967910767, "Pretrain/Step": 559, "Pretrain/Step Time": 8.413988471031189} +{"Pretrain/Learning Rate": 4.8951048951048956e-05, "Pretrain/Loss": 2.1730966567993164, "Pretrain/Loss (Raw)": 2.535526752471924, "Pretrain/Step": 560, "Pretrain/Step Time": 8.414711939170957} +{"Pretrain/Learning Rate": 4.9038461538461536e-05, "Pretrain/Loss": 2.1734375953674316, "Pretrain/Loss (Raw)": 2.234278917312622, "Pretrain/Step": 561, "Pretrain/Step Time": 8.412415444850922} +{"Pretrain/Learning Rate": 4.912587412587413e-05, "Pretrain/Loss": 2.174337387084961, "Pretrain/Loss (Raw)": 2.168774127960205, "Pretrain/Step": 562, "Pretrain/Step Time": 8.411184092983603} +{"Pretrain/Learning Rate": 4.9213286713286716e-05, "Pretrain/Loss": 2.173281192779541, "Pretrain/Loss (Raw)": 2.0022456645965576, "Pretrain/Step": 563, "Pretrain/Step Time": 8.413287540897727} +{"Pretrain/Learning Rate": 4.93006993006993e-05, "Pretrain/Loss": 2.174013614654541, "Pretrain/Loss (Raw)": 2.190865993499756, "Pretrain/Step": 564, "Pretrain/Step Time": 8.412102609872818} +{"Pretrain/Learning Rate": 4.9388111888111896e-05, "Pretrain/Loss": 2.173431158065796, "Pretrain/Loss (Raw)": 2.0842185020446777, "Pretrain/Step": 565, "Pretrain/Step Time": 8.405665313825011} +{"Pretrain/Learning Rate": 4.9475524475524476e-05, "Pretrain/Loss": 2.174165964126587, "Pretrain/Loss (Raw)": 2.1808595657348633, "Pretrain/Step": 566, "Pretrain/Step Time": 8.409679071977735} +{"Pretrain/Learning Rate": 4.956293706293706e-05, "Pretrain/Loss": 2.1750707626342773, "Pretrain/Loss (Raw)": 2.25437593460083, "Pretrain/Step": 567, "Pretrain/Step Time": 8.408486559987068} +{"Pretrain/Learning Rate": 4.9650349650349656e-05, "Pretrain/Loss": 2.176758289337158, "Pretrain/Loss (Raw)": 2.270134449005127, "Pretrain/Step": 568, "Pretrain/Step Time": 8.405485743656754} +{"Pretrain/Learning Rate": 4.973776223776224e-05, "Pretrain/Loss": 2.178548812866211, "Pretrain/Loss (Raw)": 2.326371908187866, "Pretrain/Step": 569, "Pretrain/Step Time": 8.40214498899877} +{"Pretrain/Learning Rate": 4.982517482517482e-05, "Pretrain/Loss": 2.1779913902282715, "Pretrain/Loss (Raw)": 2.1232826709747314, "Pretrain/Step": 570, "Pretrain/Step Time": 8.40368909202516} +{"Pretrain/Learning Rate": 4.9912587412587416e-05, "Pretrain/Loss": 2.174818992614746, "Pretrain/Loss (Raw)": 2.151154041290283, "Pretrain/Step": 571, "Pretrain/Step Time": 8.405227910727262} +{"Pretrain/Learning Rate": 5e-05, "Pretrain/Loss": 2.17284893989563, "Pretrain/Loss (Raw)": 1.975892186164856, "Pretrain/Step": 572, "Pretrain/Step Time": 8.408155761659145} +{"Pretrain/Learning Rate": 4.9999999639571315e-05, "Pretrain/Loss": 2.1745619773864746, "Pretrain/Loss (Raw)": 2.271939992904663, "Pretrain/Step": 573, "Pretrain/Step Time": 8.411442063748837} +{"Pretrain/Learning Rate": 4.999999855828526e-05, "Pretrain/Loss": 2.1741902828216553, "Pretrain/Loss (Raw)": 2.2237906455993652, "Pretrain/Step": 574, "Pretrain/Step Time": 8.415900966152549} +{"Pretrain/Learning Rate": 4.999999675614188e-05, "Pretrain/Loss": 2.1726982593536377, "Pretrain/Loss (Raw)": 2.1726491451263428, "Pretrain/Step": 575, "Pretrain/Step Time": 8.4191649928689} +{"Pretrain/Learning Rate": 4.99999942331412e-05, "Pretrain/Loss": 2.171471357345581, "Pretrain/Loss (Raw)": 2.2202224731445312, "Pretrain/Step": 576, "Pretrain/Step Time": 8.4166105017066} +{"Pretrain/Learning Rate": 4.9999990989283317e-05, "Pretrain/Loss": 2.172701597213745, "Pretrain/Loss (Raw)": 2.323625087738037, "Pretrain/Step": 577, "Pretrain/Step Time": 8.41659096814692} +{"Pretrain/Learning Rate": 4.9999987024568326e-05, "Pretrain/Loss": 2.1690926551818848, "Pretrain/Loss (Raw)": 1.7836276292800903, "Pretrain/Step": 578, "Pretrain/Step Time": 8.415837358683348} +{"Pretrain/Learning Rate": 4.999998233899632e-05, "Pretrain/Loss": 2.169332504272461, "Pretrain/Loss (Raw)": 2.2518038749694824, "Pretrain/Step": 579, "Pretrain/Step Time": 8.416085716336966} +{"Pretrain/Learning Rate": 4.999997693256746e-05, "Pretrain/Loss": 2.1671500205993652, "Pretrain/Loss (Raw)": 2.0077767372131348, "Pretrain/Step": 580, "Pretrain/Step Time": 8.419070921838284} +{"Pretrain/Learning Rate": 4.999997080528188e-05, "Pretrain/Loss": 2.165637969970703, "Pretrain/Loss (Raw)": 2.1196341514587402, "Pretrain/Step": 581, "Pretrain/Step Time": 8.410774873569608} +{"Pretrain/Learning Rate": 4.9999963957139764e-05, "Pretrain/Loss": 2.1659350395202637, "Pretrain/Loss (Raw)": 2.2344553470611572, "Pretrain/Step": 582, "Pretrain/Step Time": 8.415272453799844} +{"Pretrain/Learning Rate": 4.9999956388141324e-05, "Pretrain/Loss": 2.165862560272217, "Pretrain/Loss (Raw)": 2.065575361251831, "Pretrain/Step": 583, "Pretrain/Step Time": 8.413138626143336} +{"Pretrain/Learning Rate": 4.9999948098286756e-05, "Pretrain/Loss": 2.1651878356933594, "Pretrain/Loss (Raw)": 2.0613181591033936, "Pretrain/Step": 584, "Pretrain/Step Time": 8.416709316894412} +{"Pretrain/Learning Rate": 4.999993908757631e-05, "Pretrain/Loss": 2.164933443069458, "Pretrain/Loss (Raw)": 2.144880771636963, "Pretrain/Step": 585, "Pretrain/Step Time": 8.413246786221862} +{"Pretrain/Learning Rate": 4.999992935601024e-05, "Pretrain/Loss": 2.163682222366333, "Pretrain/Loss (Raw)": 2.095853805541992, "Pretrain/Step": 586, "Pretrain/Step Time": 8.418400309979916} +{"Pretrain/Learning Rate": 4.9999918903588834e-05, "Pretrain/Loss": 2.162569522857666, "Pretrain/Loss (Raw)": 2.098578691482544, "Pretrain/Step": 587, "Pretrain/Step Time": 8.418921487405896} +{"Pretrain/Learning Rate": 4.999990773031239e-05, "Pretrain/Loss": 2.166978359222412, "Pretrain/Loss (Raw)": 2.7663559913635254, "Pretrain/Step": 588, "Pretrain/Step Time": 8.417541766539216} +{"Pretrain/Learning Rate": 4.999989583618123e-05, "Pretrain/Loss": 2.1661365032196045, "Pretrain/Loss (Raw)": 2.1221964359283447, "Pretrain/Step": 589, "Pretrain/Step Time": 8.427555844187737} +{"Pretrain/Learning Rate": 4.99998832211957e-05, "Pretrain/Loss": 2.166048049926758, "Pretrain/Loss (Raw)": 2.1375510692596436, "Pretrain/Step": 590, "Pretrain/Step Time": 8.430242436006665} +{"Pretrain/Learning Rate": 4.999986988535616e-05, "Pretrain/Loss": 2.1655526161193848, "Pretrain/Loss (Raw)": 2.207454204559326, "Pretrain/Step": 591, "Pretrain/Step Time": 8.430107347667217} +{"Pretrain/Learning Rate": 4.9999855828663e-05, "Pretrain/Loss": 2.1643126010894775, "Pretrain/Loss (Raw)": 2.068913221359253, "Pretrain/Step": 592, "Pretrain/Step Time": 8.433673810213804} +{"Pretrain/Learning Rate": 4.999984105111661e-05, "Pretrain/Loss": 2.1628921031951904, "Pretrain/Loss (Raw)": 2.1690189838409424, "Pretrain/Step": 593, "Pretrain/Step Time": 8.43118672631681} +{"Pretrain/Learning Rate": 4.9999825552717435e-05, "Pretrain/Loss": 2.1648600101470947, "Pretrain/Loss (Raw)": 2.373552083969116, "Pretrain/Step": 594, "Pretrain/Step Time": 8.42927260324359} +{"Pretrain/Learning Rate": 4.999980933346591e-05, "Pretrain/Loss": 2.1652839183807373, "Pretrain/Loss (Raw)": 2.29022479057312, "Pretrain/Step": 595, "Pretrain/Step Time": 8.428223306313157} +{"Pretrain/Learning Rate": 4.999979239336251e-05, "Pretrain/Loss": 2.16872501373291, "Pretrain/Loss (Raw)": 2.510232925415039, "Pretrain/Step": 596, "Pretrain/Step Time": 8.428760165348649} +{"Pretrain/Learning Rate": 4.999977473240771e-05, "Pretrain/Loss": 2.168776035308838, "Pretrain/Loss (Raw)": 2.112311840057373, "Pretrain/Step": 597, "Pretrain/Step Time": 8.430630296468735} +{"Pretrain/Learning Rate": 4.999975635060204e-05, "Pretrain/Loss": 2.168895721435547, "Pretrain/Loss (Raw)": 2.192272424697876, "Pretrain/Step": 598, "Pretrain/Step Time": 8.43041367083788} +{"Pretrain/Learning Rate": 4.999973724794602e-05, "Pretrain/Loss": 2.1672263145446777, "Pretrain/Loss (Raw)": 2.040646553039551, "Pretrain/Step": 599, "Pretrain/Step Time": 8.426235061138868} +{"Pretrain/Learning Rate": 4.9999717424440195e-05, "Pretrain/Loss": 2.1684536933898926, "Pretrain/Loss (Raw)": 2.3135430812835693, "Pretrain/Step": 600, "Pretrain/Step Time": 8.426119234412909} +{"Pretrain/Learning Rate": 4.9999696880085146e-05, "Pretrain/Loss": 2.1670637130737305, "Pretrain/Loss (Raw)": 1.992519497871399, "Pretrain/Step": 601, "Pretrain/Step Time": 8.422776969149709} +{"Pretrain/Learning Rate": 4.999967561488146e-05, "Pretrain/Loss": 2.1670725345611572, "Pretrain/Loss (Raw)": 2.1486754417419434, "Pretrain/Step": 602, "Pretrain/Step Time": 8.423603493720293} +{"Pretrain/Learning Rate": 4.9999653628829745e-05, "Pretrain/Loss": 2.1632237434387207, "Pretrain/Loss (Raw)": 1.97494375705719, "Pretrain/Step": 603, "Pretrain/Step Time": 8.421952541917562} +{"Pretrain/Learning Rate": 4.999963092193065e-05, "Pretrain/Loss": 2.164506435394287, "Pretrain/Loss (Raw)": 2.223710775375366, "Pretrain/Step": 604, "Pretrain/Step Time": 8.421452235430479} +{"Pretrain/Learning Rate": 4.999960749418482e-05, "Pretrain/Loss": 2.1661858558654785, "Pretrain/Loss (Raw)": 2.104483127593994, "Pretrain/Step": 605, "Pretrain/Step Time": 8.427133798599243} +{"Pretrain/Learning Rate": 4.999958334559293e-05, "Pretrain/Loss": 2.168029308319092, "Pretrain/Loss (Raw)": 2.2788894176483154, "Pretrain/Step": 606, "Pretrain/Step Time": 8.430012887343764} +{"Pretrain/Learning Rate": 4.9999558476155675e-05, "Pretrain/Loss": 2.171757698059082, "Pretrain/Loss (Raw)": 2.588948965072632, "Pretrain/Step": 607, "Pretrain/Step Time": 8.428418351337314} +{"Pretrain/Learning Rate": 4.9999532885873774e-05, "Pretrain/Loss": 2.170989751815796, "Pretrain/Loss (Raw)": 2.206228494644165, "Pretrain/Step": 608, "Pretrain/Step Time": 8.430571531876922} +{"Pretrain/Learning Rate": 4.999950657474797e-05, "Pretrain/Loss": 2.171424150466919, "Pretrain/Loss (Raw)": 2.106471538543701, "Pretrain/Step": 609, "Pretrain/Step Time": 8.429799936711788} +{"Pretrain/Learning Rate": 4.9999479542779015e-05, "Pretrain/Loss": 2.1715445518493652, "Pretrain/Loss (Raw)": 2.0924124717712402, "Pretrain/Step": 610, "Pretrain/Step Time": 8.428195003420115} +{"Pretrain/Learning Rate": 4.999945178996769e-05, "Pretrain/Loss": 2.171785354614258, "Pretrain/Loss (Raw)": 2.195587158203125, "Pretrain/Step": 611, "Pretrain/Step Time": 8.430613158270717} +{"Pretrain/Learning Rate": 4.9999423316314795e-05, "Pretrain/Loss": 2.1734466552734375, "Pretrain/Loss (Raw)": 2.3835413455963135, "Pretrain/Step": 612, "Pretrain/Step Time": 8.428449805825949} +{"Pretrain/Learning Rate": 4.999939412182115e-05, "Pretrain/Loss": 2.1734585762023926, "Pretrain/Loss (Raw)": 2.0924339294433594, "Pretrain/Step": 613, "Pretrain/Step Time": 8.42275071144104} +{"Pretrain/Learning Rate": 4.999936420648761e-05, "Pretrain/Loss": 2.1752209663391113, "Pretrain/Loss (Raw)": 2.2471859455108643, "Pretrain/Step": 614, "Pretrain/Step Time": 8.42668848671019} +{"Pretrain/Learning Rate": 4.999933357031502e-05, "Pretrain/Loss": 2.1743674278259277, "Pretrain/Loss (Raw)": 2.0058016777038574, "Pretrain/Step": 615, "Pretrain/Step Time": 8.427248807623982} +{"Pretrain/Learning Rate": 4.999930221330427e-05, "Pretrain/Loss": 2.1719117164611816, "Pretrain/Loss (Raw)": 1.80436372756958, "Pretrain/Step": 616, "Pretrain/Step Time": 8.430643728002906} +{"Pretrain/Learning Rate": 4.999927013545627e-05, "Pretrain/Loss": 2.1737260818481445, "Pretrain/Loss (Raw)": 2.4083707332611084, "Pretrain/Step": 617, "Pretrain/Step Time": 8.421073116362095} +{"Pretrain/Learning Rate": 4.9999237336771926e-05, "Pretrain/Loss": 2.171928882598877, "Pretrain/Loss (Raw)": 2.0495362281799316, "Pretrain/Step": 618, "Pretrain/Step Time": 8.421462282538414} +{"Pretrain/Learning Rate": 4.9999203817252206e-05, "Pretrain/Loss": 2.1719517707824707, "Pretrain/Loss (Raw)": 2.0319478511810303, "Pretrain/Step": 619, "Pretrain/Step Time": 8.42165674827993} +{"Pretrain/Learning Rate": 4.999916957689806e-05, "Pretrain/Loss": 2.1733574867248535, "Pretrain/Loss (Raw)": 2.1953048706054688, "Pretrain/Step": 620, "Pretrain/Step Time": 8.425157649442554} +{"Pretrain/Learning Rate": 4.9999134615710486e-05, "Pretrain/Loss": 2.1733977794647217, "Pretrain/Loss (Raw)": 2.2076027393341064, "Pretrain/Step": 621, "Pretrain/Step Time": 8.424964023754} +{"Pretrain/Learning Rate": 4.999909893369049e-05, "Pretrain/Loss": 2.1716601848602295, "Pretrain/Loss (Raw)": 2.1075007915496826, "Pretrain/Step": 622, "Pretrain/Step Time": 8.426492696627975} +{"Pretrain/Learning Rate": 4.99990625308391e-05, "Pretrain/Loss": 2.169724941253662, "Pretrain/Loss (Raw)": 2.1152536869049072, "Pretrain/Step": 623, "Pretrain/Step Time": 8.42999772168696} +{"Pretrain/Learning Rate": 4.999902540715736e-05, "Pretrain/Loss": 2.171886444091797, "Pretrain/Loss (Raw)": 2.357905626296997, "Pretrain/Step": 624, "Pretrain/Step Time": 8.427459666505456} +{"Pretrain/Learning Rate": 4.999898756264636e-05, "Pretrain/Loss": 2.1750035285949707, "Pretrain/Loss (Raw)": 2.5371148586273193, "Pretrain/Step": 625, "Pretrain/Step Time": 8.430218307301402} +{"Pretrain/Learning Rate": 4.999894899730716e-05, "Pretrain/Loss": 2.1779820919036865, "Pretrain/Loss (Raw)": 2.535299062728882, "Pretrain/Step": 626, "Pretrain/Step Time": 8.429069064557552} +{"Pretrain/Learning Rate": 4.9998909711140895e-05, "Pretrain/Loss": 2.177368640899658, "Pretrain/Loss (Raw)": 2.2343215942382812, "Pretrain/Step": 627, "Pretrain/Step Time": 8.426733367145061} +{"Pretrain/Learning Rate": 4.9998869704148696e-05, "Pretrain/Loss": 2.179286479949951, "Pretrain/Loss (Raw)": 2.2575228214263916, "Pretrain/Step": 628, "Pretrain/Step Time": 8.425922883674502} +{"Pretrain/Learning Rate": 4.999882897633171e-05, "Pretrain/Loss": 2.179643154144287, "Pretrain/Loss (Raw)": 2.006521463394165, "Pretrain/Step": 629, "Pretrain/Step Time": 8.430025935173035} +{"Pretrain/Learning Rate": 4.999878752769111e-05, "Pretrain/Loss": 2.178640365600586, "Pretrain/Loss (Raw)": 1.987654209136963, "Pretrain/Step": 630, "Pretrain/Step Time": 8.42551133222878} +{"Pretrain/Learning Rate": 4.999874535822809e-05, "Pretrain/Loss": 2.178950071334839, "Pretrain/Loss (Raw)": 2.1114957332611084, "Pretrain/Step": 631, "Pretrain/Step Time": 8.427413629367948} +{"Pretrain/Learning Rate": 4.999870246794388e-05, "Pretrain/Loss": 2.174361228942871, "Pretrain/Loss (Raw)": 2.2291808128356934, "Pretrain/Step": 632, "Pretrain/Step Time": 8.42579641006887} +{"Pretrain/Learning Rate": 4.999865885683971e-05, "Pretrain/Loss": 2.174595355987549, "Pretrain/Loss (Raw)": 2.165572166442871, "Pretrain/Step": 633, "Pretrain/Step Time": 8.425309341400862} +{"Pretrain/Learning Rate": 4.9998614524916825e-05, "Pretrain/Loss": 2.1756274700164795, "Pretrain/Loss (Raw)": 2.1734676361083984, "Pretrain/Step": 634, "Pretrain/Step Time": 8.429216027259827} +{"Pretrain/Learning Rate": 4.999856947217651e-05, "Pretrain/Loss": 2.1740870475769043, "Pretrain/Loss (Raw)": 2.036358118057251, "Pretrain/Step": 635, "Pretrain/Step Time": 8.428934948518872} +{"Pretrain/Learning Rate": 4.999852369862008e-05, "Pretrain/Loss": 2.173274278640747, "Pretrain/Loss (Raw)": 2.023477077484131, "Pretrain/Step": 636, "Pretrain/Step Time": 8.428080264478922} +{"Pretrain/Learning Rate": 4.999847720424884e-05, "Pretrain/Loss": 2.172180414199829, "Pretrain/Loss (Raw)": 2.1116907596588135, "Pretrain/Step": 637, "Pretrain/Step Time": 8.430804286152124} +{"Pretrain/Learning Rate": 4.999842998906412e-05, "Pretrain/Loss": 2.1731839179992676, "Pretrain/Loss (Raw)": 2.326470375061035, "Pretrain/Step": 638, "Pretrain/Step Time": 8.428865864872932} +{"Pretrain/Learning Rate": 4.999838205306731e-05, "Pretrain/Loss": 2.1724436283111572, "Pretrain/Loss (Raw)": 2.144702911376953, "Pretrain/Step": 639, "Pretrain/Step Time": 8.43181856162846} +{"Pretrain/Learning Rate": 4.999833339625977e-05, "Pretrain/Loss": 2.176096200942993, "Pretrain/Loss (Raw)": 2.5233914852142334, "Pretrain/Step": 640, "Pretrain/Step Time": 8.436137383803725} +{"Pretrain/Learning Rate": 4.9998284018642905e-05, "Pretrain/Loss": 2.178054094314575, "Pretrain/Loss (Raw)": 2.102525472640991, "Pretrain/Step": 641, "Pretrain/Step Time": 8.435036435723305} +{"Pretrain/Learning Rate": 4.999823392021815e-05, "Pretrain/Loss": 2.1797380447387695, "Pretrain/Loss (Raw)": 2.254591226577759, "Pretrain/Step": 642, "Pretrain/Step Time": 8.434557534754276} +{"Pretrain/Learning Rate": 4.999818310098693e-05, "Pretrain/Loss": 2.1767959594726562, "Pretrain/Loss (Raw)": 2.1905994415283203, "Pretrain/Step": 643, "Pretrain/Step Time": 8.43400995992124} +{"Pretrain/Learning Rate": 4.999813156095074e-05, "Pretrain/Loss": 2.1764838695526123, "Pretrain/Loss (Raw)": 2.153954267501831, "Pretrain/Step": 644, "Pretrain/Step Time": 8.431544875726104} +{"Pretrain/Learning Rate": 4.999807930011103e-05, "Pretrain/Loss": 2.1768267154693604, "Pretrain/Loss (Raw)": 2.1364998817443848, "Pretrain/Step": 645, "Pretrain/Step Time": 8.427332865074277} +{"Pretrain/Learning Rate": 4.999802631846934e-05, "Pretrain/Loss": 2.1778972148895264, "Pretrain/Loss (Raw)": 2.202202081680298, "Pretrain/Step": 646, "Pretrain/Step Time": 8.424153938889503} +{"Pretrain/Learning Rate": 4.9997972616027176e-05, "Pretrain/Loss": 2.1786417961120605, "Pretrain/Loss (Raw)": 2.1680727005004883, "Pretrain/Step": 647, "Pretrain/Step Time": 8.430932821705937} +{"Pretrain/Learning Rate": 4.99979181927861e-05, "Pretrain/Loss": 2.179553985595703, "Pretrain/Loss (Raw)": 2.0983779430389404, "Pretrain/Step": 648, "Pretrain/Step Time": 8.431645596399903} +{"Pretrain/Learning Rate": 4.999786304874767e-05, "Pretrain/Loss": 2.1800971031188965, "Pretrain/Loss (Raw)": 2.242046594619751, "Pretrain/Step": 649, "Pretrain/Step Time": 8.427619693800807} +{"Pretrain/Learning Rate": 4.999780718391349e-05, "Pretrain/Loss": 2.179389476776123, "Pretrain/Loss (Raw)": 2.14739727973938, "Pretrain/Step": 650, "Pretrain/Step Time": 8.425088420510292} +{"Pretrain/Learning Rate": 4.9997750598285155e-05, "Pretrain/Loss": 2.178701877593994, "Pretrain/Loss (Raw)": 2.1030216217041016, "Pretrain/Step": 651, "Pretrain/Step Time": 8.418724086135626} +{"Pretrain/Learning Rate": 4.999769329186431e-05, "Pretrain/Loss": 2.1808197498321533, "Pretrain/Loss (Raw)": 2.371631622314453, "Pretrain/Step": 652, "Pretrain/Step Time": 8.41791963018477} +{"Pretrain/Learning Rate": 4.999763526465259e-05, "Pretrain/Loss": 2.18053936958313, "Pretrain/Loss (Raw)": 2.170403480529785, "Pretrain/Step": 653, "Pretrain/Step Time": 8.419622454792261} +{"Pretrain/Learning Rate": 4.999757651665169e-05, "Pretrain/Loss": 2.180853843688965, "Pretrain/Loss (Raw)": 2.1347944736480713, "Pretrain/Step": 654, "Pretrain/Step Time": 8.42558722384274} +{"Pretrain/Learning Rate": 4.999751704786329e-05, "Pretrain/Loss": 2.1808202266693115, "Pretrain/Loss (Raw)": 2.1353824138641357, "Pretrain/Step": 655, "Pretrain/Step Time": 8.425434252247214} +{"Pretrain/Learning Rate": 4.9997456858289104e-05, "Pretrain/Loss": 2.180894374847412, "Pretrain/Loss (Raw)": 2.1773674488067627, "Pretrain/Step": 656, "Pretrain/Step Time": 8.428381346166134} +{"Pretrain/Learning Rate": 4.999739594793087e-05, "Pretrain/Loss": 2.182741641998291, "Pretrain/Loss (Raw)": 2.194664716720581, "Pretrain/Step": 657, "Pretrain/Step Time": 8.430826527997851} +{"Pretrain/Learning Rate": 4.999733431679036e-05, "Pretrain/Loss": 2.182821035385132, "Pretrain/Loss (Raw)": 2.19044828414917, "Pretrain/Step": 658, "Pretrain/Step Time": 8.427166182547808} +{"Pretrain/Learning Rate": 4.999727196486932e-05, "Pretrain/Loss": 2.184603691101074, "Pretrain/Loss (Raw)": 2.1920149326324463, "Pretrain/Step": 659, "Pretrain/Step Time": 8.426647879183292} +{"Pretrain/Learning Rate": 4.999720889216957e-05, "Pretrain/Loss": 2.1866869926452637, "Pretrain/Loss (Raw)": 2.203730583190918, "Pretrain/Step": 660, "Pretrain/Step Time": 8.42840670235455} +{"Pretrain/Learning Rate": 4.9997145098692924e-05, "Pretrain/Loss": 2.1859636306762695, "Pretrain/Loss (Raw)": 2.2172701358795166, "Pretrain/Step": 661, "Pretrain/Step Time": 8.42840639129281} +{"Pretrain/Learning Rate": 4.999708058444122e-05, "Pretrain/Loss": 2.1886343955993652, "Pretrain/Loss (Raw)": 2.358365535736084, "Pretrain/Step": 662, "Pretrain/Step Time": 8.425436524674296} +{"Pretrain/Learning Rate": 4.999701534941633e-05, "Pretrain/Loss": 2.185866117477417, "Pretrain/Loss (Raw)": 2.0273969173431396, "Pretrain/Step": 663, "Pretrain/Step Time": 8.425194153562188} +{"Pretrain/Learning Rate": 4.999694939362011e-05, "Pretrain/Loss": 2.185657024383545, "Pretrain/Loss (Raw)": 2.1248927116394043, "Pretrain/Step": 664, "Pretrain/Step Time": 8.426458539441228} +{"Pretrain/Learning Rate": 4.999688271705448e-05, "Pretrain/Loss": 2.1862130165100098, "Pretrain/Loss (Raw)": 2.409876585006714, "Pretrain/Step": 665, "Pretrain/Step Time": 8.426835551857948} +{"Pretrain/Learning Rate": 4.9996815319721364e-05, "Pretrain/Loss": 2.1847763061523438, "Pretrain/Loss (Raw)": 1.9549086093902588, "Pretrain/Step": 666, "Pretrain/Step Time": 8.419038152322173} +{"Pretrain/Learning Rate": 4.99967472016227e-05, "Pretrain/Loss": 2.1818201541900635, "Pretrain/Loss (Raw)": 1.75681471824646, "Pretrain/Step": 667, "Pretrain/Step Time": 8.423180738463998} +{"Pretrain/Learning Rate": 4.999667836276044e-05, "Pretrain/Loss": 2.1809864044189453, "Pretrain/Loss (Raw)": 2.070054769515991, "Pretrain/Step": 668, "Pretrain/Step Time": 8.418301349505782} +{"Pretrain/Learning Rate": 4.999660880313659e-05, "Pretrain/Loss": 2.1829638481140137, "Pretrain/Loss (Raw)": 2.2111666202545166, "Pretrain/Step": 669, "Pretrain/Step Time": 8.416285751387477} +{"Pretrain/Learning Rate": 4.9996538522753145e-05, "Pretrain/Loss": 2.18121337890625, "Pretrain/Loss (Raw)": 1.979179859161377, "Pretrain/Step": 670, "Pretrain/Step Time": 8.42313202098012} +{"Pretrain/Learning Rate": 4.9996467521612136e-05, "Pretrain/Loss": 2.1808509826660156, "Pretrain/Loss (Raw)": 2.1867523193359375, "Pretrain/Step": 671, "Pretrain/Step Time": 8.424664633348584} +{"Pretrain/Learning Rate": 4.999639579971561e-05, "Pretrain/Loss": 2.183500051498413, "Pretrain/Loss (Raw)": 2.307995080947876, "Pretrain/Step": 672, "Pretrain/Step Time": 8.426198294386268} +{"Pretrain/Learning Rate": 4.9996323357065625e-05, "Pretrain/Loss": 2.182708263397217, "Pretrain/Loss (Raw)": 2.1427996158599854, "Pretrain/Step": 673, "Pretrain/Step Time": 8.431307908147573} +{"Pretrain/Learning Rate": 4.9996250193664276e-05, "Pretrain/Loss": 2.1816487312316895, "Pretrain/Loss (Raw)": 2.1705219745635986, "Pretrain/Step": 674, "Pretrain/Step Time": 8.429960813373327} +{"Pretrain/Learning Rate": 4.9996176309513674e-05, "Pretrain/Loss": 2.18056583404541, "Pretrain/Loss (Raw)": 2.0230891704559326, "Pretrain/Step": 675, "Pretrain/Step Time": 8.432570345699787} +{"Pretrain/Learning Rate": 4.999610170461596e-05, "Pretrain/Loss": 2.180077314376831, "Pretrain/Loss (Raw)": 2.12785005569458, "Pretrain/Step": 676, "Pretrain/Step Time": 8.426529236137867} +{"Pretrain/Learning Rate": 4.9996026378973266e-05, "Pretrain/Loss": 2.179643154144287, "Pretrain/Loss (Raw)": 2.088793992996216, "Pretrain/Step": 677, "Pretrain/Step Time": 8.425436088815331} +{"Pretrain/Learning Rate": 4.999595033258777e-05, "Pretrain/Loss": 2.180534839630127, "Pretrain/Loss (Raw)": 2.3195998668670654, "Pretrain/Step": 678, "Pretrain/Step Time": 8.424598596990108} +{"Pretrain/Learning Rate": 4.999587356546167e-05, "Pretrain/Loss": 2.1808016300201416, "Pretrain/Loss (Raw)": 2.166971445083618, "Pretrain/Step": 679, "Pretrain/Step Time": 8.423772247508168} +{"Pretrain/Learning Rate": 4.999579607759718e-05, "Pretrain/Loss": 2.179523468017578, "Pretrain/Loss (Raw)": 2.1457183361053467, "Pretrain/Step": 680, "Pretrain/Step Time": 8.426498120650649} +{"Pretrain/Learning Rate": 4.9995717868996525e-05, "Pretrain/Loss": 2.1786680221557617, "Pretrain/Loss (Raw)": 1.9939939975738525, "Pretrain/Step": 681, "Pretrain/Step Time": 8.427693573758006} +{"Pretrain/Learning Rate": 4.9995638939661973e-05, "Pretrain/Loss": 2.178928852081299, "Pretrain/Loss (Raw)": 2.166569232940674, "Pretrain/Step": 682, "Pretrain/Step Time": 8.425838837400079} +{"Pretrain/Learning Rate": 4.999555928959579e-05, "Pretrain/Loss": 2.179216146469116, "Pretrain/Loss (Raw)": 2.2430145740509033, "Pretrain/Step": 683, "Pretrain/Step Time": 8.424214404076338} +{"Pretrain/Learning Rate": 4.999547891880027e-05, "Pretrain/Loss": 2.1757445335388184, "Pretrain/Loss (Raw)": 2.075713872909546, "Pretrain/Step": 684, "Pretrain/Step Time": 8.423364182934165} +{"Pretrain/Learning Rate": 4.9995397827277744e-05, "Pretrain/Loss": 2.1748642921447754, "Pretrain/Loss (Raw)": 2.1121366024017334, "Pretrain/Step": 685, "Pretrain/Step Time": 8.418661443516612} +{"Pretrain/Learning Rate": 4.9995316015030535e-05, "Pretrain/Loss": 2.174666404724121, "Pretrain/Loss (Raw)": 2.2381296157836914, "Pretrain/Step": 686, "Pretrain/Step Time": 8.419257000088692} +{"Pretrain/Learning Rate": 4.999523348206102e-05, "Pretrain/Loss": 2.1778719425201416, "Pretrain/Loss (Raw)": 2.3764541149139404, "Pretrain/Step": 687, "Pretrain/Step Time": 8.426135653629899} +{"Pretrain/Learning Rate": 4.999515022837156e-05, "Pretrain/Loss": 2.1759486198425293, "Pretrain/Loss (Raw)": 2.289355516433716, "Pretrain/Step": 688, "Pretrain/Step Time": 8.428058655932546} +{"Pretrain/Learning Rate": 4.999506625396456e-05, "Pretrain/Loss": 2.1745705604553223, "Pretrain/Loss (Raw)": 2.057858467102051, "Pretrain/Step": 689, "Pretrain/Step Time": 8.426800357177854} +{"Pretrain/Learning Rate": 4.9994981558842455e-05, "Pretrain/Loss": 2.17429780960083, "Pretrain/Loss (Raw)": 2.133862257003784, "Pretrain/Step": 690, "Pretrain/Step Time": 8.429437544196844} +{"Pretrain/Learning Rate": 4.9994896143007676e-05, "Pretrain/Loss": 2.1756834983825684, "Pretrain/Loss (Raw)": 2.179623603820801, "Pretrain/Step": 691, "Pretrain/Step Time": 8.428749743849039} +{"Pretrain/Learning Rate": 4.999481000646268e-05, "Pretrain/Loss": 2.1736135482788086, "Pretrain/Loss (Raw)": 1.925934076309204, "Pretrain/Step": 692, "Pretrain/Step Time": 8.426781240850687} +{"Pretrain/Learning Rate": 4.999472314920996e-05, "Pretrain/Loss": 2.1737613677978516, "Pretrain/Loss (Raw)": 2.1031391620635986, "Pretrain/Step": 693, "Pretrain/Step Time": 8.4258419200778} +{"Pretrain/Learning Rate": 4.9994635571252016e-05, "Pretrain/Loss": 2.1738317012786865, "Pretrain/Loss (Raw)": 2.18984055519104, "Pretrain/Step": 694, "Pretrain/Step Time": 8.421563183888793} +{"Pretrain/Learning Rate": 4.999454727259138e-05, "Pretrain/Loss": 2.171837091445923, "Pretrain/Loss (Raw)": 1.999068021774292, "Pretrain/Step": 695, "Pretrain/Step Time": 8.419806031510234} +{"Pretrain/Learning Rate": 4.999445825323059e-05, "Pretrain/Loss": 2.1697802543640137, "Pretrain/Loss (Raw)": 2.006885051727295, "Pretrain/Step": 696, "Pretrain/Step Time": 8.4213026445359} +{"Pretrain/Learning Rate": 4.999436851317222e-05, "Pretrain/Loss": 2.167285442352295, "Pretrain/Loss (Raw)": 2.0070059299468994, "Pretrain/Step": 697, "Pretrain/Step Time": 8.421811670064926} +{"Pretrain/Learning Rate": 4.9994278052418854e-05, "Pretrain/Loss": 2.1671862602233887, "Pretrain/Loss (Raw)": 2.1106162071228027, "Pretrain/Step": 698, "Pretrain/Step Time": 8.4230942633003} +{"Pretrain/Learning Rate": 4.999418687097309e-05, "Pretrain/Loss": 2.166891574859619, "Pretrain/Loss (Raw)": 2.1133992671966553, "Pretrain/Step": 699, "Pretrain/Step Time": 8.41992305032909} +{"Pretrain/Learning Rate": 4.999409496883758e-05, "Pretrain/Loss": 2.1681182384490967, "Pretrain/Loss (Raw)": 2.1329257488250732, "Pretrain/Step": 700, "Pretrain/Step Time": 8.418082928285003} +{"Pretrain/Learning Rate": 4.999400234601496e-05, "Pretrain/Loss": 2.167846918106079, "Pretrain/Loss (Raw)": 2.237210988998413, "Pretrain/Step": 701, "Pretrain/Step Time": 8.414696596562862} +{"Pretrain/Learning Rate": 4.999390900250789e-05, "Pretrain/Loss": 2.169013738632202, "Pretrain/Loss (Raw)": 2.373129367828369, "Pretrain/Step": 702, "Pretrain/Step Time": 8.410632448270917} +{"Pretrain/Learning Rate": 4.9993814938319085e-05, "Pretrain/Loss": 2.169315814971924, "Pretrain/Loss (Raw)": 2.211308002471924, "Pretrain/Step": 703, "Pretrain/Step Time": 8.4171233586967} +{"Pretrain/Learning Rate": 4.9993720153451243e-05, "Pretrain/Loss": 2.168668746948242, "Pretrain/Loss (Raw)": 2.1374194622039795, "Pretrain/Step": 704, "Pretrain/Step Time": 8.424611052498221} +{"Pretrain/Learning Rate": 4.99936246479071e-05, "Pretrain/Loss": 2.1665754318237305, "Pretrain/Loss (Raw)": 2.0556623935699463, "Pretrain/Step": 705, "Pretrain/Step Time": 8.424653105437756} +{"Pretrain/Learning Rate": 4.999352842168941e-05, "Pretrain/Loss": 2.168419122695923, "Pretrain/Loss (Raw)": 2.019639492034912, "Pretrain/Step": 706, "Pretrain/Step Time": 8.42688418738544} +{"Pretrain/Learning Rate": 4.9993431474800944e-05, "Pretrain/Loss": 2.1665310859680176, "Pretrain/Loss (Raw)": 2.0101280212402344, "Pretrain/Step": 707, "Pretrain/Step Time": 8.424162784591317} +{"Pretrain/Learning Rate": 4.99933338072445e-05, "Pretrain/Loss": 2.167670488357544, "Pretrain/Loss (Raw)": 2.1536474227905273, "Pretrain/Step": 708, "Pretrain/Step Time": 8.42550902813673} +{"Pretrain/Learning Rate": 4.99932354190229e-05, "Pretrain/Loss": 2.1681599617004395, "Pretrain/Loss (Raw)": 2.1822731494903564, "Pretrain/Step": 709, "Pretrain/Step Time": 8.42545123770833} +{"Pretrain/Learning Rate": 4.999313631013897e-05, "Pretrain/Loss": 2.1660921573638916, "Pretrain/Loss (Raw)": 1.9697470664978027, "Pretrain/Step": 710, "Pretrain/Step Time": 8.425101399421692} +{"Pretrain/Learning Rate": 4.999303648059558e-05, "Pretrain/Loss": 2.1652517318725586, "Pretrain/Loss (Raw)": 1.9580090045928955, "Pretrain/Step": 711, "Pretrain/Step Time": 8.423773301765323} +{"Pretrain/Learning Rate": 4.9992935930395595e-05, "Pretrain/Loss": 2.1654248237609863, "Pretrain/Loss (Raw)": 2.083462953567505, "Pretrain/Step": 712, "Pretrain/Step Time": 8.424814196303487} +{"Pretrain/Learning Rate": 4.9992834659541926e-05, "Pretrain/Loss": 2.166883945465088, "Pretrain/Loss (Raw)": 2.331658124923706, "Pretrain/Step": 713, "Pretrain/Step Time": 8.424901464954019} +{"Pretrain/Learning Rate": 4.999273266803749e-05, "Pretrain/Loss": 2.1689372062683105, "Pretrain/Loss (Raw)": 2.358708143234253, "Pretrain/Step": 714, "Pretrain/Step Time": 8.424290023744106} +{"Pretrain/Learning Rate": 4.9992629955885225e-05, "Pretrain/Loss": 2.1705856323242188, "Pretrain/Loss (Raw)": 2.309556484222412, "Pretrain/Step": 715, "Pretrain/Step Time": 8.422658011317253} +{"Pretrain/Learning Rate": 4.999252652308809e-05, "Pretrain/Loss": 2.164970874786377, "Pretrain/Loss (Raw)": 2.0476748943328857, "Pretrain/Step": 716, "Pretrain/Step Time": 8.421716514974833} +{"Pretrain/Learning Rate": 4.9992422369649074e-05, "Pretrain/Loss": 2.164435863494873, "Pretrain/Loss (Raw)": 2.0536916255950928, "Pretrain/Step": 717, "Pretrain/Step Time": 8.410123448818922} +{"Pretrain/Learning Rate": 4.999231749557117e-05, "Pretrain/Loss": 2.1648480892181396, "Pretrain/Loss (Raw)": 2.190321922302246, "Pretrain/Step": 718, "Pretrain/Step Time": 8.409481596201658} +{"Pretrain/Learning Rate": 4.999221190085742e-05, "Pretrain/Loss": 2.1640586853027344, "Pretrain/Loss (Raw)": 2.1064000129699707, "Pretrain/Step": 719, "Pretrain/Step Time": 8.411399913951755} +{"Pretrain/Learning Rate": 4.999210558551086e-05, "Pretrain/Loss": 2.1650586128234863, "Pretrain/Loss (Raw)": 2.196931838989258, "Pretrain/Step": 720, "Pretrain/Step Time": 8.411650579422712} +{"Pretrain/Learning Rate": 4.9991998549534545e-05, "Pretrain/Loss": 2.1639773845672607, "Pretrain/Loss (Raw)": 2.0305893421173096, "Pretrain/Step": 721, "Pretrain/Step Time": 8.41306733340025} +{"Pretrain/Learning Rate": 4.9991890792931575e-05, "Pretrain/Loss": 2.1623640060424805, "Pretrain/Loss (Raw)": 2.1670491695404053, "Pretrain/Step": 722, "Pretrain/Step Time": 8.414003008976579} +{"Pretrain/Learning Rate": 4.999178231570505e-05, "Pretrain/Loss": 2.161194324493408, "Pretrain/Loss (Raw)": 2.1405258178710938, "Pretrain/Step": 723, "Pretrain/Step Time": 8.414414580911398} +{"Pretrain/Learning Rate": 4.99916731178581e-05, "Pretrain/Loss": 2.158735990524292, "Pretrain/Loss (Raw)": 2.1955814361572266, "Pretrain/Step": 724, "Pretrain/Step Time": 8.41756121814251} +{"Pretrain/Learning Rate": 4.9991563199393876e-05, "Pretrain/Loss": 2.1588168144226074, "Pretrain/Loss (Raw)": 2.1226019859313965, "Pretrain/Step": 725, "Pretrain/Step Time": 8.41299607604742} +{"Pretrain/Learning Rate": 4.9991452560315547e-05, "Pretrain/Loss": 2.158191680908203, "Pretrain/Loss (Raw)": 2.1122865676879883, "Pretrain/Step": 726, "Pretrain/Step Time": 8.413394497707486} +{"Pretrain/Learning Rate": 4.9991341200626295e-05, "Pretrain/Loss": 2.159339666366577, "Pretrain/Loss (Raw)": 2.187589406967163, "Pretrain/Step": 727, "Pretrain/Step Time": 8.410627087578177} +{"Pretrain/Learning Rate": 4.999122912032934e-05, "Pretrain/Loss": 2.1566877365112305, "Pretrain/Loss (Raw)": 1.9740864038467407, "Pretrain/Step": 728, "Pretrain/Step Time": 8.411905216053128} +{"Pretrain/Learning Rate": 4.999111631942791e-05, "Pretrain/Loss": 2.1554455757141113, "Pretrain/Loss (Raw)": 1.8335223197937012, "Pretrain/Step": 729, "Pretrain/Step Time": 8.411236710846424} +{"Pretrain/Learning Rate": 4.999100279792526e-05, "Pretrain/Loss": 2.155543327331543, "Pretrain/Loss (Raw)": 2.1612133979797363, "Pretrain/Step": 730, "Pretrain/Step Time": 8.411875205114484} +{"Pretrain/Learning Rate": 4.999088855582466e-05, "Pretrain/Loss": 2.1569435596466064, "Pretrain/Loss (Raw)": 2.1541624069213867, "Pretrain/Step": 731, "Pretrain/Step Time": 8.414096988737583} +{"Pretrain/Learning Rate": 4.99907735931294e-05, "Pretrain/Loss": 2.155973434448242, "Pretrain/Loss (Raw)": 2.0995304584503174, "Pretrain/Step": 732, "Pretrain/Step Time": 8.410499708727002} +{"Pretrain/Learning Rate": 4.999065790984282e-05, "Pretrain/Loss": 2.1564879417419434, "Pretrain/Loss (Raw)": 2.170342206954956, "Pretrain/Step": 733, "Pretrain/Step Time": 8.407851899042726} +{"Pretrain/Learning Rate": 4.999054150596822e-05, "Pretrain/Loss": 2.156068801879883, "Pretrain/Loss (Raw)": 2.225254774093628, "Pretrain/Step": 734, "Pretrain/Step Time": 8.412065839394927} +{"Pretrain/Learning Rate": 4.999042438150898e-05, "Pretrain/Loss": 2.152695417404175, "Pretrain/Loss (Raw)": 2.157123565673828, "Pretrain/Step": 735, "Pretrain/Step Time": 8.412534756585956} +{"Pretrain/Learning Rate": 4.9990306536468464e-05, "Pretrain/Loss": 2.1533451080322266, "Pretrain/Loss (Raw)": 2.289405107498169, "Pretrain/Step": 736, "Pretrain/Step Time": 8.415347253903747} +{"Pretrain/Learning Rate": 4.9990187970850074e-05, "Pretrain/Loss": 2.1552226543426514, "Pretrain/Loss (Raw)": 2.3467798233032227, "Pretrain/Step": 737, "Pretrain/Step Time": 8.416688984259963} +{"Pretrain/Learning Rate": 4.9990068684657246e-05, "Pretrain/Loss": 2.155721664428711, "Pretrain/Loss (Raw)": 2.156303882598877, "Pretrain/Step": 738, "Pretrain/Step Time": 8.417828803882003} +{"Pretrain/Learning Rate": 4.998994867789339e-05, "Pretrain/Loss": 2.158032178878784, "Pretrain/Loss (Raw)": 2.4913413524627686, "Pretrain/Step": 739, "Pretrain/Step Time": 8.415612533688545} +{"Pretrain/Learning Rate": 4.9989827950561984e-05, "Pretrain/Loss": 2.1553149223327637, "Pretrain/Loss (Raw)": 2.0357322692871094, "Pretrain/Step": 740, "Pretrain/Step Time": 8.414987774565816} +{"Pretrain/Learning Rate": 4.998970650266651e-05, "Pretrain/Loss": 2.1570229530334473, "Pretrain/Loss (Raw)": 2.311042308807373, "Pretrain/Step": 741, "Pretrain/Step Time": 8.412902051582932} +{"Pretrain/Learning Rate": 4.998958433421046e-05, "Pretrain/Loss": 2.1566720008850098, "Pretrain/Loss (Raw)": 2.202301025390625, "Pretrain/Step": 742, "Pretrain/Step Time": 8.412891952320933} +{"Pretrain/Learning Rate": 4.998946144519736e-05, "Pretrain/Loss": 2.1592206954956055, "Pretrain/Loss (Raw)": 2.33199405670166, "Pretrain/Step": 743, "Pretrain/Step Time": 8.411557516083121} +{"Pretrain/Learning Rate": 4.998933783563076e-05, "Pretrain/Loss": 2.1623425483703613, "Pretrain/Loss (Raw)": 2.2039878368377686, "Pretrain/Step": 744, "Pretrain/Step Time": 8.409740384668112} +{"Pretrain/Learning Rate": 4.998921350551422e-05, "Pretrain/Loss": 2.160688638687134, "Pretrain/Loss (Raw)": 2.196658134460449, "Pretrain/Step": 745, "Pretrain/Step Time": 8.414036372676492} +{"Pretrain/Learning Rate": 4.998908845485133e-05, "Pretrain/Loss": 2.1608071327209473, "Pretrain/Loss (Raw)": 2.0647335052490234, "Pretrain/Step": 746, "Pretrain/Step Time": 8.416171442717314} +{"Pretrain/Learning Rate": 4.998896268364568e-05, "Pretrain/Loss": 2.1618263721466064, "Pretrain/Loss (Raw)": 2.162381649017334, "Pretrain/Step": 747, "Pretrain/Step Time": 8.41086563281715} +{"Pretrain/Learning Rate": 4.9988836191900915e-05, "Pretrain/Loss": 2.161987781524658, "Pretrain/Loss (Raw)": 2.2159500122070312, "Pretrain/Step": 748, "Pretrain/Step Time": 8.408215761184692} +{"Pretrain/Learning Rate": 4.998870897962067e-05, "Pretrain/Loss": 2.161862373352051, "Pretrain/Loss (Raw)": 2.1915483474731445, "Pretrain/Step": 749, "Pretrain/Step Time": 8.409209480509162} +{"Pretrain/Learning Rate": 4.998858104680862e-05, "Pretrain/Loss": 2.1612603664398193, "Pretrain/Loss (Raw)": 2.03045916557312, "Pretrain/Step": 750, "Pretrain/Step Time": 8.40649888291955} +{"Pretrain/Learning Rate": 4.9988452393468454e-05, "Pretrain/Loss": 2.163022518157959, "Pretrain/Loss (Raw)": 2.340792179107666, "Pretrain/Step": 751, "Pretrain/Step Time": 8.408617403358221} +{"Pretrain/Learning Rate": 4.998832301960387e-05, "Pretrain/Loss": 2.162497043609619, "Pretrain/Loss (Raw)": 2.2906532287597656, "Pretrain/Step": 752, "Pretrain/Step Time": 8.409947687759995} +{"Pretrain/Learning Rate": 4.9988192925218617e-05, "Pretrain/Loss": 2.16011118888855, "Pretrain/Loss (Raw)": 2.2317469120025635, "Pretrain/Step": 753, "Pretrain/Step Time": 8.413759101182222} +{"Pretrain/Learning Rate": 4.998806211031643e-05, "Pretrain/Loss": 2.1615800857543945, "Pretrain/Loss (Raw)": 2.7233166694641113, "Pretrain/Step": 754, "Pretrain/Step Time": 8.414242632687092} +{"Pretrain/Learning Rate": 4.998793057490109e-05, "Pretrain/Loss": 2.163729667663574, "Pretrain/Loss (Raw)": 2.509460687637329, "Pretrain/Step": 755, "Pretrain/Step Time": 8.416496051475406} +{"Pretrain/Learning Rate": 4.998779831897639e-05, "Pretrain/Loss": 2.1625170707702637, "Pretrain/Loss (Raw)": 2.1023247241973877, "Pretrain/Step": 756, "Pretrain/Step Time": 8.415802348405123} +{"Pretrain/Learning Rate": 4.998766534254613e-05, "Pretrain/Loss": 2.1652331352233887, "Pretrain/Loss (Raw)": 2.354140281677246, "Pretrain/Step": 757, "Pretrain/Step Time": 8.41573641076684} +{"Pretrain/Learning Rate": 4.9987531645614164e-05, "Pretrain/Loss": 2.16597318649292, "Pretrain/Loss (Raw)": 2.082418441772461, "Pretrain/Step": 758, "Pretrain/Step Time": 8.41919033229351} +{"Pretrain/Learning Rate": 4.998739722818434e-05, "Pretrain/Loss": 2.1684889793395996, "Pretrain/Loss (Raw)": 2.433502197265625, "Pretrain/Step": 759, "Pretrain/Step Time": 8.41671891324222} +{"Pretrain/Learning Rate": 4.9987262090260526e-05, "Pretrain/Loss": 2.1683101654052734, "Pretrain/Loss (Raw)": 2.206317901611328, "Pretrain/Step": 760, "Pretrain/Step Time": 8.415039939805865} +{"Pretrain/Learning Rate": 4.9987126231846625e-05, "Pretrain/Loss": 2.1681346893310547, "Pretrain/Loss (Raw)": 2.1431081295013428, "Pretrain/Step": 761, "Pretrain/Step Time": 8.418435113504529} +{"Pretrain/Learning Rate": 4.998698965294656e-05, "Pretrain/Loss": 2.1658544540405273, "Pretrain/Loss (Raw)": 1.8815759420394897, "Pretrain/Step": 762, "Pretrain/Step Time": 8.414621617645025} +{"Pretrain/Learning Rate": 4.998685235356426e-05, "Pretrain/Loss": 2.1666576862335205, "Pretrain/Loss (Raw)": 2.1391637325286865, "Pretrain/Step": 763, "Pretrain/Step Time": 8.411958772689104} +{"Pretrain/Learning Rate": 4.9986714333703685e-05, "Pretrain/Loss": 2.167036533355713, "Pretrain/Loss (Raw)": 2.071974992752075, "Pretrain/Step": 764, "Pretrain/Step Time": 8.416775008663535} +{"Pretrain/Learning Rate": 4.998657559336882e-05, "Pretrain/Loss": 2.1670148372650146, "Pretrain/Loss (Raw)": 2.1089112758636475, "Pretrain/Step": 765, "Pretrain/Step Time": 8.413918616250157} +{"Pretrain/Learning Rate": 4.9986436132563656e-05, "Pretrain/Loss": 2.1646971702575684, "Pretrain/Loss (Raw)": 2.0298125743865967, "Pretrain/Step": 766, "Pretrain/Step Time": 8.412903813645244} +{"Pretrain/Learning Rate": 4.9986295951292226e-05, "Pretrain/Loss": 2.1641697883605957, "Pretrain/Loss (Raw)": 2.0771844387054443, "Pretrain/Step": 767, "Pretrain/Step Time": 8.415301661938429} +{"Pretrain/Learning Rate": 4.9986155049558566e-05, "Pretrain/Loss": 2.161123037338257, "Pretrain/Loss (Raw)": 2.1334316730499268, "Pretrain/Step": 768, "Pretrain/Step Time": 8.418065583333373} +{"Pretrain/Learning Rate": 4.9986013427366734e-05, "Pretrain/Loss": 2.1615400314331055, "Pretrain/Loss (Raw)": 2.1558926105499268, "Pretrain/Step": 769, "Pretrain/Step Time": 8.419415928423405} +{"Pretrain/Learning Rate": 4.9985871084720824e-05, "Pretrain/Loss": 2.160008430480957, "Pretrain/Loss (Raw)": 2.058558702468872, "Pretrain/Step": 770, "Pretrain/Step Time": 8.420278958976269} +{"Pretrain/Learning Rate": 4.9985728021624936e-05, "Pretrain/Loss": 2.1584126949310303, "Pretrain/Loss (Raw)": 1.986318826675415, "Pretrain/Step": 771, "Pretrain/Step Time": 8.419000197201967} +{"Pretrain/Learning Rate": 4.998558423808319e-05, "Pretrain/Loss": 2.1570608615875244, "Pretrain/Loss (Raw)": 1.9809305667877197, "Pretrain/Step": 772, "Pretrain/Step Time": 8.420457931235433} +{"Pretrain/Learning Rate": 4.9985439734099736e-05, "Pretrain/Loss": 2.15704345703125, "Pretrain/Loss (Raw)": 2.1342525482177734, "Pretrain/Step": 773, "Pretrain/Step Time": 8.422261429950595} +{"Pretrain/Learning Rate": 4.9985294509678746e-05, "Pretrain/Loss": 2.157097578048706, "Pretrain/Loss (Raw)": 2.2091565132141113, "Pretrain/Step": 774, "Pretrain/Step Time": 8.422839615494013} +{"Pretrain/Learning Rate": 4.99851485648244e-05, "Pretrain/Loss": 2.157193660736084, "Pretrain/Loss (Raw)": 2.180363178253174, "Pretrain/Step": 775, "Pretrain/Step Time": 8.418348645791411} +{"Pretrain/Learning Rate": 4.9985001899540905e-05, "Pretrain/Loss": 2.1558618545532227, "Pretrain/Loss (Raw)": 1.9279303550720215, "Pretrain/Step": 776, "Pretrain/Step Time": 8.42148407176137} +{"Pretrain/Learning Rate": 4.99848545138325e-05, "Pretrain/Loss": 2.1573123931884766, "Pretrain/Loss (Raw)": 2.427708864212036, "Pretrain/Step": 777, "Pretrain/Step Time": 8.421738846227527} +{"Pretrain/Learning Rate": 4.998470640770342e-05, "Pretrain/Loss": 2.1572632789611816, "Pretrain/Loss (Raw)": 2.1411101818084717, "Pretrain/Step": 778, "Pretrain/Step Time": 8.4212600402534} +{"Pretrain/Learning Rate": 4.998455758115795e-05, "Pretrain/Loss": 2.1562914848327637, "Pretrain/Loss (Raw)": 1.978609561920166, "Pretrain/Step": 779, "Pretrain/Step Time": 8.420483455061913} +{"Pretrain/Learning Rate": 4.998440803420037e-05, "Pretrain/Loss": 2.1550416946411133, "Pretrain/Loss (Raw)": 2.2116622924804688, "Pretrain/Step": 780, "Pretrain/Step Time": 8.422838198021054} +{"Pretrain/Learning Rate": 4.9984257766835005e-05, "Pretrain/Loss": 2.1543710231781006, "Pretrain/Loss (Raw)": 2.084562301635742, "Pretrain/Step": 781, "Pretrain/Step Time": 8.420944564044476} +{"Pretrain/Learning Rate": 4.9984106779066174e-05, "Pretrain/Loss": 2.153451442718506, "Pretrain/Loss (Raw)": 2.017094135284424, "Pretrain/Step": 782, "Pretrain/Step Time": 8.417650043964386} +{"Pretrain/Learning Rate": 4.9983955070898235e-05, "Pretrain/Loss": 2.154839515686035, "Pretrain/Loss (Raw)": 2.3130626678466797, "Pretrain/Step": 783, "Pretrain/Step Time": 8.419222213327885} +{"Pretrain/Learning Rate": 4.998380264233557e-05, "Pretrain/Loss": 2.1546688079833984, "Pretrain/Loss (Raw)": 2.155515193939209, "Pretrain/Step": 784, "Pretrain/Step Time": 8.423877384513617} +{"Pretrain/Learning Rate": 4.9983649493382564e-05, "Pretrain/Loss": 2.1547460556030273, "Pretrain/Loss (Raw)": 2.2045352458953857, "Pretrain/Step": 785, "Pretrain/Step Time": 8.42374648526311} +{"Pretrain/Learning Rate": 4.998349562404364e-05, "Pretrain/Loss": 2.1539721488952637, "Pretrain/Loss (Raw)": 2.091404438018799, "Pretrain/Step": 786, "Pretrain/Step Time": 8.426812646910548} +{"Pretrain/Learning Rate": 4.998334103432323e-05, "Pretrain/Loss": 2.1517789363861084, "Pretrain/Loss (Raw)": 1.9112608432769775, "Pretrain/Step": 787, "Pretrain/Step Time": 8.428535846993327} +{"Pretrain/Learning Rate": 4.998318572422579e-05, "Pretrain/Loss": 2.1460633277893066, "Pretrain/Loss (Raw)": 1.4721482992172241, "Pretrain/Step": 788, "Pretrain/Step Time": 8.42690620943904} +{"Pretrain/Learning Rate": 4.9983029693755815e-05, "Pretrain/Loss": 2.145246982574463, "Pretrain/Loss (Raw)": 2.1127772331237793, "Pretrain/Step": 789, "Pretrain/Step Time": 8.428175562992692} +{"Pretrain/Learning Rate": 4.998287294291778e-05, "Pretrain/Loss": 2.144056797027588, "Pretrain/Loss (Raw)": 2.2060019969940186, "Pretrain/Step": 790, "Pretrain/Step Time": 8.428319146856666} +{"Pretrain/Learning Rate": 4.998271547171621e-05, "Pretrain/Loss": 2.14505672454834, "Pretrain/Loss (Raw)": 2.1553964614868164, "Pretrain/Step": 791, "Pretrain/Step Time": 8.427623476833105} +{"Pretrain/Learning Rate": 4.998255728015566e-05, "Pretrain/Loss": 2.1443185806274414, "Pretrain/Loss (Raw)": 2.030421018600464, "Pretrain/Step": 792, "Pretrain/Step Time": 8.428395595401525} +{"Pretrain/Learning Rate": 4.998239836824068e-05, "Pretrain/Loss": 2.1417675018310547, "Pretrain/Loss (Raw)": 2.0833141803741455, "Pretrain/Step": 793, "Pretrain/Step Time": 8.428683750331402} +{"Pretrain/Learning Rate": 4.998223873597586e-05, "Pretrain/Loss": 2.1418473720550537, "Pretrain/Loss (Raw)": 1.9651354551315308, "Pretrain/Step": 794, "Pretrain/Step Time": 8.431880816817284} +{"Pretrain/Learning Rate": 4.998207838336579e-05, "Pretrain/Loss": 2.144386053085327, "Pretrain/Loss (Raw)": 2.0817816257476807, "Pretrain/Step": 795, "Pretrain/Step Time": 8.427293365821242} +{"Pretrain/Learning Rate": 4.998191731041511e-05, "Pretrain/Loss": 2.145430326461792, "Pretrain/Loss (Raw)": 2.203716516494751, "Pretrain/Step": 796, "Pretrain/Step Time": 8.429756201803684} +{"Pretrain/Learning Rate": 4.9981755517128434e-05, "Pretrain/Loss": 2.143862724304199, "Pretrain/Loss (Raw)": 2.0105462074279785, "Pretrain/Step": 797, "Pretrain/Step Time": 8.4312663115561} +{"Pretrain/Learning Rate": 4.998159300351047e-05, "Pretrain/Loss": 2.144855499267578, "Pretrain/Loss (Raw)": 2.106227397918701, "Pretrain/Step": 798, "Pretrain/Step Time": 8.427762674167752} +{"Pretrain/Learning Rate": 4.998142976956588e-05, "Pretrain/Loss": 2.144498348236084, "Pretrain/Loss (Raw)": 2.1410393714904785, "Pretrain/Step": 799, "Pretrain/Step Time": 8.42796166613698} +{"Pretrain/Learning Rate": 4.998126581529936e-05, "Pretrain/Loss": 2.1426711082458496, "Pretrain/Loss (Raw)": 2.0741097927093506, "Pretrain/Step": 800, "Pretrain/Step Time": 8.427824784070253} +{"Pretrain/Learning Rate": 4.9981101140715663e-05, "Pretrain/Loss": 2.1431493759155273, "Pretrain/Loss (Raw)": 2.2040066719055176, "Pretrain/Step": 801, "Pretrain/Step Time": 8.427579052746296} +{"Pretrain/Learning Rate": 4.998093574581953e-05, "Pretrain/Loss": 2.142578601837158, "Pretrain/Loss (Raw)": 2.097485303878784, "Pretrain/Step": 802, "Pretrain/Step Time": 8.437077708542347} +{"Pretrain/Learning Rate": 4.998076963061571e-05, "Pretrain/Loss": 2.1450185775756836, "Pretrain/Loss (Raw)": 2.3353631496429443, "Pretrain/Step": 803, "Pretrain/Step Time": 8.43245454877615} +{"Pretrain/Learning Rate": 4.9980602795109014e-05, "Pretrain/Loss": 2.1441802978515625, "Pretrain/Loss (Raw)": 2.0205790996551514, "Pretrain/Step": 804, "Pretrain/Step Time": 8.434045860543847} +{"Pretrain/Learning Rate": 4.9980435239304245e-05, "Pretrain/Loss": 2.1457343101501465, "Pretrain/Loss (Raw)": 2.2877163887023926, "Pretrain/Step": 805, "Pretrain/Step Time": 8.436127444729209} +{"Pretrain/Learning Rate": 4.998026696320625e-05, "Pretrain/Loss": 2.14437198638916, "Pretrain/Loss (Raw)": 2.145188331604004, "Pretrain/Step": 806, "Pretrain/Step Time": 8.437860367819667} +{"Pretrain/Learning Rate": 4.998009796681985e-05, "Pretrain/Loss": 2.1444592475891113, "Pretrain/Loss (Raw)": 2.1781344413757324, "Pretrain/Step": 807, "Pretrain/Step Time": 8.441039009019732} +{"Pretrain/Learning Rate": 4.9979928250149946e-05, "Pretrain/Loss": 2.145664691925049, "Pretrain/Loss (Raw)": 2.300053834915161, "Pretrain/Step": 808, "Pretrain/Step Time": 8.437191674485803} +{"Pretrain/Learning Rate": 4.997975781320141e-05, "Pretrain/Loss": 2.1473939418792725, "Pretrain/Loss (Raw)": 2.2153284549713135, "Pretrain/Step": 809, "Pretrain/Step Time": 8.44076131656766} +{"Pretrain/Learning Rate": 4.997958665597917e-05, "Pretrain/Loss": 2.1471590995788574, "Pretrain/Loss (Raw)": 2.1364705562591553, "Pretrain/Step": 810, "Pretrain/Step Time": 8.435128791257739} +{"Pretrain/Learning Rate": 4.9979414778488164e-05, "Pretrain/Loss": 2.146617889404297, "Pretrain/Loss (Raw)": 2.1737802028656006, "Pretrain/Step": 811, "Pretrain/Step Time": 8.439768584445119} +{"Pretrain/Learning Rate": 4.997924218073334e-05, "Pretrain/Loss": 2.149674654006958, "Pretrain/Loss (Raw)": 2.466984748840332, "Pretrain/Step": 812, "Pretrain/Step Time": 8.439701499417424} +{"Pretrain/Learning Rate": 4.997906886271967e-05, "Pretrain/Loss": 2.1492156982421875, "Pretrain/Loss (Raw)": 2.0533950328826904, "Pretrain/Step": 813, "Pretrain/Step Time": 8.44284214451909} +{"Pretrain/Learning Rate": 4.997889482445217e-05, "Pretrain/Loss": 2.1494812965393066, "Pretrain/Loss (Raw)": 2.2721314430236816, "Pretrain/Step": 814, "Pretrain/Step Time": 8.441418861970305} +{"Pretrain/Learning Rate": 4.9978720065935834e-05, "Pretrain/Loss": 2.146775960922241, "Pretrain/Loss (Raw)": 2.030172109603882, "Pretrain/Step": 815, "Pretrain/Step Time": 8.44194820150733} +{"Pretrain/Learning Rate": 4.9978544587175724e-05, "Pretrain/Loss": 2.1470847129821777, "Pretrain/Loss (Raw)": 2.328860282897949, "Pretrain/Step": 816, "Pretrain/Step Time": 8.440524503588676} +{"Pretrain/Learning Rate": 4.9978368388176885e-05, "Pretrain/Loss": 2.1479926109313965, "Pretrain/Loss (Raw)": 2.174057722091675, "Pretrain/Step": 817, "Pretrain/Step Time": 8.443845957517624} +{"Pretrain/Learning Rate": 4.99781914689444e-05, "Pretrain/Loss": 2.1499791145324707, "Pretrain/Loss (Raw)": 2.388162851333618, "Pretrain/Step": 818, "Pretrain/Step Time": 8.445744201540947} +{"Pretrain/Learning Rate": 4.9978013829483384e-05, "Pretrain/Loss": 2.1501379013061523, "Pretrain/Loss (Raw)": 2.199920654296875, "Pretrain/Step": 819, "Pretrain/Step Time": 8.448295028880239} +{"Pretrain/Learning Rate": 4.9977835469798933e-05, "Pretrain/Loss": 2.1538774967193604, "Pretrain/Loss (Raw)": 2.4046220779418945, "Pretrain/Step": 820, "Pretrain/Step Time": 8.448108488693833} +{"Pretrain/Learning Rate": 4.997765638989621e-05, "Pretrain/Loss": 2.155461311340332, "Pretrain/Loss (Raw)": 2.305859327316284, "Pretrain/Step": 821, "Pretrain/Step Time": 8.450706381350756} +{"Pretrain/Learning Rate": 4.9977476589780376e-05, "Pretrain/Loss": 2.154602289199829, "Pretrain/Loss (Raw)": 2.0798802375793457, "Pretrain/Step": 822, "Pretrain/Step Time": 8.452723167836666} +{"Pretrain/Learning Rate": 4.9977296069456616e-05, "Pretrain/Loss": 2.15746808052063, "Pretrain/Loss (Raw)": 2.365882396697998, "Pretrain/Step": 823, "Pretrain/Step Time": 8.456182925030589} +{"Pretrain/Learning Rate": 4.997711482893012e-05, "Pretrain/Loss": 2.1588096618652344, "Pretrain/Loss (Raw)": 2.178612232208252, "Pretrain/Step": 824, "Pretrain/Step Time": 8.456200895830989} +{"Pretrain/Learning Rate": 4.997693286820613e-05, "Pretrain/Loss": 2.1607351303100586, "Pretrain/Loss (Raw)": 2.2534430027008057, "Pretrain/Step": 825, "Pretrain/Step Time": 8.46509718336165} +{"Pretrain/Learning Rate": 4.997675018728989e-05, "Pretrain/Loss": 2.1607322692871094, "Pretrain/Loss (Raw)": 2.11027455329895, "Pretrain/Step": 826, "Pretrain/Step Time": 8.461710108444095} +{"Pretrain/Learning Rate": 4.9976566786186666e-05, "Pretrain/Loss": 2.1638150215148926, "Pretrain/Loss (Raw)": 2.507981300354004, "Pretrain/Step": 827, "Pretrain/Step Time": 8.459940865635872} +{"Pretrain/Learning Rate": 4.997638266490174e-05, "Pretrain/Loss": 2.1636948585510254, "Pretrain/Loss (Raw)": 2.1175599098205566, "Pretrain/Step": 828, "Pretrain/Step Time": 8.460938043892384} +{"Pretrain/Learning Rate": 4.997619782344044e-05, "Pretrain/Loss": 2.1636412143707275, "Pretrain/Loss (Raw)": 2.230332374572754, "Pretrain/Step": 829, "Pretrain/Step Time": 8.456000985577703} +{"Pretrain/Learning Rate": 4.9976012261808075e-05, "Pretrain/Loss": 2.160508632659912, "Pretrain/Loss (Raw)": 1.9721862077713013, "Pretrain/Step": 830, "Pretrain/Step Time": 8.456002376973629} +{"Pretrain/Learning Rate": 4.9975825980010003e-05, "Pretrain/Loss": 2.160142421722412, "Pretrain/Loss (Raw)": 2.1644139289855957, "Pretrain/Step": 831, "Pretrain/Step Time": 8.449249343946576} +{"Pretrain/Learning Rate": 4.99756389780516e-05, "Pretrain/Loss": 2.1609408855438232, "Pretrain/Loss (Raw)": 2.239607572555542, "Pretrain/Step": 832, "Pretrain/Step Time": 8.443407217040658} +{"Pretrain/Learning Rate": 4.997545125593825e-05, "Pretrain/Loss": 2.1607680320739746, "Pretrain/Loss (Raw)": 2.0335421562194824, "Pretrain/Step": 833, "Pretrain/Step Time": 8.44366362132132} +{"Pretrain/Learning Rate": 4.997526281367537e-05, "Pretrain/Loss": 2.1605095863342285, "Pretrain/Loss (Raw)": 1.986554503440857, "Pretrain/Step": 834, "Pretrain/Step Time": 8.442066928371787} +{"Pretrain/Learning Rate": 4.997507365126839e-05, "Pretrain/Loss": 2.161681890487671, "Pretrain/Loss (Raw)": 2.1602115631103516, "Pretrain/Step": 835, "Pretrain/Step Time": 8.444437354803085} +{"Pretrain/Learning Rate": 4.997488376872277e-05, "Pretrain/Loss": 2.1610817909240723, "Pretrain/Loss (Raw)": 2.076852321624756, "Pretrain/Step": 836, "Pretrain/Step Time": 8.443516368046403} +{"Pretrain/Learning Rate": 4.9974693166043986e-05, "Pretrain/Loss": 2.1611831188201904, "Pretrain/Loss (Raw)": 2.195193290710449, "Pretrain/Step": 837, "Pretrain/Step Time": 8.443172739818692} +{"Pretrain/Learning Rate": 4.9974501843237525e-05, "Pretrain/Loss": 2.163398265838623, "Pretrain/Loss (Raw)": 2.2533063888549805, "Pretrain/Step": 838, "Pretrain/Step Time": 8.443578954786062} +{"Pretrain/Learning Rate": 4.9974309800308914e-05, "Pretrain/Loss": 2.163965940475464, "Pretrain/Loss (Raw)": 2.030672073364258, "Pretrain/Step": 839, "Pretrain/Step Time": 8.440145514905453} +{"Pretrain/Learning Rate": 4.997411703726368e-05, "Pretrain/Loss": 2.163329601287842, "Pretrain/Loss (Raw)": 2.002012252807617, "Pretrain/Step": 840, "Pretrain/Step Time": 8.442330764606595} +{"Pretrain/Learning Rate": 4.9973923554107394e-05, "Pretrain/Loss": 2.1628241539001465, "Pretrain/Loss (Raw)": 2.2669458389282227, "Pretrain/Step": 841, "Pretrain/Step Time": 8.439295906573534} +{"Pretrain/Learning Rate": 4.997372935084562e-05, "Pretrain/Loss": 2.161189556121826, "Pretrain/Loss (Raw)": 2.1494812965393066, "Pretrain/Step": 842, "Pretrain/Step Time": 8.443021219223738} +{"Pretrain/Learning Rate": 4.997353442748397e-05, "Pretrain/Loss": 2.1591579914093018, "Pretrain/Loss (Raw)": 2.049520969390869, "Pretrain/Step": 843, "Pretrain/Step Time": 8.445885663852096} +{"Pretrain/Learning Rate": 4.997333878402807e-05, "Pretrain/Loss": 2.1603879928588867, "Pretrain/Loss (Raw)": 2.2051408290863037, "Pretrain/Step": 844, "Pretrain/Step Time": 8.447585631161928} +{"Pretrain/Learning Rate": 4.997314242048353e-05, "Pretrain/Loss": 2.160426616668701, "Pretrain/Loss (Raw)": 2.05859112739563, "Pretrain/Step": 845, "Pretrain/Step Time": 8.4479901753366} +{"Pretrain/Learning Rate": 4.9972945336856045e-05, "Pretrain/Loss": 2.1581687927246094, "Pretrain/Loss (Raw)": 1.9013454914093018, "Pretrain/Step": 846, "Pretrain/Step Time": 8.447650691494346} +{"Pretrain/Learning Rate": 4.997274753315129e-05, "Pretrain/Loss": 2.1589913368225098, "Pretrain/Loss (Raw)": 2.2116847038269043, "Pretrain/Step": 847, "Pretrain/Step Time": 8.444354135543108} +{"Pretrain/Learning Rate": 4.997254900937496e-05, "Pretrain/Loss": 2.1576685905456543, "Pretrain/Loss (Raw)": 2.0276010036468506, "Pretrain/Step": 848, "Pretrain/Step Time": 8.443640878424048} +{"Pretrain/Learning Rate": 4.997234976553278e-05, "Pretrain/Loss": 2.1609578132629395, "Pretrain/Loss (Raw)": 2.4516260623931885, "Pretrain/Step": 849, "Pretrain/Step Time": 8.446440998464823} +{"Pretrain/Learning Rate": 4.997214980163051e-05, "Pretrain/Loss": 2.1601898670196533, "Pretrain/Loss (Raw)": 2.0687501430511475, "Pretrain/Step": 850, "Pretrain/Step Time": 8.447822520509362} +{"Pretrain/Learning Rate": 4.9971949117673885e-05, "Pretrain/Loss": 2.1600594520568848, "Pretrain/Loss (Raw)": 2.1238291263580322, "Pretrain/Step": 851, "Pretrain/Step Time": 8.451933866366744} +{"Pretrain/Learning Rate": 4.9971747713668724e-05, "Pretrain/Loss": 2.1589431762695312, "Pretrain/Loss (Raw)": 2.0527117252349854, "Pretrain/Step": 852, "Pretrain/Step Time": 8.451587030664086} +{"Pretrain/Learning Rate": 4.9971545589620824e-05, "Pretrain/Loss": 2.1605587005615234, "Pretrain/Loss (Raw)": 2.3293731212615967, "Pretrain/Step": 853, "Pretrain/Step Time": 8.454540353268385} +{"Pretrain/Learning Rate": 4.997134274553601e-05, "Pretrain/Loss": 2.1595566272735596, "Pretrain/Loss (Raw)": 1.9840480089187622, "Pretrain/Step": 854, "Pretrain/Step Time": 8.45374651812017} +{"Pretrain/Learning Rate": 4.997113918142013e-05, "Pretrain/Loss": 2.158205270767212, "Pretrain/Loss (Raw)": 2.014594078063965, "Pretrain/Step": 855, "Pretrain/Step Time": 8.455132020637393} +{"Pretrain/Learning Rate": 4.9970934897279056e-05, "Pretrain/Loss": 2.1592795848846436, "Pretrain/Loss (Raw)": 2.1115951538085938, "Pretrain/Step": 856, "Pretrain/Step Time": 8.454001044854522} +{"Pretrain/Learning Rate": 4.9970729893118673e-05, "Pretrain/Loss": 2.1611008644104004, "Pretrain/Loss (Raw)": 2.0666494369506836, "Pretrain/Step": 857, "Pretrain/Step Time": 8.453297605738044} +{"Pretrain/Learning Rate": 4.99705241689449e-05, "Pretrain/Loss": 2.161019802093506, "Pretrain/Loss (Raw)": 2.15085768699646, "Pretrain/Step": 858, "Pretrain/Step Time": 8.454020459204912} +{"Pretrain/Learning Rate": 4.9970317724763665e-05, "Pretrain/Loss": 2.1620450019836426, "Pretrain/Loss (Raw)": 2.2853620052337646, "Pretrain/Step": 859, "Pretrain/Step Time": 8.457170594483614} +{"Pretrain/Learning Rate": 4.997011056058092e-05, "Pretrain/Loss": 2.1615357398986816, "Pretrain/Loss (Raw)": 2.0343334674835205, "Pretrain/Step": 860, "Pretrain/Step Time": 8.458913011476398} +{"Pretrain/Learning Rate": 4.996990267640265e-05, "Pretrain/Loss": 2.1614127159118652, "Pretrain/Loss (Raw)": 2.154587984085083, "Pretrain/Step": 861, "Pretrain/Step Time": 8.459428254514933} +{"Pretrain/Learning Rate": 4.996969407223482e-05, "Pretrain/Loss": 2.158318281173706, "Pretrain/Loss (Raw)": 1.8292014598846436, "Pretrain/Step": 862, "Pretrain/Step Time": 8.454305255785584} +{"Pretrain/Learning Rate": 4.996948474808348e-05, "Pretrain/Loss": 2.157472848892212, "Pretrain/Loss (Raw)": 2.0489137172698975, "Pretrain/Step": 863, "Pretrain/Step Time": 8.454786069691181} +{"Pretrain/Learning Rate": 4.996927470395464e-05, "Pretrain/Loss": 2.1546244621276855, "Pretrain/Loss (Raw)": 1.9247790575027466, "Pretrain/Step": 864, "Pretrain/Step Time": 8.450377719476819} +{"Pretrain/Learning Rate": 4.996906393985437e-05, "Pretrain/Loss": 2.1534371376037598, "Pretrain/Loss (Raw)": 2.1948232650756836, "Pretrain/Step": 865, "Pretrain/Step Time": 8.450021823868155} +{"Pretrain/Learning Rate": 4.9968852455788745e-05, "Pretrain/Loss": 2.1547913551330566, "Pretrain/Loss (Raw)": 2.329633951187134, "Pretrain/Step": 866, "Pretrain/Step Time": 8.453942788764834} +{"Pretrain/Learning Rate": 4.996864025176386e-05, "Pretrain/Loss": 2.1515774726867676, "Pretrain/Loss (Raw)": 2.0799479484558105, "Pretrain/Step": 867, "Pretrain/Step Time": 8.455872824415565} +{"Pretrain/Learning Rate": 4.9968427327785835e-05, "Pretrain/Loss": 2.150571823120117, "Pretrain/Loss (Raw)": 1.9070442914962769, "Pretrain/Step": 868, "Pretrain/Step Time": 8.459394404664636} +{"Pretrain/Learning Rate": 4.996821368386081e-05, "Pretrain/Loss": 2.1490750312805176, "Pretrain/Loss (Raw)": 2.119471311569214, "Pretrain/Step": 869, "Pretrain/Step Time": 8.459475493058562} +{"Pretrain/Learning Rate": 4.996799931999494e-05, "Pretrain/Loss": 2.147982597351074, "Pretrain/Loss (Raw)": 2.0624399185180664, "Pretrain/Step": 870, "Pretrain/Step Time": 8.460193824023008} +{"Pretrain/Learning Rate": 4.9967784236194415e-05, "Pretrain/Loss": 2.1464016437530518, "Pretrain/Loss (Raw)": 2.1296231746673584, "Pretrain/Step": 871, "Pretrain/Step Time": 8.461034506559372} +{"Pretrain/Learning Rate": 4.9967568432465436e-05, "Pretrain/Loss": 2.1459007263183594, "Pretrain/Loss (Raw)": 2.1398673057556152, "Pretrain/Step": 872, "Pretrain/Step Time": 8.458246720954776} +{"Pretrain/Learning Rate": 4.996735190881422e-05, "Pretrain/Loss": 2.146955966949463, "Pretrain/Loss (Raw)": 2.3317484855651855, "Pretrain/Step": 873, "Pretrain/Step Time": 8.452709825709462} +{"Pretrain/Learning Rate": 4.996713466524701e-05, "Pretrain/Loss": 2.146428108215332, "Pretrain/Loss (Raw)": 1.9971717596054077, "Pretrain/Step": 874, "Pretrain/Step Time": 8.45184156857431} +{"Pretrain/Learning Rate": 4.996691670177007e-05, "Pretrain/Loss": 2.1482174396514893, "Pretrain/Loss (Raw)": 2.3914031982421875, "Pretrain/Step": 875, "Pretrain/Step Time": 8.453631687909365} +{"Pretrain/Learning Rate": 4.9966698018389694e-05, "Pretrain/Loss": 2.146021842956543, "Pretrain/Loss (Raw)": 1.934899926185608, "Pretrain/Step": 876, "Pretrain/Step Time": 8.452517788857222} +{"Pretrain/Learning Rate": 4.996647861511218e-05, "Pretrain/Loss": 2.1472768783569336, "Pretrain/Loss (Raw)": 2.352193832397461, "Pretrain/Step": 877, "Pretrain/Step Time": 8.456252733245492} +{"Pretrain/Learning Rate": 4.996625849194385e-05, "Pretrain/Loss": 2.1467676162719727, "Pretrain/Loss (Raw)": 1.9652992486953735, "Pretrain/Step": 878, "Pretrain/Step Time": 8.456050861626863} +{"Pretrain/Learning Rate": 4.996603764889106e-05, "Pretrain/Loss": 2.1458191871643066, "Pretrain/Loss (Raw)": 2.2193825244903564, "Pretrain/Step": 879, "Pretrain/Step Time": 8.451216842979193} +{"Pretrain/Learning Rate": 4.9965816085960175e-05, "Pretrain/Loss": 2.144486665725708, "Pretrain/Loss (Raw)": 2.1200926303863525, "Pretrain/Step": 880, "Pretrain/Step Time": 8.44954453036189} +{"Pretrain/Learning Rate": 4.9965593803157585e-05, "Pretrain/Loss": 2.1442413330078125, "Pretrain/Loss (Raw)": 2.200317621231079, "Pretrain/Step": 881, "Pretrain/Step Time": 8.444918924942613} +{"Pretrain/Learning Rate": 4.99653708004897e-05, "Pretrain/Loss": 2.1394453048706055, "Pretrain/Loss (Raw)": 2.1094446182250977, "Pretrain/Step": 882, "Pretrain/Step Time": 8.44842735491693} +{"Pretrain/Learning Rate": 4.9965147077962934e-05, "Pretrain/Loss": 2.138180732727051, "Pretrain/Loss (Raw)": 2.347606897354126, "Pretrain/Step": 883, "Pretrain/Step Time": 8.44868789613247} +{"Pretrain/Learning Rate": 4.996492263558377e-05, "Pretrain/Loss": 2.1376450061798096, "Pretrain/Loss (Raw)": 2.033735513687134, "Pretrain/Step": 884, "Pretrain/Step Time": 8.450406974181533} +{"Pretrain/Learning Rate": 4.996469747335865e-05, "Pretrain/Loss": 2.1350114345550537, "Pretrain/Loss (Raw)": 2.017069101333618, "Pretrain/Step": 885, "Pretrain/Step Time": 8.448511390015483} +{"Pretrain/Learning Rate": 4.996447159129407e-05, "Pretrain/Loss": 2.1356868743896484, "Pretrain/Loss (Raw)": 2.1688716411590576, "Pretrain/Step": 886, "Pretrain/Step Time": 8.445407526567578} +{"Pretrain/Learning Rate": 4.996424498939656e-05, "Pretrain/Loss": 2.1303906440734863, "Pretrain/Loss (Raw)": 1.7555902004241943, "Pretrain/Step": 887, "Pretrain/Step Time": 8.445869971066713} +{"Pretrain/Learning Rate": 4.996401766767264e-05, "Pretrain/Loss": 2.1300277709960938, "Pretrain/Loss (Raw)": 2.15984845161438, "Pretrain/Step": 888, "Pretrain/Step Time": 8.44596978649497} +{"Pretrain/Learning Rate": 4.996378962612887e-05, "Pretrain/Loss": 2.128176212310791, "Pretrain/Loss (Raw)": 1.9061251878738403, "Pretrain/Step": 889, "Pretrain/Step Time": 8.440614389255643} +{"Pretrain/Learning Rate": 4.996356086477183e-05, "Pretrain/Loss": 2.130890130996704, "Pretrain/Loss (Raw)": 2.2289531230926514, "Pretrain/Step": 890, "Pretrain/Step Time": 8.439970737323165} +{"Pretrain/Learning Rate": 4.9963331383608104e-05, "Pretrain/Loss": 2.1304163932800293, "Pretrain/Loss (Raw)": 2.07848858833313, "Pretrain/Step": 891, "Pretrain/Step Time": 8.444028846919537} +{"Pretrain/Learning Rate": 4.996310118264432e-05, "Pretrain/Loss": 2.1305809020996094, "Pretrain/Loss (Raw)": 2.0930562019348145, "Pretrain/Step": 892, "Pretrain/Step Time": 8.440561724826694} +{"Pretrain/Learning Rate": 4.9962870261887104e-05, "Pretrain/Loss": 2.131103038787842, "Pretrain/Loss (Raw)": 2.1757633686065674, "Pretrain/Step": 893, "Pretrain/Step Time": 8.443460918962955} +{"Pretrain/Learning Rate": 4.9962638621343125e-05, "Pretrain/Loss": 2.1334519386291504, "Pretrain/Loss (Raw)": 2.3304789066314697, "Pretrain/Step": 894, "Pretrain/Step Time": 8.446532318368554} +{"Pretrain/Learning Rate": 4.996240626101907e-05, "Pretrain/Loss": 2.133964776992798, "Pretrain/Loss (Raw)": 2.1428003311157227, "Pretrain/Step": 895, "Pretrain/Step Time": 8.442825304344296} +{"Pretrain/Learning Rate": 4.996217318092161e-05, "Pretrain/Loss": 2.133269786834717, "Pretrain/Loss (Raw)": 2.0444796085357666, "Pretrain/Step": 896, "Pretrain/Step Time": 8.436096323654056} +{"Pretrain/Learning Rate": 4.99619393810575e-05, "Pretrain/Loss": 2.1325836181640625, "Pretrain/Loss (Raw)": 2.0680739879608154, "Pretrain/Step": 897, "Pretrain/Step Time": 8.432615218684077} +{"Pretrain/Learning Rate": 4.996170486143345e-05, "Pretrain/Loss": 2.134965419769287, "Pretrain/Loss (Raw)": 2.363422155380249, "Pretrain/Step": 898, "Pretrain/Step Time": 8.435232561081648} +{"Pretrain/Learning Rate": 4.996146962205625e-05, "Pretrain/Loss": 2.1358044147491455, "Pretrain/Loss (Raw)": 2.0937063694000244, "Pretrain/Step": 899, "Pretrain/Step Time": 8.44247280061245} +{"Pretrain/Learning Rate": 4.996123366293266e-05, "Pretrain/Loss": 2.137111186981201, "Pretrain/Loss (Raw)": 2.148171901702881, "Pretrain/Step": 900, "Pretrain/Step Time": 8.439702451229095} +{"Pretrain/Learning Rate": 4.99609969840695e-05, "Pretrain/Loss": 2.1378703117370605, "Pretrain/Loss (Raw)": 2.2314670085906982, "Pretrain/Step": 901, "Pretrain/Step Time": 8.43821200542152} +{"Pretrain/Learning Rate": 4.996075958547359e-05, "Pretrain/Loss": 2.13682222366333, "Pretrain/Loss (Raw)": 2.0750012397766113, "Pretrain/Step": 902, "Pretrain/Step Time": 8.441059719771147} +{"Pretrain/Learning Rate": 4.9960521467151763e-05, "Pretrain/Loss": 2.136287212371826, "Pretrain/Loss (Raw)": 2.1118526458740234, "Pretrain/Step": 903, "Pretrain/Step Time": 8.44036147557199} +{"Pretrain/Learning Rate": 4.9960282629110913e-05, "Pretrain/Loss": 2.137744665145874, "Pretrain/Loss (Raw)": 2.1145036220550537, "Pretrain/Step": 904, "Pretrain/Step Time": 8.43770145997405} +{"Pretrain/Learning Rate": 4.996004307135789e-05, "Pretrain/Loss": 2.135371685028076, "Pretrain/Loss (Raw)": 2.1239678859710693, "Pretrain/Step": 905, "Pretrain/Step Time": 8.438682343810797} +{"Pretrain/Learning Rate": 4.9959802793899635e-05, "Pretrain/Loss": 2.133660316467285, "Pretrain/Loss (Raw)": 1.9220750331878662, "Pretrain/Step": 906, "Pretrain/Step Time": 8.436098100617528} +{"Pretrain/Learning Rate": 4.995956179674305e-05, "Pretrain/Loss": 2.134542942047119, "Pretrain/Loss (Raw)": 2.0915420055389404, "Pretrain/Step": 907, "Pretrain/Step Time": 8.443175511434674} +{"Pretrain/Learning Rate": 4.9959320079895105e-05, "Pretrain/Loss": 2.1391658782958984, "Pretrain/Loss (Raw)": 2.8033952713012695, "Pretrain/Step": 908, "Pretrain/Step Time": 8.440977009013295} +{"Pretrain/Learning Rate": 4.995907764336276e-05, "Pretrain/Loss": 2.1393771171569824, "Pretrain/Loss (Raw)": 2.1116397380828857, "Pretrain/Step": 909, "Pretrain/Step Time": 8.440791670233011} +{"Pretrain/Learning Rate": 4.995883448715301e-05, "Pretrain/Loss": 2.1420202255249023, "Pretrain/Loss (Raw)": 2.3554069995880127, "Pretrain/Step": 910, "Pretrain/Step Time": 8.440463330596685} +{"Pretrain/Learning Rate": 4.995859061127285e-05, "Pretrain/Loss": 2.1393074989318848, "Pretrain/Loss (Raw)": 1.9658288955688477, "Pretrain/Step": 911, "Pretrain/Step Time": 8.43999619036913} +{"Pretrain/Learning Rate": 4.995834601572933e-05, "Pretrain/Loss": 2.1387178897857666, "Pretrain/Loss (Raw)": 2.0800256729125977, "Pretrain/Step": 912, "Pretrain/Step Time": 8.434422438964248} +{"Pretrain/Learning Rate": 4.99581007005295e-05, "Pretrain/Loss": 2.1377267837524414, "Pretrain/Loss (Raw)": 2.0776760578155518, "Pretrain/Step": 913, "Pretrain/Step Time": 8.429959174245596} +{"Pretrain/Learning Rate": 4.995785466568043e-05, "Pretrain/Loss": 2.138298749923706, "Pretrain/Loss (Raw)": 2.1646158695220947, "Pretrain/Step": 914, "Pretrain/Step Time": 8.42974928766489} +{"Pretrain/Learning Rate": 4.9957607911189205e-05, "Pretrain/Loss": 2.1395421028137207, "Pretrain/Loss (Raw)": 2.07041072845459, "Pretrain/Step": 915, "Pretrain/Step Time": 8.433730319142342} +{"Pretrain/Learning Rate": 4.9957360437062964e-05, "Pretrain/Loss": 2.143897533416748, "Pretrain/Loss (Raw)": 2.029620409011841, "Pretrain/Step": 916, "Pretrain/Step Time": 8.43353440798819} +{"Pretrain/Learning Rate": 4.995711224330882e-05, "Pretrain/Loss": 2.143944025039673, "Pretrain/Loss (Raw)": 2.118753433227539, "Pretrain/Step": 917, "Pretrain/Step Time": 8.431395435705781} +{"Pretrain/Learning Rate": 4.9956863329933944e-05, "Pretrain/Loss": 2.143035411834717, "Pretrain/Loss (Raw)": 2.0896973609924316, "Pretrain/Step": 918, "Pretrain/Step Time": 8.438010478392243} +{"Pretrain/Learning Rate": 4.99566136969455e-05, "Pretrain/Loss": 2.1412127017974854, "Pretrain/Loss (Raw)": 1.922085165977478, "Pretrain/Step": 919, "Pretrain/Step Time": 8.437429368495941} +{"Pretrain/Learning Rate": 4.99563633443507e-05, "Pretrain/Loss": 2.139813184738159, "Pretrain/Loss (Raw)": 1.8512951135635376, "Pretrain/Step": 920, "Pretrain/Step Time": 8.43652674369514} +{"Pretrain/Learning Rate": 4.9956112272156755e-05, "Pretrain/Loss": 2.1398725509643555, "Pretrain/Loss (Raw)": 2.090928792953491, "Pretrain/Step": 921, "Pretrain/Step Time": 8.436987835913897} +{"Pretrain/Learning Rate": 4.995586048037091e-05, "Pretrain/Loss": 2.141897678375244, "Pretrain/Loss (Raw)": 2.2243247032165527, "Pretrain/Step": 922, "Pretrain/Step Time": 8.435277113690972} +{"Pretrain/Learning Rate": 4.9955607969000405e-05, "Pretrain/Loss": 2.1443347930908203, "Pretrain/Loss (Raw)": 2.3937346935272217, "Pretrain/Step": 923, "Pretrain/Step Time": 8.436574965715408} +{"Pretrain/Learning Rate": 4.995535473805255e-05, "Pretrain/Loss": 2.1463429927825928, "Pretrain/Loss (Raw)": 2.4607646465301514, "Pretrain/Step": 924, "Pretrain/Step Time": 8.439896594733} +{"Pretrain/Learning Rate": 4.995510078753463e-05, "Pretrain/Loss": 2.14905047416687, "Pretrain/Loss (Raw)": 2.3571078777313232, "Pretrain/Step": 925, "Pretrain/Step Time": 8.438388543203473} +{"Pretrain/Learning Rate": 4.995484611745398e-05, "Pretrain/Loss": 2.1498537063598633, "Pretrain/Loss (Raw)": 2.2090585231781006, "Pretrain/Step": 926, "Pretrain/Step Time": 8.434898145496845} +{"Pretrain/Learning Rate": 4.9954590727817916e-05, "Pretrain/Loss": 2.1508305072784424, "Pretrain/Loss (Raw)": 2.266054391860962, "Pretrain/Step": 927, "Pretrain/Step Time": 8.43849079683423} +{"Pretrain/Learning Rate": 4.995433461863384e-05, "Pretrain/Loss": 2.150780439376831, "Pretrain/Loss (Raw)": 2.067701578140259, "Pretrain/Step": 928, "Pretrain/Step Time": 8.439671508967876} +{"Pretrain/Learning Rate": 4.99540777899091e-05, "Pretrain/Loss": 2.1499717235565186, "Pretrain/Loss (Raw)": 2.1004931926727295, "Pretrain/Step": 929, "Pretrain/Step Time": 8.434022404253483} +{"Pretrain/Learning Rate": 4.9953820241651125e-05, "Pretrain/Loss": 2.1504454612731934, "Pretrain/Loss (Raw)": 2.158104419708252, "Pretrain/Step": 930, "Pretrain/Step Time": 8.424547595903277} +{"Pretrain/Learning Rate": 4.995356197386734e-05, "Pretrain/Loss": 2.148423194885254, "Pretrain/Loss (Raw)": 2.076514482498169, "Pretrain/Step": 931, "Pretrain/Step Time": 8.429431235417724} +{"Pretrain/Learning Rate": 4.995330298656517e-05, "Pretrain/Loss": 2.151339530944824, "Pretrain/Loss (Raw)": 2.393866777420044, "Pretrain/Step": 932, "Pretrain/Step Time": 8.431791763752699} +{"Pretrain/Learning Rate": 4.995304327975212e-05, "Pretrain/Loss": 2.150585651397705, "Pretrain/Loss (Raw)": 2.191235303878784, "Pretrain/Step": 933, "Pretrain/Step Time": 8.430022517219186} +{"Pretrain/Learning Rate": 4.995278285343564e-05, "Pretrain/Loss": 2.150865077972412, "Pretrain/Loss (Raw)": 2.1809499263763428, "Pretrain/Step": 934, "Pretrain/Step Time": 8.430843418464065} +{"Pretrain/Learning Rate": 4.995252170762327e-05, "Pretrain/Loss": 2.1501693725585938, "Pretrain/Loss (Raw)": 2.0890748500823975, "Pretrain/Step": 935, "Pretrain/Step Time": 8.43187697418034} +{"Pretrain/Learning Rate": 4.9952259842322516e-05, "Pretrain/Loss": 2.1496591567993164, "Pretrain/Loss (Raw)": 2.2347795963287354, "Pretrain/Step": 936, "Pretrain/Step Time": 8.432481426745653} +{"Pretrain/Learning Rate": 4.995199725754095e-05, "Pretrain/Loss": 2.1495919227600098, "Pretrain/Loss (Raw)": 2.2067205905914307, "Pretrain/Step": 937, "Pretrain/Step Time": 8.430585090070963} +{"Pretrain/Learning Rate": 4.995173395328613e-05, "Pretrain/Loss": 2.150674819946289, "Pretrain/Loss (Raw)": 2.275062322616577, "Pretrain/Step": 938, "Pretrain/Step Time": 8.433857386931777} +{"Pretrain/Learning Rate": 4.995146992956565e-05, "Pretrain/Loss": 2.1504480838775635, "Pretrain/Loss (Raw)": 2.1447627544403076, "Pretrain/Step": 939, "Pretrain/Step Time": 8.431665858253837} +{"Pretrain/Learning Rate": 4.9951205186387124e-05, "Pretrain/Loss": 2.148411989212036, "Pretrain/Loss (Raw)": 2.2063591480255127, "Pretrain/Step": 940, "Pretrain/Step Time": 8.43087749928236} +{"Pretrain/Learning Rate": 4.995093972375818e-05, "Pretrain/Loss": 2.1506881713867188, "Pretrain/Loss (Raw)": 2.3447425365448, "Pretrain/Step": 941, "Pretrain/Step Time": 8.432471817359328} +{"Pretrain/Learning Rate": 4.995067354168649e-05, "Pretrain/Loss": 2.1490421295166016, "Pretrain/Loss (Raw)": 2.0614521503448486, "Pretrain/Step": 942, "Pretrain/Step Time": 8.433510964736342} +{"Pretrain/Learning Rate": 4.9950406640179714e-05, "Pretrain/Loss": 2.1497981548309326, "Pretrain/Loss (Raw)": 2.1269407272338867, "Pretrain/Step": 943, "Pretrain/Step Time": 8.42977574467659} +{"Pretrain/Learning Rate": 4.9950139019245545e-05, "Pretrain/Loss": 2.1475822925567627, "Pretrain/Loss (Raw)": 2.045224666595459, "Pretrain/Step": 944, "Pretrain/Step Time": 8.428622398525476} +{"Pretrain/Learning Rate": 4.994987067889171e-05, "Pretrain/Loss": 2.1479148864746094, "Pretrain/Loss (Raw)": 2.216643810272217, "Pretrain/Step": 945, "Pretrain/Step Time": 8.427328614518046} +{"Pretrain/Learning Rate": 4.994960161912594e-05, "Pretrain/Loss": 2.1456732749938965, "Pretrain/Loss (Raw)": 2.101214647293091, "Pretrain/Step": 946, "Pretrain/Step Time": 8.42287409119308} +{"Pretrain/Learning Rate": 4.9949331839956005e-05, "Pretrain/Loss": 2.1437997817993164, "Pretrain/Loss (Raw)": 1.9601248502731323, "Pretrain/Step": 947, "Pretrain/Step Time": 8.421002211049199} +{"Pretrain/Learning Rate": 4.994906134138967e-05, "Pretrain/Loss": 2.143979549407959, "Pretrain/Loss (Raw)": 2.4276247024536133, "Pretrain/Step": 948, "Pretrain/Step Time": 8.42274833098054} +{"Pretrain/Learning Rate": 4.994879012343473e-05, "Pretrain/Loss": 2.1419990062713623, "Pretrain/Loss (Raw)": 2.052356243133545, "Pretrain/Step": 949, "Pretrain/Step Time": 8.422310747206211} +{"Pretrain/Learning Rate": 4.994851818609903e-05, "Pretrain/Loss": 2.1422367095947266, "Pretrain/Loss (Raw)": 2.1102964878082275, "Pretrain/Step": 950, "Pretrain/Step Time": 8.421235494315624} +{"Pretrain/Learning Rate": 4.994824552939038e-05, "Pretrain/Loss": 2.140376091003418, "Pretrain/Loss (Raw)": 2.1277172565460205, "Pretrain/Step": 951, "Pretrain/Step Time": 8.417363710701466} +{"Pretrain/Learning Rate": 4.994797215331667e-05, "Pretrain/Loss": 2.1401243209838867, "Pretrain/Loss (Raw)": 2.1464295387268066, "Pretrain/Step": 952, "Pretrain/Step Time": 8.419678583741188} +{"Pretrain/Learning Rate": 4.994769805788576e-05, "Pretrain/Loss": 2.1397664546966553, "Pretrain/Loss (Raw)": 2.207611322402954, "Pretrain/Step": 953, "Pretrain/Step Time": 8.40755875222385} +{"Pretrain/Learning Rate": 4.9947423243105576e-05, "Pretrain/Loss": 2.1403751373291016, "Pretrain/Loss (Raw)": 2.1881723403930664, "Pretrain/Step": 954, "Pretrain/Step Time": 8.411832781508565} +{"Pretrain/Learning Rate": 4.994714770898402e-05, "Pretrain/Loss": 2.14142107963562, "Pretrain/Loss (Raw)": 2.6418697834014893, "Pretrain/Step": 955, "Pretrain/Step Time": 8.412151189520955} +{"Pretrain/Learning Rate": 4.994687145552904e-05, "Pretrain/Loss": 2.141510009765625, "Pretrain/Loss (Raw)": 2.1289255619049072, "Pretrain/Step": 956, "Pretrain/Step Time": 8.41267086751759} +{"Pretrain/Learning Rate": 4.994659448274862e-05, "Pretrain/Loss": 2.138026237487793, "Pretrain/Loss (Raw)": 1.7844141721725464, "Pretrain/Step": 957, "Pretrain/Step Time": 8.419051321223378} +{"Pretrain/Learning Rate": 4.994631679065073e-05, "Pretrain/Loss": 2.1393203735351562, "Pretrain/Loss (Raw)": 2.1378393173217773, "Pretrain/Step": 958, "Pretrain/Step Time": 8.423528272658587} +{"Pretrain/Learning Rate": 4.9946038379243386e-05, "Pretrain/Loss": 2.1399035453796387, "Pretrain/Loss (Raw)": 2.2390573024749756, "Pretrain/Step": 959, "Pretrain/Step Time": 8.424856722354889} +{"Pretrain/Learning Rate": 4.9945759248534605e-05, "Pretrain/Loss": 2.1377809047698975, "Pretrain/Loss (Raw)": 1.967935562133789, "Pretrain/Step": 960, "Pretrain/Step Time": 8.425589501857758} +{"Pretrain/Learning Rate": 4.9945479398532445e-05, "Pretrain/Loss": 2.138695240020752, "Pretrain/Loss (Raw)": 2.1505537033081055, "Pretrain/Step": 961, "Pretrain/Step Time": 8.425661005079746} +{"Pretrain/Learning Rate": 4.994519882924497e-05, "Pretrain/Loss": 2.137277126312256, "Pretrain/Loss (Raw)": 1.8050590753555298, "Pretrain/Step": 962, "Pretrain/Step Time": 8.426504965871572} +{"Pretrain/Learning Rate": 4.994491754068027e-05, "Pretrain/Loss": 2.137002944946289, "Pretrain/Loss (Raw)": 2.125110387802124, "Pretrain/Step": 963, "Pretrain/Step Time": 8.42794506624341} +{"Pretrain/Learning Rate": 4.9944635532846464e-05, "Pretrain/Loss": 2.1377110481262207, "Pretrain/Loss (Raw)": 2.1674764156341553, "Pretrain/Step": 964, "Pretrain/Step Time": 8.422670153900981} +{"Pretrain/Learning Rate": 4.994435280575167e-05, "Pretrain/Loss": 2.1363754272460938, "Pretrain/Loss (Raw)": 2.02425217628479, "Pretrain/Step": 965, "Pretrain/Step Time": 8.429622955620289} +{"Pretrain/Learning Rate": 4.994406935940405e-05, "Pretrain/Loss": 2.1344761848449707, "Pretrain/Loss (Raw)": 2.010188341140747, "Pretrain/Step": 966, "Pretrain/Step Time": 8.427164169028401} +{"Pretrain/Learning Rate": 4.994378519381178e-05, "Pretrain/Loss": 2.134294271469116, "Pretrain/Loss (Raw)": 2.0073885917663574, "Pretrain/Step": 967, "Pretrain/Step Time": 8.430328913033009} +{"Pretrain/Learning Rate": 4.9943500308983044e-05, "Pretrain/Loss": 2.1345930099487305, "Pretrain/Loss (Raw)": 2.0402562618255615, "Pretrain/Step": 968, "Pretrain/Step Time": 8.428575249388814} +{"Pretrain/Learning Rate": 4.994321470492606e-05, "Pretrain/Loss": 2.1337649822235107, "Pretrain/Loss (Raw)": 2.1609482765197754, "Pretrain/Step": 969, "Pretrain/Step Time": 8.432913513854146} +{"Pretrain/Learning Rate": 4.994292838164907e-05, "Pretrain/Loss": 2.131835460662842, "Pretrain/Loss (Raw)": 1.9025177955627441, "Pretrain/Step": 970, "Pretrain/Step Time": 8.421691849827766} +{"Pretrain/Learning Rate": 4.994264133916031e-05, "Pretrain/Loss": 2.134148597717285, "Pretrain/Loss (Raw)": 2.3455774784088135, "Pretrain/Step": 971, "Pretrain/Step Time": 8.420146381482482} +{"Pretrain/Learning Rate": 4.994235357746808e-05, "Pretrain/Loss": 2.131143093109131, "Pretrain/Loss (Raw)": 1.8204563856124878, "Pretrain/Step": 972, "Pretrain/Step Time": 8.421656042337418} +{"Pretrain/Learning Rate": 4.994206509658067e-05, "Pretrain/Loss": 2.1323723793029785, "Pretrain/Loss (Raw)": 2.2159371376037598, "Pretrain/Step": 973, "Pretrain/Step Time": 8.424003524705768} +{"Pretrain/Learning Rate": 4.994177589650639e-05, "Pretrain/Loss": 2.1348252296447754, "Pretrain/Loss (Raw)": 2.21532940864563, "Pretrain/Step": 974, "Pretrain/Step Time": 8.424782009795308} +{"Pretrain/Learning Rate": 4.9941485977253585e-05, "Pretrain/Loss": 2.1350455284118652, "Pretrain/Loss (Raw)": 2.239854574203491, "Pretrain/Step": 975, "Pretrain/Step Time": 8.425025088712573} +{"Pretrain/Learning Rate": 4.9941195338830616e-05, "Pretrain/Loss": 2.1344141960144043, "Pretrain/Loss (Raw)": 1.946797251701355, "Pretrain/Step": 976, "Pretrain/Step Time": 8.429054321721196} +{"Pretrain/Learning Rate": 4.994090398124586e-05, "Pretrain/Loss": 2.130709648132324, "Pretrain/Loss (Raw)": 1.977471947669983, "Pretrain/Step": 977, "Pretrain/Step Time": 8.424019165337086} +{"Pretrain/Learning Rate": 4.994061190450773e-05, "Pretrain/Loss": 2.1309309005737305, "Pretrain/Loss (Raw)": 2.09702205657959, "Pretrain/Step": 978, "Pretrain/Step Time": 8.422157483175397} +{"Pretrain/Learning Rate": 4.994031910862462e-05, "Pretrain/Loss": 2.131744146347046, "Pretrain/Loss (Raw)": 2.2279374599456787, "Pretrain/Step": 979, "Pretrain/Step Time": 8.419181736186147} +{"Pretrain/Learning Rate": 4.994002559360501e-05, "Pretrain/Loss": 2.132941246032715, "Pretrain/Loss (Raw)": 2.205960988998413, "Pretrain/Step": 980, "Pretrain/Step Time": 8.414084719493985} +{"Pretrain/Learning Rate": 4.9939731359457334e-05, "Pretrain/Loss": 2.1325113773345947, "Pretrain/Loss (Raw)": 2.274353504180908, "Pretrain/Step": 981, "Pretrain/Step Time": 8.41313523054123} +{"Pretrain/Learning Rate": 4.993943640619008e-05, "Pretrain/Loss": 2.1334147453308105, "Pretrain/Loss (Raw)": 2.099669933319092, "Pretrain/Step": 982, "Pretrain/Step Time": 8.416573867201805} +{"Pretrain/Learning Rate": 4.993914073381176e-05, "Pretrain/Loss": 2.1354713439941406, "Pretrain/Loss (Raw)": 2.277827501296997, "Pretrain/Step": 983, "Pretrain/Step Time": 8.415636183694005} +{"Pretrain/Learning Rate": 4.9938844342330904e-05, "Pretrain/Loss": 2.1369175910949707, "Pretrain/Loss (Raw)": 2.296700954437256, "Pretrain/Step": 984, "Pretrain/Step Time": 8.417969964444637} +{"Pretrain/Learning Rate": 4.993854723175605e-05, "Pretrain/Loss": 2.1360890865325928, "Pretrain/Loss (Raw)": 1.9606287479400635, "Pretrain/Step": 985, "Pretrain/Step Time": 8.420472849160433} +{"Pretrain/Learning Rate": 4.9938249402095766e-05, "Pretrain/Loss": 2.13478946685791, "Pretrain/Loss (Raw)": 1.9844884872436523, "Pretrain/Step": 986, "Pretrain/Step Time": 8.419260812923312} +{"Pretrain/Learning Rate": 4.993795085335864e-05, "Pretrain/Loss": 2.1326394081115723, "Pretrain/Loss (Raw)": 2.010175943374634, "Pretrain/Step": 987, "Pretrain/Step Time": 8.41381223499775} +{"Pretrain/Learning Rate": 4.993765158555328e-05, "Pretrain/Loss": 2.13321590423584, "Pretrain/Loss (Raw)": 2.108097791671753, "Pretrain/Step": 988, "Pretrain/Step Time": 8.41191390901804} +{"Pretrain/Learning Rate": 4.993735159868832e-05, "Pretrain/Loss": 2.1322922706604004, "Pretrain/Loss (Raw)": 2.0363996028900146, "Pretrain/Step": 989, "Pretrain/Step Time": 8.409064929932356} +{"Pretrain/Learning Rate": 4.993705089277241e-05, "Pretrain/Loss": 2.134434223175049, "Pretrain/Loss (Raw)": 2.1033427715301514, "Pretrain/Step": 990, "Pretrain/Step Time": 8.412927478551865} +{"Pretrain/Learning Rate": 4.9936749467814216e-05, "Pretrain/Loss": 2.1349949836730957, "Pretrain/Loss (Raw)": 2.1206843852996826, "Pretrain/Step": 991, "Pretrain/Step Time": 8.414114898070693} +{"Pretrain/Learning Rate": 4.9936447323822424e-05, "Pretrain/Loss": 2.1367008686065674, "Pretrain/Loss (Raw)": 2.1431446075439453, "Pretrain/Step": 992, "Pretrain/Step Time": 8.415439181029797} +{"Pretrain/Learning Rate": 4.9936144460805756e-05, "Pretrain/Loss": 2.134026050567627, "Pretrain/Loss (Raw)": 1.8524396419525146, "Pretrain/Step": 993, "Pretrain/Step Time": 8.41522161476314} +{"Pretrain/Learning Rate": 4.993584087877293e-05, "Pretrain/Loss": 2.1321158409118652, "Pretrain/Loss (Raw)": 2.08514666557312, "Pretrain/Step": 994, "Pretrain/Step Time": 8.412155501544476} +{"Pretrain/Learning Rate": 4.993553657773273e-05, "Pretrain/Loss": 2.133941173553467, "Pretrain/Loss (Raw)": 2.313565254211426, "Pretrain/Step": 995, "Pretrain/Step Time": 8.409182071685791} +{"Pretrain/Learning Rate": 4.99352315576939e-05, "Pretrain/Loss": 2.1389284133911133, "Pretrain/Loss (Raw)": 2.5454161167144775, "Pretrain/Step": 996, "Pretrain/Step Time": 8.40796859189868} +{"Pretrain/Learning Rate": 4.993492581866525e-05, "Pretrain/Loss": 2.1391677856445312, "Pretrain/Loss (Raw)": 2.150123119354248, "Pretrain/Step": 997, "Pretrain/Step Time": 8.407916473224759} +{"Pretrain/Learning Rate": 4.993461936065559e-05, "Pretrain/Loss": 2.140042781829834, "Pretrain/Loss (Raw)": 2.174435615539551, "Pretrain/Step": 998, "Pretrain/Step Time": 8.401537138968706} +{"Pretrain/Learning Rate": 4.993431218367376e-05, "Pretrain/Loss": 2.13859486579895, "Pretrain/Loss (Raw)": 1.9442837238311768, "Pretrain/Step": 999, "Pretrain/Step Time": 8.408749632537365} +{"Pretrain/Learning Rate": 4.993400428772861e-05, "Pretrain/Loss": 2.139108657836914, "Pretrain/Loss (Raw)": 2.205627679824829, "Pretrain/Step": 1000, "Pretrain/Step Time": 8.407818142324686} +{"Pretrain/Learning Rate": 4.9933695672829026e-05, "Pretrain/Loss": 2.1393957138061523, "Pretrain/Loss (Raw)": 2.3685154914855957, "Pretrain/Step": 1001, "Pretrain/Step Time": 8.415218867361546} +{"Pretrain/Learning Rate": 4.9933386338983914e-05, "Pretrain/Loss": 2.141122579574585, "Pretrain/Loss (Raw)": 2.2182040214538574, "Pretrain/Step": 1002, "Pretrain/Step Time": 8.411057827994227} +{"Pretrain/Learning Rate": 4.993307628620217e-05, "Pretrain/Loss": 2.1396982669830322, "Pretrain/Loss (Raw)": 2.2090823650360107, "Pretrain/Step": 1003, "Pretrain/Step Time": 8.414011610671878} +{"Pretrain/Learning Rate": 4.993276551449276e-05, "Pretrain/Loss": 2.141667127609253, "Pretrain/Loss (Raw)": 2.186923027038574, "Pretrain/Step": 1004, "Pretrain/Step Time": 8.415726298466325} +{"Pretrain/Learning Rate": 4.993245402386463e-05, "Pretrain/Loss": 2.1405727863311768, "Pretrain/Loss (Raw)": 2.2121286392211914, "Pretrain/Step": 1005, "Pretrain/Step Time": 8.41307358443737} +{"Pretrain/Learning Rate": 4.9932141814326764e-05, "Pretrain/Loss": 2.141050338745117, "Pretrain/Loss (Raw)": 2.0264065265655518, "Pretrain/Step": 1006, "Pretrain/Step Time": 8.413123393431306} +{"Pretrain/Learning Rate": 4.993182888588816e-05, "Pretrain/Loss": 2.1400060653686523, "Pretrain/Loss (Raw)": 2.0857229232788086, "Pretrain/Step": 1007, "Pretrain/Step Time": 8.418099781498313} +{"Pretrain/Learning Rate": 4.9931515238557847e-05, "Pretrain/Loss": 2.140341281890869, "Pretrain/Loss (Raw)": 2.162985324859619, "Pretrain/Step": 1008, "Pretrain/Step Time": 8.422702306881547} +{"Pretrain/Learning Rate": 4.993120087234487e-05, "Pretrain/Loss": 2.1398167610168457, "Pretrain/Loss (Raw)": 2.1332178115844727, "Pretrain/Step": 1009, "Pretrain/Step Time": 8.421811919659376} +{"Pretrain/Learning Rate": 4.9930885787258285e-05, "Pretrain/Loss": 2.1406965255737305, "Pretrain/Loss (Raw)": 2.2220330238342285, "Pretrain/Step": 1010, "Pretrain/Step Time": 8.4196373578161} +{"Pretrain/Learning Rate": 4.9930569983307194e-05, "Pretrain/Loss": 2.1381256580352783, "Pretrain/Loss (Raw)": 2.01853609085083, "Pretrain/Step": 1011, "Pretrain/Step Time": 8.418507361784577} +{"Pretrain/Learning Rate": 4.993025346050069e-05, "Pretrain/Loss": 2.138700008392334, "Pretrain/Loss (Raw)": 2.107259511947632, "Pretrain/Step": 1012, "Pretrain/Step Time": 8.418156189844012} +{"Pretrain/Learning Rate": 4.992993621884789e-05, "Pretrain/Loss": 2.140435218811035, "Pretrain/Loss (Raw)": 2.2391433715820312, "Pretrain/Step": 1013, "Pretrain/Step Time": 8.417828902602196} +{"Pretrain/Learning Rate": 4.992961825835797e-05, "Pretrain/Loss": 2.140800714492798, "Pretrain/Loss (Raw)": 2.215656042098999, "Pretrain/Step": 1014, "Pretrain/Step Time": 8.416800877079368} +{"Pretrain/Learning Rate": 4.992929957904007e-05, "Pretrain/Loss": 2.1431491374969482, "Pretrain/Loss (Raw)": 2.056201934814453, "Pretrain/Step": 1015, "Pretrain/Step Time": 8.420514976605773} +{"Pretrain/Learning Rate": 4.99289801809034e-05, "Pretrain/Loss": 2.1419479846954346, "Pretrain/Loss (Raw)": 2.006093740463257, "Pretrain/Step": 1016, "Pretrain/Step Time": 8.42680498957634} +{"Pretrain/Learning Rate": 4.992866006395715e-05, "Pretrain/Loss": 2.143686056137085, "Pretrain/Loss (Raw)": 2.1286091804504395, "Pretrain/Step": 1017, "Pretrain/Step Time": 8.426283152773976} +{"Pretrain/Learning Rate": 4.992833922821057e-05, "Pretrain/Loss": 2.141850471496582, "Pretrain/Loss (Raw)": 1.994003176689148, "Pretrain/Step": 1018, "Pretrain/Step Time": 8.42645949870348} +{"Pretrain/Learning Rate": 4.99280176736729e-05, "Pretrain/Loss": 2.1417057514190674, "Pretrain/Loss (Raw)": 2.059966802597046, "Pretrain/Step": 1019, "Pretrain/Step Time": 8.423481537029147} +{"Pretrain/Learning Rate": 4.9927695400353415e-05, "Pretrain/Loss": 2.1413779258728027, "Pretrain/Loss (Raw)": 2.0511014461517334, "Pretrain/Step": 1020, "Pretrain/Step Time": 8.424616355448961} +{"Pretrain/Learning Rate": 4.99273724082614e-05, "Pretrain/Loss": 2.141599655151367, "Pretrain/Loss (Raw)": 2.2041144371032715, "Pretrain/Step": 1021, "Pretrain/Step Time": 8.423031728714705} +{"Pretrain/Learning Rate": 4.992704869740617e-05, "Pretrain/Loss": 2.140723705291748, "Pretrain/Loss (Raw)": 2.2183990478515625, "Pretrain/Step": 1022, "Pretrain/Step Time": 8.424603028222919} +{"Pretrain/Learning Rate": 4.992672426779708e-05, "Pretrain/Loss": 2.1414225101470947, "Pretrain/Loss (Raw)": 2.232229709625244, "Pretrain/Step": 1023, "Pretrain/Step Time": 8.423990104347467} +{"Pretrain/Learning Rate": 4.992639911944346e-05, "Pretrain/Loss": 2.1424195766448975, "Pretrain/Loss (Raw)": 2.1721038818359375, "Pretrain/Step": 1024, "Pretrain/Step Time": 8.428435707464814} +{"Pretrain/Learning Rate": 4.9926073252354685e-05, "Pretrain/Loss": 2.1443514823913574, "Pretrain/Loss (Raw)": 2.3153562545776367, "Pretrain/Step": 1025, "Pretrain/Step Time": 8.432804575189948} +{"Pretrain/Learning Rate": 4.992574666654016e-05, "Pretrain/Loss": 2.1436262130737305, "Pretrain/Loss (Raw)": 2.270601987838745, "Pretrain/Step": 1026, "Pretrain/Step Time": 8.429105227813125} +{"Pretrain/Learning Rate": 4.992541936200931e-05, "Pretrain/Loss": 2.144770622253418, "Pretrain/Loss (Raw)": 2.240184783935547, "Pretrain/Step": 1027, "Pretrain/Step Time": 8.424425274133682} +{"Pretrain/Learning Rate": 4.992509133877156e-05, "Pretrain/Loss": 2.1444859504699707, "Pretrain/Loss (Raw)": 2.1117196083068848, "Pretrain/Step": 1028, "Pretrain/Step Time": 8.42479724995792} +{"Pretrain/Learning Rate": 4.992476259683637e-05, "Pretrain/Loss": 2.1437132358551025, "Pretrain/Loss (Raw)": 2.132551908493042, "Pretrain/Step": 1029, "Pretrain/Step Time": 8.426519799977541} +{"Pretrain/Learning Rate": 4.9924433136213235e-05, "Pretrain/Loss": 2.1453311443328857, "Pretrain/Loss (Raw)": 2.2821121215820312, "Pretrain/Step": 1030, "Pretrain/Step Time": 8.42714317701757} +{"Pretrain/Learning Rate": 4.9924102956911624e-05, "Pretrain/Loss": 2.1450955867767334, "Pretrain/Loss (Raw)": 2.0816760063171387, "Pretrain/Step": 1031, "Pretrain/Step Time": 8.427303973585367} +{"Pretrain/Learning Rate": 4.992377205894109e-05, "Pretrain/Loss": 2.1453630924224854, "Pretrain/Loss (Raw)": 2.148756980895996, "Pretrain/Step": 1032, "Pretrain/Step Time": 8.425755670294166} +{"Pretrain/Learning Rate": 4.9923440442311145e-05, "Pretrain/Loss": 2.1451966762542725, "Pretrain/Loss (Raw)": 2.1026618480682373, "Pretrain/Step": 1033, "Pretrain/Step Time": 8.425637286156416} +{"Pretrain/Learning Rate": 4.9923108107031366e-05, "Pretrain/Loss": 2.146310806274414, "Pretrain/Loss (Raw)": 2.0646982192993164, "Pretrain/Step": 1034, "Pretrain/Step Time": 8.426538726314902} +{"Pretrain/Learning Rate": 4.992277505311134e-05, "Pretrain/Loss": 2.146505355834961, "Pretrain/Loss (Raw)": 2.1164488792419434, "Pretrain/Step": 1035, "Pretrain/Step Time": 8.420645644888282} +{"Pretrain/Learning Rate": 4.9922441280560664e-05, "Pretrain/Loss": 2.1416501998901367, "Pretrain/Loss (Raw)": 2.181920051574707, "Pretrain/Step": 1036, "Pretrain/Step Time": 8.423279237002134} +{"Pretrain/Learning Rate": 4.9922106789388964e-05, "Pretrain/Loss": 2.1418275833129883, "Pretrain/Loss (Raw)": 2.134336471557617, "Pretrain/Step": 1037, "Pretrain/Step Time": 8.425048630684614} +{"Pretrain/Learning Rate": 4.992177157960588e-05, "Pretrain/Loss": 2.1399192810058594, "Pretrain/Loss (Raw)": 2.111171007156372, "Pretrain/Step": 1038, "Pretrain/Step Time": 8.425999658182263} +{"Pretrain/Learning Rate": 4.992143565122108e-05, "Pretrain/Loss": 2.141327381134033, "Pretrain/Loss (Raw)": 2.1460459232330322, "Pretrain/Step": 1039, "Pretrain/Step Time": 8.427303148433566} +{"Pretrain/Learning Rate": 4.9921099004244254e-05, "Pretrain/Loss": 2.1409125328063965, "Pretrain/Loss (Raw)": 2.0269453525543213, "Pretrain/Step": 1040, "Pretrain/Step Time": 8.426656391471624} +{"Pretrain/Learning Rate": 4.992076163868511e-05, "Pretrain/Loss": 2.1413087844848633, "Pretrain/Loss (Raw)": 2.1283624172210693, "Pretrain/Step": 1041, "Pretrain/Step Time": 8.432240864261985} +{"Pretrain/Learning Rate": 4.9920423554553365e-05, "Pretrain/Loss": 2.1401617527008057, "Pretrain/Loss (Raw)": 2.0178167819976807, "Pretrain/Step": 1042, "Pretrain/Step Time": 8.42930118739605} +{"Pretrain/Learning Rate": 4.992008475185877e-05, "Pretrain/Loss": 2.1401281356811523, "Pretrain/Loss (Raw)": 2.0660994052886963, "Pretrain/Step": 1043, "Pretrain/Step Time": 8.423481782898307} +{"Pretrain/Learning Rate": 4.9919745230611116e-05, "Pretrain/Loss": 2.1403961181640625, "Pretrain/Loss (Raw)": 2.063934087753296, "Pretrain/Step": 1044, "Pretrain/Step Time": 8.422721901908517} +{"Pretrain/Learning Rate": 4.9919404990820164e-05, "Pretrain/Loss": 2.1411476135253906, "Pretrain/Loss (Raw)": 2.214928388595581, "Pretrain/Step": 1045, "Pretrain/Step Time": 8.422459110617638} +{"Pretrain/Learning Rate": 4.9919064032495744e-05, "Pretrain/Loss": 2.1416351795196533, "Pretrain/Loss (Raw)": 2.1521341800689697, "Pretrain/Step": 1046, "Pretrain/Step Time": 8.42199899815023} +{"Pretrain/Learning Rate": 4.9918722355647675e-05, "Pretrain/Loss": 2.1432909965515137, "Pretrain/Loss (Raw)": 2.1340203285217285, "Pretrain/Step": 1047, "Pretrain/Step Time": 8.424357684329152} +{"Pretrain/Learning Rate": 4.991837996028581e-05, "Pretrain/Loss": 2.145332098007202, "Pretrain/Loss (Raw)": 2.112546443939209, "Pretrain/Step": 1048, "Pretrain/Step Time": 8.423620451241732} +{"Pretrain/Learning Rate": 4.9918036846420025e-05, "Pretrain/Loss": 2.14521861076355, "Pretrain/Loss (Raw)": 2.0763931274414062, "Pretrain/Step": 1049, "Pretrain/Step Time": 8.423956444486976} +{"Pretrain/Learning Rate": 4.991769301406022e-05, "Pretrain/Loss": 2.144474983215332, "Pretrain/Loss (Raw)": 2.1291778087615967, "Pretrain/Step": 1050, "Pretrain/Step Time": 8.424912324175239} +{"Pretrain/Learning Rate": 4.991734846321629e-05, "Pretrain/Loss": 2.1418776512145996, "Pretrain/Loss (Raw)": 2.0612637996673584, "Pretrain/Step": 1051, "Pretrain/Step Time": 8.427778325974941} +{"Pretrain/Learning Rate": 4.991700319389819e-05, "Pretrain/Loss": 2.1379361152648926, "Pretrain/Loss (Raw)": 1.9562103748321533, "Pretrain/Step": 1052, "Pretrain/Step Time": 8.42693185992539} +{"Pretrain/Learning Rate": 4.991665720611588e-05, "Pretrain/Loss": 2.136277675628662, "Pretrain/Loss (Raw)": 2.1448445320129395, "Pretrain/Step": 1053, "Pretrain/Step Time": 8.427832044661045} +{"Pretrain/Learning Rate": 4.991631049987931e-05, "Pretrain/Loss": 2.136483669281006, "Pretrain/Loss (Raw)": 2.235433578491211, "Pretrain/Step": 1054, "Pretrain/Step Time": 8.424898829311132} +{"Pretrain/Learning Rate": 4.9915963075198494e-05, "Pretrain/Loss": 2.1344780921936035, "Pretrain/Loss (Raw)": 2.0093486309051514, "Pretrain/Step": 1055, "Pretrain/Step Time": 8.426325665786862} +{"Pretrain/Learning Rate": 4.9915614932083456e-05, "Pretrain/Loss": 2.1331093311309814, "Pretrain/Loss (Raw)": 1.892508864402771, "Pretrain/Step": 1056, "Pretrain/Step Time": 8.42548462562263} +{"Pretrain/Learning Rate": 4.991526607054422e-05, "Pretrain/Loss": 2.13413405418396, "Pretrain/Loss (Raw)": 2.2316370010375977, "Pretrain/Step": 1057, "Pretrain/Step Time": 8.428226925432682} +{"Pretrain/Learning Rate": 4.991491649059085e-05, "Pretrain/Loss": 2.1361606121063232, "Pretrain/Loss (Raw)": 2.417520046234131, "Pretrain/Step": 1058, "Pretrain/Step Time": 8.428661299869418} +{"Pretrain/Learning Rate": 4.991456619223342e-05, "Pretrain/Loss": 2.1378180980682373, "Pretrain/Loss (Raw)": 2.2886455059051514, "Pretrain/Step": 1059, "Pretrain/Step Time": 8.428393229842186} +{"Pretrain/Learning Rate": 4.991421517548205e-05, "Pretrain/Loss": 2.136852264404297, "Pretrain/Loss (Raw)": 2.270235776901245, "Pretrain/Step": 1060, "Pretrain/Step Time": 8.424489047378302} +{"Pretrain/Learning Rate": 4.991386344034684e-05, "Pretrain/Loss": 2.1360995769500732, "Pretrain/Loss (Raw)": 2.0948984622955322, "Pretrain/Step": 1061, "Pretrain/Step Time": 8.423379158601165} +{"Pretrain/Learning Rate": 4.991351098683794e-05, "Pretrain/Loss": 2.135535717010498, "Pretrain/Loss (Raw)": 2.1087822914123535, "Pretrain/Step": 1062, "Pretrain/Step Time": 8.420956091955304} +{"Pretrain/Learning Rate": 4.991315781496552e-05, "Pretrain/Loss": 2.1360747814178467, "Pretrain/Loss (Raw)": 2.1580872535705566, "Pretrain/Step": 1063, "Pretrain/Step Time": 8.418301314115524} +{"Pretrain/Learning Rate": 4.991280392473975e-05, "Pretrain/Loss": 2.134127140045166, "Pretrain/Loss (Raw)": 1.9854655265808105, "Pretrain/Step": 1064, "Pretrain/Step Time": 8.419056911021471} +{"Pretrain/Learning Rate": 4.991244931617085e-05, "Pretrain/Loss": 2.1332054138183594, "Pretrain/Loss (Raw)": 2.0887417793273926, "Pretrain/Step": 1065, "Pretrain/Step Time": 8.416686214506626} +{"Pretrain/Learning Rate": 4.9912093989269024e-05, "Pretrain/Loss": 2.134552001953125, "Pretrain/Loss (Raw)": 2.44742751121521, "Pretrain/Step": 1066, "Pretrain/Step Time": 8.416174598038197} +{"Pretrain/Learning Rate": 4.9911737944044545e-05, "Pretrain/Loss": 2.136608123779297, "Pretrain/Loss (Raw)": 2.4079627990722656, "Pretrain/Step": 1067, "Pretrain/Step Time": 8.415462564677} +{"Pretrain/Learning Rate": 4.9911381180507653e-05, "Pretrain/Loss": 2.134615898132324, "Pretrain/Loss (Raw)": 1.951332926750183, "Pretrain/Step": 1068, "Pretrain/Step Time": 8.419297639280558} +{"Pretrain/Learning Rate": 4.9911023698668655e-05, "Pretrain/Loss": 2.133876323699951, "Pretrain/Loss (Raw)": 2.250091552734375, "Pretrain/Step": 1069, "Pretrain/Step Time": 8.414050595834851} +{"Pretrain/Learning Rate": 4.991066549853784e-05, "Pretrain/Loss": 2.1356329917907715, "Pretrain/Loss (Raw)": 2.286320924758911, "Pretrain/Step": 1070, "Pretrain/Step Time": 8.417228359729052} +{"Pretrain/Learning Rate": 4.991030658012555e-05, "Pretrain/Loss": 2.135183095932007, "Pretrain/Loss (Raw)": 2.069342851638794, "Pretrain/Step": 1071, "Pretrain/Step Time": 8.416941734030843} +{"Pretrain/Learning Rate": 4.990994694344213e-05, "Pretrain/Loss": 2.136183738708496, "Pretrain/Loss (Raw)": 2.1733033657073975, "Pretrain/Step": 1072, "Pretrain/Step Time": 8.418651407584548} +{"Pretrain/Learning Rate": 4.9909586588497955e-05, "Pretrain/Loss": 2.1334354877471924, "Pretrain/Loss (Raw)": 1.8648666143417358, "Pretrain/Step": 1073, "Pretrain/Step Time": 8.417358035221696} +{"Pretrain/Learning Rate": 4.9909225515303405e-05, "Pretrain/Loss": 2.1351537704467773, "Pretrain/Loss (Raw)": 2.32116961479187, "Pretrain/Step": 1074, "Pretrain/Step Time": 8.420722605660558} +{"Pretrain/Learning Rate": 4.99088637238689e-05, "Pretrain/Loss": 2.1357510089874268, "Pretrain/Loss (Raw)": 2.036550283432007, "Pretrain/Step": 1075, "Pretrain/Step Time": 8.418380312621593} +{"Pretrain/Learning Rate": 4.990850121420487e-05, "Pretrain/Loss": 2.1333532333374023, "Pretrain/Loss (Raw)": 2.120706081390381, "Pretrain/Step": 1076, "Pretrain/Step Time": 8.41737075150013} +{"Pretrain/Learning Rate": 4.9908137986321754e-05, "Pretrain/Loss": 2.1348581314086914, "Pretrain/Loss (Raw)": 2.2449843883514404, "Pretrain/Step": 1077, "Pretrain/Step Time": 8.416433293372393} +{"Pretrain/Learning Rate": 4.990777404023006e-05, "Pretrain/Loss": 2.1347689628601074, "Pretrain/Loss (Raw)": 2.098884105682373, "Pretrain/Step": 1078, "Pretrain/Step Time": 8.41688391380012} +{"Pretrain/Learning Rate": 4.9907409375940246e-05, "Pretrain/Loss": 2.1341943740844727, "Pretrain/Loss (Raw)": 2.054176092147827, "Pretrain/Step": 1079, "Pretrain/Step Time": 8.418376890942454} +{"Pretrain/Learning Rate": 4.9907043993462846e-05, "Pretrain/Loss": 2.133918285369873, "Pretrain/Loss (Raw)": 2.111077070236206, "Pretrain/Step": 1080, "Pretrain/Step Time": 8.412964187562466} +{"Pretrain/Learning Rate": 4.990667789280838e-05, "Pretrain/Loss": 2.1343791484832764, "Pretrain/Loss (Raw)": 2.266616106033325, "Pretrain/Step": 1081, "Pretrain/Step Time": 8.416936747729778} +{"Pretrain/Learning Rate": 4.990631107398743e-05, "Pretrain/Loss": 2.133538246154785, "Pretrain/Loss (Raw)": 2.080533027648926, "Pretrain/Step": 1082, "Pretrain/Step Time": 8.415123408660293} +{"Pretrain/Learning Rate": 4.990594353701056e-05, "Pretrain/Loss": 2.1291537284851074, "Pretrain/Loss (Raw)": 2.080653667449951, "Pretrain/Step": 1083, "Pretrain/Step Time": 8.412516998127103} +{"Pretrain/Learning Rate": 4.9905575281888354e-05, "Pretrain/Loss": 2.130465269088745, "Pretrain/Loss (Raw)": 2.296818971633911, "Pretrain/Step": 1084, "Pretrain/Step Time": 8.414908859878778} +{"Pretrain/Learning Rate": 4.9905206308631444e-05, "Pretrain/Loss": 2.1343092918395996, "Pretrain/Loss (Raw)": 2.2764227390289307, "Pretrain/Step": 1085, "Pretrain/Step Time": 8.41278494335711} +{"Pretrain/Learning Rate": 4.9904836617250475e-05, "Pretrain/Loss": 2.134427785873413, "Pretrain/Loss (Raw)": 2.1530251502990723, "Pretrain/Step": 1086, "Pretrain/Step Time": 8.409110156819224} +{"Pretrain/Learning Rate": 4.9904466207756084e-05, "Pretrain/Loss": 2.1336779594421387, "Pretrain/Loss (Raw)": 2.1430797576904297, "Pretrain/Step": 1087, "Pretrain/Step Time": 8.41307083889842} +{"Pretrain/Learning Rate": 4.990409508015898e-05, "Pretrain/Loss": 2.1355631351470947, "Pretrain/Loss (Raw)": 2.2092323303222656, "Pretrain/Step": 1088, "Pretrain/Step Time": 8.41353777423501} +{"Pretrain/Learning Rate": 4.9903723234469844e-05, "Pretrain/Loss": 2.1355555057525635, "Pretrain/Loss (Raw)": 2.1495745182037354, "Pretrain/Step": 1089, "Pretrain/Step Time": 8.413379458710551} +{"Pretrain/Learning Rate": 4.9903350670699414e-05, "Pretrain/Loss": 2.1366913318634033, "Pretrain/Loss (Raw)": 1.9504605531692505, "Pretrain/Step": 1090, "Pretrain/Step Time": 8.41626550629735} +{"Pretrain/Learning Rate": 4.990297738885841e-05, "Pretrain/Loss": 2.1366114616394043, "Pretrain/Loss (Raw)": 2.1148746013641357, "Pretrain/Step": 1091, "Pretrain/Step Time": 8.41219499707222} +{"Pretrain/Learning Rate": 4.990260338895761e-05, "Pretrain/Loss": 2.1367597579956055, "Pretrain/Loss (Raw)": 2.186460256576538, "Pretrain/Step": 1092, "Pretrain/Step Time": 8.411180375143886} +{"Pretrain/Learning Rate": 4.9902228671007806e-05, "Pretrain/Loss": 2.136378765106201, "Pretrain/Loss (Raw)": 1.9754588603973389, "Pretrain/Step": 1093, "Pretrain/Step Time": 8.407184638082981} +{"Pretrain/Learning Rate": 4.990185323501978e-05, "Pretrain/Loss": 2.137514352798462, "Pretrain/Loss (Raw)": 2.1555631160736084, "Pretrain/Step": 1094, "Pretrain/Step Time": 8.407760549336672} +{"Pretrain/Learning Rate": 4.990147708100439e-05, "Pretrain/Loss": 2.1385436058044434, "Pretrain/Loss (Raw)": 2.139136791229248, "Pretrain/Step": 1095, "Pretrain/Step Time": 8.40363155119121} +{"Pretrain/Learning Rate": 4.990110020897244e-05, "Pretrain/Loss": 2.1421356201171875, "Pretrain/Loss (Raw)": 2.50001859664917, "Pretrain/Step": 1096, "Pretrain/Step Time": 8.403620744124055} +{"Pretrain/Learning Rate": 4.990072261893484e-05, "Pretrain/Loss": 2.1421821117401123, "Pretrain/Loss (Raw)": 2.1669116020202637, "Pretrain/Step": 1097, "Pretrain/Step Time": 8.40427171625197} +{"Pretrain/Learning Rate": 4.990034431090245e-05, "Pretrain/Loss": 2.144684076309204, "Pretrain/Loss (Raw)": 2.2227745056152344, "Pretrain/Step": 1098, "Pretrain/Step Time": 8.405576381832361} +{"Pretrain/Learning Rate": 4.989996528488617e-05, "Pretrain/Loss": 2.1425724029541016, "Pretrain/Loss (Raw)": 2.0752830505371094, "Pretrain/Step": 1099, "Pretrain/Step Time": 8.4067940171808} +{"Pretrain/Learning Rate": 4.989958554089696e-05, "Pretrain/Loss": 2.145235776901245, "Pretrain/Loss (Raw)": 2.1613876819610596, "Pretrain/Step": 1100, "Pretrain/Step Time": 8.405069390311837} +{"Pretrain/Learning Rate": 4.989920507894575e-05, "Pretrain/Loss": 2.144564151763916, "Pretrain/Loss (Raw)": 2.1299259662628174, "Pretrain/Step": 1101, "Pretrain/Step Time": 8.407067937776446} +{"Pretrain/Learning Rate": 4.989882389904352e-05, "Pretrain/Loss": 2.143167018890381, "Pretrain/Loss (Raw)": 2.036543130874634, "Pretrain/Step": 1102, "Pretrain/Step Time": 8.408024551346898} +{"Pretrain/Learning Rate": 4.9898442001201253e-05, "Pretrain/Loss": 2.14188289642334, "Pretrain/Loss (Raw)": 2.0754497051239014, "Pretrain/Step": 1103, "Pretrain/Step Time": 8.412061957642436} +{"Pretrain/Learning Rate": 4.989805938542996e-05, "Pretrain/Loss": 2.143127202987671, "Pretrain/Loss (Raw)": 2.1060895919799805, "Pretrain/Step": 1104, "Pretrain/Step Time": 8.404712837189436} +{"Pretrain/Learning Rate": 4.9897676051740685e-05, "Pretrain/Loss": 2.143374443054199, "Pretrain/Loss (Raw)": 2.0090839862823486, "Pretrain/Step": 1105, "Pretrain/Step Time": 8.40400843322277} +{"Pretrain/Learning Rate": 4.9897292000144455e-05, "Pretrain/Loss": 2.1421475410461426, "Pretrain/Loss (Raw)": 1.9400140047073364, "Pretrain/Step": 1106, "Pretrain/Step Time": 8.408038590103388} +{"Pretrain/Learning Rate": 4.9896907230652376e-05, "Pretrain/Loss": 2.1385116577148438, "Pretrain/Loss (Raw)": 1.7625290155410767, "Pretrain/Step": 1107, "Pretrain/Step Time": 8.407417353242636} +{"Pretrain/Learning Rate": 4.989652174327553e-05, "Pretrain/Loss": 2.1367125511169434, "Pretrain/Loss (Raw)": 1.9756895303726196, "Pretrain/Step": 1108, "Pretrain/Step Time": 8.408281244337559} +{"Pretrain/Learning Rate": 4.989613553802502e-05, "Pretrain/Loss": 2.1353659629821777, "Pretrain/Loss (Raw)": 2.101947784423828, "Pretrain/Step": 1109, "Pretrain/Step Time": 8.407992742955685} +{"Pretrain/Learning Rate": 4.9895748614912e-05, "Pretrain/Loss": 2.1366422176361084, "Pretrain/Loss (Raw)": 2.263054132461548, "Pretrain/Step": 1110, "Pretrain/Step Time": 8.405133282765746} +{"Pretrain/Learning Rate": 4.9895360973947615e-05, "Pretrain/Loss": 2.134838819503784, "Pretrain/Loss (Raw)": 2.0469963550567627, "Pretrain/Step": 1111, "Pretrain/Step Time": 8.409606056287885} +{"Pretrain/Learning Rate": 4.989497261514305e-05, "Pretrain/Loss": 2.1335787773132324, "Pretrain/Loss (Raw)": 2.135418653488159, "Pretrain/Step": 1112, "Pretrain/Step Time": 8.402680266648531} +{"Pretrain/Learning Rate": 4.98945835385095e-05, "Pretrain/Loss": 2.134915828704834, "Pretrain/Loss (Raw)": 2.131774425506592, "Pretrain/Step": 1113, "Pretrain/Step Time": 8.406347962096334} +{"Pretrain/Learning Rate": 4.989419374405818e-05, "Pretrain/Loss": 2.136047840118408, "Pretrain/Loss (Raw)": 2.129399061203003, "Pretrain/Step": 1114, "Pretrain/Step Time": 8.406358940526843} +{"Pretrain/Learning Rate": 4.989380323180033e-05, "Pretrain/Loss": 2.1362571716308594, "Pretrain/Loss (Raw)": 2.036965847015381, "Pretrain/Step": 1115, "Pretrain/Step Time": 8.408774573355913} +{"Pretrain/Learning Rate": 4.989341200174722e-05, "Pretrain/Loss": 2.135953664779663, "Pretrain/Loss (Raw)": 2.0692458152770996, "Pretrain/Step": 1116, "Pretrain/Step Time": 8.412271950393915} +{"Pretrain/Learning Rate": 4.9893020053910116e-05, "Pretrain/Loss": 2.1378636360168457, "Pretrain/Loss (Raw)": 2.2808573246002197, "Pretrain/Step": 1117, "Pretrain/Step Time": 8.413583448156714} +{"Pretrain/Learning Rate": 4.989262738830033e-05, "Pretrain/Loss": 2.137646436691284, "Pretrain/Loss (Raw)": 2.075549840927124, "Pretrain/Step": 1118, "Pretrain/Step Time": 8.41236906312406} +{"Pretrain/Learning Rate": 4.9892234004929186e-05, "Pretrain/Loss": 2.1360278129577637, "Pretrain/Loss (Raw)": 1.9134846925735474, "Pretrain/Step": 1119, "Pretrain/Step Time": 8.417472144588828} +{"Pretrain/Learning Rate": 4.9891839903808016e-05, "Pretrain/Loss": 2.1349611282348633, "Pretrain/Loss (Raw)": 2.006617307662964, "Pretrain/Step": 1120, "Pretrain/Step Time": 8.417392877861857} +{"Pretrain/Learning Rate": 4.9891445084948193e-05, "Pretrain/Loss": 2.136505603790283, "Pretrain/Loss (Raw)": 2.0501303672790527, "Pretrain/Step": 1121, "Pretrain/Step Time": 8.4166564848274} +{"Pretrain/Learning Rate": 4.9891049548361095e-05, "Pretrain/Loss": 2.1368844509124756, "Pretrain/Loss (Raw)": 2.133652687072754, "Pretrain/Step": 1122, "Pretrain/Step Time": 8.419564072042704} +{"Pretrain/Learning Rate": 4.989065329405813e-05, "Pretrain/Loss": 2.133695125579834, "Pretrain/Loss (Raw)": 1.9053250551223755, "Pretrain/Step": 1123, "Pretrain/Step Time": 8.420244317501783} +{"Pretrain/Learning Rate": 4.9890256322050734e-05, "Pretrain/Loss": 2.132279634475708, "Pretrain/Loss (Raw)": 2.364239454269409, "Pretrain/Step": 1124, "Pretrain/Step Time": 8.416695700958371} +{"Pretrain/Learning Rate": 4.9889858632350336e-05, "Pretrain/Loss": 2.1325368881225586, "Pretrain/Loss (Raw)": 2.1830594539642334, "Pretrain/Step": 1125, "Pretrain/Step Time": 8.421598456799984} +{"Pretrain/Learning Rate": 4.988946022496841e-05, "Pretrain/Loss": 2.131622076034546, "Pretrain/Loss (Raw)": 2.057309150695801, "Pretrain/Step": 1126, "Pretrain/Step Time": 8.425425300374627} +{"Pretrain/Learning Rate": 4.988906109991644e-05, "Pretrain/Loss": 2.1321964263916016, "Pretrain/Loss (Raw)": 2.017829656600952, "Pretrain/Step": 1127, "Pretrain/Step Time": 8.418058758601546} +{"Pretrain/Learning Rate": 4.988866125720595e-05, "Pretrain/Loss": 2.1315505504608154, "Pretrain/Loss (Raw)": 2.1229381561279297, "Pretrain/Step": 1128, "Pretrain/Step Time": 8.419750714674592} +{"Pretrain/Learning Rate": 4.988826069684845e-05, "Pretrain/Loss": 2.130601644515991, "Pretrain/Loss (Raw)": 2.247076988220215, "Pretrain/Step": 1129, "Pretrain/Step Time": 8.413705984130502} +{"Pretrain/Learning Rate": 4.98878594188555e-05, "Pretrain/Loss": 2.12955379486084, "Pretrain/Loss (Raw)": 2.0840466022491455, "Pretrain/Step": 1130, "Pretrain/Step Time": 8.418045761063695} +{"Pretrain/Learning Rate": 4.988745742323867e-05, "Pretrain/Loss": 2.1288537979125977, "Pretrain/Loss (Raw)": 2.1194825172424316, "Pretrain/Step": 1131, "Pretrain/Step Time": 8.413352254778147} +{"Pretrain/Learning Rate": 4.9887054710009545e-05, "Pretrain/Loss": 2.1281769275665283, "Pretrain/Loss (Raw)": 2.1003129482269287, "Pretrain/Step": 1132, "Pretrain/Step Time": 8.411371130496264} +{"Pretrain/Learning Rate": 4.9886651279179746e-05, "Pretrain/Loss": 2.1271114349365234, "Pretrain/Loss (Raw)": 2.075723171234131, "Pretrain/Step": 1133, "Pretrain/Step Time": 8.415250789374113} +{"Pretrain/Learning Rate": 4.98862471307609e-05, "Pretrain/Loss": 2.1268177032470703, "Pretrain/Loss (Raw)": 1.9888280630111694, "Pretrain/Step": 1134, "Pretrain/Step Time": 8.419254254549742} +{"Pretrain/Learning Rate": 4.988584226476466e-05, "Pretrain/Loss": 2.1265459060668945, "Pretrain/Loss (Raw)": 2.050938129425049, "Pretrain/Step": 1135, "Pretrain/Step Time": 8.415233973413706} +{"Pretrain/Learning Rate": 4.98854366812027e-05, "Pretrain/Loss": 2.1258692741394043, "Pretrain/Loss (Raw)": 2.0763442516326904, "Pretrain/Step": 1136, "Pretrain/Step Time": 8.415310963988304} +{"Pretrain/Learning Rate": 4.9885030380086726e-05, "Pretrain/Loss": 2.1241214275360107, "Pretrain/Loss (Raw)": 1.9095113277435303, "Pretrain/Step": 1137, "Pretrain/Step Time": 8.416201904416084} +{"Pretrain/Learning Rate": 4.988462336142844e-05, "Pretrain/Loss": 2.1230320930480957, "Pretrain/Loss (Raw)": 2.0826046466827393, "Pretrain/Step": 1138, "Pretrain/Step Time": 8.415635660290718} +{"Pretrain/Learning Rate": 4.988421562523958e-05, "Pretrain/Loss": 2.1235272884368896, "Pretrain/Loss (Raw)": 2.081913948059082, "Pretrain/Step": 1139, "Pretrain/Step Time": 8.415120534598827} +{"Pretrain/Learning Rate": 4.988380717153191e-05, "Pretrain/Loss": 2.1241631507873535, "Pretrain/Loss (Raw)": 2.188645362854004, "Pretrain/Step": 1140, "Pretrain/Step Time": 8.420314321294427} +{"Pretrain/Learning Rate": 4.988339800031718e-05, "Pretrain/Loss": 2.1238009929656982, "Pretrain/Loss (Raw)": 2.192789077758789, "Pretrain/Step": 1141, "Pretrain/Step Time": 8.420229900628328} +{"Pretrain/Learning Rate": 4.9882988111607233e-05, "Pretrain/Loss": 2.1236045360565186, "Pretrain/Loss (Raw)": 2.1904921531677246, "Pretrain/Step": 1142, "Pretrain/Step Time": 8.42172434926033} +{"Pretrain/Learning Rate": 4.988257750541386e-05, "Pretrain/Loss": 2.124072790145874, "Pretrain/Loss (Raw)": 2.116154670715332, "Pretrain/Step": 1143, "Pretrain/Step Time": 8.420072291046381} +{"Pretrain/Learning Rate": 4.9882166181748905e-05, "Pretrain/Loss": 2.125469446182251, "Pretrain/Loss (Raw)": 2.184872627258301, "Pretrain/Step": 1144, "Pretrain/Step Time": 8.415458917617798} +{"Pretrain/Learning Rate": 4.988175414062423e-05, "Pretrain/Loss": 2.1249446868896484, "Pretrain/Loss (Raw)": 2.0614213943481445, "Pretrain/Step": 1145, "Pretrain/Step Time": 8.412128260359168} +{"Pretrain/Learning Rate": 4.988134138205171e-05, "Pretrain/Loss": 2.128021478652954, "Pretrain/Loss (Raw)": 2.3878426551818848, "Pretrain/Step": 1146, "Pretrain/Step Time": 8.416502868756652} +{"Pretrain/Learning Rate": 4.988092790604325e-05, "Pretrain/Loss": 2.129793167114258, "Pretrain/Loss (Raw)": 2.2867329120635986, "Pretrain/Step": 1147, "Pretrain/Step Time": 8.417691184207797} +{"Pretrain/Learning Rate": 4.9880513712610784e-05, "Pretrain/Loss": 2.12939453125, "Pretrain/Loss (Raw)": 2.000110387802124, "Pretrain/Step": 1148, "Pretrain/Step Time": 8.414446368813515} +{"Pretrain/Learning Rate": 4.988009880176624e-05, "Pretrain/Loss": 2.1275038719177246, "Pretrain/Loss (Raw)": 1.9620813131332397, "Pretrain/Step": 1149, "Pretrain/Step Time": 8.415161930024624} +{"Pretrain/Learning Rate": 4.987968317352159e-05, "Pretrain/Loss": 2.1262917518615723, "Pretrain/Loss (Raw)": 2.0632588863372803, "Pretrain/Step": 1150, "Pretrain/Step Time": 8.41687024012208} +{"Pretrain/Learning Rate": 4.9879266827888806e-05, "Pretrain/Loss": 2.1243369579315186, "Pretrain/Loss (Raw)": 1.9820092916488647, "Pretrain/Step": 1151, "Pretrain/Step Time": 8.416328938677907} +{"Pretrain/Learning Rate": 4.98788497648799e-05, "Pretrain/Loss": 2.1214659214019775, "Pretrain/Loss (Raw)": 1.8046239614486694, "Pretrain/Step": 1152, "Pretrain/Step Time": 8.413342099636793} +{"Pretrain/Learning Rate": 4.9878431984506915e-05, "Pretrain/Loss": 2.1216650009155273, "Pretrain/Loss (Raw)": 2.3408045768737793, "Pretrain/Step": 1153, "Pretrain/Step Time": 8.416037932038307} +{"Pretrain/Learning Rate": 4.987801348678187e-05, "Pretrain/Loss": 2.121330976486206, "Pretrain/Loss (Raw)": 2.227872371673584, "Pretrain/Step": 1154, "Pretrain/Step Time": 8.418563418090343} +{"Pretrain/Learning Rate": 4.987759427171684e-05, "Pretrain/Loss": 2.1202902793884277, "Pretrain/Loss (Raw)": 2.10697603225708, "Pretrain/Step": 1155, "Pretrain/Step Time": 8.416852064430714} +{"Pretrain/Learning Rate": 4.9877174339323926e-05, "Pretrain/Loss": 2.1209850311279297, "Pretrain/Loss (Raw)": 2.2006540298461914, "Pretrain/Step": 1156, "Pretrain/Step Time": 8.421883147209883} +{"Pretrain/Learning Rate": 4.9876753689615216e-05, "Pretrain/Loss": 2.1221320629119873, "Pretrain/Loss (Raw)": 2.2793524265289307, "Pretrain/Step": 1157, "Pretrain/Step Time": 8.42033169977367} +{"Pretrain/Learning Rate": 4.987633232260286e-05, "Pretrain/Loss": 2.1213443279266357, "Pretrain/Loss (Raw)": 2.1812844276428223, "Pretrain/Step": 1158, "Pretrain/Step Time": 8.421905322000384} +{"Pretrain/Learning Rate": 4.9875910238299e-05, "Pretrain/Loss": 2.121075391769409, "Pretrain/Loss (Raw)": 2.047255516052246, "Pretrain/Step": 1159, "Pretrain/Step Time": 8.42100266739726} +{"Pretrain/Learning Rate": 4.9875487436715807e-05, "Pretrain/Loss": 2.1214160919189453, "Pretrain/Loss (Raw)": 2.192394256591797, "Pretrain/Step": 1160, "Pretrain/Step Time": 8.423285610973835} +{"Pretrain/Learning Rate": 4.987506391786546e-05, "Pretrain/Loss": 2.1195592880249023, "Pretrain/Loss (Raw)": 1.864974856376648, "Pretrain/Step": 1161, "Pretrain/Step Time": 8.424449432641268} +{"Pretrain/Learning Rate": 4.987463968176018e-05, "Pretrain/Loss": 2.1199727058410645, "Pretrain/Loss (Raw)": 2.117622137069702, "Pretrain/Step": 1162, "Pretrain/Step Time": 8.422713266685605} +{"Pretrain/Learning Rate": 4.9874214728412206e-05, "Pretrain/Loss": 2.1199705600738525, "Pretrain/Loss (Raw)": 2.1161656379699707, "Pretrain/Step": 1163, "Pretrain/Step Time": 8.425200428813696} +{"Pretrain/Learning Rate": 4.987378905783378e-05, "Pretrain/Loss": 2.1183106899261475, "Pretrain/Loss (Raw)": 1.9694480895996094, "Pretrain/Step": 1164, "Pretrain/Step Time": 8.423535326495767} +{"Pretrain/Learning Rate": 4.987336267003719e-05, "Pretrain/Loss": 2.1175050735473633, "Pretrain/Loss (Raw)": 2.03122615814209, "Pretrain/Step": 1165, "Pretrain/Step Time": 8.421365350484848} +{"Pretrain/Learning Rate": 4.987293556503472e-05, "Pretrain/Loss": 2.1189913749694824, "Pretrain/Loss (Raw)": 2.301408529281616, "Pretrain/Step": 1166, "Pretrain/Step Time": 8.419774258509278} +{"Pretrain/Learning Rate": 4.9872507742838686e-05, "Pretrain/Loss": 2.1188011169433594, "Pretrain/Loss (Raw)": 2.121683120727539, "Pretrain/Step": 1167, "Pretrain/Step Time": 8.417674919590354} +{"Pretrain/Learning Rate": 4.987207920346142e-05, "Pretrain/Loss": 2.1194396018981934, "Pretrain/Loss (Raw)": 2.108696699142456, "Pretrain/Step": 1168, "Pretrain/Step Time": 8.421960402280092} +{"Pretrain/Learning Rate": 4.987164994691529e-05, "Pretrain/Loss": 2.1196703910827637, "Pretrain/Loss (Raw)": 2.1579201221466064, "Pretrain/Step": 1169, "Pretrain/Step Time": 8.420860316604376} +{"Pretrain/Learning Rate": 4.987121997321267e-05, "Pretrain/Loss": 2.122021198272705, "Pretrain/Loss (Raw)": 2.318676710128784, "Pretrain/Step": 1170, "Pretrain/Step Time": 8.420115729793906} +{"Pretrain/Learning Rate": 4.987078928236595e-05, "Pretrain/Loss": 2.1218957901000977, "Pretrain/Loss (Raw)": 2.050076961517334, "Pretrain/Step": 1171, "Pretrain/Step Time": 8.422791315242648} +{"Pretrain/Learning Rate": 4.987035787438755e-05, "Pretrain/Loss": 2.1228389739990234, "Pretrain/Loss (Raw)": 2.1846539974212646, "Pretrain/Step": 1172, "Pretrain/Step Time": 8.424057576805353} +{"Pretrain/Learning Rate": 4.986992574928992e-05, "Pretrain/Loss": 2.120291233062744, "Pretrain/Loss (Raw)": 1.8887900114059448, "Pretrain/Step": 1173, "Pretrain/Step Time": 8.426711857318878} +{"Pretrain/Learning Rate": 4.9869492907085515e-05, "Pretrain/Loss": 2.121440887451172, "Pretrain/Loss (Raw)": 2.299297571182251, "Pretrain/Step": 1174, "Pretrain/Step Time": 8.429089637473226} +{"Pretrain/Learning Rate": 4.98690593477868e-05, "Pretrain/Loss": 2.1218085289001465, "Pretrain/Loss (Raw)": 2.1811065673828125, "Pretrain/Step": 1175, "Pretrain/Step Time": 8.427251879125834} +{"Pretrain/Learning Rate": 4.986862507140631e-05, "Pretrain/Loss": 2.121366024017334, "Pretrain/Loss (Raw)": 2.0559043884277344, "Pretrain/Step": 1176, "Pretrain/Step Time": 8.425403594970703} +{"Pretrain/Learning Rate": 4.986819007795653e-05, "Pretrain/Loss": 2.1226987838745117, "Pretrain/Loss (Raw)": 2.2469494342803955, "Pretrain/Step": 1177, "Pretrain/Step Time": 8.426101872697473} +{"Pretrain/Learning Rate": 4.9867754367450026e-05, "Pretrain/Loss": 2.1220130920410156, "Pretrain/Loss (Raw)": 2.0414135456085205, "Pretrain/Step": 1178, "Pretrain/Step Time": 8.422901559621096} +{"Pretrain/Learning Rate": 4.986731793989936e-05, "Pretrain/Loss": 2.1230034828186035, "Pretrain/Loss (Raw)": 2.18804931640625, "Pretrain/Step": 1179, "Pretrain/Step Time": 8.419512785971165} +{"Pretrain/Learning Rate": 4.986688079531711e-05, "Pretrain/Loss": 2.1239795684814453, "Pretrain/Loss (Raw)": 2.0811378955841064, "Pretrain/Step": 1180, "Pretrain/Step Time": 8.420017693191767} +{"Pretrain/Learning Rate": 4.9866442933715876e-05, "Pretrain/Loss": 2.122220754623413, "Pretrain/Loss (Raw)": 1.9197232723236084, "Pretrain/Step": 1181, "Pretrain/Step Time": 8.421178685501218} +{"Pretrain/Learning Rate": 4.9866004355108295e-05, "Pretrain/Loss": 2.121572732925415, "Pretrain/Loss (Raw)": 2.152512550354004, "Pretrain/Step": 1182, "Pretrain/Step Time": 8.423621091991663} +{"Pretrain/Learning Rate": 4.9865565059507e-05, "Pretrain/Loss": 2.123403549194336, "Pretrain/Loss (Raw)": 2.2436633110046387, "Pretrain/Step": 1183, "Pretrain/Step Time": 8.420296311378479} +{"Pretrain/Learning Rate": 4.9865125046924676e-05, "Pretrain/Loss": 2.1246001720428467, "Pretrain/Loss (Raw)": 2.0456838607788086, "Pretrain/Step": 1184, "Pretrain/Step Time": 8.418475937098265} +{"Pretrain/Learning Rate": 4.9864684317374e-05, "Pretrain/Loss": 2.123723030090332, "Pretrain/Loss (Raw)": 2.1193747520446777, "Pretrain/Step": 1185, "Pretrain/Step Time": 8.419690957292914} +{"Pretrain/Learning Rate": 4.986424287086767e-05, "Pretrain/Loss": 2.119198799133301, "Pretrain/Loss (Raw)": 1.8383902311325073, "Pretrain/Step": 1186, "Pretrain/Step Time": 8.423909993842244} +{"Pretrain/Learning Rate": 4.986380070741843e-05, "Pretrain/Loss": 2.1172618865966797, "Pretrain/Loss (Raw)": 2.040733575820923, "Pretrain/Step": 1187, "Pretrain/Step Time": 8.420571299269795} +{"Pretrain/Learning Rate": 4.986335782703903e-05, "Pretrain/Loss": 2.1154286861419678, "Pretrain/Loss (Raw)": 2.0355896949768066, "Pretrain/Step": 1188, "Pretrain/Step Time": 8.422940392047167} +{"Pretrain/Learning Rate": 4.986291422974223e-05, "Pretrain/Loss": 2.1147167682647705, "Pretrain/Loss (Raw)": 2.0037593841552734, "Pretrain/Step": 1189, "Pretrain/Step Time": 8.426722086966038} +{"Pretrain/Learning Rate": 4.9862469915540824e-05, "Pretrain/Loss": 2.113515853881836, "Pretrain/Loss (Raw)": 1.9550988674163818, "Pretrain/Step": 1190, "Pretrain/Step Time": 8.427085222676396} +{"Pretrain/Learning Rate": 4.986202488444763e-05, "Pretrain/Loss": 2.111628532409668, "Pretrain/Loss (Raw)": 1.9164817333221436, "Pretrain/Step": 1191, "Pretrain/Step Time": 8.42566797696054} +{"Pretrain/Learning Rate": 4.9861579136475466e-05, "Pretrain/Loss": 2.1120944023132324, "Pretrain/Loss (Raw)": 2.045107841491699, "Pretrain/Step": 1192, "Pretrain/Step Time": 8.42925094999373} +{"Pretrain/Learning Rate": 4.98611326716372e-05, "Pretrain/Loss": 2.1126794815063477, "Pretrain/Loss (Raw)": 2.1636390686035156, "Pretrain/Step": 1193, "Pretrain/Step Time": 8.427614022046328} +{"Pretrain/Learning Rate": 4.9860685489945704e-05, "Pretrain/Loss": 2.1089558601379395, "Pretrain/Loss (Raw)": 1.9707956314086914, "Pretrain/Step": 1194, "Pretrain/Step Time": 8.428538605570793} +{"Pretrain/Learning Rate": 4.986023759141386e-05, "Pretrain/Loss": 2.105388641357422, "Pretrain/Loss (Raw)": 1.9513795375823975, "Pretrain/Step": 1195, "Pretrain/Step Time": 8.427867835387588} +{"Pretrain/Learning Rate": 4.985978897605459e-05, "Pretrain/Loss": 2.106280565261841, "Pretrain/Loss (Raw)": 2.0654714107513428, "Pretrain/Step": 1196, "Pretrain/Step Time": 8.423282880336046} +{"Pretrain/Learning Rate": 4.985933964388083e-05, "Pretrain/Loss": 2.1054739952087402, "Pretrain/Loss (Raw)": 2.1468701362609863, "Pretrain/Step": 1197, "Pretrain/Step Time": 8.423134382814169} +{"Pretrain/Learning Rate": 4.985888959490554e-05, "Pretrain/Loss": 2.102029800415039, "Pretrain/Loss (Raw)": 1.8454707860946655, "Pretrain/Step": 1198, "Pretrain/Step Time": 8.423228431493044} +{"Pretrain/Learning Rate": 4.9858438829141695e-05, "Pretrain/Loss": 2.103135108947754, "Pretrain/Loss (Raw)": 2.2108380794525146, "Pretrain/Step": 1199, "Pretrain/Step Time": 8.425473030656576} +{"Pretrain/Learning Rate": 4.9857987346602284e-05, "Pretrain/Loss": 2.1015427112579346, "Pretrain/Loss (Raw)": 1.9694299697875977, "Pretrain/Step": 1200, "Pretrain/Step Time": 8.422098210081458} +{"Pretrain/Learning Rate": 4.985753514730034e-05, "Pretrain/Loss": 2.104637622833252, "Pretrain/Loss (Raw)": 2.261039972305298, "Pretrain/Step": 1201, "Pretrain/Step Time": 8.424522394314408} +{"Pretrain/Learning Rate": 4.985708223124888e-05, "Pretrain/Loss": 2.1015310287475586, "Pretrain/Loss (Raw)": 1.9235020875930786, "Pretrain/Step": 1202, "Pretrain/Step Time": 8.425525980070233} +{"Pretrain/Learning Rate": 4.9856628598460995e-05, "Pretrain/Loss": 2.1029133796691895, "Pretrain/Loss (Raw)": 2.213526964187622, "Pretrain/Step": 1203, "Pretrain/Step Time": 8.426952637732029} +{"Pretrain/Learning Rate": 4.9856174248949733e-05, "Pretrain/Loss": 2.1034576892852783, "Pretrain/Loss (Raw)": 2.1903514862060547, "Pretrain/Step": 1204, "Pretrain/Step Time": 8.42585995234549} +{"Pretrain/Learning Rate": 4.985571918272821e-05, "Pretrain/Loss": 2.1007206439971924, "Pretrain/Loss (Raw)": 1.8946458101272583, "Pretrain/Step": 1205, "Pretrain/Step Time": 8.427189430221915} +{"Pretrain/Learning Rate": 4.985526339980955e-05, "Pretrain/Loss": 2.10085391998291, "Pretrain/Loss (Raw)": 2.1159238815307617, "Pretrain/Step": 1206, "Pretrain/Step Time": 8.43021371588111} +{"Pretrain/Learning Rate": 4.9854806900206896e-05, "Pretrain/Loss": 2.1009371280670166, "Pretrain/Loss (Raw)": 2.0648560523986816, "Pretrain/Step": 1207, "Pretrain/Step Time": 8.429750232025981} +{"Pretrain/Learning Rate": 4.98543496839334e-05, "Pretrain/Loss": 2.1010849475860596, "Pretrain/Loss (Raw)": 2.129976987838745, "Pretrain/Step": 1208, "Pretrain/Step Time": 8.429684415459633} +{"Pretrain/Learning Rate": 4.985389175100225e-05, "Pretrain/Loss": 2.101924419403076, "Pretrain/Loss (Raw)": 2.374072551727295, "Pretrain/Step": 1209, "Pretrain/Step Time": 8.428478512912989} +{"Pretrain/Learning Rate": 4.985343310142666e-05, "Pretrain/Loss": 2.103503704071045, "Pretrain/Loss (Raw)": 2.2827043533325195, "Pretrain/Step": 1210, "Pretrain/Step Time": 8.42899720557034} +{"Pretrain/Learning Rate": 4.9852973735219846e-05, "Pretrain/Loss": 2.104307174682617, "Pretrain/Loss (Raw)": 2.1834967136383057, "Pretrain/Step": 1211, "Pretrain/Step Time": 8.433363636955619} +{"Pretrain/Learning Rate": 4.985251365239505e-05, "Pretrain/Loss": 2.1032357215881348, "Pretrain/Loss (Raw)": 2.159660577774048, "Pretrain/Step": 1212, "Pretrain/Step Time": 8.429781267419457} +{"Pretrain/Learning Rate": 4.9852052852965544e-05, "Pretrain/Loss": 2.1023166179656982, "Pretrain/Loss (Raw)": 2.15879225730896, "Pretrain/Step": 1213, "Pretrain/Step Time": 8.426207691431046} +{"Pretrain/Learning Rate": 4.9851591336944615e-05, "Pretrain/Loss": 2.103926420211792, "Pretrain/Loss (Raw)": 2.3590710163116455, "Pretrain/Step": 1214, "Pretrain/Step Time": 8.43183751963079} +{"Pretrain/Learning Rate": 4.985112910434556e-05, "Pretrain/Loss": 2.103886365890503, "Pretrain/Loss (Raw)": 2.137972116470337, "Pretrain/Step": 1215, "Pretrain/Step Time": 8.428211631253362} +{"Pretrain/Learning Rate": 4.985066615518172e-05, "Pretrain/Loss": 2.1022706031799316, "Pretrain/Loss (Raw)": 2.002366781234741, "Pretrain/Step": 1216, "Pretrain/Step Time": 8.426415218040347} +{"Pretrain/Learning Rate": 4.985020248946645e-05, "Pretrain/Loss": 2.1035714149475098, "Pretrain/Loss (Raw)": 2.3160929679870605, "Pretrain/Step": 1217, "Pretrain/Step Time": 8.426813391968608} +{"Pretrain/Learning Rate": 4.984973810721311e-05, "Pretrain/Loss": 2.104888916015625, "Pretrain/Loss (Raw)": 2.1191251277923584, "Pretrain/Step": 1218, "Pretrain/Step Time": 8.423400204628706} +{"Pretrain/Learning Rate": 4.9849273008435076e-05, "Pretrain/Loss": 2.1042702198028564, "Pretrain/Loss (Raw)": 2.0356826782226562, "Pretrain/Step": 1219, "Pretrain/Step Time": 8.427629239857197} +{"Pretrain/Learning Rate": 4.984880719314578e-05, "Pretrain/Loss": 2.104548454284668, "Pretrain/Loss (Raw)": 2.2220401763916016, "Pretrain/Step": 1220, "Pretrain/Step Time": 8.428426811471581} +{"Pretrain/Learning Rate": 4.984834066135865e-05, "Pretrain/Loss": 2.105931282043457, "Pretrain/Loss (Raw)": 2.1524879932403564, "Pretrain/Step": 1221, "Pretrain/Step Time": 8.431089002639055} +{"Pretrain/Learning Rate": 4.984787341308712e-05, "Pretrain/Loss": 2.1033568382263184, "Pretrain/Loss (Raw)": 1.8260473012924194, "Pretrain/Step": 1222, "Pretrain/Step Time": 8.431639265269041} +{"Pretrain/Learning Rate": 4.984740544834469e-05, "Pretrain/Loss": 2.1028223037719727, "Pretrain/Loss (Raw)": 2.0706844329833984, "Pretrain/Step": 1223, "Pretrain/Step Time": 8.436014726758003} +{"Pretrain/Learning Rate": 4.9846936767144836e-05, "Pretrain/Loss": 2.1006295680999756, "Pretrain/Loss (Raw)": 2.219350576400757, "Pretrain/Step": 1224, "Pretrain/Step Time": 8.435513336211443} +{"Pretrain/Learning Rate": 4.9846467369501075e-05, "Pretrain/Loss": 2.0982003211975098, "Pretrain/Loss (Raw)": 1.8559931516647339, "Pretrain/Step": 1225, "Pretrain/Step Time": 8.43387727625668} +{"Pretrain/Learning Rate": 4.984599725542695e-05, "Pretrain/Loss": 2.098271369934082, "Pretrain/Loss (Raw)": 2.2318646907806396, "Pretrain/Step": 1226, "Pretrain/Step Time": 8.437317434698343} +{"Pretrain/Learning Rate": 4.9845526424936e-05, "Pretrain/Loss": 2.098085403442383, "Pretrain/Loss (Raw)": 2.051466464996338, "Pretrain/Step": 1227, "Pretrain/Step Time": 8.436327805742621} +{"Pretrain/Learning Rate": 4.9845054878041816e-05, "Pretrain/Loss": 2.097942352294922, "Pretrain/Loss (Raw)": 2.1430647373199463, "Pretrain/Step": 1228, "Pretrain/Step Time": 8.433971159160137} +{"Pretrain/Learning Rate": 4.9844582614757985e-05, "Pretrain/Loss": 2.0949220657348633, "Pretrain/Loss (Raw)": 1.7433249950408936, "Pretrain/Step": 1229, "Pretrain/Step Time": 8.428420383483171} +{"Pretrain/Learning Rate": 4.984410963509813e-05, "Pretrain/Loss": 2.095045328140259, "Pretrain/Loss (Raw)": 2.052339553833008, "Pretrain/Step": 1230, "Pretrain/Step Time": 8.428337596356869} +{"Pretrain/Learning Rate": 4.984363593907589e-05, "Pretrain/Loss": 2.095104694366455, "Pretrain/Loss (Raw)": 2.083038330078125, "Pretrain/Step": 1231, "Pretrain/Step Time": 8.424327950924635} +{"Pretrain/Learning Rate": 4.984316152670492e-05, "Pretrain/Loss": 2.0936665534973145, "Pretrain/Loss (Raw)": 1.9220123291015625, "Pretrain/Step": 1232, "Pretrain/Step Time": 8.426302945241332} +{"Pretrain/Learning Rate": 4.98426863979989e-05, "Pretrain/Loss": 2.094364643096924, "Pretrain/Loss (Raw)": 2.098432779312134, "Pretrain/Step": 1233, "Pretrain/Step Time": 8.431463651359081} +{"Pretrain/Learning Rate": 4.984221055297153e-05, "Pretrain/Loss": 2.094963550567627, "Pretrain/Loss (Raw)": 2.0167031288146973, "Pretrain/Step": 1234, "Pretrain/Step Time": 8.428617924451828} +{"Pretrain/Learning Rate": 4.984173399163653e-05, "Pretrain/Loss": 2.098850965499878, "Pretrain/Loss (Raw)": 2.2601096630096436, "Pretrain/Step": 1235, "Pretrain/Step Time": 8.428764555603266} +{"Pretrain/Learning Rate": 4.984125671400764e-05, "Pretrain/Loss": 2.098776340484619, "Pretrain/Loss (Raw)": 1.966145634651184, "Pretrain/Step": 1236, "Pretrain/Step Time": 8.437088621780276} +{"Pretrain/Learning Rate": 4.9840778720098635e-05, "Pretrain/Loss": 2.099928379058838, "Pretrain/Loss (Raw)": 2.2494125366210938, "Pretrain/Step": 1237, "Pretrain/Step Time": 8.43851651251316} +{"Pretrain/Learning Rate": 4.984030000992329e-05, "Pretrain/Loss": 2.0996012687683105, "Pretrain/Loss (Raw)": 2.221170663833618, "Pretrain/Step": 1238, "Pretrain/Step Time": 8.436402993276715} +{"Pretrain/Learning Rate": 4.983982058349539e-05, "Pretrain/Loss": 2.1010305881500244, "Pretrain/Loss (Raw)": 2.2299392223358154, "Pretrain/Step": 1239, "Pretrain/Step Time": 8.434490928426385} +{"Pretrain/Learning Rate": 4.983934044082879e-05, "Pretrain/Loss": 2.1000404357910156, "Pretrain/Loss (Raw)": 2.008697271347046, "Pretrain/Step": 1240, "Pretrain/Step Time": 8.440389178693295} +{"Pretrain/Learning Rate": 4.9838859581937306e-05, "Pretrain/Loss": 2.099964141845703, "Pretrain/Loss (Raw)": 2.1220054626464844, "Pretrain/Step": 1241, "Pretrain/Step Time": 8.437458273023367} +{"Pretrain/Learning Rate": 4.983837800683482e-05, "Pretrain/Loss": 2.098743438720703, "Pretrain/Loss (Raw)": 1.973149299621582, "Pretrain/Step": 1242, "Pretrain/Step Time": 8.437366053462029} +{"Pretrain/Learning Rate": 4.9837895715535215e-05, "Pretrain/Loss": 2.099377393722534, "Pretrain/Loss (Raw)": 2.1180999279022217, "Pretrain/Step": 1243, "Pretrain/Step Time": 8.435706736519933} +{"Pretrain/Learning Rate": 4.98374127080524e-05, "Pretrain/Loss": 2.100261688232422, "Pretrain/Loss (Raw)": 2.182438373565674, "Pretrain/Step": 1244, "Pretrain/Step Time": 8.43489152751863} +{"Pretrain/Learning Rate": 4.9836928984400286e-05, "Pretrain/Loss": 2.0973598957061768, "Pretrain/Loss (Raw)": 1.9094196557998657, "Pretrain/Step": 1245, "Pretrain/Step Time": 8.433636063709855} +{"Pretrain/Learning Rate": 4.983644454459285e-05, "Pretrain/Loss": 2.0972096920013428, "Pretrain/Loss (Raw)": 2.0563418865203857, "Pretrain/Step": 1246, "Pretrain/Step Time": 8.43202000297606} +{"Pretrain/Learning Rate": 4.9835959388644035e-05, "Pretrain/Loss": 2.0993337631225586, "Pretrain/Loss (Raw)": 2.1853418350219727, "Pretrain/Step": 1247, "Pretrain/Step Time": 8.425026850774884} +{"Pretrain/Learning Rate": 4.983547351656784e-05, "Pretrain/Loss": 2.101803779602051, "Pretrain/Loss (Raw)": 2.3227896690368652, "Pretrain/Step": 1248, "Pretrain/Step Time": 8.430131427943707} +{"Pretrain/Learning Rate": 4.983498692837828e-05, "Pretrain/Loss": 2.10105562210083, "Pretrain/Loss (Raw)": 1.954365849494934, "Pretrain/Step": 1249, "Pretrain/Step Time": 8.430815618485212} +{"Pretrain/Learning Rate": 4.983449962408937e-05, "Pretrain/Loss": 2.100536823272705, "Pretrain/Loss (Raw)": 2.0672366619110107, "Pretrain/Step": 1250, "Pretrain/Step Time": 8.428817378357053} +{"Pretrain/Learning Rate": 4.983401160371518e-05, "Pretrain/Loss": 2.101952314376831, "Pretrain/Loss (Raw)": 2.0865304470062256, "Pretrain/Step": 1251, "Pretrain/Step Time": 8.42711540311575} +{"Pretrain/Learning Rate": 4.983352286726977e-05, "Pretrain/Loss": 2.0995917320251465, "Pretrain/Loss (Raw)": 2.062082052230835, "Pretrain/Step": 1252, "Pretrain/Step Time": 8.43277787975967} +{"Pretrain/Learning Rate": 4.9833033414767225e-05, "Pretrain/Loss": 2.0984997749328613, "Pretrain/Loss (Raw)": 2.043290376663208, "Pretrain/Step": 1253, "Pretrain/Step Time": 8.42787397839129} +{"Pretrain/Learning Rate": 4.9832543246221675e-05, "Pretrain/Loss": 2.0977368354797363, "Pretrain/Loss (Raw)": 1.9596426486968994, "Pretrain/Step": 1254, "Pretrain/Step Time": 8.427509270608425} +{"Pretrain/Learning Rate": 4.983205236164725e-05, "Pretrain/Loss": 2.098318099975586, "Pretrain/Loss (Raw)": 2.0922000408172607, "Pretrain/Step": 1255, "Pretrain/Step Time": 8.430895643308759} +{"Pretrain/Learning Rate": 4.9831560761058096e-05, "Pretrain/Loss": 2.0981431007385254, "Pretrain/Loss (Raw)": 2.100590705871582, "Pretrain/Step": 1256, "Pretrain/Step Time": 8.432492101565003} +{"Pretrain/Learning Rate": 4.983106844446839e-05, "Pretrain/Loss": 2.0944056510925293, "Pretrain/Loss (Raw)": 1.7686407566070557, "Pretrain/Step": 1257, "Pretrain/Step Time": 8.438028384000063} +{"Pretrain/Learning Rate": 4.983057541189233e-05, "Pretrain/Loss": 2.094414710998535, "Pretrain/Loss (Raw)": 2.0852253437042236, "Pretrain/Step": 1258, "Pretrain/Step Time": 8.435808578506112} +{"Pretrain/Learning Rate": 4.983008166334414e-05, "Pretrain/Loss": 2.0920052528381348, "Pretrain/Loss (Raw)": 1.811082363128662, "Pretrain/Step": 1259, "Pretrain/Step Time": 8.436673203483224} +{"Pretrain/Learning Rate": 4.982958719883804e-05, "Pretrain/Loss": 2.09196138381958, "Pretrain/Loss (Raw)": 2.094667434692383, "Pretrain/Step": 1260, "Pretrain/Step Time": 8.43689920194447} +{"Pretrain/Learning Rate": 4.982909201838831e-05, "Pretrain/Loss": 2.092362403869629, "Pretrain/Loss (Raw)": 2.1270768642425537, "Pretrain/Step": 1261, "Pretrain/Step Time": 8.43002450466156} +{"Pretrain/Learning Rate": 4.982859612200921e-05, "Pretrain/Loss": 2.094937324523926, "Pretrain/Loss (Raw)": 2.318432569503784, "Pretrain/Step": 1262, "Pretrain/Step Time": 8.429374653846025} +{"Pretrain/Learning Rate": 4.9828099509715034e-05, "Pretrain/Loss": 2.095430850982666, "Pretrain/Loss (Raw)": 2.114078998565674, "Pretrain/Step": 1263, "Pretrain/Step Time": 8.430857775732875} +{"Pretrain/Learning Rate": 4.982760218152012e-05, "Pretrain/Loss": 2.095431089401245, "Pretrain/Loss (Raw)": 2.0763914585113525, "Pretrain/Step": 1264, "Pretrain/Step Time": 8.430463572964072} +{"Pretrain/Learning Rate": 4.9827104137438794e-05, "Pretrain/Loss": 2.0975418090820312, "Pretrain/Loss (Raw)": 2.179659843444824, "Pretrain/Step": 1265, "Pretrain/Step Time": 8.429221533238888} +{"Pretrain/Learning Rate": 4.982660537748543e-05, "Pretrain/Loss": 2.0966973304748535, "Pretrain/Loss (Raw)": 1.9745434522628784, "Pretrain/Step": 1266, "Pretrain/Step Time": 8.433150205761194} +{"Pretrain/Learning Rate": 4.98261059016744e-05, "Pretrain/Loss": 2.0953636169433594, "Pretrain/Loss (Raw)": 1.9111934900283813, "Pretrain/Step": 1267, "Pretrain/Step Time": 8.432453526183963} +{"Pretrain/Learning Rate": 4.98256057100201e-05, "Pretrain/Loss": 2.0955114364624023, "Pretrain/Loss (Raw)": 2.207540988922119, "Pretrain/Step": 1268, "Pretrain/Step Time": 8.428824612870812} +{"Pretrain/Learning Rate": 4.982510480253697e-05, "Pretrain/Loss": 2.095412492752075, "Pretrain/Loss (Raw)": 2.1801366806030273, "Pretrain/Step": 1269, "Pretrain/Step Time": 8.42934825271368} +{"Pretrain/Learning Rate": 4.9824603179239435e-05, "Pretrain/Loss": 2.094578266143799, "Pretrain/Loss (Raw)": 2.083702325820923, "Pretrain/Step": 1270, "Pretrain/Step Time": 8.431507049128413} +{"Pretrain/Learning Rate": 4.982410084014197e-05, "Pretrain/Loss": 2.0966358184814453, "Pretrain/Loss (Raw)": 2.3795406818389893, "Pretrain/Step": 1271, "Pretrain/Step Time": 8.430420562624931} +{"Pretrain/Learning Rate": 4.982359778525906e-05, "Pretrain/Loss": 2.095612049102783, "Pretrain/Loss (Raw)": 2.0538177490234375, "Pretrain/Step": 1272, "Pretrain/Step Time": 8.435394991189241} +{"Pretrain/Learning Rate": 4.9823094014605204e-05, "Pretrain/Loss": 2.097224473953247, "Pretrain/Loss (Raw)": 2.2678122520446777, "Pretrain/Step": 1273, "Pretrain/Step Time": 8.437213715165854} +{"Pretrain/Learning Rate": 4.982258952819493e-05, "Pretrain/Loss": 2.093991756439209, "Pretrain/Loss (Raw)": 1.9740604162216187, "Pretrain/Step": 1274, "Pretrain/Step Time": 8.43340802937746} +{"Pretrain/Learning Rate": 4.98220843260428e-05, "Pretrain/Loss": 2.0939698219299316, "Pretrain/Loss (Raw)": 2.2839407920837402, "Pretrain/Step": 1275, "Pretrain/Step Time": 8.433154305443168} +{"Pretrain/Learning Rate": 4.982157840816335e-05, "Pretrain/Loss": 2.0932765007019043, "Pretrain/Loss (Raw)": 1.9113657474517822, "Pretrain/Step": 1276, "Pretrain/Step Time": 8.435902088880539} +{"Pretrain/Learning Rate": 4.9821071774571187e-05, "Pretrain/Loss": 2.0956552028656006, "Pretrain/Loss (Raw)": 2.266535997390747, "Pretrain/Step": 1277, "Pretrain/Step Time": 8.434189639985561} +{"Pretrain/Learning Rate": 4.982056442528092e-05, "Pretrain/Loss": 2.095500946044922, "Pretrain/Loss (Raw)": 2.043515205383301, "Pretrain/Step": 1278, "Pretrain/Step Time": 8.42838509939611} +{"Pretrain/Learning Rate": 4.9820056360307176e-05, "Pretrain/Loss": 2.096127986907959, "Pretrain/Loss (Raw)": 2.062279224395752, "Pretrain/Step": 1279, "Pretrain/Step Time": 8.429363071918488} +{"Pretrain/Learning Rate": 4.981954757966461e-05, "Pretrain/Loss": 2.0993947982788086, "Pretrain/Loss (Raw)": 2.2227911949157715, "Pretrain/Step": 1280, "Pretrain/Step Time": 8.432221569120884} +{"Pretrain/Learning Rate": 4.981903808336787e-05, "Pretrain/Loss": 2.0977067947387695, "Pretrain/Loss (Raw)": 2.1247124671936035, "Pretrain/Step": 1281, "Pretrain/Step Time": 8.426482059061527} +{"Pretrain/Learning Rate": 4.9818527871431675e-05, "Pretrain/Loss": 2.095808506011963, "Pretrain/Loss (Raw)": 1.984899878501892, "Pretrain/Step": 1282, "Pretrain/Step Time": 8.42952237650752} +{"Pretrain/Learning Rate": 4.981801694387072e-05, "Pretrain/Loss": 2.0953097343444824, "Pretrain/Loss (Raw)": 2.043121337890625, "Pretrain/Step": 1283, "Pretrain/Step Time": 8.43023395165801} +{"Pretrain/Learning Rate": 4.981750530069975e-05, "Pretrain/Loss": 2.0950348377227783, "Pretrain/Loss (Raw)": 2.165489435195923, "Pretrain/Step": 1284, "Pretrain/Step Time": 8.424058863893151} +{"Pretrain/Learning Rate": 4.98169929419335e-05, "Pretrain/Loss": 2.093113899230957, "Pretrain/Loss (Raw)": 2.03346848487854, "Pretrain/Step": 1285, "Pretrain/Step Time": 8.424112293869257} +{"Pretrain/Learning Rate": 4.981647986758676e-05, "Pretrain/Loss": 2.093663454055786, "Pretrain/Loss (Raw)": 2.25162672996521, "Pretrain/Step": 1286, "Pretrain/Step Time": 8.421842865645885} +{"Pretrain/Learning Rate": 4.9815966077674316e-05, "Pretrain/Loss": 2.0942835807800293, "Pretrain/Loss (Raw)": 2.126596689224243, "Pretrain/Step": 1287, "Pretrain/Step Time": 8.42077718488872} +{"Pretrain/Learning Rate": 4.9815451572210983e-05, "Pretrain/Loss": 2.0924482345581055, "Pretrain/Loss (Raw)": 1.9574986696243286, "Pretrain/Step": 1288, "Pretrain/Step Time": 8.424325095489621} +{"Pretrain/Learning Rate": 4.9814936351211595e-05, "Pretrain/Loss": 2.096036434173584, "Pretrain/Loss (Raw)": 2.3242666721343994, "Pretrain/Step": 1289, "Pretrain/Step Time": 8.421835279092193} +{"Pretrain/Learning Rate": 4.981442041469101e-05, "Pretrain/Loss": 2.0964012145996094, "Pretrain/Loss (Raw)": 2.164302349090576, "Pretrain/Step": 1290, "Pretrain/Step Time": 8.423057673498988} +{"Pretrain/Learning Rate": 4.981390376266411e-05, "Pretrain/Loss": 2.096045732498169, "Pretrain/Loss (Raw)": 2.0706727504730225, "Pretrain/Step": 1291, "Pretrain/Step Time": 8.425549272447824} +{"Pretrain/Learning Rate": 4.981338639514579e-05, "Pretrain/Loss": 2.0991945266723633, "Pretrain/Loss (Raw)": 2.372514486312866, "Pretrain/Step": 1292, "Pretrain/Step Time": 8.423494843766093} +{"Pretrain/Learning Rate": 4.981286831215096e-05, "Pretrain/Loss": 2.101353168487549, "Pretrain/Loss (Raw)": 2.307511329650879, "Pretrain/Step": 1293, "Pretrain/Step Time": 8.424211511388421} +{"Pretrain/Learning Rate": 4.981234951369457e-05, "Pretrain/Loss": 2.1001815795898438, "Pretrain/Loss (Raw)": 2.151470899581909, "Pretrain/Step": 1294, "Pretrain/Step Time": 8.426613545045257} +{"Pretrain/Learning Rate": 4.981182999979156e-05, "Pretrain/Loss": 2.098942279815674, "Pretrain/Loss (Raw)": 1.9630088806152344, "Pretrain/Step": 1295, "Pretrain/Step Time": 8.42815044336021} +{"Pretrain/Learning Rate": 4.981130977045694e-05, "Pretrain/Loss": 2.0996389389038086, "Pretrain/Loss (Raw)": 2.19789981842041, "Pretrain/Step": 1296, "Pretrain/Step Time": 8.422857193276286} +{"Pretrain/Learning Rate": 4.9810788825705675e-05, "Pretrain/Loss": 2.1007347106933594, "Pretrain/Loss (Raw)": 2.298166513442993, "Pretrain/Step": 1297, "Pretrain/Step Time": 8.424098052084446} +{"Pretrain/Learning Rate": 4.981026716555283e-05, "Pretrain/Loss": 2.1004881858825684, "Pretrain/Loss (Raw)": 2.2871158123016357, "Pretrain/Step": 1298, "Pretrain/Step Time": 8.42326612956822} +{"Pretrain/Learning Rate": 4.98097447900134e-05, "Pretrain/Loss": 2.1007819175720215, "Pretrain/Loss (Raw)": 2.087665319442749, "Pretrain/Step": 1299, "Pretrain/Step Time": 8.424146626144648} +{"Pretrain/Learning Rate": 4.980922169910247e-05, "Pretrain/Loss": 2.1018807888031006, "Pretrain/Loss (Raw)": 2.325334072113037, "Pretrain/Step": 1300, "Pretrain/Step Time": 8.421527612954378} +{"Pretrain/Learning Rate": 4.980869789283513e-05, "Pretrain/Loss": 2.1032028198242188, "Pretrain/Loss (Raw)": 2.0579848289489746, "Pretrain/Step": 1301, "Pretrain/Step Time": 8.420358169823885} +{"Pretrain/Learning Rate": 4.9808173371226475e-05, "Pretrain/Loss": 2.0999197959899902, "Pretrain/Loss (Raw)": 1.8791110515594482, "Pretrain/Step": 1302, "Pretrain/Step Time": 8.41280478052795} +{"Pretrain/Learning Rate": 4.980764813429163e-05, "Pretrain/Loss": 2.0991785526275635, "Pretrain/Loss (Raw)": 2.0861823558807373, "Pretrain/Step": 1303, "Pretrain/Step Time": 8.418077053502202} +{"Pretrain/Learning Rate": 4.980712218204574e-05, "Pretrain/Loss": 2.100038528442383, "Pretrain/Loss (Raw)": 2.1660001277923584, "Pretrain/Step": 1304, "Pretrain/Step Time": 8.419151354581118} +{"Pretrain/Learning Rate": 4.9806595514503965e-05, "Pretrain/Loss": 2.0993294715881348, "Pretrain/Loss (Raw)": 2.15620493888855, "Pretrain/Step": 1305, "Pretrain/Step Time": 8.421219045296311} +{"Pretrain/Learning Rate": 4.9806068131681494e-05, "Pretrain/Loss": 2.098851203918457, "Pretrain/Loss (Raw)": 1.9801876544952393, "Pretrain/Step": 1306, "Pretrain/Step Time": 8.421571968123317} +{"Pretrain/Learning Rate": 4.980554003359354e-05, "Pretrain/Loss": 2.0963408946990967, "Pretrain/Loss (Raw)": 1.8667110204696655, "Pretrain/Step": 1307, "Pretrain/Step Time": 8.423072190955281} +{"Pretrain/Learning Rate": 4.9805011220255324e-05, "Pretrain/Loss": 2.0976333618164062, "Pretrain/Loss (Raw)": 2.246565818786621, "Pretrain/Step": 1308, "Pretrain/Step Time": 8.421429274603724} +{"Pretrain/Learning Rate": 4.980448169168209e-05, "Pretrain/Loss": 2.0993967056274414, "Pretrain/Loss (Raw)": 2.145447015762329, "Pretrain/Step": 1309, "Pretrain/Step Time": 8.42109976708889} +{"Pretrain/Learning Rate": 4.980395144788913e-05, "Pretrain/Loss": 2.100221872329712, "Pretrain/Loss (Raw)": 2.2581443786621094, "Pretrain/Step": 1310, "Pretrain/Step Time": 8.425066221505404} +{"Pretrain/Learning Rate": 4.9803420488891696e-05, "Pretrain/Loss": 2.100353717803955, "Pretrain/Loss (Raw)": 2.260549545288086, "Pretrain/Step": 1311, "Pretrain/Step Time": 8.42524142190814} +{"Pretrain/Learning Rate": 4.9802888814705126e-05, "Pretrain/Loss": 2.1002464294433594, "Pretrain/Loss (Raw)": 2.0319347381591797, "Pretrain/Step": 1312, "Pretrain/Step Time": 8.427459644153714} +{"Pretrain/Learning Rate": 4.9802356425344746e-05, "Pretrain/Loss": 2.099669933319092, "Pretrain/Loss (Raw)": 2.0455875396728516, "Pretrain/Step": 1313, "Pretrain/Step Time": 8.422741424292326} +{"Pretrain/Learning Rate": 4.9801823320825897e-05, "Pretrain/Loss": 2.101254940032959, "Pretrain/Loss (Raw)": 2.0412683486938477, "Pretrain/Step": 1314, "Pretrain/Step Time": 8.418423287570477} +{"Pretrain/Learning Rate": 4.980128950116396e-05, "Pretrain/Loss": 2.101386547088623, "Pretrain/Loss (Raw)": 2.057579517364502, "Pretrain/Step": 1315, "Pretrain/Step Time": 8.42127594165504} +{"Pretrain/Learning Rate": 4.980075496637432e-05, "Pretrain/Loss": 2.1017942428588867, "Pretrain/Loss (Raw)": 2.0877835750579834, "Pretrain/Step": 1316, "Pretrain/Step Time": 8.418333245441318} +{"Pretrain/Learning Rate": 4.98002197164724e-05, "Pretrain/Loss": 2.102762222290039, "Pretrain/Loss (Raw)": 2.127652168273926, "Pretrain/Step": 1317, "Pretrain/Step Time": 8.419109094887972} +{"Pretrain/Learning Rate": 4.979968375147363e-05, "Pretrain/Loss": 2.102527379989624, "Pretrain/Loss (Raw)": 1.9250375032424927, "Pretrain/Step": 1318, "Pretrain/Step Time": 8.417815808206797} +{"Pretrain/Learning Rate": 4.979914707139345e-05, "Pretrain/Loss": 2.103691577911377, "Pretrain/Loss (Raw)": 2.065483808517456, "Pretrain/Step": 1319, "Pretrain/Step Time": 8.416856344789267} +{"Pretrain/Learning Rate": 4.979860967624735e-05, "Pretrain/Loss": 2.10410737991333, "Pretrain/Loss (Raw)": 2.098344326019287, "Pretrain/Step": 1320, "Pretrain/Step Time": 8.419724589213729} +{"Pretrain/Learning Rate": 4.979807156605082e-05, "Pretrain/Loss": 2.1041741371154785, "Pretrain/Loss (Raw)": 2.172206401824951, "Pretrain/Step": 1321, "Pretrain/Step Time": 8.421912349760532} +{"Pretrain/Learning Rate": 4.9797532740819386e-05, "Pretrain/Loss": 2.1013879776000977, "Pretrain/Loss (Raw)": 1.6141409873962402, "Pretrain/Step": 1322, "Pretrain/Step Time": 8.427860915660858} +{"Pretrain/Learning Rate": 4.979699320056857e-05, "Pretrain/Loss": 2.1029839515686035, "Pretrain/Loss (Raw)": 2.1556570529937744, "Pretrain/Step": 1323, "Pretrain/Step Time": 8.427094398066401} +{"Pretrain/Learning Rate": 4.979645294531394e-05, "Pretrain/Loss": 2.1063005924224854, "Pretrain/Loss (Raw)": 2.4899954795837402, "Pretrain/Step": 1324, "Pretrain/Step Time": 8.431505618616939} +{"Pretrain/Learning Rate": 4.979591197507106e-05, "Pretrain/Loss": 2.1055994033813477, "Pretrain/Loss (Raw)": 2.057128429412842, "Pretrain/Step": 1325, "Pretrain/Step Time": 8.433490291237831} +{"Pretrain/Learning Rate": 4.9795370289855554e-05, "Pretrain/Loss": 2.1062450408935547, "Pretrain/Loss (Raw)": 1.9281164407730103, "Pretrain/Step": 1326, "Pretrain/Step Time": 8.431964004412293} +{"Pretrain/Learning Rate": 4.9794827889683015e-05, "Pretrain/Loss": 2.108672618865967, "Pretrain/Loss (Raw)": 2.52156400680542, "Pretrain/Step": 1327, "Pretrain/Step Time": 8.427725553512573} +{"Pretrain/Learning Rate": 4.97942847745691e-05, "Pretrain/Loss": 2.1093010902404785, "Pretrain/Loss (Raw)": 2.049879312515259, "Pretrain/Step": 1328, "Pretrain/Step Time": 8.429502058774233} +{"Pretrain/Learning Rate": 4.9793740944529455e-05, "Pretrain/Loss": 2.1073172092437744, "Pretrain/Loss (Raw)": 2.007096290588379, "Pretrain/Step": 1329, "Pretrain/Step Time": 8.427055491134524} +{"Pretrain/Learning Rate": 4.979319639957977e-05, "Pretrain/Loss": 2.1092820167541504, "Pretrain/Loss (Raw)": 2.17501163482666, "Pretrain/Step": 1330, "Pretrain/Step Time": 8.428236439824104} +{"Pretrain/Learning Rate": 4.9792651139735745e-05, "Pretrain/Loss": 2.109050750732422, "Pretrain/Loss (Raw)": 2.183927536010742, "Pretrain/Step": 1331, "Pretrain/Step Time": 8.425407189875841} +{"Pretrain/Learning Rate": 4.9792105165013105e-05, "Pretrain/Loss": 2.1073832511901855, "Pretrain/Loss (Raw)": 1.9769107103347778, "Pretrain/Step": 1332, "Pretrain/Step Time": 8.42927892319858} +{"Pretrain/Learning Rate": 4.9791558475427584e-05, "Pretrain/Loss": 2.109344244003296, "Pretrain/Loss (Raw)": 2.1456589698791504, "Pretrain/Step": 1333, "Pretrain/Step Time": 8.425026746466756} +{"Pretrain/Learning Rate": 4.9791011070994956e-05, "Pretrain/Loss": 2.110790252685547, "Pretrain/Loss (Raw)": 2.301013469696045, "Pretrain/Step": 1334, "Pretrain/Step Time": 8.42330039665103} +{"Pretrain/Learning Rate": 4.9790462951730997e-05, "Pretrain/Loss": 2.112518310546875, "Pretrain/Loss (Raw)": 2.286017656326294, "Pretrain/Step": 1335, "Pretrain/Step Time": 8.422134436666965} +{"Pretrain/Learning Rate": 4.978991411765152e-05, "Pretrain/Loss": 2.1116714477539062, "Pretrain/Loss (Raw)": 2.0216007232666016, "Pretrain/Step": 1336, "Pretrain/Step Time": 8.42050639912486} +{"Pretrain/Learning Rate": 4.978936456877235e-05, "Pretrain/Loss": 2.108999490737915, "Pretrain/Loss (Raw)": 2.0320565700531006, "Pretrain/Step": 1337, "Pretrain/Step Time": 8.422781851142645} +{"Pretrain/Learning Rate": 4.978881430510931e-05, "Pretrain/Loss": 2.1080145835876465, "Pretrain/Loss (Raw)": 2.156625747680664, "Pretrain/Step": 1338, "Pretrain/Step Time": 8.42249270528555} +{"Pretrain/Learning Rate": 4.97882633266783e-05, "Pretrain/Loss": 2.1110548973083496, "Pretrain/Loss (Raw)": 2.5726473331451416, "Pretrain/Step": 1339, "Pretrain/Step Time": 8.422617219388485} +{"Pretrain/Learning Rate": 4.9787711633495183e-05, "Pretrain/Loss": 2.1109278202056885, "Pretrain/Loss (Raw)": 2.1434056758880615, "Pretrain/Step": 1340, "Pretrain/Step Time": 8.423945249989629} +{"Pretrain/Learning Rate": 4.9787159225575876e-05, "Pretrain/Loss": 2.111598014831543, "Pretrain/Loss (Raw)": 2.244611978530884, "Pretrain/Step": 1341, "Pretrain/Step Time": 8.426029516384006} +{"Pretrain/Learning Rate": 4.9786606102936314e-05, "Pretrain/Loss": 2.1101388931274414, "Pretrain/Loss (Raw)": 2.172283411026001, "Pretrain/Step": 1342, "Pretrain/Step Time": 8.423052679747343} +{"Pretrain/Learning Rate": 4.978605226559243e-05, "Pretrain/Loss": 2.1111230850219727, "Pretrain/Loss (Raw)": 2.263951063156128, "Pretrain/Step": 1343, "Pretrain/Step Time": 8.421088695526123} +{"Pretrain/Learning Rate": 4.9785497713560204e-05, "Pretrain/Loss": 2.110128402709961, "Pretrain/Loss (Raw)": 1.875031590461731, "Pretrain/Step": 1344, "Pretrain/Step Time": 8.423466021195054} +{"Pretrain/Learning Rate": 4.978494244685563e-05, "Pretrain/Loss": 2.1091504096984863, "Pretrain/Loss (Raw)": 2.190904140472412, "Pretrain/Step": 1345, "Pretrain/Step Time": 8.422252869233489} +{"Pretrain/Learning Rate": 4.97843864654947e-05, "Pretrain/Loss": 2.1102309226989746, "Pretrain/Loss (Raw)": 2.257422685623169, "Pretrain/Step": 1346, "Pretrain/Step Time": 8.42857675999403} +{"Pretrain/Learning Rate": 4.978382976949347e-05, "Pretrain/Loss": 2.108673334121704, "Pretrain/Loss (Raw)": 1.8363287448883057, "Pretrain/Step": 1347, "Pretrain/Step Time": 8.42639396339655} +{"Pretrain/Learning Rate": 4.978327235886798e-05, "Pretrain/Loss": 2.107612133026123, "Pretrain/Loss (Raw)": 2.086207151412964, "Pretrain/Step": 1348, "Pretrain/Step Time": 8.425819288939238} +{"Pretrain/Learning Rate": 4.97827142336343e-05, "Pretrain/Loss": 2.106110095977783, "Pretrain/Loss (Raw)": 1.9602538347244263, "Pretrain/Step": 1349, "Pretrain/Step Time": 8.424920355901122} +{"Pretrain/Learning Rate": 4.9782155393808524e-05, "Pretrain/Loss": 2.109706401824951, "Pretrain/Loss (Raw)": 2.2863237857818604, "Pretrain/Step": 1350, "Pretrain/Step Time": 8.423081863671541} +{"Pretrain/Learning Rate": 4.978159583940677e-05, "Pretrain/Loss": 2.109160900115967, "Pretrain/Loss (Raw)": 2.0009191036224365, "Pretrain/Step": 1351, "Pretrain/Step Time": 8.421020464971662} +{"Pretrain/Learning Rate": 4.9781035570445166e-05, "Pretrain/Loss": 2.109403133392334, "Pretrain/Loss (Raw)": 2.2503347396850586, "Pretrain/Step": 1352, "Pretrain/Step Time": 8.423424012959003} +{"Pretrain/Learning Rate": 4.978047458693987e-05, "Pretrain/Loss": 2.110912561416626, "Pretrain/Loss (Raw)": 2.0491878986358643, "Pretrain/Step": 1353, "Pretrain/Step Time": 8.424074435606599} +{"Pretrain/Learning Rate": 4.9779912888907065e-05, "Pretrain/Loss": 2.110278606414795, "Pretrain/Loss (Raw)": 2.150688886642456, "Pretrain/Step": 1354, "Pretrain/Step Time": 8.424297841265798} +{"Pretrain/Learning Rate": 4.977935047636294e-05, "Pretrain/Loss": 2.110950469970703, "Pretrain/Loss (Raw)": 2.1374847888946533, "Pretrain/Step": 1355, "Pretrain/Step Time": 8.424762275069952} +{"Pretrain/Learning Rate": 4.977878734932371e-05, "Pretrain/Loss": 2.111786365509033, "Pretrain/Loss (Raw)": 2.2500650882720947, "Pretrain/Step": 1356, "Pretrain/Step Time": 8.426251044496894} +{"Pretrain/Learning Rate": 4.977822350780561e-05, "Pretrain/Loss": 2.114417552947998, "Pretrain/Loss (Raw)": 2.0801124572753906, "Pretrain/Step": 1357, "Pretrain/Step Time": 8.42962284013629} +{"Pretrain/Learning Rate": 4.9777658951824904e-05, "Pretrain/Loss": 2.1145970821380615, "Pretrain/Loss (Raw)": 2.075331211090088, "Pretrain/Step": 1358, "Pretrain/Step Time": 8.433145733550191} +{"Pretrain/Learning Rate": 4.9777093681397866e-05, "Pretrain/Loss": 2.116314649581909, "Pretrain/Loss (Raw)": 2.302910804748535, "Pretrain/Step": 1359, "Pretrain/Step Time": 8.433925371617079} +{"Pretrain/Learning Rate": 4.977652769654081e-05, "Pretrain/Loss": 2.1187667846679688, "Pretrain/Loss (Raw)": 2.23587703704834, "Pretrain/Step": 1360, "Pretrain/Step Time": 8.438177207484841} +{"Pretrain/Learning Rate": 4.977596099727004e-05, "Pretrain/Loss": 2.1201858520507812, "Pretrain/Loss (Raw)": 2.280052423477173, "Pretrain/Step": 1361, "Pretrain/Step Time": 8.436600172892213} +{"Pretrain/Learning Rate": 4.977539358360189e-05, "Pretrain/Loss": 2.120577335357666, "Pretrain/Loss (Raw)": 2.0667879581451416, "Pretrain/Step": 1362, "Pretrain/Step Time": 8.435613874346018} +{"Pretrain/Learning Rate": 4.977482545555275e-05, "Pretrain/Loss": 2.1194872856140137, "Pretrain/Loss (Raw)": 2.120598077774048, "Pretrain/Step": 1363, "Pretrain/Step Time": 8.439962172880769} +{"Pretrain/Learning Rate": 4.977425661313897e-05, "Pretrain/Loss": 2.1206326484680176, "Pretrain/Loss (Raw)": 2.112779378890991, "Pretrain/Step": 1364, "Pretrain/Step Time": 8.430447019636631} +{"Pretrain/Learning Rate": 4.977368705637697e-05, "Pretrain/Loss": 2.119337558746338, "Pretrain/Loss (Raw)": 2.0836493968963623, "Pretrain/Step": 1365, "Pretrain/Step Time": 8.429180240258574} +{"Pretrain/Learning Rate": 4.977311678528317e-05, "Pretrain/Loss": 2.1182947158813477, "Pretrain/Loss (Raw)": 2.087648868560791, "Pretrain/Step": 1366, "Pretrain/Step Time": 8.43018158338964} +{"Pretrain/Learning Rate": 4.9772545799874e-05, "Pretrain/Loss": 2.1188888549804688, "Pretrain/Loss (Raw)": 2.3060100078582764, "Pretrain/Step": 1367, "Pretrain/Step Time": 8.430607384070754} +{"Pretrain/Learning Rate": 4.977197410016595e-05, "Pretrain/Loss": 2.120129108428955, "Pretrain/Loss (Raw)": 2.1674296855926514, "Pretrain/Step": 1368, "Pretrain/Step Time": 8.428042320534587} +{"Pretrain/Learning Rate": 4.977140168617548e-05, "Pretrain/Loss": 2.121164321899414, "Pretrain/Loss (Raw)": 2.2545223236083984, "Pretrain/Step": 1369, "Pretrain/Step Time": 8.426663564518094} +{"Pretrain/Learning Rate": 4.9770828557919106e-05, "Pretrain/Loss": 2.1225426197052, "Pretrain/Loss (Raw)": 2.1495680809020996, "Pretrain/Step": 1370, "Pretrain/Step Time": 8.425559038296342} +{"Pretrain/Learning Rate": 4.977025471541336e-05, "Pretrain/Loss": 2.12235426902771, "Pretrain/Loss (Raw)": 2.094021797180176, "Pretrain/Step": 1371, "Pretrain/Step Time": 8.425046544522047} +{"Pretrain/Learning Rate": 4.9769680158674774e-05, "Pretrain/Loss": 2.121947765350342, "Pretrain/Loss (Raw)": 2.130373477935791, "Pretrain/Step": 1372, "Pretrain/Step Time": 8.424342572689056} +{"Pretrain/Learning Rate": 4.9769104887719926e-05, "Pretrain/Loss": 2.122835874557495, "Pretrain/Loss (Raw)": 2.023106813430786, "Pretrain/Step": 1373, "Pretrain/Step Time": 8.428469760343432} +{"Pretrain/Learning Rate": 4.9768528902565396e-05, "Pretrain/Loss": 2.1209919452667236, "Pretrain/Loss (Raw)": 1.8203060626983643, "Pretrain/Step": 1374, "Pretrain/Step Time": 8.426237555220723} +{"Pretrain/Learning Rate": 4.97679522032278e-05, "Pretrain/Loss": 2.118582248687744, "Pretrain/Loss (Raw)": 1.876918077468872, "Pretrain/Step": 1375, "Pretrain/Step Time": 8.429296251386404} +{"Pretrain/Learning Rate": 4.976737478972376e-05, "Pretrain/Loss": 2.1169044971466064, "Pretrain/Loss (Raw)": 2.108041524887085, "Pretrain/Step": 1376, "Pretrain/Step Time": 8.422068359330297} +{"Pretrain/Learning Rate": 4.976679666206993e-05, "Pretrain/Loss": 2.1184277534484863, "Pretrain/Loss (Raw)": 2.1493453979492188, "Pretrain/Step": 1377, "Pretrain/Step Time": 8.425764316692948} +{"Pretrain/Learning Rate": 4.9766217820282974e-05, "Pretrain/Loss": 2.119779586791992, "Pretrain/Loss (Raw)": 2.2402312755584717, "Pretrain/Step": 1378, "Pretrain/Step Time": 8.424085447564721} +{"Pretrain/Learning Rate": 4.976563826437959e-05, "Pretrain/Loss": 2.118863582611084, "Pretrain/Loss (Raw)": 1.9693076610565186, "Pretrain/Step": 1379, "Pretrain/Step Time": 8.428598836064339} +{"Pretrain/Learning Rate": 4.976505799437648e-05, "Pretrain/Loss": 2.118096351623535, "Pretrain/Loss (Raw)": 1.9638937711715698, "Pretrain/Step": 1380, "Pretrain/Step Time": 8.428086668252945} +{"Pretrain/Learning Rate": 4.9764477010290384e-05, "Pretrain/Loss": 2.1215949058532715, "Pretrain/Loss (Raw)": 2.491079807281494, "Pretrain/Step": 1381, "Pretrain/Step Time": 8.4278326574713} +{"Pretrain/Learning Rate": 4.976389531213805e-05, "Pretrain/Loss": 2.120316505432129, "Pretrain/Loss (Raw)": 1.7960128784179688, "Pretrain/Step": 1382, "Pretrain/Step Time": 8.425235003232956} +{"Pretrain/Learning Rate": 4.976331289993625e-05, "Pretrain/Loss": 2.121480941772461, "Pretrain/Loss (Raw)": 2.2412657737731934, "Pretrain/Step": 1383, "Pretrain/Step Time": 8.423858422785997} +{"Pretrain/Learning Rate": 4.976272977370179e-05, "Pretrain/Loss": 2.122520685195923, "Pretrain/Loss (Raw)": 2.2336714267730713, "Pretrain/Step": 1384, "Pretrain/Step Time": 8.422972831875086} +{"Pretrain/Learning Rate": 4.976214593345146e-05, "Pretrain/Loss": 2.1265392303466797, "Pretrain/Loss (Raw)": 2.2830207347869873, "Pretrain/Step": 1385, "Pretrain/Step Time": 8.417728574946523} +{"Pretrain/Learning Rate": 4.9761561379202124e-05, "Pretrain/Loss": 2.12990665435791, "Pretrain/Loss (Raw)": 2.5162436962127686, "Pretrain/Step": 1386, "Pretrain/Step Time": 8.417177207767963} +{"Pretrain/Learning Rate": 4.976097611097061e-05, "Pretrain/Loss": 2.131707191467285, "Pretrain/Loss (Raw)": 2.0415520668029785, "Pretrain/Step": 1387, "Pretrain/Step Time": 8.421226512640715} +{"Pretrain/Learning Rate": 4.976039012877381e-05, "Pretrain/Loss": 2.1302690505981445, "Pretrain/Loss (Raw)": 1.9106184244155884, "Pretrain/Step": 1388, "Pretrain/Step Time": 8.42259780690074} +{"Pretrain/Learning Rate": 4.97598034326286e-05, "Pretrain/Loss": 2.1306352615356445, "Pretrain/Loss (Raw)": 2.17392897605896, "Pretrain/Step": 1389, "Pretrain/Step Time": 8.42340406961739} +{"Pretrain/Learning Rate": 4.9759216022551934e-05, "Pretrain/Loss": 2.127931833267212, "Pretrain/Loss (Raw)": 1.97238028049469, "Pretrain/Step": 1390, "Pretrain/Step Time": 8.425971675664186} +{"Pretrain/Learning Rate": 4.9758627898560715e-05, "Pretrain/Loss": 2.1286230087280273, "Pretrain/Loss (Raw)": 2.2025434970855713, "Pretrain/Step": 1391, "Pretrain/Step Time": 8.425421113148332} +{"Pretrain/Learning Rate": 4.975803906067193e-05, "Pretrain/Loss": 2.129495620727539, "Pretrain/Loss (Raw)": 2.1881208419799805, "Pretrain/Step": 1392, "Pretrain/Step Time": 8.42339038476348} +{"Pretrain/Learning Rate": 4.975744950890252e-05, "Pretrain/Loss": 2.1290907859802246, "Pretrain/Loss (Raw)": 2.127837896347046, "Pretrain/Step": 1393, "Pretrain/Step Time": 8.422545835375786} +{"Pretrain/Learning Rate": 4.975685924326952e-05, "Pretrain/Loss": 2.1312131881713867, "Pretrain/Loss (Raw)": 2.246185779571533, "Pretrain/Step": 1394, "Pretrain/Step Time": 8.423568814992905} +{"Pretrain/Learning Rate": 4.9756268263789935e-05, "Pretrain/Loss": 2.1316418647766113, "Pretrain/Loss (Raw)": 1.9660745859146118, "Pretrain/Step": 1395, "Pretrain/Step Time": 8.434529360383749} +{"Pretrain/Learning Rate": 4.97556765704808e-05, "Pretrain/Loss": 2.1349363327026367, "Pretrain/Loss (Raw)": 2.6292595863342285, "Pretrain/Step": 1396, "Pretrain/Step Time": 8.431436194106936} +{"Pretrain/Learning Rate": 4.975508416335919e-05, "Pretrain/Loss": 2.135676145553589, "Pretrain/Loss (Raw)": 2.27480411529541, "Pretrain/Step": 1397, "Pretrain/Step Time": 8.434073695912957} +{"Pretrain/Learning Rate": 4.975449104244217e-05, "Pretrain/Loss": 2.1350345611572266, "Pretrain/Loss (Raw)": 2.001594305038452, "Pretrain/Step": 1398, "Pretrain/Step Time": 8.434661777690053} +{"Pretrain/Learning Rate": 4.975389720774687e-05, "Pretrain/Loss": 2.1326258182525635, "Pretrain/Loss (Raw)": 2.071218967437744, "Pretrain/Step": 1399, "Pretrain/Step Time": 8.435450207442045} +{"Pretrain/Learning Rate": 4.975330265929038e-05, "Pretrain/Loss": 2.134040355682373, "Pretrain/Loss (Raw)": 2.234891891479492, "Pretrain/Step": 1400, "Pretrain/Step Time": 8.428310574963689} +{"Pretrain/Learning Rate": 4.975270739708986e-05, "Pretrain/Loss": 2.1322243213653564, "Pretrain/Loss (Raw)": 2.035313844680786, "Pretrain/Step": 1401, "Pretrain/Step Time": 8.43125137500465} +{"Pretrain/Learning Rate": 4.975211142116247e-05, "Pretrain/Loss": 2.132399559020996, "Pretrain/Loss (Raw)": 1.9965250492095947, "Pretrain/Step": 1402, "Pretrain/Step Time": 8.42909804545343} +{"Pretrain/Learning Rate": 4.97515147315254e-05, "Pretrain/Loss": 2.1308064460754395, "Pretrain/Loss (Raw)": 2.079996109008789, "Pretrain/Step": 1403, "Pretrain/Step Time": 8.434672677889466} +{"Pretrain/Learning Rate": 4.975091732819585e-05, "Pretrain/Loss": 2.1327552795410156, "Pretrain/Loss (Raw)": 2.1608567237854004, "Pretrain/Step": 1404, "Pretrain/Step Time": 8.431181589141488} +{"Pretrain/Learning Rate": 4.9750319211191046e-05, "Pretrain/Loss": 2.1309423446655273, "Pretrain/Loss (Raw)": 2.034449338912964, "Pretrain/Step": 1405, "Pretrain/Step Time": 8.432496080175042} +{"Pretrain/Learning Rate": 4.9749720380528234e-05, "Pretrain/Loss": 2.131897449493408, "Pretrain/Loss (Raw)": 2.1657776832580566, "Pretrain/Step": 1406, "Pretrain/Step Time": 8.436122229322791} +{"Pretrain/Learning Rate": 4.974912083622469e-05, "Pretrain/Loss": 2.13149094581604, "Pretrain/Loss (Raw)": 2.0102572441101074, "Pretrain/Step": 1407, "Pretrain/Step Time": 8.433825112879276} +{"Pretrain/Learning Rate": 4.9748520578297685e-05, "Pretrain/Loss": 2.1305127143859863, "Pretrain/Loss (Raw)": 2.09755802154541, "Pretrain/Step": 1408, "Pretrain/Step Time": 8.434086019173265} +{"Pretrain/Learning Rate": 4.9747919606764534e-05, "Pretrain/Loss": 2.130131244659424, "Pretrain/Loss (Raw)": 2.0759098529815674, "Pretrain/Step": 1409, "Pretrain/Step Time": 8.436212169006467} +{"Pretrain/Learning Rate": 4.974731792164258e-05, "Pretrain/Loss": 2.1332931518554688, "Pretrain/Loss (Raw)": 2.389618396759033, "Pretrain/Step": 1410, "Pretrain/Step Time": 8.43332345597446} +{"Pretrain/Learning Rate": 4.974671552294915e-05, "Pretrain/Loss": 2.1333770751953125, "Pretrain/Loss (Raw)": 2.053858757019043, "Pretrain/Step": 1411, "Pretrain/Step Time": 8.436932371929288} +{"Pretrain/Learning Rate": 4.9746112410701625e-05, "Pretrain/Loss": 2.1329569816589355, "Pretrain/Loss (Raw)": 2.1117255687713623, "Pretrain/Step": 1412, "Pretrain/Step Time": 8.443157818168402} +{"Pretrain/Learning Rate": 4.974550858491739e-05, "Pretrain/Loss": 2.1330368518829346, "Pretrain/Loss (Raw)": 2.043684720993042, "Pretrain/Step": 1413, "Pretrain/Step Time": 8.44273497723043} +{"Pretrain/Learning Rate": 4.9744904045613866e-05, "Pretrain/Loss": 2.1319477558135986, "Pretrain/Loss (Raw)": 2.1122050285339355, "Pretrain/Step": 1414, "Pretrain/Step Time": 8.442341014742851} +{"Pretrain/Learning Rate": 4.974429879280847e-05, "Pretrain/Loss": 2.131922721862793, "Pretrain/Loss (Raw)": 2.1234140396118164, "Pretrain/Step": 1415, "Pretrain/Step Time": 8.443703467026353} +{"Pretrain/Learning Rate": 4.974369282651867e-05, "Pretrain/Loss": 2.132587432861328, "Pretrain/Loss (Raw)": 2.042548656463623, "Pretrain/Step": 1416, "Pretrain/Step Time": 8.43621813878417} +{"Pretrain/Learning Rate": 4.974308614676193e-05, "Pretrain/Loss": 2.1311168670654297, "Pretrain/Loss (Raw)": 2.1360373497009277, "Pretrain/Step": 1417, "Pretrain/Step Time": 8.44395374134183} +{"Pretrain/Learning Rate": 4.974247875355574e-05, "Pretrain/Loss": 2.1311376094818115, "Pretrain/Loss (Raw)": 2.166961193084717, "Pretrain/Step": 1418, "Pretrain/Step Time": 8.444828055799007} +{"Pretrain/Learning Rate": 4.9741870646917616e-05, "Pretrain/Loss": 2.1319797039031982, "Pretrain/Loss (Raw)": 2.1784827709198, "Pretrain/Step": 1419, "Pretrain/Step Time": 8.442433755844831} +{"Pretrain/Learning Rate": 4.974126182686509e-05, "Pretrain/Loss": 2.1299290657043457, "Pretrain/Loss (Raw)": 2.1100244522094727, "Pretrain/Step": 1420, "Pretrain/Step Time": 8.446344485506415} +{"Pretrain/Learning Rate": 4.9740652293415735e-05, "Pretrain/Loss": 2.1279585361480713, "Pretrain/Loss (Raw)": 2.0552914142608643, "Pretrain/Step": 1421, "Pretrain/Step Time": 8.445304322987795} +{"Pretrain/Learning Rate": 4.97400420465871e-05, "Pretrain/Loss": 2.1295127868652344, "Pretrain/Loss (Raw)": 2.3503921031951904, "Pretrain/Step": 1422, "Pretrain/Step Time": 8.442504098638892} +{"Pretrain/Learning Rate": 4.973943108639679e-05, "Pretrain/Loss": 2.1305060386657715, "Pretrain/Loss (Raw)": 2.090181827545166, "Pretrain/Step": 1423, "Pretrain/Step Time": 8.444811580702662} +{"Pretrain/Learning Rate": 4.9738819412862436e-05, "Pretrain/Loss": 2.129448652267456, "Pretrain/Loss (Raw)": 2.0625290870666504, "Pretrain/Step": 1424, "Pretrain/Step Time": 8.444653514772654} +{"Pretrain/Learning Rate": 4.973820702600166e-05, "Pretrain/Loss": 2.1288139820098877, "Pretrain/Loss (Raw)": 2.2169511318206787, "Pretrain/Step": 1425, "Pretrain/Step Time": 8.442852789536119} +{"Pretrain/Learning Rate": 4.973759392583213e-05, "Pretrain/Loss": 2.1272454261779785, "Pretrain/Loss (Raw)": 2.086308479309082, "Pretrain/Step": 1426, "Pretrain/Step Time": 8.441417841240764} +{"Pretrain/Learning Rate": 4.9736980112371504e-05, "Pretrain/Loss": 2.127230644226074, "Pretrain/Loss (Raw)": 2.0857994556427, "Pretrain/Step": 1427, "Pretrain/Step Time": 8.441501051187515} +{"Pretrain/Learning Rate": 4.97363655856375e-05, "Pretrain/Loss": 2.1258907318115234, "Pretrain/Loss (Raw)": 2.153822660446167, "Pretrain/Step": 1428, "Pretrain/Step Time": 8.446792533621192} +{"Pretrain/Learning Rate": 4.9735750345647836e-05, "Pretrain/Loss": 2.12581729888916, "Pretrain/Loss (Raw)": 2.048574209213257, "Pretrain/Step": 1429, "Pretrain/Step Time": 8.447466596961021} +{"Pretrain/Learning Rate": 4.9735134392420245e-05, "Pretrain/Loss": 2.1287355422973633, "Pretrain/Loss (Raw)": 2.2526280879974365, "Pretrain/Step": 1430, "Pretrain/Step Time": 8.445945439860225} +{"Pretrain/Learning Rate": 4.9734517725972494e-05, "Pretrain/Loss": 2.1309027671813965, "Pretrain/Loss (Raw)": 2.3636043071746826, "Pretrain/Step": 1431, "Pretrain/Step Time": 8.438948983326554} +{"Pretrain/Learning Rate": 4.973390034632236e-05, "Pretrain/Loss": 2.1288959980010986, "Pretrain/Loss (Raw)": 1.9091325998306274, "Pretrain/Step": 1432, "Pretrain/Step Time": 8.441417302936316} +{"Pretrain/Learning Rate": 4.9733282253487645e-05, "Pretrain/Loss": 2.1306777000427246, "Pretrain/Loss (Raw)": 2.384286880493164, "Pretrain/Step": 1433, "Pretrain/Step Time": 8.434907246381044} +{"Pretrain/Learning Rate": 4.973266344748617e-05, "Pretrain/Loss": 2.1305525302886963, "Pretrain/Loss (Raw)": 1.96412992477417, "Pretrain/Step": 1434, "Pretrain/Step Time": 8.43669936619699} +{"Pretrain/Learning Rate": 4.973204392833579e-05, "Pretrain/Loss": 2.1310219764709473, "Pretrain/Loss (Raw)": 1.9268169403076172, "Pretrain/Step": 1435, "Pretrain/Step Time": 8.444693718105555} +{"Pretrain/Learning Rate": 4.9731423696054345e-05, "Pretrain/Loss": 2.128139019012451, "Pretrain/Loss (Raw)": 1.877524733543396, "Pretrain/Step": 1436, "Pretrain/Step Time": 8.441818989813328} +{"Pretrain/Learning Rate": 4.973080275065974e-05, "Pretrain/Loss": 2.1280884742736816, "Pretrain/Loss (Raw)": 2.1390185356140137, "Pretrain/Step": 1437, "Pretrain/Step Time": 8.444098360836506} +{"Pretrain/Learning Rate": 4.973018109216987e-05, "Pretrain/Loss": 2.1257195472717285, "Pretrain/Loss (Raw)": 1.9549027681350708, "Pretrain/Step": 1438, "Pretrain/Step Time": 8.439200600609183} +{"Pretrain/Learning Rate": 4.9729558720602666e-05, "Pretrain/Loss": 2.125411033630371, "Pretrain/Loss (Raw)": 2.221053123474121, "Pretrain/Step": 1439, "Pretrain/Step Time": 8.440508391708136} +{"Pretrain/Learning Rate": 4.972893563597606e-05, "Pretrain/Loss": 2.126112937927246, "Pretrain/Loss (Raw)": 2.1217713356018066, "Pretrain/Step": 1440, "Pretrain/Step Time": 8.441841635853052} +{"Pretrain/Learning Rate": 4.972831183830803e-05, "Pretrain/Loss": 2.1248984336853027, "Pretrain/Loss (Raw)": 1.890142560005188, "Pretrain/Step": 1441, "Pretrain/Step Time": 8.446899056434631} +{"Pretrain/Learning Rate": 4.972768732761657e-05, "Pretrain/Loss": 2.1255273818969727, "Pretrain/Loss (Raw)": 2.121760845184326, "Pretrain/Step": 1442, "Pretrain/Step Time": 8.447694165632129} +{"Pretrain/Learning Rate": 4.972706210391967e-05, "Pretrain/Loss": 2.1258389949798584, "Pretrain/Loss (Raw)": 2.097491979598999, "Pretrain/Step": 1443, "Pretrain/Step Time": 8.446990622207522} +{"Pretrain/Learning Rate": 4.972643616723537e-05, "Pretrain/Loss": 2.1256446838378906, "Pretrain/Loss (Raw)": 2.0628836154937744, "Pretrain/Step": 1444, "Pretrain/Step Time": 8.447367878630757} +{"Pretrain/Learning Rate": 4.972580951758171e-05, "Pretrain/Loss": 2.125354528427124, "Pretrain/Loss (Raw)": 2.0905253887176514, "Pretrain/Step": 1445, "Pretrain/Step Time": 8.448481488972902} +{"Pretrain/Learning Rate": 4.972518215497676e-05, "Pretrain/Loss": 2.1268982887268066, "Pretrain/Loss (Raw)": 2.122645139694214, "Pretrain/Step": 1446, "Pretrain/Step Time": 8.447334883734584} +{"Pretrain/Learning Rate": 4.9724554079438615e-05, "Pretrain/Loss": 2.1265549659729004, "Pretrain/Loss (Raw)": 2.0215585231781006, "Pretrain/Step": 1447, "Pretrain/Step Time": 8.447683053091168} +{"Pretrain/Learning Rate": 4.9723925290985384e-05, "Pretrain/Loss": 2.1269004344940186, "Pretrain/Loss (Raw)": 2.1425578594207764, "Pretrain/Step": 1448, "Pretrain/Step Time": 8.441890772432089} +{"Pretrain/Learning Rate": 4.97232957896352e-05, "Pretrain/Loss": 2.1265368461608887, "Pretrain/Loss (Raw)": 2.12565541267395, "Pretrain/Step": 1449, "Pretrain/Step Time": 8.443881900981069} +{"Pretrain/Learning Rate": 4.97226655754062e-05, "Pretrain/Loss": 2.1324195861816406, "Pretrain/Loss (Raw)": 2.3671183586120605, "Pretrain/Step": 1450, "Pretrain/Step Time": 8.439462579786777} +{"Pretrain/Learning Rate": 4.972203464831658e-05, "Pretrain/Loss": 2.13106107711792, "Pretrain/Loss (Raw)": 1.9818007946014404, "Pretrain/Step": 1451, "Pretrain/Step Time": 8.443462377414107} +{"Pretrain/Learning Rate": 4.972140300838452e-05, "Pretrain/Loss": 2.1284780502319336, "Pretrain/Loss (Raw)": 2.159336566925049, "Pretrain/Step": 1452, "Pretrain/Step Time": 8.438375128433108} +{"Pretrain/Learning Rate": 4.972077065562821e-05, "Pretrain/Loss": 2.128025770187378, "Pretrain/Loss (Raw)": 1.9992412328720093, "Pretrain/Step": 1453, "Pretrain/Step Time": 8.443667678162456} +{"Pretrain/Learning Rate": 4.972013759006593e-05, "Pretrain/Loss": 2.130183219909668, "Pretrain/Loss (Raw)": 2.2042529582977295, "Pretrain/Step": 1454, "Pretrain/Step Time": 8.44368682987988} +{"Pretrain/Learning Rate": 4.9719503811715894e-05, "Pretrain/Loss": 2.127444267272949, "Pretrain/Loss (Raw)": 2.1710009574890137, "Pretrain/Step": 1455, "Pretrain/Step Time": 8.443001620471478} +{"Pretrain/Learning Rate": 4.97188693205964e-05, "Pretrain/Loss": 2.1292476654052734, "Pretrain/Loss (Raw)": 2.280719041824341, "Pretrain/Step": 1456, "Pretrain/Step Time": 8.444364380091429} +{"Pretrain/Learning Rate": 4.971823411672573e-05, "Pretrain/Loss": 2.1304924488067627, "Pretrain/Loss (Raw)": 2.1664011478424072, "Pretrain/Step": 1457, "Pretrain/Step Time": 8.44483644515276} +{"Pretrain/Learning Rate": 4.971759820012221e-05, "Pretrain/Loss": 2.128910779953003, "Pretrain/Loss (Raw)": 1.9725828170776367, "Pretrain/Step": 1458, "Pretrain/Step Time": 8.444354124367237} +{"Pretrain/Learning Rate": 4.971696157080416e-05, "Pretrain/Loss": 2.1277642250061035, "Pretrain/Loss (Raw)": 2.037184953689575, "Pretrain/Step": 1459, "Pretrain/Step Time": 8.449454864487052} +{"Pretrain/Learning Rate": 4.971632422878996e-05, "Pretrain/Loss": 2.1295995712280273, "Pretrain/Loss (Raw)": 2.2117981910705566, "Pretrain/Step": 1460, "Pretrain/Step Time": 8.444710960611701} +{"Pretrain/Learning Rate": 4.9715686174097964e-05, "Pretrain/Loss": 2.1302099227905273, "Pretrain/Loss (Raw)": 2.223790168762207, "Pretrain/Step": 1461, "Pretrain/Step Time": 8.45037410594523} +{"Pretrain/Learning Rate": 4.9715047406746586e-05, "Pretrain/Loss": 2.1301193237304688, "Pretrain/Loss (Raw)": 2.2894163131713867, "Pretrain/Step": 1462, "Pretrain/Step Time": 8.447574593126774} +{"Pretrain/Learning Rate": 4.971440792675424e-05, "Pretrain/Loss": 2.1285014152526855, "Pretrain/Loss (Raw)": 2.078930377960205, "Pretrain/Step": 1463, "Pretrain/Step Time": 8.448946891352534} +{"Pretrain/Learning Rate": 4.9713767734139354e-05, "Pretrain/Loss": 2.1340551376342773, "Pretrain/Loss (Raw)": 2.7324681282043457, "Pretrain/Step": 1464, "Pretrain/Step Time": 8.454206056892872} +{"Pretrain/Learning Rate": 4.971312682892041e-05, "Pretrain/Loss": 2.1328978538513184, "Pretrain/Loss (Raw)": 1.883941411972046, "Pretrain/Step": 1465, "Pretrain/Step Time": 8.451021837070584} +{"Pretrain/Learning Rate": 4.971248521111587e-05, "Pretrain/Loss": 2.136870861053467, "Pretrain/Loss (Raw)": 2.665163993835449, "Pretrain/Step": 1466, "Pretrain/Step Time": 8.450180273503065} +{"Pretrain/Learning Rate": 4.9711842880744244e-05, "Pretrain/Loss": 2.1346795558929443, "Pretrain/Loss (Raw)": 2.2921535968780518, "Pretrain/Step": 1467, "Pretrain/Step Time": 8.453431319445372} +{"Pretrain/Learning Rate": 4.971119983782404e-05, "Pretrain/Loss": 2.1334078311920166, "Pretrain/Loss (Raw)": 1.9806249141693115, "Pretrain/Step": 1468, "Pretrain/Step Time": 8.450739994645119} +{"Pretrain/Learning Rate": 4.9710556082373816e-05, "Pretrain/Loss": 2.13247013092041, "Pretrain/Loss (Raw)": 2.1246092319488525, "Pretrain/Step": 1469, "Pretrain/Step Time": 8.451805852353573} +{"Pretrain/Learning Rate": 4.970991161441213e-05, "Pretrain/Loss": 2.1315927505493164, "Pretrain/Loss (Raw)": 2.059967279434204, "Pretrain/Step": 1470, "Pretrain/Step Time": 8.453194446861744} +{"Pretrain/Learning Rate": 4.970926643395756e-05, "Pretrain/Loss": 2.1319947242736816, "Pretrain/Loss (Raw)": 2.3153834342956543, "Pretrain/Step": 1471, "Pretrain/Step Time": 8.454151513054967} +{"Pretrain/Learning Rate": 4.9708620541028704e-05, "Pretrain/Loss": 2.1340293884277344, "Pretrain/Loss (Raw)": 2.1354923248291016, "Pretrain/Step": 1472, "Pretrain/Step Time": 8.4530612770468} +{"Pretrain/Learning Rate": 4.97079739356442e-05, "Pretrain/Loss": 2.134366512298584, "Pretrain/Loss (Raw)": 2.234025716781616, "Pretrain/Step": 1473, "Pretrain/Step Time": 8.454612735658884} +{"Pretrain/Learning Rate": 4.970732661782268e-05, "Pretrain/Loss": 2.132983446121216, "Pretrain/Loss (Raw)": 2.0804100036621094, "Pretrain/Step": 1474, "Pretrain/Step Time": 8.450303219258785} +{"Pretrain/Learning Rate": 4.970667858758282e-05, "Pretrain/Loss": 2.134713888168335, "Pretrain/Loss (Raw)": 2.0578272342681885, "Pretrain/Step": 1475, "Pretrain/Step Time": 8.45207779482007} +{"Pretrain/Learning Rate": 4.9706029844943304e-05, "Pretrain/Loss": 2.134122133255005, "Pretrain/Loss (Raw)": 2.0104727745056152, "Pretrain/Step": 1476, "Pretrain/Step Time": 8.455724550411105} +{"Pretrain/Learning Rate": 4.970538038992283e-05, "Pretrain/Loss": 2.13869571685791, "Pretrain/Loss (Raw)": 2.5456602573394775, "Pretrain/Step": 1477, "Pretrain/Step Time": 8.453027555719018} +{"Pretrain/Learning Rate": 4.970473022254012e-05, "Pretrain/Loss": 2.142937660217285, "Pretrain/Loss (Raw)": 2.829291582107544, "Pretrain/Step": 1478, "Pretrain/Step Time": 8.451560592278838} +{"Pretrain/Learning Rate": 4.970407934281394e-05, "Pretrain/Loss": 2.1437575817108154, "Pretrain/Loss (Raw)": 2.1058530807495117, "Pretrain/Step": 1479, "Pretrain/Step Time": 8.450122337788343} +{"Pretrain/Learning Rate": 4.970342775076304e-05, "Pretrain/Loss": 2.146000862121582, "Pretrain/Loss (Raw)": 2.537475109100342, "Pretrain/Step": 1480, "Pretrain/Step Time": 8.449669156223536} +{"Pretrain/Learning Rate": 4.9702775446406224e-05, "Pretrain/Loss": 2.1464498043060303, "Pretrain/Loss (Raw)": 2.106663227081299, "Pretrain/Step": 1481, "Pretrain/Step Time": 8.44682564586401} +{"Pretrain/Learning Rate": 4.970212242976229e-05, "Pretrain/Loss": 2.1444125175476074, "Pretrain/Loss (Raw)": 1.8899399042129517, "Pretrain/Step": 1482, "Pretrain/Step Time": 8.449064031243324} +{"Pretrain/Learning Rate": 4.970146870085006e-05, "Pretrain/Loss": 2.145113468170166, "Pretrain/Loss (Raw)": 2.2271974086761475, "Pretrain/Step": 1483, "Pretrain/Step Time": 8.449940649792552} +{"Pretrain/Learning Rate": 4.9700814259688404e-05, "Pretrain/Loss": 2.142648696899414, "Pretrain/Loss (Raw)": 1.9345877170562744, "Pretrain/Step": 1484, "Pretrain/Step Time": 8.446388663724065} +{"Pretrain/Learning Rate": 4.970015910629619e-05, "Pretrain/Loss": 2.1430835723876953, "Pretrain/Loss (Raw)": 2.135754346847534, "Pretrain/Step": 1485, "Pretrain/Step Time": 8.443946059793234} +{"Pretrain/Learning Rate": 4.969950324069228e-05, "Pretrain/Loss": 2.144211769104004, "Pretrain/Loss (Raw)": 2.219722032546997, "Pretrain/Step": 1486, "Pretrain/Step Time": 8.439435932785273} +{"Pretrain/Learning Rate": 4.969884666289561e-05, "Pretrain/Loss": 2.143951654434204, "Pretrain/Loss (Raw)": 2.269634485244751, "Pretrain/Step": 1487, "Pretrain/Step Time": 8.44357779994607} +{"Pretrain/Learning Rate": 4.969818937292512e-05, "Pretrain/Loss": 2.1426408290863037, "Pretrain/Loss (Raw)": 2.0680959224700928, "Pretrain/Step": 1488, "Pretrain/Step Time": 8.439826365560293} +{"Pretrain/Learning Rate": 4.9697531370799746e-05, "Pretrain/Loss": 2.140730857849121, "Pretrain/Loss (Raw)": 2.0355594158172607, "Pretrain/Step": 1489, "Pretrain/Step Time": 8.4438263643533} +{"Pretrain/Learning Rate": 4.969687265653846e-05, "Pretrain/Loss": 2.1423375606536865, "Pretrain/Loss (Raw)": 2.272458553314209, "Pretrain/Step": 1490, "Pretrain/Step Time": 8.44474259763956} +{"Pretrain/Learning Rate": 4.969621323016027e-05, "Pretrain/Loss": 2.141517400741577, "Pretrain/Loss (Raw)": 2.015615701675415, "Pretrain/Step": 1491, "Pretrain/Step Time": 8.441721424460411} +{"Pretrain/Learning Rate": 4.969555309168417e-05, "Pretrain/Loss": 2.1448681354522705, "Pretrain/Loss (Raw)": 2.5416948795318604, "Pretrain/Step": 1492, "Pretrain/Step Time": 8.447046149522066} +{"Pretrain/Learning Rate": 4.9694892241129215e-05, "Pretrain/Loss": 2.145085334777832, "Pretrain/Loss (Raw)": 2.1114258766174316, "Pretrain/Step": 1493, "Pretrain/Step Time": 8.448688443750143} +{"Pretrain/Learning Rate": 4.9694230678514446e-05, "Pretrain/Loss": 2.146521806716919, "Pretrain/Loss (Raw)": 2.271517753601074, "Pretrain/Step": 1494, "Pretrain/Step Time": 8.447165034711361} +{"Pretrain/Learning Rate": 4.969356840385895e-05, "Pretrain/Loss": 2.1434097290039062, "Pretrain/Loss (Raw)": 1.907676100730896, "Pretrain/Step": 1495, "Pretrain/Step Time": 8.447312287986279} +{"Pretrain/Learning Rate": 4.969290541718181e-05, "Pretrain/Loss": 2.1429600715637207, "Pretrain/Loss (Raw)": 2.10986590385437, "Pretrain/Step": 1496, "Pretrain/Step Time": 8.449244696646929} +{"Pretrain/Learning Rate": 4.969224171850215e-05, "Pretrain/Loss": 2.140623092651367, "Pretrain/Loss (Raw)": 1.9553618431091309, "Pretrain/Step": 1497, "Pretrain/Step Time": 8.445898696780205} +{"Pretrain/Learning Rate": 4.969157730783911e-05, "Pretrain/Loss": 2.1387875080108643, "Pretrain/Loss (Raw)": 1.9146591424942017, "Pretrain/Step": 1498, "Pretrain/Step Time": 8.447889691218734} +{"Pretrain/Learning Rate": 4.9690912185211847e-05, "Pretrain/Loss": 2.1391983032226562, "Pretrain/Loss (Raw)": 2.1465988159179688, "Pretrain/Step": 1499, "Pretrain/Step Time": 8.448888886719942} +{"Pretrain/Learning Rate": 4.969024635063953e-05, "Pretrain/Loss": 2.1385278701782227, "Pretrain/Loss (Raw)": 2.0445609092712402, "Pretrain/Step": 1500, "Pretrain/Step Time": 8.448199689388275} +{"Pretrain/Learning Rate": 4.9689579804141376e-05, "Pretrain/Loss": 2.1402621269226074, "Pretrain/Loss (Raw)": 2.2450761795043945, "Pretrain/Step": 1501, "Pretrain/Step Time": 8.442276062443852} +{"Pretrain/Learning Rate": 4.9688912545736576e-05, "Pretrain/Loss": 2.143105983734131, "Pretrain/Loss (Raw)": 2.184298038482666, "Pretrain/Step": 1502, "Pretrain/Step Time": 8.445645997300744} +{"Pretrain/Learning Rate": 4.96882445754444e-05, "Pretrain/Loss": 2.1472041606903076, "Pretrain/Loss (Raw)": 2.401498794555664, "Pretrain/Step": 1503, "Pretrain/Step Time": 8.44566485285759} +{"Pretrain/Learning Rate": 4.96875758932841e-05, "Pretrain/Loss": 2.1436774730682373, "Pretrain/Loss (Raw)": 1.6566320657730103, "Pretrain/Step": 1504, "Pretrain/Step Time": 8.450949368998408} +{"Pretrain/Learning Rate": 4.968690649927494e-05, "Pretrain/Loss": 2.146467447280884, "Pretrain/Loss (Raw)": 2.5064656734466553, "Pretrain/Step": 1505, "Pretrain/Step Time": 8.449422741308808} +{"Pretrain/Learning Rate": 4.968623639343624e-05, "Pretrain/Loss": 2.1461925506591797, "Pretrain/Loss (Raw)": 2.2050490379333496, "Pretrain/Step": 1506, "Pretrain/Step Time": 8.448249725624919} +{"Pretrain/Learning Rate": 4.968556557578732e-05, "Pretrain/Loss": 2.1489038467407227, "Pretrain/Loss (Raw)": 2.3163230419158936, "Pretrain/Step": 1507, "Pretrain/Step Time": 8.447653463110328} +{"Pretrain/Learning Rate": 4.968489404634751e-05, "Pretrain/Loss": 2.149869441986084, "Pretrain/Loss (Raw)": 2.0875132083892822, "Pretrain/Step": 1508, "Pretrain/Step Time": 8.445831732824445} +{"Pretrain/Learning Rate": 4.968422180513619e-05, "Pretrain/Loss": 2.1469244956970215, "Pretrain/Loss (Raw)": 2.114107847213745, "Pretrain/Step": 1509, "Pretrain/Step Time": 8.444880787283182} +{"Pretrain/Learning Rate": 4.9683548852172734e-05, "Pretrain/Loss": 2.147904396057129, "Pretrain/Loss (Raw)": 1.92146635055542, "Pretrain/Step": 1510, "Pretrain/Step Time": 8.455663751810789} +{"Pretrain/Learning Rate": 4.968287518747654e-05, "Pretrain/Loss": 2.1469736099243164, "Pretrain/Loss (Raw)": 2.122087240219116, "Pretrain/Step": 1511, "Pretrain/Step Time": 8.45518346130848} +{"Pretrain/Learning Rate": 4.968220081106705e-05, "Pretrain/Loss": 2.1472983360290527, "Pretrain/Loss (Raw)": 2.275259017944336, "Pretrain/Step": 1512, "Pretrain/Step Time": 8.452410923317075} +{"Pretrain/Learning Rate": 4.96815257229637e-05, "Pretrain/Loss": 2.146374464035034, "Pretrain/Loss (Raw)": 2.1647651195526123, "Pretrain/Step": 1513, "Pretrain/Step Time": 8.450872395187616} +{"Pretrain/Learning Rate": 4.968084992318595e-05, "Pretrain/Loss": 2.1445491313934326, "Pretrain/Loss (Raw)": 2.282609462738037, "Pretrain/Step": 1514, "Pretrain/Step Time": 8.456517539918423} +{"Pretrain/Learning Rate": 4.968017341175329e-05, "Pretrain/Loss": 2.144157886505127, "Pretrain/Loss (Raw)": 1.9914507865905762, "Pretrain/Step": 1515, "Pretrain/Step Time": 8.451454270631075} +{"Pretrain/Learning Rate": 4.967949618868523e-05, "Pretrain/Loss": 2.145153045654297, "Pretrain/Loss (Raw)": 2.0380501747131348, "Pretrain/Step": 1516, "Pretrain/Step Time": 8.450489103794098} +{"Pretrain/Learning Rate": 4.967881825400129e-05, "Pretrain/Loss": 2.1433916091918945, "Pretrain/Loss (Raw)": 1.9484515190124512, "Pretrain/Step": 1517, "Pretrain/Step Time": 8.451828382909298} +{"Pretrain/Learning Rate": 4.967813960772103e-05, "Pretrain/Loss": 2.144127607345581, "Pretrain/Loss (Raw)": 2.0665628910064697, "Pretrain/Step": 1518, "Pretrain/Step Time": 8.446033278480172} +{"Pretrain/Learning Rate": 4.967746024986402e-05, "Pretrain/Loss": 2.1437504291534424, "Pretrain/Loss (Raw)": 2.154266834259033, "Pretrain/Step": 1519, "Pretrain/Step Time": 8.45041075348854} +{"Pretrain/Learning Rate": 4.967678018044982e-05, "Pretrain/Loss": 2.1421945095062256, "Pretrain/Loss (Raw)": 1.988964557647705, "Pretrain/Step": 1520, "Pretrain/Step Time": 8.45147510804236} +{"Pretrain/Learning Rate": 4.967609939949807e-05, "Pretrain/Loss": 2.1402742862701416, "Pretrain/Loss (Raw)": 1.8820561170578003, "Pretrain/Step": 1521, "Pretrain/Step Time": 8.454909887164831} +{"Pretrain/Learning Rate": 4.967541790702839e-05, "Pretrain/Loss": 2.137458324432373, "Pretrain/Loss (Raw)": 1.8857331275939941, "Pretrain/Step": 1522, "Pretrain/Step Time": 8.450165355578065} +{"Pretrain/Learning Rate": 4.967473570306043e-05, "Pretrain/Loss": 2.1395201683044434, "Pretrain/Loss (Raw)": 2.229987144470215, "Pretrain/Step": 1523, "Pretrain/Step Time": 8.44040035456419} +{"Pretrain/Learning Rate": 4.967405278761386e-05, "Pretrain/Loss": 2.135469913482666, "Pretrain/Loss (Raw)": 2.1108663082122803, "Pretrain/Step": 1524, "Pretrain/Step Time": 8.445348355919123} +{"Pretrain/Learning Rate": 4.9673369160708374e-05, "Pretrain/Loss": 2.135359048843384, "Pretrain/Loss (Raw)": 2.2605957984924316, "Pretrain/Step": 1525, "Pretrain/Step Time": 8.44090879894793} +{"Pretrain/Learning Rate": 4.9672684822363674e-05, "Pretrain/Loss": 2.1362783908843994, "Pretrain/Loss (Raw)": 2.1192538738250732, "Pretrain/Step": 1526, "Pretrain/Step Time": 8.439530540257692} +{"Pretrain/Learning Rate": 4.967199977259951e-05, "Pretrain/Loss": 2.1353611946105957, "Pretrain/Loss (Raw)": 1.9537943601608276, "Pretrain/Step": 1527, "Pretrain/Step Time": 8.440063731744885} +{"Pretrain/Learning Rate": 4.9671314011435614e-05, "Pretrain/Loss": 2.1343774795532227, "Pretrain/Loss (Raw)": 2.108994722366333, "Pretrain/Step": 1528, "Pretrain/Step Time": 8.442926231771708} +{"Pretrain/Learning Rate": 4.967062753889178e-05, "Pretrain/Loss": 2.136004686355591, "Pretrain/Loss (Raw)": 2.2436001300811768, "Pretrain/Step": 1529, "Pretrain/Step Time": 8.439155232161283} +{"Pretrain/Learning Rate": 4.966994035498779e-05, "Pretrain/Loss": 2.1345162391662598, "Pretrain/Loss (Raw)": 1.8060132265090942, "Pretrain/Step": 1530, "Pretrain/Step Time": 8.440814819186926} +{"Pretrain/Learning Rate": 4.966925245974346e-05, "Pretrain/Loss": 2.135101318359375, "Pretrain/Loss (Raw)": 2.1548783779144287, "Pretrain/Step": 1531, "Pretrain/Step Time": 8.43850121088326} +{"Pretrain/Learning Rate": 4.966856385317863e-05, "Pretrain/Loss": 2.133885145187378, "Pretrain/Loss (Raw)": 2.0052051544189453, "Pretrain/Step": 1532, "Pretrain/Step Time": 8.438521163538098} +{"Pretrain/Learning Rate": 4.966787453531314e-05, "Pretrain/Loss": 2.134211540222168, "Pretrain/Loss (Raw)": 2.076237678527832, "Pretrain/Step": 1533, "Pretrain/Step Time": 8.43605219759047} +{"Pretrain/Learning Rate": 4.9667184506166886e-05, "Pretrain/Loss": 2.1334228515625, "Pretrain/Loss (Raw)": 2.064824104309082, "Pretrain/Step": 1534, "Pretrain/Step Time": 8.4355848133564} +{"Pretrain/Learning Rate": 4.966649376575976e-05, "Pretrain/Loss": 2.1343655586242676, "Pretrain/Loss (Raw)": 2.1308817863464355, "Pretrain/Step": 1535, "Pretrain/Step Time": 8.439826060086489} +{"Pretrain/Learning Rate": 4.9665802314111665e-05, "Pretrain/Loss": 2.1343655586242676, "Pretrain/Loss (Raw)": 2.0975873470306396, "Pretrain/Step": 1536, "Pretrain/Step Time": 8.43785211071372} +{"Pretrain/Learning Rate": 4.966511015124256e-05, "Pretrain/Loss": 2.134525775909424, "Pretrain/Loss (Raw)": 2.096409797668457, "Pretrain/Step": 1537, "Pretrain/Step Time": 8.43559549190104} +{"Pretrain/Learning Rate": 4.966441727717238e-05, "Pretrain/Loss": 2.1329994201660156, "Pretrain/Loss (Raw)": 2.1942660808563232, "Pretrain/Step": 1538, "Pretrain/Step Time": 8.439392805099487} +{"Pretrain/Learning Rate": 4.966372369192113e-05, "Pretrain/Loss": 2.133415460586548, "Pretrain/Loss (Raw)": 2.1070685386657715, "Pretrain/Step": 1539, "Pretrain/Step Time": 8.434264250099659} +{"Pretrain/Learning Rate": 4.9663029395508775e-05, "Pretrain/Loss": 2.132532835006714, "Pretrain/Loss (Raw)": 1.998782753944397, "Pretrain/Step": 1540, "Pretrain/Step Time": 8.431470239534974} +{"Pretrain/Learning Rate": 4.966233438795537e-05, "Pretrain/Loss": 2.1315841674804688, "Pretrain/Loss (Raw)": 1.9222365617752075, "Pretrain/Step": 1541, "Pretrain/Step Time": 8.429580848664045} +{"Pretrain/Learning Rate": 4.966163866928093e-05, "Pretrain/Loss": 2.1305227279663086, "Pretrain/Loss (Raw)": 1.9763349294662476, "Pretrain/Step": 1542, "Pretrain/Step Time": 8.431114438921213} +{"Pretrain/Learning Rate": 4.9660942239505524e-05, "Pretrain/Loss": 2.1318697929382324, "Pretrain/Loss (Raw)": 2.29581880569458, "Pretrain/Step": 1543, "Pretrain/Step Time": 8.435684463009238} +{"Pretrain/Learning Rate": 4.966024509864924e-05, "Pretrain/Loss": 2.130707263946533, "Pretrain/Loss (Raw)": 1.8937604427337646, "Pretrain/Step": 1544, "Pretrain/Step Time": 8.442853853106499} +{"Pretrain/Learning Rate": 4.965954724673216e-05, "Pretrain/Loss": 2.130836009979248, "Pretrain/Loss (Raw)": 2.152519702911377, "Pretrain/Step": 1545, "Pretrain/Step Time": 8.434499772265553} +{"Pretrain/Learning Rate": 4.965884868377443e-05, "Pretrain/Loss": 2.1294126510620117, "Pretrain/Loss (Raw)": 1.9847815036773682, "Pretrain/Step": 1546, "Pretrain/Step Time": 8.433930123224854} +{"Pretrain/Learning Rate": 4.9658149409796185e-05, "Pretrain/Loss": 2.1280314922332764, "Pretrain/Loss (Raw)": 2.0016729831695557, "Pretrain/Step": 1547, "Pretrain/Step Time": 8.431153589859605} +{"Pretrain/Learning Rate": 4.9657449424817575e-05, "Pretrain/Loss": 2.1270101070404053, "Pretrain/Loss (Raw)": 1.9793230295181274, "Pretrain/Step": 1548, "Pretrain/Step Time": 8.431881181895733} +{"Pretrain/Learning Rate": 4.96567487288588e-05, "Pretrain/Loss": 2.126677989959717, "Pretrain/Loss (Raw)": 2.012793779373169, "Pretrain/Step": 1549, "Pretrain/Step Time": 8.431107729673386} +{"Pretrain/Learning Rate": 4.9656047321940054e-05, "Pretrain/Loss": 2.1248111724853516, "Pretrain/Loss (Raw)": 2.1114256381988525, "Pretrain/Step": 1550, "Pretrain/Step Time": 8.431738631799817} +{"Pretrain/Learning Rate": 4.965534520408156e-05, "Pretrain/Loss": 2.12662935256958, "Pretrain/Loss (Raw)": 2.3228843212127686, "Pretrain/Step": 1551, "Pretrain/Step Time": 8.431721931323409} +{"Pretrain/Learning Rate": 4.965464237530358e-05, "Pretrain/Loss": 2.126695156097412, "Pretrain/Loss (Raw)": 2.0709710121154785, "Pretrain/Step": 1552, "Pretrain/Step Time": 8.435453018173575} +{"Pretrain/Learning Rate": 4.9653938835626354e-05, "Pretrain/Loss": 2.125688314437866, "Pretrain/Loss (Raw)": 2.088078022003174, "Pretrain/Step": 1553, "Pretrain/Step Time": 8.433264562860131} +{"Pretrain/Learning Rate": 4.9653234585070194e-05, "Pretrain/Loss": 2.124985694885254, "Pretrain/Loss (Raw)": 1.996385931968689, "Pretrain/Step": 1554, "Pretrain/Step Time": 8.440016832202673} +{"Pretrain/Learning Rate": 4.965252962365539e-05, "Pretrain/Loss": 2.1260476112365723, "Pretrain/Loss (Raw)": 2.2217111587524414, "Pretrain/Step": 1555, "Pretrain/Step Time": 8.43934484757483} +{"Pretrain/Learning Rate": 4.965182395140227e-05, "Pretrain/Loss": 2.1261541843414307, "Pretrain/Loss (Raw)": 2.167461633682251, "Pretrain/Step": 1556, "Pretrain/Step Time": 8.436923136934638} +{"Pretrain/Learning Rate": 4.9651117568331186e-05, "Pretrain/Loss": 2.1255154609680176, "Pretrain/Loss (Raw)": 1.9667887687683105, "Pretrain/Step": 1557, "Pretrain/Step Time": 8.434347555041313} +{"Pretrain/Learning Rate": 4.9650410474462506e-05, "Pretrain/Loss": 2.1264896392822266, "Pretrain/Loss (Raw)": 2.377338409423828, "Pretrain/Step": 1558, "Pretrain/Step Time": 8.435085836797953} +{"Pretrain/Learning Rate": 4.964970266981661e-05, "Pretrain/Loss": 2.1250505447387695, "Pretrain/Loss (Raw)": 2.1793813705444336, "Pretrain/Step": 1559, "Pretrain/Step Time": 8.441199192777276} +{"Pretrain/Learning Rate": 4.9648994154413925e-05, "Pretrain/Loss": 2.1260416507720947, "Pretrain/Loss (Raw)": 2.0360050201416016, "Pretrain/Step": 1560, "Pretrain/Step Time": 8.44021662324667} +{"Pretrain/Learning Rate": 4.9648284928274865e-05, "Pretrain/Loss": 2.123023509979248, "Pretrain/Loss (Raw)": 1.998000144958496, "Pretrain/Step": 1561, "Pretrain/Step Time": 8.441138196736574} +{"Pretrain/Learning Rate": 4.964757499141989e-05, "Pretrain/Loss": 2.124199390411377, "Pretrain/Loss (Raw)": 2.1145994663238525, "Pretrain/Step": 1562, "Pretrain/Step Time": 8.440846655517817} +{"Pretrain/Learning Rate": 4.964686434386946e-05, "Pretrain/Loss": 2.1267428398132324, "Pretrain/Loss (Raw)": 2.2523839473724365, "Pretrain/Step": 1563, "Pretrain/Step Time": 8.433796893805265} +{"Pretrain/Learning Rate": 4.964615298564407e-05, "Pretrain/Loss": 2.1288669109344482, "Pretrain/Loss (Raw)": 2.1494109630584717, "Pretrain/Step": 1564, "Pretrain/Step Time": 8.434493204578757} +{"Pretrain/Learning Rate": 4.964544091676424e-05, "Pretrain/Loss": 2.129348039627075, "Pretrain/Loss (Raw)": 2.2006278038024902, "Pretrain/Step": 1565, "Pretrain/Step Time": 8.430935364216566} +{"Pretrain/Learning Rate": 4.964472813725049e-05, "Pretrain/Loss": 2.1297905445098877, "Pretrain/Loss (Raw)": 2.0115249156951904, "Pretrain/Step": 1566, "Pretrain/Step Time": 8.432804506272078} +{"Pretrain/Learning Rate": 4.964401464712337e-05, "Pretrain/Loss": 2.128727912902832, "Pretrain/Loss (Raw)": 2.0850443840026855, "Pretrain/Step": 1567, "Pretrain/Step Time": 8.431433824822307} +{"Pretrain/Learning Rate": 4.964330044640347e-05, "Pretrain/Loss": 2.12703800201416, "Pretrain/Loss (Raw)": 1.9054638147354126, "Pretrain/Step": 1568, "Pretrain/Step Time": 8.432935370132327} +{"Pretrain/Learning Rate": 4.9642585535111374e-05, "Pretrain/Loss": 2.1287124156951904, "Pretrain/Loss (Raw)": 2.1044790744781494, "Pretrain/Step": 1569, "Pretrain/Step Time": 8.43410800024867} +{"Pretrain/Learning Rate": 4.9641869913267697e-05, "Pretrain/Loss": 2.129274845123291, "Pretrain/Loss (Raw)": 2.1937060356140137, "Pretrain/Step": 1570, "Pretrain/Step Time": 8.433378303423524} +{"Pretrain/Learning Rate": 4.9641153580893074e-05, "Pretrain/Loss": 2.1280972957611084, "Pretrain/Loss (Raw)": 1.9468011856079102, "Pretrain/Step": 1571, "Pretrain/Step Time": 8.434171561151743} +{"Pretrain/Learning Rate": 4.9640436538008154e-05, "Pretrain/Loss": 2.128370761871338, "Pretrain/Loss (Raw)": 2.0978615283966064, "Pretrain/Step": 1572, "Pretrain/Step Time": 8.435107545927167} +{"Pretrain/Learning Rate": 4.963971878463362e-05, "Pretrain/Loss": 2.1292452812194824, "Pretrain/Loss (Raw)": 2.2024974822998047, "Pretrain/Step": 1573, "Pretrain/Step Time": 8.430662808939815} +{"Pretrain/Learning Rate": 4.963900032079016e-05, "Pretrain/Loss": 2.1282958984375, "Pretrain/Loss (Raw)": 2.0010833740234375, "Pretrain/Step": 1574, "Pretrain/Step Time": 8.43213495053351} +{"Pretrain/Learning Rate": 4.963828114649849e-05, "Pretrain/Loss": 2.1285600662231445, "Pretrain/Loss (Raw)": 2.0554163455963135, "Pretrain/Step": 1575, "Pretrain/Step Time": 8.432798953726888} +{"Pretrain/Learning Rate": 4.963756126177936e-05, "Pretrain/Loss": 2.1321122646331787, "Pretrain/Loss (Raw)": 2.5972156524658203, "Pretrain/Step": 1576, "Pretrain/Step Time": 8.435909386724234} +{"Pretrain/Learning Rate": 4.963684066665352e-05, "Pretrain/Loss": 2.130509614944458, "Pretrain/Loss (Raw)": 1.920540690422058, "Pretrain/Step": 1577, "Pretrain/Step Time": 8.431236131116748} +{"Pretrain/Learning Rate": 4.963611936114175e-05, "Pretrain/Loss": 2.1280441284179688, "Pretrain/Loss (Raw)": 2.051506996154785, "Pretrain/Step": 1578, "Pretrain/Step Time": 8.430021608248353} +{"Pretrain/Learning Rate": 4.963539734526484e-05, "Pretrain/Loss": 2.1291251182556152, "Pretrain/Loss (Raw)": 2.120164155960083, "Pretrain/Step": 1579, "Pretrain/Step Time": 8.430503824725747} +{"Pretrain/Learning Rate": 4.963467461904361e-05, "Pretrain/Loss": 2.1286487579345703, "Pretrain/Loss (Raw)": 2.0983502864837646, "Pretrain/Step": 1580, "Pretrain/Step Time": 8.43101742118597} +{"Pretrain/Learning Rate": 4.963395118249892e-05, "Pretrain/Loss": 2.131114959716797, "Pretrain/Loss (Raw)": 2.314964532852173, "Pretrain/Step": 1581, "Pretrain/Step Time": 8.423469057306647} +{"Pretrain/Learning Rate": 4.9633227035651595e-05, "Pretrain/Loss": 2.129455327987671, "Pretrain/Loss (Raw)": 1.9917775392532349, "Pretrain/Step": 1582, "Pretrain/Step Time": 8.42251881211996} +{"Pretrain/Learning Rate": 4.963250217852254e-05, "Pretrain/Loss": 2.128666877746582, "Pretrain/Loss (Raw)": 2.070096969604492, "Pretrain/Step": 1583, "Pretrain/Step Time": 8.422943070530891} +{"Pretrain/Learning Rate": 4.9631776611132654e-05, "Pretrain/Loss": 2.1273088455200195, "Pretrain/Loss (Raw)": 2.1068718433380127, "Pretrain/Step": 1584, "Pretrain/Step Time": 8.422325124964118} +{"Pretrain/Learning Rate": 4.963105033350285e-05, "Pretrain/Loss": 2.1273903846740723, "Pretrain/Loss (Raw)": 2.1768627166748047, "Pretrain/Step": 1585, "Pretrain/Step Time": 8.426697572693229} +{"Pretrain/Learning Rate": 4.9630323345654076e-05, "Pretrain/Loss": 2.128143787384033, "Pretrain/Loss (Raw)": 2.0689947605133057, "Pretrain/Step": 1586, "Pretrain/Step Time": 8.425747606903315} +{"Pretrain/Learning Rate": 4.962959564760729e-05, "Pretrain/Loss": 2.1275458335876465, "Pretrain/Loss (Raw)": 1.96064293384552, "Pretrain/Step": 1587, "Pretrain/Step Time": 8.424173757433891} +{"Pretrain/Learning Rate": 4.9628867239383476e-05, "Pretrain/Loss": 2.127798557281494, "Pretrain/Loss (Raw)": 2.2441699504852295, "Pretrain/Step": 1588, "Pretrain/Step Time": 8.426718689501286} +{"Pretrain/Learning Rate": 4.9628138121003634e-05, "Pretrain/Loss": 2.125359058380127, "Pretrain/Loss (Raw)": 1.911516785621643, "Pretrain/Step": 1589, "Pretrain/Step Time": 8.428312841802835} +{"Pretrain/Learning Rate": 4.96274082924888e-05, "Pretrain/Loss": 2.124420404434204, "Pretrain/Loss (Raw)": 2.169268846511841, "Pretrain/Step": 1590, "Pretrain/Step Time": 8.426038330420852} +{"Pretrain/Learning Rate": 4.962667775386e-05, "Pretrain/Loss": 2.12542724609375, "Pretrain/Loss (Raw)": 2.207807779312134, "Pretrain/Step": 1591, "Pretrain/Step Time": 8.42768650688231} +{"Pretrain/Learning Rate": 4.962594650513831e-05, "Pretrain/Loss": 2.1212713718414307, "Pretrain/Loss (Raw)": 2.2005348205566406, "Pretrain/Step": 1592, "Pretrain/Step Time": 8.429139249026775} +{"Pretrain/Learning Rate": 4.962521454634481e-05, "Pretrain/Loss": 2.121776580810547, "Pretrain/Loss (Raw)": 1.9486079216003418, "Pretrain/Step": 1593, "Pretrain/Step Time": 8.428438751026988} +{"Pretrain/Learning Rate": 4.9624481877500614e-05, "Pretrain/Loss": 2.1164040565490723, "Pretrain/Loss (Raw)": 1.9774953126907349, "Pretrain/Step": 1594, "Pretrain/Step Time": 8.428294952958822} +{"Pretrain/Learning Rate": 4.9623748498626844e-05, "Pretrain/Loss": 2.1137757301330566, "Pretrain/Loss (Raw)": 1.9557116031646729, "Pretrain/Step": 1595, "Pretrain/Step Time": 8.423288272693753} +{"Pretrain/Learning Rate": 4.962301440974464e-05, "Pretrain/Loss": 2.1134042739868164, "Pretrain/Loss (Raw)": 1.933063268661499, "Pretrain/Step": 1596, "Pretrain/Step Time": 8.424475306645036} +{"Pretrain/Learning Rate": 4.962227961087518e-05, "Pretrain/Loss": 2.111722469329834, "Pretrain/Loss (Raw)": 1.9093672037124634, "Pretrain/Step": 1597, "Pretrain/Step Time": 8.421786153689027} +{"Pretrain/Learning Rate": 4.962154410203963e-05, "Pretrain/Loss": 2.111398696899414, "Pretrain/Loss (Raw)": 2.0184969902038574, "Pretrain/Step": 1598, "Pretrain/Step Time": 8.417096640914679} +{"Pretrain/Learning Rate": 4.962080788325922e-05, "Pretrain/Loss": 2.1056089401245117, "Pretrain/Loss (Raw)": 1.5742993354797363, "Pretrain/Step": 1599, "Pretrain/Step Time": 8.416502704843879} +{"Pretrain/Learning Rate": 4.9620070954555175e-05, "Pretrain/Loss": 2.1049070358276367, "Pretrain/Loss (Raw)": 2.0456721782684326, "Pretrain/Step": 1600, "Pretrain/Step Time": 8.415268948301673} +{"Pretrain/Learning Rate": 4.961933331594874e-05, "Pretrain/Loss": 2.103368043899536, "Pretrain/Loss (Raw)": 2.0370187759399414, "Pretrain/Step": 1601, "Pretrain/Step Time": 8.41238073259592} +{"Pretrain/Learning Rate": 4.961859496746119e-05, "Pretrain/Loss": 2.1048989295959473, "Pretrain/Loss (Raw)": 2.2763421535491943, "Pretrain/Step": 1602, "Pretrain/Step Time": 8.418304573744535} +{"Pretrain/Learning Rate": 4.9617855909113796e-05, "Pretrain/Loss": 2.105562686920166, "Pretrain/Loss (Raw)": 2.142805576324463, "Pretrain/Step": 1603, "Pretrain/Step Time": 8.415503151714802} +{"Pretrain/Learning Rate": 4.961711614092789e-05, "Pretrain/Loss": 2.1055638790130615, "Pretrain/Loss (Raw)": 2.0106348991394043, "Pretrain/Step": 1604, "Pretrain/Step Time": 8.414062175899744} +{"Pretrain/Learning Rate": 4.9616375662924786e-05, "Pretrain/Loss": 2.103705883026123, "Pretrain/Loss (Raw)": 2.3078207969665527, "Pretrain/Step": 1605, "Pretrain/Step Time": 8.414995227009058} +{"Pretrain/Learning Rate": 4.961563447512585e-05, "Pretrain/Loss": 2.098778247833252, "Pretrain/Loss (Raw)": 2.198578357696533, "Pretrain/Step": 1606, "Pretrain/Step Time": 8.420310219749808} +{"Pretrain/Learning Rate": 4.961489257755245e-05, "Pretrain/Loss": 2.0981383323669434, "Pretrain/Loss (Raw)": 2.023930072784424, "Pretrain/Step": 1607, "Pretrain/Step Time": 8.419383512809873} +{"Pretrain/Learning Rate": 4.9614149970225965e-05, "Pretrain/Loss": 2.096557378768921, "Pretrain/Loss (Raw)": 2.335123300552368, "Pretrain/Step": 1608, "Pretrain/Step Time": 8.422634491696954} +{"Pretrain/Learning Rate": 4.961340665316782e-05, "Pretrain/Loss": 2.095787525177002, "Pretrain/Loss (Raw)": 2.0081076622009277, "Pretrain/Step": 1609, "Pretrain/Step Time": 8.420865833759308} +{"Pretrain/Learning Rate": 4.9612662626399455e-05, "Pretrain/Loss": 2.1005797386169434, "Pretrain/Loss (Raw)": 2.5033624172210693, "Pretrain/Step": 1610, "Pretrain/Step Time": 8.415212476626039} +{"Pretrain/Learning Rate": 4.9611917889942306e-05, "Pretrain/Loss": 2.100104570388794, "Pretrain/Loss (Raw)": 2.1663806438446045, "Pretrain/Step": 1611, "Pretrain/Step Time": 8.4148277528584} +{"Pretrain/Learning Rate": 4.9611172443817855e-05, "Pretrain/Loss": 2.1020708084106445, "Pretrain/Loss (Raw)": 2.1862258911132812, "Pretrain/Step": 1612, "Pretrain/Step Time": 8.418985184282064} +{"Pretrain/Learning Rate": 4.9610426288047594e-05, "Pretrain/Loss": 2.1030051708221436, "Pretrain/Loss (Raw)": 2.255361318588257, "Pretrain/Step": 1613, "Pretrain/Step Time": 8.422699538990855} +{"Pretrain/Learning Rate": 4.9609679422653045e-05, "Pretrain/Loss": 2.101881742477417, "Pretrain/Loss (Raw)": 2.0759406089782715, "Pretrain/Step": 1614, "Pretrain/Step Time": 8.421429060399532} +{"Pretrain/Learning Rate": 4.960893184765574e-05, "Pretrain/Loss": 2.103372097015381, "Pretrain/Loss (Raw)": 2.460404396057129, "Pretrain/Step": 1615, "Pretrain/Step Time": 8.417862368747592} +{"Pretrain/Learning Rate": 4.9608183563077224e-05, "Pretrain/Loss": 2.10379695892334, "Pretrain/Loss (Raw)": 2.122497797012329, "Pretrain/Step": 1616, "Pretrain/Step Time": 8.417746001854539} +{"Pretrain/Learning Rate": 4.960743456893909e-05, "Pretrain/Loss": 2.1050539016723633, "Pretrain/Loss (Raw)": 2.1964218616485596, "Pretrain/Step": 1617, "Pretrain/Step Time": 8.413653349503875} +{"Pretrain/Learning Rate": 4.960668486526292e-05, "Pretrain/Loss": 2.105738401412964, "Pretrain/Loss (Raw)": 2.3600640296936035, "Pretrain/Step": 1618, "Pretrain/Step Time": 8.416762923821807} +{"Pretrain/Learning Rate": 4.9605934452070346e-05, "Pretrain/Loss": 2.1065664291381836, "Pretrain/Loss (Raw)": 2.1216037273406982, "Pretrain/Step": 1619, "Pretrain/Step Time": 8.416835378855467} +{"Pretrain/Learning Rate": 4.9605183329382996e-05, "Pretrain/Loss": 2.1008810997009277, "Pretrain/Loss (Raw)": 1.8139557838439941, "Pretrain/Step": 1620, "Pretrain/Step Time": 8.416485922411084} +{"Pretrain/Learning Rate": 4.960443149722254e-05, "Pretrain/Loss": 2.099331855773926, "Pretrain/Loss (Raw)": 1.9131227731704712, "Pretrain/Step": 1621, "Pretrain/Step Time": 8.412626391276717} +{"Pretrain/Learning Rate": 4.960367895561063e-05, "Pretrain/Loss": 2.098853588104248, "Pretrain/Loss (Raw)": 2.2103211879730225, "Pretrain/Step": 1622, "Pretrain/Step Time": 8.417893139645457} +{"Pretrain/Learning Rate": 4.960292570456899e-05, "Pretrain/Loss": 2.1022098064422607, "Pretrain/Loss (Raw)": 2.337296485900879, "Pretrain/Step": 1623, "Pretrain/Step Time": 8.418664943426847} +{"Pretrain/Learning Rate": 4.960217174411933e-05, "Pretrain/Loss": 2.1005136966705322, "Pretrain/Loss (Raw)": 1.8927466869354248, "Pretrain/Step": 1624, "Pretrain/Step Time": 8.414753446355462} +{"Pretrain/Learning Rate": 4.9601417074283396e-05, "Pretrain/Loss": 2.1046085357666016, "Pretrain/Loss (Raw)": 2.479508876800537, "Pretrain/Step": 1625, "Pretrain/Step Time": 8.422231208533049} +{"Pretrain/Learning Rate": 4.960066169508294e-05, "Pretrain/Loss": 2.103342056274414, "Pretrain/Loss (Raw)": 1.7525404691696167, "Pretrain/Step": 1626, "Pretrain/Step Time": 8.422703053802252} +{"Pretrain/Learning Rate": 4.959990560653974e-05, "Pretrain/Loss": 2.104222297668457, "Pretrain/Loss (Raw)": 2.2592599391937256, "Pretrain/Step": 1627, "Pretrain/Step Time": 8.420475387945771} +{"Pretrain/Learning Rate": 4.959914880867561e-05, "Pretrain/Loss": 2.1050925254821777, "Pretrain/Loss (Raw)": 2.155928134918213, "Pretrain/Step": 1628, "Pretrain/Step Time": 8.418424762785435} +{"Pretrain/Learning Rate": 4.959839130151237e-05, "Pretrain/Loss": 2.104851484298706, "Pretrain/Loss (Raw)": 2.214245319366455, "Pretrain/Step": 1629, "Pretrain/Step Time": 8.421580784022808} +{"Pretrain/Learning Rate": 4.959763308507185e-05, "Pretrain/Loss": 2.1048145294189453, "Pretrain/Loss (Raw)": 2.1795506477355957, "Pretrain/Step": 1630, "Pretrain/Step Time": 8.421734139323235} +{"Pretrain/Learning Rate": 4.959687415937592e-05, "Pretrain/Loss": 2.1017773151397705, "Pretrain/Loss (Raw)": 2.012763261795044, "Pretrain/Step": 1631, "Pretrain/Step Time": 8.417837457731366} +{"Pretrain/Learning Rate": 4.959611452444647e-05, "Pretrain/Loss": 2.105806827545166, "Pretrain/Loss (Raw)": 2.172398567199707, "Pretrain/Step": 1632, "Pretrain/Step Time": 8.414292570203543} +{"Pretrain/Learning Rate": 4.9595354180305386e-05, "Pretrain/Loss": 2.1043689250946045, "Pretrain/Loss (Raw)": 2.322420835494995, "Pretrain/Step": 1633, "Pretrain/Step Time": 8.412417717278004} +{"Pretrain/Learning Rate": 4.959459312697461e-05, "Pretrain/Loss": 2.1039626598358154, "Pretrain/Loss (Raw)": 2.1530370712280273, "Pretrain/Step": 1634, "Pretrain/Step Time": 8.421661101281643} +{"Pretrain/Learning Rate": 4.959383136447608e-05, "Pretrain/Loss": 2.1025137901306152, "Pretrain/Loss (Raw)": 2.130884885787964, "Pretrain/Step": 1635, "Pretrain/Step Time": 8.41991888731718} +{"Pretrain/Learning Rate": 4.959306889283176e-05, "Pretrain/Loss": 2.1022372245788574, "Pretrain/Loss (Raw)": 2.052074432373047, "Pretrain/Step": 1636, "Pretrain/Step Time": 8.421327199786901} +{"Pretrain/Learning Rate": 4.959230571206363e-05, "Pretrain/Loss": 2.102283000946045, "Pretrain/Loss (Raw)": 2.1199951171875, "Pretrain/Step": 1637, "Pretrain/Step Time": 8.42554958537221} +{"Pretrain/Learning Rate": 4.9591541822193706e-05, "Pretrain/Loss": 2.104458808898926, "Pretrain/Loss (Raw)": 2.199986457824707, "Pretrain/Step": 1638, "Pretrain/Step Time": 8.415954744443297} +{"Pretrain/Learning Rate": 4.9590777223244014e-05, "Pretrain/Loss": 2.1042258739471436, "Pretrain/Loss (Raw)": 2.092273712158203, "Pretrain/Step": 1639, "Pretrain/Step Time": 8.413577634841204} +{"Pretrain/Learning Rate": 4.9590011915236584e-05, "Pretrain/Loss": 2.104088306427002, "Pretrain/Loss (Raw)": 2.2576308250427246, "Pretrain/Step": 1640, "Pretrain/Step Time": 8.418859094381332} +{"Pretrain/Learning Rate": 4.9589245898193506e-05, "Pretrain/Loss": 2.1042582988739014, "Pretrain/Loss (Raw)": 2.186528205871582, "Pretrain/Step": 1641, "Pretrain/Step Time": 8.422710044309497} +{"Pretrain/Learning Rate": 4.9588479172136845e-05, "Pretrain/Loss": 2.1044235229492188, "Pretrain/Loss (Raw)": 2.303776502609253, "Pretrain/Step": 1642, "Pretrain/Step Time": 8.416697021573782} +{"Pretrain/Learning Rate": 4.958771173708873e-05, "Pretrain/Loss": 2.1051864624023438, "Pretrain/Loss (Raw)": 2.089102268218994, "Pretrain/Step": 1643, "Pretrain/Step Time": 8.420217016711831} +{"Pretrain/Learning Rate": 4.9586943593071276e-05, "Pretrain/Loss": 2.1041014194488525, "Pretrain/Loss (Raw)": 1.8991376161575317, "Pretrain/Step": 1644, "Pretrain/Step Time": 8.418776689097285} +{"Pretrain/Learning Rate": 4.9586174740106644e-05, "Pretrain/Loss": 2.1059012413024902, "Pretrain/Loss (Raw)": 2.1788434982299805, "Pretrain/Step": 1645, "Pretrain/Step Time": 8.416636357083917} +{"Pretrain/Learning Rate": 4.9585405178216994e-05, "Pretrain/Loss": 2.105309009552002, "Pretrain/Loss (Raw)": 1.9907587766647339, "Pretrain/Step": 1646, "Pretrain/Step Time": 8.420536821708083} +{"Pretrain/Learning Rate": 4.958463490742451e-05, "Pretrain/Loss": 2.1044979095458984, "Pretrain/Loss (Raw)": 2.050426483154297, "Pretrain/Step": 1647, "Pretrain/Step Time": 8.412575881928205} +{"Pretrain/Learning Rate": 4.9583863927751416e-05, "Pretrain/Loss": 2.1049551963806152, "Pretrain/Loss (Raw)": 2.0474941730499268, "Pretrain/Step": 1648, "Pretrain/Step Time": 8.413366759195924} +{"Pretrain/Learning Rate": 4.9583092239219934e-05, "Pretrain/Loss": 2.109168529510498, "Pretrain/Loss (Raw)": 2.421391010284424, "Pretrain/Step": 1649, "Pretrain/Step Time": 8.412705877795815} +{"Pretrain/Learning Rate": 4.958231984185231e-05, "Pretrain/Loss": 2.112323760986328, "Pretrain/Loss (Raw)": 2.2896156311035156, "Pretrain/Step": 1650, "Pretrain/Step Time": 8.41817701049149} +{"Pretrain/Learning Rate": 4.9581546735670834e-05, "Pretrain/Loss": 2.112290859222412, "Pretrain/Loss (Raw)": 2.225767135620117, "Pretrain/Step": 1651, "Pretrain/Step Time": 8.418695064261556} +{"Pretrain/Learning Rate": 4.9580772920697785e-05, "Pretrain/Loss": 2.1127612590789795, "Pretrain/Loss (Raw)": 2.171063184738159, "Pretrain/Step": 1652, "Pretrain/Step Time": 8.418037509545684} +{"Pretrain/Learning Rate": 4.9579998396955476e-05, "Pretrain/Loss": 2.112492084503174, "Pretrain/Loss (Raw)": 2.2261128425598145, "Pretrain/Step": 1653, "Pretrain/Step Time": 8.41828453168273} +{"Pretrain/Learning Rate": 4.957922316446623e-05, "Pretrain/Loss": 2.113342046737671, "Pretrain/Loss (Raw)": 2.228095293045044, "Pretrain/Step": 1654, "Pretrain/Step Time": 8.41926595568657} +{"Pretrain/Learning Rate": 4.957844722325242e-05, "Pretrain/Loss": 2.1140294075012207, "Pretrain/Loss (Raw)": 2.0417604446411133, "Pretrain/Step": 1655, "Pretrain/Step Time": 8.41934323310852} +{"Pretrain/Learning Rate": 4.957767057333642e-05, "Pretrain/Loss": 2.114157199859619, "Pretrain/Loss (Raw)": 2.125335693359375, "Pretrain/Step": 1656, "Pretrain/Step Time": 8.416742410510778} +{"Pretrain/Learning Rate": 4.9576893214740596e-05, "Pretrain/Loss": 2.112973690032959, "Pretrain/Loss (Raw)": 2.092142343521118, "Pretrain/Step": 1657, "Pretrain/Step Time": 8.4201335106045} +{"Pretrain/Learning Rate": 4.95761151474874e-05, "Pretrain/Loss": 2.114952564239502, "Pretrain/Loss (Raw)": 2.059300422668457, "Pretrain/Step": 1658, "Pretrain/Step Time": 8.420288261026144} +{"Pretrain/Learning Rate": 4.9575336371599234e-05, "Pretrain/Loss": 2.1141982078552246, "Pretrain/Loss (Raw)": 2.0582990646362305, "Pretrain/Step": 1659, "Pretrain/Step Time": 8.418209623545408} +{"Pretrain/Learning Rate": 4.957455688709858e-05, "Pretrain/Loss": 2.1144003868103027, "Pretrain/Loss (Raw)": 2.0310897827148438, "Pretrain/Step": 1660, "Pretrain/Step Time": 8.42173427157104} +{"Pretrain/Learning Rate": 4.95737766940079e-05, "Pretrain/Loss": 2.114759922027588, "Pretrain/Loss (Raw)": 2.1222760677337646, "Pretrain/Step": 1661, "Pretrain/Step Time": 8.420087456703186} +{"Pretrain/Learning Rate": 4.957299579234969e-05, "Pretrain/Loss": 2.11462664604187, "Pretrain/Loss (Raw)": 2.0477588176727295, "Pretrain/Step": 1662, "Pretrain/Step Time": 8.416648954153061} +{"Pretrain/Learning Rate": 4.9572214182146464e-05, "Pretrain/Loss": 2.1142749786376953, "Pretrain/Loss (Raw)": 2.0858569145202637, "Pretrain/Step": 1663, "Pretrain/Step Time": 8.417852217331529} +{"Pretrain/Learning Rate": 4.957143186342077e-05, "Pretrain/Loss": 2.1137356758117676, "Pretrain/Loss (Raw)": 2.028557538986206, "Pretrain/Step": 1664, "Pretrain/Step Time": 8.415554951876402} +{"Pretrain/Learning Rate": 4.9570648836195155e-05, "Pretrain/Loss": 2.116072177886963, "Pretrain/Loss (Raw)": 2.3954813480377197, "Pretrain/Step": 1665, "Pretrain/Step Time": 8.417770573869348} +{"Pretrain/Learning Rate": 4.9569865100492204e-05, "Pretrain/Loss": 2.1154072284698486, "Pretrain/Loss (Raw)": 2.109182834625244, "Pretrain/Step": 1666, "Pretrain/Step Time": 8.418397387489676} +{"Pretrain/Learning Rate": 4.956908065633452e-05, "Pretrain/Loss": 2.117534875869751, "Pretrain/Loss (Raw)": 2.3793742656707764, "Pretrain/Step": 1667, "Pretrain/Step Time": 8.420128934085369} +{"Pretrain/Learning Rate": 4.956829550374471e-05, "Pretrain/Loss": 2.1178245544433594, "Pretrain/Loss (Raw)": 2.03587007522583, "Pretrain/Step": 1668, "Pretrain/Step Time": 8.41819248907268} +{"Pretrain/Learning Rate": 4.9567509642745426e-05, "Pretrain/Loss": 2.1192383766174316, "Pretrain/Loss (Raw)": 2.1031877994537354, "Pretrain/Step": 1669, "Pretrain/Step Time": 8.419219709932804} +{"Pretrain/Learning Rate": 4.956672307335931e-05, "Pretrain/Loss": 2.120366334915161, "Pretrain/Loss (Raw)": 2.1207640171051025, "Pretrain/Step": 1670, "Pretrain/Step Time": 8.419797468930483} +{"Pretrain/Learning Rate": 4.956593579560905e-05, "Pretrain/Loss": 2.1224606037139893, "Pretrain/Loss (Raw)": 2.563851833343506, "Pretrain/Step": 1671, "Pretrain/Step Time": 8.415912259370089} +{"Pretrain/Learning Rate": 4.956514780951736e-05, "Pretrain/Loss": 2.1226749420166016, "Pretrain/Loss (Raw)": 1.9212251901626587, "Pretrain/Step": 1672, "Pretrain/Step Time": 8.409911159425974} +{"Pretrain/Learning Rate": 4.956435911510695e-05, "Pretrain/Loss": 2.1220600605010986, "Pretrain/Loss (Raw)": 2.073789119720459, "Pretrain/Step": 1673, "Pretrain/Step Time": 8.411832908168435} +{"Pretrain/Learning Rate": 4.956356971240055e-05, "Pretrain/Loss": 2.123577117919922, "Pretrain/Loss (Raw)": 2.178971529006958, "Pretrain/Step": 1674, "Pretrain/Step Time": 8.414118496701121} +{"Pretrain/Learning Rate": 4.956277960142095e-05, "Pretrain/Loss": 2.124052047729492, "Pretrain/Loss (Raw)": 2.062460422515869, "Pretrain/Step": 1675, "Pretrain/Step Time": 8.416098050773144} +{"Pretrain/Learning Rate": 4.9561988782190906e-05, "Pretrain/Loss": 2.12548828125, "Pretrain/Loss (Raw)": 2.163151502609253, "Pretrain/Step": 1676, "Pretrain/Step Time": 8.412895746529102} +{"Pretrain/Learning Rate": 4.956119725473323e-05, "Pretrain/Loss": 2.128405809402466, "Pretrain/Loss (Raw)": 2.3862428665161133, "Pretrain/Step": 1677, "Pretrain/Step Time": 8.41500593163073} +{"Pretrain/Learning Rate": 4.9560405019070745e-05, "Pretrain/Loss": 2.129089832305908, "Pretrain/Loss (Raw)": 2.198981761932373, "Pretrain/Step": 1678, "Pretrain/Step Time": 8.413250517100096} +{"Pretrain/Learning Rate": 4.9559612075226296e-05, "Pretrain/Loss": 2.127668857574463, "Pretrain/Loss (Raw)": 2.140977382659912, "Pretrain/Step": 1679, "Pretrain/Step Time": 8.413895847275853} +{"Pretrain/Learning Rate": 4.955881842322275e-05, "Pretrain/Loss": 2.1262404918670654, "Pretrain/Loss (Raw)": 1.88815438747406, "Pretrain/Step": 1680, "Pretrain/Step Time": 8.409427560865879} +{"Pretrain/Learning Rate": 4.955802406308298e-05, "Pretrain/Loss": 2.1285834312438965, "Pretrain/Loss (Raw)": 2.3879919052124023, "Pretrain/Step": 1681, "Pretrain/Step Time": 8.408613193780184} +{"Pretrain/Learning Rate": 4.955722899482991e-05, "Pretrain/Loss": 2.1301350593566895, "Pretrain/Loss (Raw)": 2.195004463195801, "Pretrain/Step": 1682, "Pretrain/Step Time": 8.407218595966697} +{"Pretrain/Learning Rate": 4.9556433218486446e-05, "Pretrain/Loss": 2.1281180381774902, "Pretrain/Loss (Raw)": 1.96351957321167, "Pretrain/Step": 1683, "Pretrain/Step Time": 8.414359118789434} +{"Pretrain/Learning Rate": 4.9555636734075536e-05, "Pretrain/Loss": 2.1269376277923584, "Pretrain/Loss (Raw)": 2.0163817405700684, "Pretrain/Step": 1684, "Pretrain/Step Time": 8.414165439084172} +{"Pretrain/Learning Rate": 4.955483954162016e-05, "Pretrain/Loss": 2.1291637420654297, "Pretrain/Loss (Raw)": 2.251708507537842, "Pretrain/Step": 1685, "Pretrain/Step Time": 8.417862318456173} +{"Pretrain/Learning Rate": 4.955404164114329e-05, "Pretrain/Loss": 2.1267895698547363, "Pretrain/Loss (Raw)": 2.0734386444091797, "Pretrain/Step": 1686, "Pretrain/Step Time": 8.419460503384471} +{"Pretrain/Learning Rate": 4.955324303266795e-05, "Pretrain/Loss": 2.1247718334198, "Pretrain/Loss (Raw)": 1.921126365661621, "Pretrain/Step": 1687, "Pretrain/Step Time": 8.416860776022077} +{"Pretrain/Learning Rate": 4.9552443716217146e-05, "Pretrain/Loss": 2.125185966491699, "Pretrain/Loss (Raw)": 2.089010000228882, "Pretrain/Step": 1688, "Pretrain/Step Time": 8.416227325797081} +{"Pretrain/Learning Rate": 4.9551643691813935e-05, "Pretrain/Loss": 2.125368595123291, "Pretrain/Loss (Raw)": 2.0213656425476074, "Pretrain/Step": 1689, "Pretrain/Step Time": 8.421151842921972} +{"Pretrain/Learning Rate": 4.955084295948139e-05, "Pretrain/Loss": 2.125028133392334, "Pretrain/Loss (Raw)": 2.0710177421569824, "Pretrain/Step": 1690, "Pretrain/Step Time": 8.419845400378108} +{"Pretrain/Learning Rate": 4.95500415192426e-05, "Pretrain/Loss": 2.125035524368286, "Pretrain/Loss (Raw)": 2.253343343734741, "Pretrain/Step": 1691, "Pretrain/Step Time": 8.419435227289796} +{"Pretrain/Learning Rate": 4.954923937112066e-05, "Pretrain/Loss": 2.1251072883605957, "Pretrain/Loss (Raw)": 2.1585845947265625, "Pretrain/Step": 1692, "Pretrain/Step Time": 8.421454215422273} +{"Pretrain/Learning Rate": 4.954843651513871e-05, "Pretrain/Loss": 2.126575469970703, "Pretrain/Loss (Raw)": 2.3885767459869385, "Pretrain/Step": 1693, "Pretrain/Step Time": 8.419219812378287} +{"Pretrain/Learning Rate": 4.954763295131991e-05, "Pretrain/Loss": 2.12735652923584, "Pretrain/Loss (Raw)": 2.111497163772583, "Pretrain/Step": 1694, "Pretrain/Step Time": 8.418828221037984} +{"Pretrain/Learning Rate": 4.954682867968741e-05, "Pretrain/Loss": 2.1269240379333496, "Pretrain/Loss (Raw)": 2.0296831130981445, "Pretrain/Step": 1695, "Pretrain/Step Time": 8.420463429763913} +{"Pretrain/Learning Rate": 4.9546023700264404e-05, "Pretrain/Loss": 2.1306324005126953, "Pretrain/Loss (Raw)": 2.3801252841949463, "Pretrain/Step": 1696, "Pretrain/Step Time": 8.4199188221246} +{"Pretrain/Learning Rate": 4.954521801307411e-05, "Pretrain/Loss": 2.12931489944458, "Pretrain/Loss (Raw)": 1.9358326196670532, "Pretrain/Step": 1697, "Pretrain/Step Time": 8.414625057950616} +{"Pretrain/Learning Rate": 4.9544411618139765e-05, "Pretrain/Loss": 2.1290698051452637, "Pretrain/Loss (Raw)": 2.1623525619506836, "Pretrain/Step": 1698, "Pretrain/Step Time": 8.415328111499548} +{"Pretrain/Learning Rate": 4.954360451548461e-05, "Pretrain/Loss": 2.12977933883667, "Pretrain/Loss (Raw)": 2.0376057624816895, "Pretrain/Step": 1699, "Pretrain/Step Time": 8.415592201054096} +{"Pretrain/Learning Rate": 4.954279670513192e-05, "Pretrain/Loss": 2.1279826164245605, "Pretrain/Loss (Raw)": 1.8678979873657227, "Pretrain/Step": 1700, "Pretrain/Step Time": 8.416686767712235} +{"Pretrain/Learning Rate": 4.954198818710499e-05, "Pretrain/Loss": 2.1278388500213623, "Pretrain/Loss (Raw)": 2.1840949058532715, "Pretrain/Step": 1701, "Pretrain/Step Time": 8.41928131878376} +{"Pretrain/Learning Rate": 4.954117896142714e-05, "Pretrain/Loss": 2.130194664001465, "Pretrain/Loss (Raw)": 2.302588939666748, "Pretrain/Step": 1702, "Pretrain/Step Time": 8.421255379915237} +{"Pretrain/Learning Rate": 4.954036902812168e-05, "Pretrain/Loss": 2.1322436332702637, "Pretrain/Loss (Raw)": 2.317725419998169, "Pretrain/Step": 1703, "Pretrain/Step Time": 8.42241151817143} +{"Pretrain/Learning Rate": 4.9539558387211985e-05, "Pretrain/Loss": 2.1279795169830322, "Pretrain/Loss (Raw)": 2.0513978004455566, "Pretrain/Step": 1704, "Pretrain/Step Time": 8.419552698731422} +{"Pretrain/Learning Rate": 4.953874703872142e-05, "Pretrain/Loss": 2.1301722526550293, "Pretrain/Loss (Raw)": 2.201212167739868, "Pretrain/Step": 1705, "Pretrain/Step Time": 8.421915374696255} +{"Pretrain/Learning Rate": 4.9537934982673393e-05, "Pretrain/Loss": 2.131568431854248, "Pretrain/Loss (Raw)": 2.230234384536743, "Pretrain/Step": 1706, "Pretrain/Step Time": 8.41985596343875} +{"Pretrain/Learning Rate": 4.95371222190913e-05, "Pretrain/Loss": 2.131464719772339, "Pretrain/Loss (Raw)": 2.1068766117095947, "Pretrain/Step": 1707, "Pretrain/Step Time": 8.419237280264497} +{"Pretrain/Learning Rate": 4.953630874799859e-05, "Pretrain/Loss": 2.1317086219787598, "Pretrain/Loss (Raw)": 2.1295559406280518, "Pretrain/Step": 1708, "Pretrain/Step Time": 8.419177304953337} +{"Pretrain/Learning Rate": 4.95354945694187e-05, "Pretrain/Loss": 2.1294658184051514, "Pretrain/Loss (Raw)": 2.027909278869629, "Pretrain/Step": 1709, "Pretrain/Step Time": 8.422144344076514} +{"Pretrain/Learning Rate": 4.953467968337514e-05, "Pretrain/Loss": 2.130955696105957, "Pretrain/Loss (Raw)": 2.182469129562378, "Pretrain/Step": 1710, "Pretrain/Step Time": 8.42154104448855} +{"Pretrain/Learning Rate": 4.953386408989138e-05, "Pretrain/Loss": 2.130652904510498, "Pretrain/Loss (Raw)": 2.0313165187835693, "Pretrain/Step": 1711, "Pretrain/Step Time": 8.421463942155242} +{"Pretrain/Learning Rate": 4.9533047788990946e-05, "Pretrain/Loss": 2.131340503692627, "Pretrain/Loss (Raw)": 2.194899797439575, "Pretrain/Step": 1712, "Pretrain/Step Time": 8.42031947337091} +{"Pretrain/Learning Rate": 4.953223078069737e-05, "Pretrain/Loss": 2.1304397583007812, "Pretrain/Loss (Raw)": 2.0615813732147217, "Pretrain/Step": 1713, "Pretrain/Step Time": 8.4179857224226} +{"Pretrain/Learning Rate": 4.9531413065034214e-05, "Pretrain/Loss": 2.132507085800171, "Pretrain/Loss (Raw)": 2.3336169719696045, "Pretrain/Step": 1714, "Pretrain/Step Time": 8.417937656864524} +{"Pretrain/Learning Rate": 4.9530594642025055e-05, "Pretrain/Loss": 2.1340227127075195, "Pretrain/Loss (Raw)": 2.1546521186828613, "Pretrain/Step": 1715, "Pretrain/Step Time": 8.4201057869941} +{"Pretrain/Learning Rate": 4.95297755116935e-05, "Pretrain/Loss": 2.135035276412964, "Pretrain/Loss (Raw)": 2.37375807762146, "Pretrain/Step": 1716, "Pretrain/Step Time": 8.419217802584171} +{"Pretrain/Learning Rate": 4.952895567406315e-05, "Pretrain/Loss": 2.1353988647460938, "Pretrain/Loss (Raw)": 1.958065152168274, "Pretrain/Step": 1717, "Pretrain/Step Time": 8.416032709181309} +{"Pretrain/Learning Rate": 4.952813512915766e-05, "Pretrain/Loss": 2.1352736949920654, "Pretrain/Loss (Raw)": 2.1532368659973145, "Pretrain/Step": 1718, "Pretrain/Step Time": 8.419217847287655} +{"Pretrain/Learning Rate": 4.952731387700068e-05, "Pretrain/Loss": 2.13346529006958, "Pretrain/Loss (Raw)": 1.9763373136520386, "Pretrain/Step": 1719, "Pretrain/Step Time": 8.422110550105572} +{"Pretrain/Learning Rate": 4.95264919176159e-05, "Pretrain/Loss": 2.1328659057617188, "Pretrain/Loss (Raw)": 2.123814105987549, "Pretrain/Step": 1720, "Pretrain/Step Time": 8.415311358869076} +{"Pretrain/Learning Rate": 4.952566925102702e-05, "Pretrain/Loss": 2.1349856853485107, "Pretrain/Loss (Raw)": 2.2199485301971436, "Pretrain/Step": 1721, "Pretrain/Step Time": 8.419422106817365} +{"Pretrain/Learning Rate": 4.952484587725775e-05, "Pretrain/Loss": 2.135748863220215, "Pretrain/Loss (Raw)": 2.0752029418945312, "Pretrain/Step": 1722, "Pretrain/Step Time": 8.424126025289297} +{"Pretrain/Learning Rate": 4.9524021796331845e-05, "Pretrain/Loss": 2.136577606201172, "Pretrain/Loss (Raw)": 2.0617387294769287, "Pretrain/Step": 1723, "Pretrain/Step Time": 8.427697559818625} +{"Pretrain/Learning Rate": 4.952319700827305e-05, "Pretrain/Loss": 2.138526439666748, "Pretrain/Loss (Raw)": 2.1825156211853027, "Pretrain/Step": 1724, "Pretrain/Step Time": 8.428484847769141} +{"Pretrain/Learning Rate": 4.952237151310516e-05, "Pretrain/Loss": 2.1384854316711426, "Pretrain/Loss (Raw)": 1.9041252136230469, "Pretrain/Step": 1725, "Pretrain/Step Time": 8.427450945600867} +{"Pretrain/Learning Rate": 4.952154531085198e-05, "Pretrain/Loss": 2.137593984603882, "Pretrain/Loss (Raw)": 1.9044103622436523, "Pretrain/Step": 1726, "Pretrain/Step Time": 8.432574396952987} +{"Pretrain/Learning Rate": 4.952071840153732e-05, "Pretrain/Loss": 2.141507625579834, "Pretrain/Loss (Raw)": 2.0752527713775635, "Pretrain/Step": 1727, "Pretrain/Step Time": 8.431427754461765} +{"Pretrain/Learning Rate": 4.9519890785185033e-05, "Pretrain/Loss": 2.1455111503601074, "Pretrain/Loss (Raw)": 2.55810546875, "Pretrain/Step": 1728, "Pretrain/Step Time": 8.430274095386267} +{"Pretrain/Learning Rate": 4.951906246181898e-05, "Pretrain/Loss": 2.1463561058044434, "Pretrain/Loss (Raw)": 2.1451942920684814, "Pretrain/Step": 1729, "Pretrain/Step Time": 8.432616762816906} +{"Pretrain/Learning Rate": 4.9518233431463045e-05, "Pretrain/Loss": 2.144615650177002, "Pretrain/Loss (Raw)": 2.0535519123077393, "Pretrain/Step": 1730, "Pretrain/Step Time": 8.425737783312798} +{"Pretrain/Learning Rate": 4.951740369414114e-05, "Pretrain/Loss": 2.1449642181396484, "Pretrain/Loss (Raw)": 2.1874196529388428, "Pretrain/Step": 1731, "Pretrain/Step Time": 8.427014695480466} +{"Pretrain/Learning Rate": 4.951657324987717e-05, "Pretrain/Loss": 2.1443333625793457, "Pretrain/Loss (Raw)": 1.929886817932129, "Pretrain/Step": 1732, "Pretrain/Step Time": 8.430961292237043} +{"Pretrain/Learning Rate": 4.9515742098695106e-05, "Pretrain/Loss": 2.1414268016815186, "Pretrain/Loss (Raw)": 1.9357690811157227, "Pretrain/Step": 1733, "Pretrain/Step Time": 8.427938168868423} +{"Pretrain/Learning Rate": 4.95149102406189e-05, "Pretrain/Loss": 2.1397252082824707, "Pretrain/Loss (Raw)": 1.980785608291626, "Pretrain/Step": 1734, "Pretrain/Step Time": 8.427297433838248} +{"Pretrain/Learning Rate": 4.9514077675672535e-05, "Pretrain/Loss": 2.138495922088623, "Pretrain/Loss (Raw)": 1.8665684461593628, "Pretrain/Step": 1735, "Pretrain/Step Time": 8.430490216240287} +{"Pretrain/Learning Rate": 4.951324440388002e-05, "Pretrain/Loss": 2.1355855464935303, "Pretrain/Loss (Raw)": 1.9625968933105469, "Pretrain/Step": 1736, "Pretrain/Step Time": 8.424637461081147} +{"Pretrain/Learning Rate": 4.9512410425265384e-05, "Pretrain/Loss": 2.13742995262146, "Pretrain/Loss (Raw)": 2.244192361831665, "Pretrain/Step": 1737, "Pretrain/Step Time": 8.4302449952811} +{"Pretrain/Learning Rate": 4.9511575739852685e-05, "Pretrain/Loss": 2.134627103805542, "Pretrain/Loss (Raw)": 2.1446101665496826, "Pretrain/Step": 1738, "Pretrain/Step Time": 8.432147013023496} +{"Pretrain/Learning Rate": 4.951074034766597e-05, "Pretrain/Loss": 2.133655071258545, "Pretrain/Loss (Raw)": 2.041964292526245, "Pretrain/Step": 1739, "Pretrain/Step Time": 8.430821113288403} +{"Pretrain/Learning Rate": 4.950990424872933e-05, "Pretrain/Loss": 2.132556438446045, "Pretrain/Loss (Raw)": 2.0455615520477295, "Pretrain/Step": 1740, "Pretrain/Step Time": 8.429107876494527} +{"Pretrain/Learning Rate": 4.950906744306689e-05, "Pretrain/Loss": 2.13187837600708, "Pretrain/Loss (Raw)": 2.168609380722046, "Pretrain/Step": 1741, "Pretrain/Step Time": 8.425378043204546} +{"Pretrain/Learning Rate": 4.950822993070276e-05, "Pretrain/Loss": 2.135334014892578, "Pretrain/Loss (Raw)": 2.518261671066284, "Pretrain/Step": 1742, "Pretrain/Step Time": 8.424437705427408} +{"Pretrain/Learning Rate": 4.95073917116611e-05, "Pretrain/Loss": 2.1335983276367188, "Pretrain/Loss (Raw)": 2.238245725631714, "Pretrain/Step": 1743, "Pretrain/Step Time": 8.428075412288308} +{"Pretrain/Learning Rate": 4.950655278596607e-05, "Pretrain/Loss": 2.1346652507781982, "Pretrain/Loss (Raw)": 2.259044885635376, "Pretrain/Step": 1744, "Pretrain/Step Time": 8.429483272135258} +{"Pretrain/Learning Rate": 4.950571315364188e-05, "Pretrain/Loss": 2.1346797943115234, "Pretrain/Loss (Raw)": 2.1982882022857666, "Pretrain/Step": 1745, "Pretrain/Step Time": 8.427762949839234} +{"Pretrain/Learning Rate": 4.950487281471272e-05, "Pretrain/Loss": 2.1338682174682617, "Pretrain/Loss (Raw)": 2.256176710128784, "Pretrain/Step": 1746, "Pretrain/Step Time": 8.424251781776547} +{"Pretrain/Learning Rate": 4.950403176920283e-05, "Pretrain/Loss": 2.1331655979156494, "Pretrain/Loss (Raw)": 2.0316624641418457, "Pretrain/Step": 1747, "Pretrain/Step Time": 8.424243193119764} +{"Pretrain/Learning Rate": 4.9503190017136456e-05, "Pretrain/Loss": 2.135504722595215, "Pretrain/Loss (Raw)": 2.1133649349212646, "Pretrain/Step": 1748, "Pretrain/Step Time": 8.424313120543957} +{"Pretrain/Learning Rate": 4.9502347558537866e-05, "Pretrain/Loss": 2.137627363204956, "Pretrain/Loss (Raw)": 2.1848204135894775, "Pretrain/Step": 1749, "Pretrain/Step Time": 8.422885684296489} +{"Pretrain/Learning Rate": 4.9501504393431366e-05, "Pretrain/Loss": 2.1379027366638184, "Pretrain/Loss (Raw)": 2.2455923557281494, "Pretrain/Step": 1750, "Pretrain/Step Time": 8.42175755649805} +{"Pretrain/Learning Rate": 4.950066052184125e-05, "Pretrain/Loss": 2.1366443634033203, "Pretrain/Loss (Raw)": 2.176210641860962, "Pretrain/Step": 1751, "Pretrain/Step Time": 8.422631807625294} +{"Pretrain/Learning Rate": 4.949981594379186e-05, "Pretrain/Loss": 2.137732744216919, "Pretrain/Loss (Raw)": 2.0320425033569336, "Pretrain/Step": 1752, "Pretrain/Step Time": 8.428162591531873} +{"Pretrain/Learning Rate": 4.9498970659307555e-05, "Pretrain/Loss": 2.1341633796691895, "Pretrain/Loss (Raw)": 2.0226151943206787, "Pretrain/Step": 1753, "Pretrain/Step Time": 8.422764839604497} +{"Pretrain/Learning Rate": 4.9498124668412705e-05, "Pretrain/Loss": 2.1366872787475586, "Pretrain/Loss (Raw)": 2.075646162033081, "Pretrain/Step": 1754, "Pretrain/Step Time": 8.425741633400321} +{"Pretrain/Learning Rate": 4.949727797113169e-05, "Pretrain/Loss": 2.139491558074951, "Pretrain/Loss (Raw)": 2.6181859970092773, "Pretrain/Step": 1755, "Pretrain/Step Time": 8.427741015329957} +{"Pretrain/Learning Rate": 4.949643056748894e-05, "Pretrain/Loss": 2.1380488872528076, "Pretrain/Loss (Raw)": 1.9712629318237305, "Pretrain/Step": 1756, "Pretrain/Step Time": 8.42830092459917} +{"Pretrain/Learning Rate": 4.949558245750888e-05, "Pretrain/Loss": 2.1376280784606934, "Pretrain/Loss (Raw)": 2.1603877544403076, "Pretrain/Step": 1757, "Pretrain/Step Time": 8.428037613630295} +{"Pretrain/Learning Rate": 4.949473364121597e-05, "Pretrain/Loss": 2.1362967491149902, "Pretrain/Loss (Raw)": 2.009140729904175, "Pretrain/Step": 1758, "Pretrain/Step Time": 8.427609087899327} +{"Pretrain/Learning Rate": 4.949388411863469e-05, "Pretrain/Loss": 2.1367669105529785, "Pretrain/Loss (Raw)": 2.072939872741699, "Pretrain/Step": 1759, "Pretrain/Step Time": 8.430178737267852} +{"Pretrain/Learning Rate": 4.949303388978952e-05, "Pretrain/Loss": 2.1350300312042236, "Pretrain/Loss (Raw)": 1.9500738382339478, "Pretrain/Step": 1760, "Pretrain/Step Time": 8.42787597514689} +{"Pretrain/Learning Rate": 4.949218295470499e-05, "Pretrain/Loss": 2.133607864379883, "Pretrain/Loss (Raw)": 2.1403939723968506, "Pretrain/Step": 1761, "Pretrain/Step Time": 8.430359387770295} +{"Pretrain/Learning Rate": 4.949133131340562e-05, "Pretrain/Loss": 2.1327364444732666, "Pretrain/Loss (Raw)": 2.0414934158325195, "Pretrain/Step": 1762, "Pretrain/Step Time": 8.422243852168322} +{"Pretrain/Learning Rate": 4.949047896591599e-05, "Pretrain/Loss": 2.132113456726074, "Pretrain/Loss (Raw)": 2.051163673400879, "Pretrain/Step": 1763, "Pretrain/Step Time": 8.421998832374811} +{"Pretrain/Learning Rate": 4.9489625912260654e-05, "Pretrain/Loss": 2.1319456100463867, "Pretrain/Loss (Raw)": 2.0305633544921875, "Pretrain/Step": 1764, "Pretrain/Step Time": 8.42253452539444} +{"Pretrain/Learning Rate": 4.9488772152464226e-05, "Pretrain/Loss": 2.1323182582855225, "Pretrain/Loss (Raw)": 2.1677026748657227, "Pretrain/Step": 1765, "Pretrain/Step Time": 8.420893114060163} +{"Pretrain/Learning Rate": 4.948791768655131e-05, "Pretrain/Loss": 2.13150691986084, "Pretrain/Loss (Raw)": 2.096134901046753, "Pretrain/Step": 1766, "Pretrain/Step Time": 8.42544505186379} +{"Pretrain/Learning Rate": 4.9487062514546554e-05, "Pretrain/Loss": 2.1317009925842285, "Pretrain/Loss (Raw)": 2.1171305179595947, "Pretrain/Step": 1767, "Pretrain/Step Time": 8.424920661374927} +{"Pretrain/Learning Rate": 4.948620663647461e-05, "Pretrain/Loss": 2.1318299770355225, "Pretrain/Loss (Raw)": 2.274122476577759, "Pretrain/Step": 1768, "Pretrain/Step Time": 8.421317737549543} +{"Pretrain/Learning Rate": 4.9485350052360164e-05, "Pretrain/Loss": 2.1320924758911133, "Pretrain/Loss (Raw)": 2.220123052597046, "Pretrain/Step": 1769, "Pretrain/Step Time": 8.421023949980736} +{"Pretrain/Learning Rate": 4.948449276222791e-05, "Pretrain/Loss": 2.1293230056762695, "Pretrain/Loss (Raw)": 1.949306607246399, "Pretrain/Step": 1770, "Pretrain/Step Time": 8.423674678429961} +{"Pretrain/Learning Rate": 4.948363476610256e-05, "Pretrain/Loss": 2.130312204360962, "Pretrain/Loss (Raw)": 2.2157161235809326, "Pretrain/Step": 1771, "Pretrain/Step Time": 8.424636200070381} +{"Pretrain/Learning Rate": 4.9482776064008865e-05, "Pretrain/Loss": 2.1304261684417725, "Pretrain/Loss (Raw)": 1.913722038269043, "Pretrain/Step": 1772, "Pretrain/Step Time": 8.426098080351949} +{"Pretrain/Learning Rate": 4.948191665597158e-05, "Pretrain/Loss": 2.128988265991211, "Pretrain/Loss (Raw)": 1.994802713394165, "Pretrain/Step": 1773, "Pretrain/Step Time": 8.426421090960503} +{"Pretrain/Learning Rate": 4.948105654201549e-05, "Pretrain/Loss": 2.128420829772949, "Pretrain/Loss (Raw)": 1.9181246757507324, "Pretrain/Step": 1774, "Pretrain/Step Time": 8.421426689252257} +{"Pretrain/Learning Rate": 4.94801957221654e-05, "Pretrain/Loss": 2.1284067630767822, "Pretrain/Loss (Raw)": 2.048617124557495, "Pretrain/Step": 1775, "Pretrain/Step Time": 8.423134999349713} +{"Pretrain/Learning Rate": 4.9479334196446116e-05, "Pretrain/Loss": 2.1285877227783203, "Pretrain/Loss (Raw)": 2.0706350803375244, "Pretrain/Step": 1776, "Pretrain/Step Time": 8.419328013435006} +{"Pretrain/Learning Rate": 4.9478471964882476e-05, "Pretrain/Loss": 2.1252541542053223, "Pretrain/Loss (Raw)": 1.9946802854537964, "Pretrain/Step": 1777, "Pretrain/Step Time": 8.417047668248415} +{"Pretrain/Learning Rate": 4.947760902749937e-05, "Pretrain/Loss": 2.1256017684936523, "Pretrain/Loss (Raw)": 2.334118127822876, "Pretrain/Step": 1778, "Pretrain/Step Time": 8.41754605807364} +{"Pretrain/Learning Rate": 4.9476745384321654e-05, "Pretrain/Loss": 2.123624086380005, "Pretrain/Loss (Raw)": 1.972646951675415, "Pretrain/Step": 1779, "Pretrain/Step Time": 8.416179273277521} +{"Pretrain/Learning Rate": 4.947588103537425e-05, "Pretrain/Loss": 2.1245763301849365, "Pretrain/Loss (Raw)": 2.2929599285125732, "Pretrain/Step": 1780, "Pretrain/Step Time": 8.413387769833207} +{"Pretrain/Learning Rate": 4.947501598068206e-05, "Pretrain/Loss": 2.1237435340881348, "Pretrain/Loss (Raw)": 2.1195168495178223, "Pretrain/Step": 1781, "Pretrain/Step Time": 8.413448302075267} +{"Pretrain/Learning Rate": 4.947415022027004e-05, "Pretrain/Loss": 2.1223223209381104, "Pretrain/Loss (Raw)": 2.046163320541382, "Pretrain/Step": 1782, "Pretrain/Step Time": 8.411526767536998} +{"Pretrain/Learning Rate": 4.947328375416316e-05, "Pretrain/Loss": 2.123523712158203, "Pretrain/Loss (Raw)": 2.1955292224884033, "Pretrain/Step": 1783, "Pretrain/Step Time": 8.415416525676847} +{"Pretrain/Learning Rate": 4.947241658238638e-05, "Pretrain/Loss": 2.1226048469543457, "Pretrain/Loss (Raw)": 2.0077250003814697, "Pretrain/Step": 1784, "Pretrain/Step Time": 8.417959613725543} +{"Pretrain/Learning Rate": 4.947154870496473e-05, "Pretrain/Loss": 2.122953414916992, "Pretrain/Loss (Raw)": 2.136739730834961, "Pretrain/Step": 1785, "Pretrain/Step Time": 8.420142233371735} +{"Pretrain/Learning Rate": 4.947068012192323e-05, "Pretrain/Loss": 2.124223232269287, "Pretrain/Loss (Raw)": 2.2218315601348877, "Pretrain/Step": 1786, "Pretrain/Step Time": 8.42094500362873} +{"Pretrain/Learning Rate": 4.946981083328691e-05, "Pretrain/Loss": 2.1230809688568115, "Pretrain/Loss (Raw)": 1.912114143371582, "Pretrain/Step": 1787, "Pretrain/Step Time": 8.420039048418403} +{"Pretrain/Learning Rate": 4.9468940839080845e-05, "Pretrain/Loss": 2.123391628265381, "Pretrain/Loss (Raw)": 2.0708696842193604, "Pretrain/Step": 1788, "Pretrain/Step Time": 8.419127967208624} +{"Pretrain/Learning Rate": 4.946807013933012e-05, "Pretrain/Loss": 2.1243414878845215, "Pretrain/Loss (Raw)": 2.243870973587036, "Pretrain/Step": 1789, "Pretrain/Step Time": 8.420059066265821} +{"Pretrain/Learning Rate": 4.946719873405985e-05, "Pretrain/Loss": 2.128904342651367, "Pretrain/Loss (Raw)": 2.631784677505493, "Pretrain/Step": 1790, "Pretrain/Step Time": 8.423786943778396} +{"Pretrain/Learning Rate": 4.9466326623295146e-05, "Pretrain/Loss": 2.127779006958008, "Pretrain/Loss (Raw)": 1.9418002367019653, "Pretrain/Step": 1791, "Pretrain/Step Time": 8.418923418968916} +{"Pretrain/Learning Rate": 4.946545380706116e-05, "Pretrain/Loss": 2.128352165222168, "Pretrain/Loss (Raw)": 2.1019279956817627, "Pretrain/Step": 1792, "Pretrain/Step Time": 8.420052276924253} +{"Pretrain/Learning Rate": 4.946458028538306e-05, "Pretrain/Loss": 2.126178741455078, "Pretrain/Loss (Raw)": 2.1172916889190674, "Pretrain/Step": 1793, "Pretrain/Step Time": 8.417881896719337} +{"Pretrain/Learning Rate": 4.946370605828604e-05, "Pretrain/Loss": 2.126347064971924, "Pretrain/Loss (Raw)": 2.1306984424591064, "Pretrain/Step": 1794, "Pretrain/Step Time": 8.415147641673684} +{"Pretrain/Learning Rate": 4.94628311257953e-05, "Pretrain/Loss": 2.1226449012756348, "Pretrain/Loss (Raw)": 1.9055346250534058, "Pretrain/Step": 1795, "Pretrain/Step Time": 8.415059695020318} +{"Pretrain/Learning Rate": 4.9461955487936066e-05, "Pretrain/Loss": 2.1228861808776855, "Pretrain/Loss (Raw)": 2.0667521953582764, "Pretrain/Step": 1796, "Pretrain/Step Time": 8.413497449830174} +{"Pretrain/Learning Rate": 4.946107914473359e-05, "Pretrain/Loss": 2.12237811088562, "Pretrain/Loss (Raw)": 2.0381507873535156, "Pretrain/Step": 1797, "Pretrain/Step Time": 8.417468501254916} +{"Pretrain/Learning Rate": 4.946020209621314e-05, "Pretrain/Loss": 2.123075008392334, "Pretrain/Loss (Raw)": 2.2099616527557373, "Pretrain/Step": 1798, "Pretrain/Step Time": 8.413111180067062} +{"Pretrain/Learning Rate": 4.945932434240001e-05, "Pretrain/Loss": 2.1199512481689453, "Pretrain/Loss (Raw)": 2.164000988006592, "Pretrain/Step": 1799, "Pretrain/Step Time": 8.414759170264006} +{"Pretrain/Learning Rate": 4.9458445883319504e-05, "Pretrain/Loss": 2.1212596893310547, "Pretrain/Loss (Raw)": 2.088691473007202, "Pretrain/Step": 1800, "Pretrain/Step Time": 8.41352429986} +{"Pretrain/Learning Rate": 4.945756671899695e-05, "Pretrain/Loss": 2.1219654083251953, "Pretrain/Loss (Raw)": 2.164139986038208, "Pretrain/Step": 1801, "Pretrain/Step Time": 8.422268712893128} +{"Pretrain/Learning Rate": 4.94566868494577e-05, "Pretrain/Loss": 2.1217355728149414, "Pretrain/Loss (Raw)": 2.149552822113037, "Pretrain/Step": 1802, "Pretrain/Step Time": 8.421546561643481} +{"Pretrain/Learning Rate": 4.945580627472713e-05, "Pretrain/Loss": 2.1216816902160645, "Pretrain/Loss (Raw)": 2.055556058883667, "Pretrain/Step": 1803, "Pretrain/Step Time": 8.421659864485264} +{"Pretrain/Learning Rate": 4.9454924994830634e-05, "Pretrain/Loss": 2.121371030807495, "Pretrain/Loss (Raw)": 2.123401641845703, "Pretrain/Step": 1804, "Pretrain/Step Time": 8.425907969474792} +{"Pretrain/Learning Rate": 4.945404300979361e-05, "Pretrain/Loss": 2.1181273460388184, "Pretrain/Loss (Raw)": 1.9710533618927002, "Pretrain/Step": 1805, "Pretrain/Step Time": 8.42627184279263} +{"Pretrain/Learning Rate": 4.945316031964149e-05, "Pretrain/Loss": 2.1174986362457275, "Pretrain/Loss (Raw)": 2.1184887886047363, "Pretrain/Step": 1806, "Pretrain/Step Time": 8.426564894616604} +{"Pretrain/Learning Rate": 4.945227692439973e-05, "Pretrain/Loss": 2.116300106048584, "Pretrain/Loss (Raw)": 1.9875503778457642, "Pretrain/Step": 1807, "Pretrain/Step Time": 8.421518743038177} +{"Pretrain/Learning Rate": 4.94513928240938e-05, "Pretrain/Loss": 2.1198854446411133, "Pretrain/Loss (Raw)": 2.347107410430908, "Pretrain/Step": 1808, "Pretrain/Step Time": 8.423258112743497} +{"Pretrain/Learning Rate": 4.94505080187492e-05, "Pretrain/Loss": 2.1193430423736572, "Pretrain/Loss (Raw)": 2.318563222885132, "Pretrain/Step": 1809, "Pretrain/Step Time": 8.42611857317388} +{"Pretrain/Learning Rate": 4.944962250839144e-05, "Pretrain/Loss": 2.1196579933166504, "Pretrain/Loss (Raw)": 2.2353193759918213, "Pretrain/Step": 1810, "Pretrain/Step Time": 8.425521364435554} +{"Pretrain/Learning Rate": 4.944873629304605e-05, "Pretrain/Loss": 2.1204018592834473, "Pretrain/Loss (Raw)": 2.058716058731079, "Pretrain/Step": 1811, "Pretrain/Step Time": 8.419093001633883} +{"Pretrain/Learning Rate": 4.944784937273858e-05, "Pretrain/Loss": 2.1230554580688477, "Pretrain/Loss (Raw)": 2.356048822402954, "Pretrain/Step": 1812, "Pretrain/Step Time": 8.418908605352044} +{"Pretrain/Learning Rate": 4.944696174749461e-05, "Pretrain/Loss": 2.122669219970703, "Pretrain/Loss (Raw)": 2.2023062705993652, "Pretrain/Step": 1813, "Pretrain/Step Time": 8.420281941071153} +{"Pretrain/Learning Rate": 4.9446073417339733e-05, "Pretrain/Loss": 2.1229419708251953, "Pretrain/Loss (Raw)": 2.10829758644104, "Pretrain/Step": 1814, "Pretrain/Step Time": 8.417502630501986} +{"Pretrain/Learning Rate": 4.944518438229956e-05, "Pretrain/Loss": 2.124560832977295, "Pretrain/Loss (Raw)": 2.128389358520508, "Pretrain/Step": 1815, "Pretrain/Step Time": 8.418680584058166} +{"Pretrain/Learning Rate": 4.9444294642399735e-05, "Pretrain/Loss": 2.124246835708618, "Pretrain/Loss (Raw)": 2.0487797260284424, "Pretrain/Step": 1816, "Pretrain/Step Time": 8.418475328013301} +{"Pretrain/Learning Rate": 4.94434041976659e-05, "Pretrain/Loss": 2.1249279975891113, "Pretrain/Loss (Raw)": 2.108546495437622, "Pretrain/Step": 1817, "Pretrain/Step Time": 8.413689943030477} +{"Pretrain/Learning Rate": 4.944251304812374e-05, "Pretrain/Loss": 2.1244959831237793, "Pretrain/Loss (Raw)": 2.015734910964966, "Pretrain/Step": 1818, "Pretrain/Step Time": 8.419714640825987} +{"Pretrain/Learning Rate": 4.9441621193798945e-05, "Pretrain/Loss": 2.1220550537109375, "Pretrain/Loss (Raw)": 1.9409167766571045, "Pretrain/Step": 1819, "Pretrain/Step Time": 8.420967858284712} +{"Pretrain/Learning Rate": 4.9440728634717226e-05, "Pretrain/Loss": 2.121988534927368, "Pretrain/Loss (Raw)": 2.1500794887542725, "Pretrain/Step": 1820, "Pretrain/Step Time": 8.418704444542527} +{"Pretrain/Learning Rate": 4.943983537090433e-05, "Pretrain/Loss": 2.119717836380005, "Pretrain/Loss (Raw)": 2.0979177951812744, "Pretrain/Step": 1821, "Pretrain/Step Time": 8.421391120180488} +{"Pretrain/Learning Rate": 4.943894140238602e-05, "Pretrain/Loss": 2.120344638824463, "Pretrain/Loss (Raw)": 2.191725254058838, "Pretrain/Step": 1822, "Pretrain/Step Time": 8.419423321262002} +{"Pretrain/Learning Rate": 4.943804672918806e-05, "Pretrain/Loss": 2.121857166290283, "Pretrain/Loss (Raw)": 2.2232656478881836, "Pretrain/Step": 1823, "Pretrain/Step Time": 8.41727307997644} +{"Pretrain/Learning Rate": 4.9437151351336243e-05, "Pretrain/Loss": 2.1198527812957764, "Pretrain/Loss (Raw)": 2.123579978942871, "Pretrain/Step": 1824, "Pretrain/Step Time": 8.414102487266064} +{"Pretrain/Learning Rate": 4.94362552688564e-05, "Pretrain/Loss": 2.1218185424804688, "Pretrain/Loss (Raw)": 2.1874444484710693, "Pretrain/Step": 1825, "Pretrain/Step Time": 8.417148953303695} +{"Pretrain/Learning Rate": 4.943535848177435e-05, "Pretrain/Loss": 2.1215453147888184, "Pretrain/Loss (Raw)": 2.1273751258850098, "Pretrain/Step": 1826, "Pretrain/Step Time": 8.4187904689461} +{"Pretrain/Learning Rate": 4.943446099011598e-05, "Pretrain/Loss": 2.1214518547058105, "Pretrain/Loss (Raw)": 2.025658369064331, "Pretrain/Step": 1827, "Pretrain/Step Time": 8.418364392593503} +{"Pretrain/Learning Rate": 4.9433562793907146e-05, "Pretrain/Loss": 2.1209726333618164, "Pretrain/Loss (Raw)": 1.8065871000289917, "Pretrain/Step": 1828, "Pretrain/Step Time": 8.417192036285996} +{"Pretrain/Learning Rate": 4.9432663893173757e-05, "Pretrain/Loss": 2.120722532272339, "Pretrain/Loss (Raw)": 2.1520607471466064, "Pretrain/Step": 1829, "Pretrain/Step Time": 8.41710201650858} +{"Pretrain/Learning Rate": 4.943176428794172e-05, "Pretrain/Loss": 2.1190199851989746, "Pretrain/Loss (Raw)": 2.084642171859741, "Pretrain/Step": 1830, "Pretrain/Step Time": 8.41524388641119} +{"Pretrain/Learning Rate": 4.943086397823699e-05, "Pretrain/Loss": 2.1183695793151855, "Pretrain/Loss (Raw)": 2.234480142593384, "Pretrain/Step": 1831, "Pretrain/Step Time": 8.413499457761645} +{"Pretrain/Learning Rate": 4.9429962964085517e-05, "Pretrain/Loss": 2.1183688640594482, "Pretrain/Loss (Raw)": 2.0512940883636475, "Pretrain/Step": 1832, "Pretrain/Step Time": 8.414164053276181} +{"Pretrain/Learning Rate": 4.942906124551328e-05, "Pretrain/Loss": 2.11747407913208, "Pretrain/Loss (Raw)": 2.0867111682891846, "Pretrain/Step": 1833, "Pretrain/Step Time": 8.412967571988702} +{"Pretrain/Learning Rate": 4.9428158822546296e-05, "Pretrain/Loss": 2.116950035095215, "Pretrain/Loss (Raw)": 2.1631276607513428, "Pretrain/Step": 1834, "Pretrain/Step Time": 8.417270205914974} +{"Pretrain/Learning Rate": 4.942725569521056e-05, "Pretrain/Loss": 2.118091583251953, "Pretrain/Loss (Raw)": 2.252997875213623, "Pretrain/Step": 1835, "Pretrain/Step Time": 8.415130136534572} +{"Pretrain/Learning Rate": 4.942635186353214e-05, "Pretrain/Loss": 2.117527961730957, "Pretrain/Loss (Raw)": 2.0574164390563965, "Pretrain/Step": 1836, "Pretrain/Step Time": 8.415398467332125} +{"Pretrain/Learning Rate": 4.9425447327537075e-05, "Pretrain/Loss": 2.1180319786071777, "Pretrain/Loss (Raw)": 2.0924463272094727, "Pretrain/Step": 1837, "Pretrain/Step Time": 8.416520241647959} +{"Pretrain/Learning Rate": 4.942454208725145e-05, "Pretrain/Loss": 2.1186249256134033, "Pretrain/Loss (Raw)": 2.258345127105713, "Pretrain/Step": 1838, "Pretrain/Step Time": 8.414191158488393} +{"Pretrain/Learning Rate": 4.942363614270138e-05, "Pretrain/Loss": 2.1209540367126465, "Pretrain/Loss (Raw)": 2.3294405937194824, "Pretrain/Step": 1839, "Pretrain/Step Time": 8.418486893177032} +{"Pretrain/Learning Rate": 4.942272949391298e-05, "Pretrain/Loss": 2.120007276535034, "Pretrain/Loss (Raw)": 2.073719024658203, "Pretrain/Step": 1840, "Pretrain/Step Time": 8.418537503108382} +{"Pretrain/Learning Rate": 4.942182214091238e-05, "Pretrain/Loss": 2.1207103729248047, "Pretrain/Loss (Raw)": 2.1515958309173584, "Pretrain/Step": 1841, "Pretrain/Step Time": 8.416729023680091} +{"Pretrain/Learning Rate": 4.942091408372577e-05, "Pretrain/Loss": 2.1196346282958984, "Pretrain/Loss (Raw)": 2.1958954334259033, "Pretrain/Step": 1842, "Pretrain/Step Time": 8.417321629822254} +{"Pretrain/Learning Rate": 4.942000532237931e-05, "Pretrain/Loss": 2.1173696517944336, "Pretrain/Loss (Raw)": 1.864759087562561, "Pretrain/Step": 1843, "Pretrain/Step Time": 8.413431445136666} +{"Pretrain/Learning Rate": 4.941909585689921e-05, "Pretrain/Loss": 2.1139931678771973, "Pretrain/Loss (Raw)": 1.941575288772583, "Pretrain/Step": 1844, "Pretrain/Step Time": 8.413020448759198} +{"Pretrain/Learning Rate": 4.9418185687311705e-05, "Pretrain/Loss": 2.1157822608947754, "Pretrain/Loss (Raw)": 2.187059164047241, "Pretrain/Step": 1845, "Pretrain/Step Time": 8.414396420121193} +{"Pretrain/Learning Rate": 4.941727481364302e-05, "Pretrain/Loss": 2.114328622817993, "Pretrain/Loss (Raw)": 1.9671695232391357, "Pretrain/Step": 1846, "Pretrain/Step Time": 8.413655450567603} +{"Pretrain/Learning Rate": 4.941636323591943e-05, "Pretrain/Loss": 2.114055633544922, "Pretrain/Loss (Raw)": 1.9413822889328003, "Pretrain/Step": 1847, "Pretrain/Step Time": 8.412644566968083} +{"Pretrain/Learning Rate": 4.941545095416722e-05, "Pretrain/Loss": 2.1139445304870605, "Pretrain/Loss (Raw)": 2.109570026397705, "Pretrain/Step": 1848, "Pretrain/Step Time": 8.417904855683446} +{"Pretrain/Learning Rate": 4.941453796841269e-05, "Pretrain/Loss": 2.1111326217651367, "Pretrain/Loss (Raw)": 1.8600645065307617, "Pretrain/Step": 1849, "Pretrain/Step Time": 8.41581672616303} +{"Pretrain/Learning Rate": 4.941362427868218e-05, "Pretrain/Loss": 2.114760160446167, "Pretrain/Loss (Raw)": 2.5395185947418213, "Pretrain/Step": 1850, "Pretrain/Step Time": 8.410982014611363} +{"Pretrain/Learning Rate": 4.9412709885002006e-05, "Pretrain/Loss": 2.113649845123291, "Pretrain/Loss (Raw)": 1.91960871219635, "Pretrain/Step": 1851, "Pretrain/Step Time": 8.411228159442544} +{"Pretrain/Learning Rate": 4.9411794787398565e-05, "Pretrain/Loss": 2.112670660018921, "Pretrain/Loss (Raw)": 2.0571820735931396, "Pretrain/Step": 1852, "Pretrain/Step Time": 8.412832245230675} +{"Pretrain/Learning Rate": 4.941087898589824e-05, "Pretrain/Loss": 2.113241195678711, "Pretrain/Loss (Raw)": 1.9771485328674316, "Pretrain/Step": 1853, "Pretrain/Step Time": 8.415561221539974} +{"Pretrain/Learning Rate": 4.940996248052741e-05, "Pretrain/Loss": 2.1152350902557373, "Pretrain/Loss (Raw)": 2.159635305404663, "Pretrain/Step": 1854, "Pretrain/Step Time": 8.411977723240852} +{"Pretrain/Learning Rate": 4.9409045271312524e-05, "Pretrain/Loss": 2.115501880645752, "Pretrain/Loss (Raw)": 2.1094112396240234, "Pretrain/Step": 1855, "Pretrain/Step Time": 8.414932185783982} +{"Pretrain/Learning Rate": 4.940812735828003e-05, "Pretrain/Loss": 2.111363410949707, "Pretrain/Loss (Raw)": 2.0283608436584473, "Pretrain/Step": 1856, "Pretrain/Step Time": 8.415466289967299} +{"Pretrain/Learning Rate": 4.940720874145638e-05, "Pretrain/Loss": 2.109030246734619, "Pretrain/Loss (Raw)": 1.8465631008148193, "Pretrain/Step": 1857, "Pretrain/Step Time": 8.414178788661957} +{"Pretrain/Learning Rate": 4.940628942086808e-05, "Pretrain/Loss": 2.1096363067626953, "Pretrain/Loss (Raw)": 2.131098508834839, "Pretrain/Step": 1858, "Pretrain/Step Time": 8.4169398304075} +{"Pretrain/Learning Rate": 4.9405369396541634e-05, "Pretrain/Loss": 2.108181953430176, "Pretrain/Loss (Raw)": 2.0012829303741455, "Pretrain/Step": 1859, "Pretrain/Step Time": 8.41356036812067} +{"Pretrain/Learning Rate": 4.940444866850356e-05, "Pretrain/Loss": 2.1103241443634033, "Pretrain/Loss (Raw)": 2.2040913105010986, "Pretrain/Step": 1860, "Pretrain/Step Time": 8.408089641481638} +{"Pretrain/Learning Rate": 4.940352723678041e-05, "Pretrain/Loss": 2.1115167140960693, "Pretrain/Loss (Raw)": 2.088435411453247, "Pretrain/Step": 1861, "Pretrain/Step Time": 8.413585375994444} +{"Pretrain/Learning Rate": 4.9402605101398755e-05, "Pretrain/Loss": 2.1128101348876953, "Pretrain/Loss (Raw)": 2.14634370803833, "Pretrain/Step": 1862, "Pretrain/Step Time": 8.41152854077518} +{"Pretrain/Learning Rate": 4.9401682262385195e-05, "Pretrain/Loss": 2.1144065856933594, "Pretrain/Loss (Raw)": 2.070873498916626, "Pretrain/Step": 1863, "Pretrain/Step Time": 8.409246133640409} +{"Pretrain/Learning Rate": 4.940075871976632e-05, "Pretrain/Loss": 2.1170554161071777, "Pretrain/Loss (Raw)": 2.301661729812622, "Pretrain/Step": 1864, "Pretrain/Step Time": 8.41449628956616} +{"Pretrain/Learning Rate": 4.9399834473568776e-05, "Pretrain/Loss": 2.11545729637146, "Pretrain/Loss (Raw)": 2.039630651473999, "Pretrain/Step": 1865, "Pretrain/Step Time": 8.411663230508566} +{"Pretrain/Learning Rate": 4.93989095238192e-05, "Pretrain/Loss": 2.1143786907196045, "Pretrain/Loss (Raw)": 2.006556510925293, "Pretrain/Step": 1866, "Pretrain/Step Time": 8.41158395446837} +{"Pretrain/Learning Rate": 4.939798387054427e-05, "Pretrain/Loss": 2.1161327362060547, "Pretrain/Loss (Raw)": 2.266469717025757, "Pretrain/Step": 1867, "Pretrain/Step Time": 8.416213134303689} +{"Pretrain/Learning Rate": 4.939705751377067e-05, "Pretrain/Loss": 2.1163978576660156, "Pretrain/Loss (Raw)": 2.0795352458953857, "Pretrain/Step": 1868, "Pretrain/Step Time": 8.417099645361304} +{"Pretrain/Learning Rate": 4.939613045352512e-05, "Pretrain/Loss": 2.1153812408447266, "Pretrain/Loss (Raw)": 2.038456678390503, "Pretrain/Step": 1869, "Pretrain/Step Time": 8.419067364186049} +{"Pretrain/Learning Rate": 4.939520268983435e-05, "Pretrain/Loss": 2.1130716800689697, "Pretrain/Loss (Raw)": 2.2226486206054688, "Pretrain/Step": 1870, "Pretrain/Step Time": 8.419336382299662} +{"Pretrain/Learning Rate": 4.93942742227251e-05, "Pretrain/Loss": 2.1136081218719482, "Pretrain/Loss (Raw)": 2.306896924972534, "Pretrain/Step": 1871, "Pretrain/Step Time": 8.414396181702614} +{"Pretrain/Learning Rate": 4.939334505222415e-05, "Pretrain/Loss": 2.1104369163513184, "Pretrain/Loss (Raw)": 1.8531650304794312, "Pretrain/Step": 1872, "Pretrain/Step Time": 8.416846729815006} +{"Pretrain/Learning Rate": 4.93924151783583e-05, "Pretrain/Loss": 2.1076951026916504, "Pretrain/Loss (Raw)": 1.8473076820373535, "Pretrain/Step": 1873, "Pretrain/Step Time": 8.418281247839332} +{"Pretrain/Learning Rate": 4.9391484601154346e-05, "Pretrain/Loss": 2.1075754165649414, "Pretrain/Loss (Raw)": 2.2408413887023926, "Pretrain/Step": 1874, "Pretrain/Step Time": 8.417672779411077} +{"Pretrain/Learning Rate": 4.939055332063913e-05, "Pretrain/Loss": 2.108915090560913, "Pretrain/Loss (Raw)": 2.2031474113464355, "Pretrain/Step": 1875, "Pretrain/Step Time": 8.418083366006613} +{"Pretrain/Learning Rate": 4.938962133683951e-05, "Pretrain/Loss": 2.109445333480835, "Pretrain/Loss (Raw)": 2.1812562942504883, "Pretrain/Step": 1876, "Pretrain/Step Time": 8.415211727842689} +{"Pretrain/Learning Rate": 4.938868864978234e-05, "Pretrain/Loss": 2.1121630668640137, "Pretrain/Loss (Raw)": 2.5326950550079346, "Pretrain/Step": 1877, "Pretrain/Step Time": 8.415901325643063} +{"Pretrain/Learning Rate": 4.938775525949453e-05, "Pretrain/Loss": 2.1098811626434326, "Pretrain/Loss (Raw)": 1.953491449356079, "Pretrain/Step": 1878, "Pretrain/Step Time": 8.415748804807663} +{"Pretrain/Learning Rate": 4.938682116600299e-05, "Pretrain/Loss": 2.109145164489746, "Pretrain/Loss (Raw)": 2.0820178985595703, "Pretrain/Step": 1879, "Pretrain/Step Time": 8.414580069482327} +{"Pretrain/Learning Rate": 4.938588636933466e-05, "Pretrain/Loss": 2.110572338104248, "Pretrain/Loss (Raw)": 2.2147111892700195, "Pretrain/Step": 1880, "Pretrain/Step Time": 8.411159371957183} +{"Pretrain/Learning Rate": 4.938495086951648e-05, "Pretrain/Loss": 2.1113970279693604, "Pretrain/Loss (Raw)": 2.1281609535217285, "Pretrain/Step": 1881, "Pretrain/Step Time": 8.408822169527411} +{"Pretrain/Learning Rate": 4.938401466657544e-05, "Pretrain/Loss": 2.1100497245788574, "Pretrain/Loss (Raw)": 1.9032065868377686, "Pretrain/Step": 1882, "Pretrain/Step Time": 8.40817173756659} +{"Pretrain/Learning Rate": 4.938307776053852e-05, "Pretrain/Loss": 2.106288433074951, "Pretrain/Loss (Raw)": 2.136763095855713, "Pretrain/Step": 1883, "Pretrain/Step Time": 8.405831085518003} +{"Pretrain/Learning Rate": 4.9382140151432746e-05, "Pretrain/Loss": 2.106489419937134, "Pretrain/Loss (Raw)": 1.996981143951416, "Pretrain/Step": 1884, "Pretrain/Step Time": 8.409815011546016} +{"Pretrain/Learning Rate": 4.938120183928514e-05, "Pretrain/Loss": 2.104670524597168, "Pretrain/Loss (Raw)": 1.9275431632995605, "Pretrain/Step": 1885, "Pretrain/Step Time": 8.407938990741968} +{"Pretrain/Learning Rate": 4.938026282412277e-05, "Pretrain/Loss": 2.105133056640625, "Pretrain/Loss (Raw)": 2.068369150161743, "Pretrain/Step": 1886, "Pretrain/Step Time": 8.406525425612926} +{"Pretrain/Learning Rate": 4.9379323105972705e-05, "Pretrain/Loss": 2.1044836044311523, "Pretrain/Loss (Raw)": 1.9898101091384888, "Pretrain/Step": 1887, "Pretrain/Step Time": 8.407270099967718} +{"Pretrain/Learning Rate": 4.937838268486206e-05, "Pretrain/Loss": 2.1038174629211426, "Pretrain/Loss (Raw)": 1.8647983074188232, "Pretrain/Step": 1888, "Pretrain/Step Time": 8.412741407752037} +{"Pretrain/Learning Rate": 4.9377441560817924e-05, "Pretrain/Loss": 2.101557731628418, "Pretrain/Loss (Raw)": 1.8511114120483398, "Pretrain/Step": 1889, "Pretrain/Step Time": 8.41195142827928} +{"Pretrain/Learning Rate": 4.937649973386744e-05, "Pretrain/Loss": 2.1031527519226074, "Pretrain/Loss (Raw)": 2.245708465576172, "Pretrain/Step": 1890, "Pretrain/Step Time": 8.413080910220742} +{"Pretrain/Learning Rate": 4.937555720403778e-05, "Pretrain/Loss": 2.105164051055908, "Pretrain/Loss (Raw)": 2.308579683303833, "Pretrain/Step": 1891, "Pretrain/Step Time": 8.411963889375329} +{"Pretrain/Learning Rate": 4.9374613971356115e-05, "Pretrain/Loss": 2.1064491271972656, "Pretrain/Loss (Raw)": 2.1950669288635254, "Pretrain/Step": 1892, "Pretrain/Step Time": 8.411177456378937} +{"Pretrain/Learning Rate": 4.9373670035849635e-05, "Pretrain/Loss": 2.1048269271850586, "Pretrain/Loss (Raw)": 1.9600632190704346, "Pretrain/Step": 1893, "Pretrain/Step Time": 8.415013335645199} +{"Pretrain/Learning Rate": 4.937272539754556e-05, "Pretrain/Loss": 2.101968765258789, "Pretrain/Loss (Raw)": 1.7302708625793457, "Pretrain/Step": 1894, "Pretrain/Step Time": 8.41277945227921} +{"Pretrain/Learning Rate": 4.937178005647113e-05, "Pretrain/Loss": 2.1017231941223145, "Pretrain/Loss (Raw)": 2.085686683654785, "Pretrain/Step": 1895, "Pretrain/Step Time": 8.416522802785039} +{"Pretrain/Learning Rate": 4.93708340126536e-05, "Pretrain/Loss": 2.1007113456726074, "Pretrain/Loss (Raw)": 2.1446356773376465, "Pretrain/Step": 1896, "Pretrain/Step Time": 8.414447732269764} +{"Pretrain/Learning Rate": 4.9369887266120257e-05, "Pretrain/Loss": 2.1007518768310547, "Pretrain/Loss (Raw)": 2.2252931594848633, "Pretrain/Step": 1897, "Pretrain/Step Time": 8.415652042254806} +{"Pretrain/Learning Rate": 4.9368939816898396e-05, "Pretrain/Loss": 2.1024889945983887, "Pretrain/Loss (Raw)": 2.171684741973877, "Pretrain/Step": 1898, "Pretrain/Step Time": 8.416695604100823} +{"Pretrain/Learning Rate": 4.9367991665015326e-05, "Pretrain/Loss": 2.100940704345703, "Pretrain/Loss (Raw)": 2.017540454864502, "Pretrain/Step": 1899, "Pretrain/Step Time": 8.418342174962163} +{"Pretrain/Learning Rate": 4.9367042810498395e-05, "Pretrain/Loss": 2.1036148071289062, "Pretrain/Loss (Raw)": 2.2559924125671387, "Pretrain/Step": 1900, "Pretrain/Step Time": 8.41688460111618} +{"Pretrain/Learning Rate": 4.936609325337497e-05, "Pretrain/Loss": 2.1040828227996826, "Pretrain/Loss (Raw)": 2.05470609664917, "Pretrain/Step": 1901, "Pretrain/Step Time": 8.416388472542167} +{"Pretrain/Learning Rate": 4.936514299367242e-05, "Pretrain/Loss": 2.105983257293701, "Pretrain/Loss (Raw)": 2.1613576412200928, "Pretrain/Step": 1902, "Pretrain/Step Time": 8.419653231278062} +{"Pretrain/Learning Rate": 4.936419203141815e-05, "Pretrain/Loss": 2.1052088737487793, "Pretrain/Loss (Raw)": 1.949509620666504, "Pretrain/Step": 1903, "Pretrain/Step Time": 8.421773234382272} +{"Pretrain/Learning Rate": 4.936324036663957e-05, "Pretrain/Loss": 2.104269504547119, "Pretrain/Loss (Raw)": 1.9503899812698364, "Pretrain/Step": 1904, "Pretrain/Step Time": 8.424958415329456} +{"Pretrain/Learning Rate": 4.936228799936414e-05, "Pretrain/Loss": 2.106712818145752, "Pretrain/Loss (Raw)": 2.3074300289154053, "Pretrain/Step": 1905, "Pretrain/Step Time": 8.424164477735758} +{"Pretrain/Learning Rate": 4.936133492961931e-05, "Pretrain/Loss": 2.1043074131011963, "Pretrain/Loss (Raw)": 2.026226043701172, "Pretrain/Step": 1906, "Pretrain/Step Time": 8.420320179313421} +{"Pretrain/Learning Rate": 4.936038115743255e-05, "Pretrain/Loss": 2.105525493621826, "Pretrain/Loss (Raw)": 2.128572702407837, "Pretrain/Step": 1907, "Pretrain/Step Time": 8.423504499718547} +{"Pretrain/Learning Rate": 4.935942668283138e-05, "Pretrain/Loss": 2.1053237915039062, "Pretrain/Loss (Raw)": 2.2671163082122803, "Pretrain/Step": 1908, "Pretrain/Step Time": 8.423146402463317} +{"Pretrain/Learning Rate": 4.9358471505843305e-05, "Pretrain/Loss": 2.1048460006713867, "Pretrain/Loss (Raw)": 2.0583629608154297, "Pretrain/Step": 1909, "Pretrain/Step Time": 8.423544207587838} +{"Pretrain/Learning Rate": 4.935751562649589e-05, "Pretrain/Loss": 2.1044867038726807, "Pretrain/Loss (Raw)": 2.0001962184906006, "Pretrain/Step": 1910, "Pretrain/Step Time": 8.424632543697953} +{"Pretrain/Learning Rate": 4.935655904481668e-05, "Pretrain/Loss": 2.1036367416381836, "Pretrain/Loss (Raw)": 2.0867271423339844, "Pretrain/Step": 1911, "Pretrain/Step Time": 8.419743075966835} +{"Pretrain/Learning Rate": 4.9355601760833245e-05, "Pretrain/Loss": 2.1050333976745605, "Pretrain/Loss (Raw)": 2.186525583267212, "Pretrain/Step": 1912, "Pretrain/Step Time": 8.417140362784266} +{"Pretrain/Learning Rate": 4.935464377457322e-05, "Pretrain/Loss": 2.1048614978790283, "Pretrain/Loss (Raw)": 2.114708662033081, "Pretrain/Step": 1913, "Pretrain/Step Time": 8.416510239243507} +{"Pretrain/Learning Rate": 4.9353685086064206e-05, "Pretrain/Loss": 2.104304075241089, "Pretrain/Loss (Raw)": 2.1504719257354736, "Pretrain/Step": 1914, "Pretrain/Step Time": 8.41770552098751} +{"Pretrain/Learning Rate": 4.935272569533385e-05, "Pretrain/Loss": 2.106501579284668, "Pretrain/Loss (Raw)": 2.193406105041504, "Pretrain/Step": 1915, "Pretrain/Step Time": 8.417556462809443} +{"Pretrain/Learning Rate": 4.935176560240981e-05, "Pretrain/Loss": 2.1064398288726807, "Pretrain/Loss (Raw)": 2.0629587173461914, "Pretrain/Step": 1916, "Pretrain/Step Time": 8.420521022751927} +{"Pretrain/Learning Rate": 4.935080480731979e-05, "Pretrain/Loss": 2.1054439544677734, "Pretrain/Loss (Raw)": 2.1163978576660156, "Pretrain/Step": 1917, "Pretrain/Step Time": 8.422067038714886} +{"Pretrain/Learning Rate": 4.934984331009146e-05, "Pretrain/Loss": 2.1022772789001465, "Pretrain/Loss (Raw)": 2.2264392375946045, "Pretrain/Step": 1918, "Pretrain/Step Time": 8.42022480815649} +{"Pretrain/Learning Rate": 4.934888111075258e-05, "Pretrain/Loss": 2.102832078933716, "Pretrain/Loss (Raw)": 2.0128157138824463, "Pretrain/Step": 1919, "Pretrain/Step Time": 8.422844571992755} +{"Pretrain/Learning Rate": 4.934791820933087e-05, "Pretrain/Loss": 2.102433204650879, "Pretrain/Loss (Raw)": 2.05088472366333, "Pretrain/Step": 1920, "Pretrain/Step Time": 8.423215877264738} +{"Pretrain/Learning Rate": 4.93469546058541e-05, "Pretrain/Loss": 2.1011548042297363, "Pretrain/Loss (Raw)": 1.9536551237106323, "Pretrain/Step": 1921, "Pretrain/Step Time": 8.423699891194701} +{"Pretrain/Learning Rate": 4.934599030035007e-05, "Pretrain/Loss": 2.098787784576416, "Pretrain/Loss (Raw)": 1.8277010917663574, "Pretrain/Step": 1922, "Pretrain/Step Time": 8.420604137703776} +{"Pretrain/Learning Rate": 4.9345025292846555e-05, "Pretrain/Loss": 2.0999372005462646, "Pretrain/Loss (Raw)": 2.052692413330078, "Pretrain/Step": 1923, "Pretrain/Step Time": 8.422098070383072} +{"Pretrain/Learning Rate": 4.9344059583371407e-05, "Pretrain/Loss": 2.1001169681549072, "Pretrain/Loss (Raw)": 2.089735507965088, "Pretrain/Step": 1924, "Pretrain/Step Time": 8.423799054697156} +{"Pretrain/Learning Rate": 4.9343093171952465e-05, "Pretrain/Loss": 2.100505828857422, "Pretrain/Loss (Raw)": 2.0879170894622803, "Pretrain/Step": 1925, "Pretrain/Step Time": 8.420732637867332} +{"Pretrain/Learning Rate": 4.934212605861759e-05, "Pretrain/Loss": 2.098809242248535, "Pretrain/Loss (Raw)": 1.9928112030029297, "Pretrain/Step": 1926, "Pretrain/Step Time": 8.420302351936698} +{"Pretrain/Learning Rate": 4.9341158243394666e-05, "Pretrain/Loss": 2.09763240814209, "Pretrain/Loss (Raw)": 2.0133838653564453, "Pretrain/Step": 1927, "Pretrain/Step Time": 8.425197510048747} +{"Pretrain/Learning Rate": 4.934018972631161e-05, "Pretrain/Loss": 2.099945545196533, "Pretrain/Loss (Raw)": 2.3847463130950928, "Pretrain/Step": 1928, "Pretrain/Step Time": 8.425126161426306} +{"Pretrain/Learning Rate": 4.933922050739634e-05, "Pretrain/Loss": 2.098552703857422, "Pretrain/Loss (Raw)": 1.9858582019805908, "Pretrain/Step": 1929, "Pretrain/Step Time": 8.415745932608843} +{"Pretrain/Learning Rate": 4.93382505866768e-05, "Pretrain/Loss": 2.0993571281433105, "Pretrain/Loss (Raw)": 2.2525060176849365, "Pretrain/Step": 1930, "Pretrain/Step Time": 8.415223302319646} +{"Pretrain/Learning Rate": 4.9337279964180974e-05, "Pretrain/Loss": 2.099207639694214, "Pretrain/Loss (Raw)": 2.036452531814575, "Pretrain/Step": 1931, "Pretrain/Step Time": 8.416623594239354} +{"Pretrain/Learning Rate": 4.9336308639936826e-05, "Pretrain/Loss": 2.0981831550598145, "Pretrain/Loss (Raw)": 1.9922661781311035, "Pretrain/Step": 1932, "Pretrain/Step Time": 8.411113703623414} +{"Pretrain/Learning Rate": 4.9335336613972374e-05, "Pretrain/Loss": 2.0974860191345215, "Pretrain/Loss (Raw)": 1.8818256855010986, "Pretrain/Step": 1933, "Pretrain/Step Time": 8.417475800961256} +{"Pretrain/Learning Rate": 4.933436388631565e-05, "Pretrain/Loss": 2.0980823040008545, "Pretrain/Loss (Raw)": 2.1947944164276123, "Pretrain/Step": 1934, "Pretrain/Step Time": 8.419497355818748} +{"Pretrain/Learning Rate": 4.93333904569947e-05, "Pretrain/Loss": 2.1000514030456543, "Pretrain/Loss (Raw)": 2.2396044731140137, "Pretrain/Step": 1935, "Pretrain/Step Time": 8.419309118762612} +{"Pretrain/Learning Rate": 4.933241632603758e-05, "Pretrain/Loss": 2.096001386642456, "Pretrain/Loss (Raw)": 1.8287266492843628, "Pretrain/Step": 1936, "Pretrain/Step Time": 8.422763312235475} +{"Pretrain/Learning Rate": 4.9331441493472395e-05, "Pretrain/Loss": 2.093039035797119, "Pretrain/Loss (Raw)": 1.939335584640503, "Pretrain/Step": 1937, "Pretrain/Step Time": 8.420699527487159} +{"Pretrain/Learning Rate": 4.933046595932725e-05, "Pretrain/Loss": 2.0923244953155518, "Pretrain/Loss (Raw)": 2.143880605697632, "Pretrain/Step": 1938, "Pretrain/Step Time": 8.421007694676518} +{"Pretrain/Learning Rate": 4.932948972363027e-05, "Pretrain/Loss": 2.092837333679199, "Pretrain/Loss (Raw)": 2.1243796348571777, "Pretrain/Step": 1939, "Pretrain/Step Time": 8.420593965798616} +{"Pretrain/Learning Rate": 4.93285127864096e-05, "Pretrain/Loss": 2.0910911560058594, "Pretrain/Loss (Raw)": 2.1324946880340576, "Pretrain/Step": 1940, "Pretrain/Step Time": 8.418486770242453} +{"Pretrain/Learning Rate": 4.9327535147693416e-05, "Pretrain/Loss": 2.0872740745544434, "Pretrain/Loss (Raw)": 1.7137426137924194, "Pretrain/Step": 1941, "Pretrain/Step Time": 8.419066494330764} +{"Pretrain/Learning Rate": 4.932655680750991e-05, "Pretrain/Loss": 2.0870370864868164, "Pretrain/Loss (Raw)": 2.0779778957366943, "Pretrain/Step": 1942, "Pretrain/Step Time": 8.418121822178364} +{"Pretrain/Learning Rate": 4.932557776588729e-05, "Pretrain/Loss": 2.0881526470184326, "Pretrain/Loss (Raw)": 2.2711706161499023, "Pretrain/Step": 1943, "Pretrain/Step Time": 8.416608437895775} +{"Pretrain/Learning Rate": 4.9324598022853776e-05, "Pretrain/Loss": 2.089341878890991, "Pretrain/Loss (Raw)": 2.2010107040405273, "Pretrain/Step": 1944, "Pretrain/Step Time": 8.415077362209558} +{"Pretrain/Learning Rate": 4.9323617578437624e-05, "Pretrain/Loss": 2.088517189025879, "Pretrain/Loss (Raw)": 2.002997398376465, "Pretrain/Step": 1945, "Pretrain/Step Time": 8.420563170686364} +{"Pretrain/Learning Rate": 4.932263643266711e-05, "Pretrain/Loss": 2.0894811153411865, "Pretrain/Loss (Raw)": 2.1390767097473145, "Pretrain/Step": 1946, "Pretrain/Step Time": 8.414423309266567} +{"Pretrain/Learning Rate": 4.932165458557052e-05, "Pretrain/Loss": 2.089613437652588, "Pretrain/Loss (Raw)": 1.9578930139541626, "Pretrain/Step": 1947, "Pretrain/Step Time": 8.416728666052222} +{"Pretrain/Learning Rate": 4.932067203717617e-05, "Pretrain/Loss": 2.0896975994110107, "Pretrain/Loss (Raw)": 2.1608407497406006, "Pretrain/Step": 1948, "Pretrain/Step Time": 8.41729768551886} +{"Pretrain/Learning Rate": 4.9319688787512384e-05, "Pretrain/Loss": 2.0900092124938965, "Pretrain/Loss (Raw)": 2.137814998626709, "Pretrain/Step": 1949, "Pretrain/Step Time": 8.417556464672089} +{"Pretrain/Learning Rate": 4.9318704836607514e-05, "Pretrain/Loss": 2.089385747909546, "Pretrain/Loss (Raw)": 2.1119067668914795, "Pretrain/Step": 1950, "Pretrain/Step Time": 8.42243187688291} +{"Pretrain/Learning Rate": 4.9317720184489934e-05, "Pretrain/Loss": 2.089578628540039, "Pretrain/Loss (Raw)": 2.24798321723938, "Pretrain/Step": 1951, "Pretrain/Step Time": 8.4220234695822} +{"Pretrain/Learning Rate": 4.931673483118804e-05, "Pretrain/Loss": 2.0895321369171143, "Pretrain/Loss (Raw)": 2.117614984512329, "Pretrain/Step": 1952, "Pretrain/Step Time": 8.422782460227609} +{"Pretrain/Learning Rate": 4.931574877673023e-05, "Pretrain/Loss": 2.0899648666381836, "Pretrain/Loss (Raw)": 2.2428228855133057, "Pretrain/Step": 1953, "Pretrain/Step Time": 8.42047051154077} +{"Pretrain/Learning Rate": 4.931476202114496e-05, "Pretrain/Loss": 2.088128089904785, "Pretrain/Loss (Raw)": 1.8922747373580933, "Pretrain/Step": 1954, "Pretrain/Step Time": 8.421079961583018} +{"Pretrain/Learning Rate": 4.931377456446066e-05, "Pretrain/Loss": 2.0890884399414062, "Pretrain/Loss (Raw)": 2.1485791206359863, "Pretrain/Step": 1955, "Pretrain/Step Time": 8.416136842221022} +{"Pretrain/Learning Rate": 4.9312786406705805e-05, "Pretrain/Loss": 2.091597557067871, "Pretrain/Loss (Raw)": 2.127748966217041, "Pretrain/Step": 1956, "Pretrain/Step Time": 8.419470623135567} +{"Pretrain/Learning Rate": 4.93117975479089e-05, "Pretrain/Loss": 2.090303897857666, "Pretrain/Loss (Raw)": 1.9864580631256104, "Pretrain/Step": 1957, "Pretrain/Step Time": 8.416239377111197} +{"Pretrain/Learning Rate": 4.9310807988098446e-05, "Pretrain/Loss": 2.0906472206115723, "Pretrain/Loss (Raw)": 2.1285979747772217, "Pretrain/Step": 1958, "Pretrain/Step Time": 8.417194763198495} +{"Pretrain/Learning Rate": 4.930981772730299e-05, "Pretrain/Loss": 2.0914530754089355, "Pretrain/Loss (Raw)": 2.3376216888427734, "Pretrain/Step": 1959, "Pretrain/Step Time": 8.418555043637753} +{"Pretrain/Learning Rate": 4.9308826765551064e-05, "Pretrain/Loss": 2.091980457305908, "Pretrain/Loss (Raw)": 2.118842840194702, "Pretrain/Step": 1960, "Pretrain/Step Time": 8.418899988755584} +{"Pretrain/Learning Rate": 4.930783510287127e-05, "Pretrain/Loss": 2.09151554107666, "Pretrain/Loss (Raw)": 2.0271756649017334, "Pretrain/Step": 1961, "Pretrain/Step Time": 8.417780585587025} +{"Pretrain/Learning Rate": 4.930684273929218e-05, "Pretrain/Loss": 2.0908560752868652, "Pretrain/Loss (Raw)": 2.078721523284912, "Pretrain/Step": 1962, "Pretrain/Step Time": 8.419279873371124} +{"Pretrain/Learning Rate": 4.930584967484241e-05, "Pretrain/Loss": 2.088623285293579, "Pretrain/Loss (Raw)": 1.9672037363052368, "Pretrain/Step": 1963, "Pretrain/Step Time": 8.420317156240344} +{"Pretrain/Learning Rate": 4.9304855909550606e-05, "Pretrain/Loss": 2.08921480178833, "Pretrain/Loss (Raw)": 2.1331400871276855, "Pretrain/Step": 1964, "Pretrain/Step Time": 8.420823451131582} +{"Pretrain/Learning Rate": 4.930386144344541e-05, "Pretrain/Loss": 2.092250347137451, "Pretrain/Loss (Raw)": 2.480984687805176, "Pretrain/Step": 1965, "Pretrain/Step Time": 8.41927282139659} +{"Pretrain/Learning Rate": 4.930286627655551e-05, "Pretrain/Loss": 2.0904035568237305, "Pretrain/Loss (Raw)": 2.0219545364379883, "Pretrain/Step": 1966, "Pretrain/Step Time": 8.42193604260683} +{"Pretrain/Learning Rate": 4.930187040890959e-05, "Pretrain/Loss": 2.088212728500366, "Pretrain/Loss (Raw)": 2.0490105152130127, "Pretrain/Step": 1967, "Pretrain/Step Time": 8.42388921417296} +{"Pretrain/Learning Rate": 4.930087384053637e-05, "Pretrain/Loss": 2.0883543491363525, "Pretrain/Loss (Raw)": 2.0918500423431396, "Pretrain/Step": 1968, "Pretrain/Step Time": 8.42465036176145} +{"Pretrain/Learning Rate": 4.9299876571464574e-05, "Pretrain/Loss": 2.088510513305664, "Pretrain/Loss (Raw)": 2.17158842086792, "Pretrain/Step": 1969, "Pretrain/Step Time": 8.428402289748192} +{"Pretrain/Learning Rate": 4.929887860172297e-05, "Pretrain/Loss": 2.087829113006592, "Pretrain/Loss (Raw)": 2.1086721420288086, "Pretrain/Step": 1970, "Pretrain/Step Time": 8.425478145480156} +{"Pretrain/Learning Rate": 4.929787993134034e-05, "Pretrain/Loss": 2.0892186164855957, "Pretrain/Loss (Raw)": 2.0426270961761475, "Pretrain/Step": 1971, "Pretrain/Step Time": 8.425619592890143} +{"Pretrain/Learning Rate": 4.929688056034547e-05, "Pretrain/Loss": 2.090702772140503, "Pretrain/Loss (Raw)": 2.131530523300171, "Pretrain/Step": 1972, "Pretrain/Step Time": 8.430565802380443} +{"Pretrain/Learning Rate": 4.929588048876718e-05, "Pretrain/Loss": 2.090546131134033, "Pretrain/Loss (Raw)": 2.167001724243164, "Pretrain/Step": 1973, "Pretrain/Step Time": 8.427356034517288} +{"Pretrain/Learning Rate": 4.929487971663429e-05, "Pretrain/Loss": 2.091994047164917, "Pretrain/Loss (Raw)": 2.152510166168213, "Pretrain/Step": 1974, "Pretrain/Step Time": 8.428268482908607} +{"Pretrain/Learning Rate": 4.9293878243975676e-05, "Pretrain/Loss": 2.0923755168914795, "Pretrain/Loss (Raw)": 1.9902095794677734, "Pretrain/Step": 1975, "Pretrain/Step Time": 8.430874632671475} +{"Pretrain/Learning Rate": 4.929287607082021e-05, "Pretrain/Loss": 2.092103958129883, "Pretrain/Loss (Raw)": 2.0748016834259033, "Pretrain/Step": 1976, "Pretrain/Step Time": 8.427406009286642} +{"Pretrain/Learning Rate": 4.929187319719679e-05, "Pretrain/Loss": 2.095393657684326, "Pretrain/Loss (Raw)": 2.2811408042907715, "Pretrain/Step": 1977, "Pretrain/Step Time": 8.429022274911404} +{"Pretrain/Learning Rate": 4.929086962313433e-05, "Pretrain/Loss": 2.092695713043213, "Pretrain/Loss (Raw)": 2.194179058074951, "Pretrain/Step": 1978, "Pretrain/Step Time": 8.431369073688984} +{"Pretrain/Learning Rate": 4.928986534866177e-05, "Pretrain/Loss": 2.0935451984405518, "Pretrain/Loss (Raw)": 2.028352737426758, "Pretrain/Step": 1979, "Pretrain/Step Time": 8.427301667630672} +{"Pretrain/Learning Rate": 4.9288860373808066e-05, "Pretrain/Loss": 2.093413829803467, "Pretrain/Loss (Raw)": 2.040386199951172, "Pretrain/Step": 1980, "Pretrain/Step Time": 8.428565483540297} +{"Pretrain/Learning Rate": 4.928785469860219e-05, "Pretrain/Loss": 2.094635486602783, "Pretrain/Loss (Raw)": 2.133486032485962, "Pretrain/Step": 1981, "Pretrain/Step Time": 8.42639328725636} +{"Pretrain/Learning Rate": 4.928684832307315e-05, "Pretrain/Loss": 2.0931811332702637, "Pretrain/Loss (Raw)": 1.9734854698181152, "Pretrain/Step": 1982, "Pretrain/Step Time": 8.4289495870471} +{"Pretrain/Learning Rate": 4.9285841247249955e-05, "Pretrain/Loss": 2.0941760540008545, "Pretrain/Loss (Raw)": 2.23677134513855, "Pretrain/Step": 1983, "Pretrain/Step Time": 8.428078042343259} +{"Pretrain/Learning Rate": 4.928483347116165e-05, "Pretrain/Loss": 2.0948731899261475, "Pretrain/Loss (Raw)": 2.117615222930908, "Pretrain/Step": 1984, "Pretrain/Step Time": 8.429013663902879} +{"Pretrain/Learning Rate": 4.92838249948373e-05, "Pretrain/Loss": 2.0954132080078125, "Pretrain/Loss (Raw)": 1.9156683683395386, "Pretrain/Step": 1985, "Pretrain/Step Time": 8.427840640768409} +{"Pretrain/Learning Rate": 4.928281581830596e-05, "Pretrain/Loss": 2.0951247215270996, "Pretrain/Loss (Raw)": 2.094177722930908, "Pretrain/Step": 1986, "Pretrain/Step Time": 8.42579760402441} +{"Pretrain/Learning Rate": 4.928180594159676e-05, "Pretrain/Loss": 2.0953733921051025, "Pretrain/Loss (Raw)": 2.033095121383667, "Pretrain/Step": 1987, "Pretrain/Step Time": 8.427604276686907} +{"Pretrain/Learning Rate": 4.9280795364738795e-05, "Pretrain/Loss": 2.09364652633667, "Pretrain/Loss (Raw)": 1.9830626249313354, "Pretrain/Step": 1988, "Pretrain/Step Time": 8.431699953973293} +{"Pretrain/Learning Rate": 4.927978408776122e-05, "Pretrain/Loss": 2.0937225818634033, "Pretrain/Loss (Raw)": 2.0981647968292236, "Pretrain/Step": 1989, "Pretrain/Step Time": 8.426841484382749} +{"Pretrain/Learning Rate": 4.927877211069317e-05, "Pretrain/Loss": 2.0922317504882812, "Pretrain/Loss (Raw)": 1.9555017948150635, "Pretrain/Step": 1990, "Pretrain/Step Time": 8.427497442811728} +{"Pretrain/Learning Rate": 4.9277759433563855e-05, "Pretrain/Loss": 2.0916876792907715, "Pretrain/Loss (Raw)": 2.001251697540283, "Pretrain/Step": 1991, "Pretrain/Step Time": 8.43070768378675} +{"Pretrain/Learning Rate": 4.9276746056402455e-05, "Pretrain/Loss": 2.089770555496216, "Pretrain/Loss (Raw)": 2.0562775135040283, "Pretrain/Step": 1992, "Pretrain/Step Time": 8.424361046403646} +{"Pretrain/Learning Rate": 4.927573197923821e-05, "Pretrain/Loss": 2.0888848304748535, "Pretrain/Loss (Raw)": 1.9262490272521973, "Pretrain/Step": 1993, "Pretrain/Step Time": 8.422673620283604} +{"Pretrain/Learning Rate": 4.927471720210033e-05, "Pretrain/Loss": 2.08894681930542, "Pretrain/Loss (Raw)": 2.01448655128479, "Pretrain/Step": 1994, "Pretrain/Step Time": 8.427075698971748} +{"Pretrain/Learning Rate": 4.9273701725018093e-05, "Pretrain/Loss": 2.0876047611236572, "Pretrain/Loss (Raw)": 2.0946922302246094, "Pretrain/Step": 1995, "Pretrain/Step Time": 8.41933100298047} +{"Pretrain/Learning Rate": 4.927268554802079e-05, "Pretrain/Loss": 2.0885589122772217, "Pretrain/Loss (Raw)": 2.201655626296997, "Pretrain/Step": 1996, "Pretrain/Step Time": 8.421765426173806} +{"Pretrain/Learning Rate": 4.92716686711377e-05, "Pretrain/Loss": 2.089054822921753, "Pretrain/Loss (Raw)": 2.101945400238037, "Pretrain/Step": 1997, "Pretrain/Step Time": 8.428149396553636} +{"Pretrain/Learning Rate": 4.927065109439816e-05, "Pretrain/Loss": 2.0875136852264404, "Pretrain/Loss (Raw)": 2.025367498397827, "Pretrain/Step": 1998, "Pretrain/Step Time": 8.43102409131825} +{"Pretrain/Learning Rate": 4.92696328178315e-05, "Pretrain/Loss": 2.0854239463806152, "Pretrain/Loss (Raw)": 2.039429187774658, "Pretrain/Step": 1999, "Pretrain/Step Time": 8.432427443563938} +{"Pretrain/Learning Rate": 4.9268613841467094e-05, "Pretrain/Loss": 2.0884976387023926, "Pretrain/Loss (Raw)": 2.246600389480591, "Pretrain/Step": 2000, "Pretrain/Step Time": 8.432867838069797} +{"Pretrain/Learning Rate": 4.926759416533431e-05, "Pretrain/Loss": 2.090873956680298, "Pretrain/Loss (Raw)": 2.1514742374420166, "Pretrain/Step": 2001, "Pretrain/Step Time": 8.432298490777612} +{"Pretrain/Learning Rate": 4.9266573789462564e-05, "Pretrain/Loss": 2.088060140609741, "Pretrain/Loss (Raw)": 1.8806463479995728, "Pretrain/Step": 2002, "Pretrain/Step Time": 8.432488527148962} +{"Pretrain/Learning Rate": 4.9265552713881265e-05, "Pretrain/Loss": 2.0862581729888916, "Pretrain/Loss (Raw)": 1.9725048542022705, "Pretrain/Step": 2003, "Pretrain/Step Time": 8.430793611332774} +{"Pretrain/Learning Rate": 4.926453093861986e-05, "Pretrain/Loss": 2.0863609313964844, "Pretrain/Loss (Raw)": 2.194434404373169, "Pretrain/Step": 2004, "Pretrain/Step Time": 8.434781044721603} +{"Pretrain/Learning Rate": 4.926350846370781e-05, "Pretrain/Loss": 2.0820980072021484, "Pretrain/Loss (Raw)": 1.9870414733886719, "Pretrain/Step": 2005, "Pretrain/Step Time": 8.436162080615759} +{"Pretrain/Learning Rate": 4.926248528917459e-05, "Pretrain/Loss": 2.082894802093506, "Pretrain/Loss (Raw)": 2.055476188659668, "Pretrain/Step": 2006, "Pretrain/Step Time": 8.434096181765199} +{"Pretrain/Learning Rate": 4.926146141504972e-05, "Pretrain/Loss": 2.0835161209106445, "Pretrain/Loss (Raw)": 2.1615519523620605, "Pretrain/Step": 2007, "Pretrain/Step Time": 8.430224362760782} +{"Pretrain/Learning Rate": 4.926043684136271e-05, "Pretrain/Loss": 2.0818209648132324, "Pretrain/Loss (Raw)": 1.9977190494537354, "Pretrain/Step": 2008, "Pretrain/Step Time": 8.437078362330794} +{"Pretrain/Learning Rate": 4.925941156814311e-05, "Pretrain/Loss": 2.082533836364746, "Pretrain/Loss (Raw)": 2.2194020748138428, "Pretrain/Step": 2009, "Pretrain/Step Time": 8.437796810641885} +{"Pretrain/Learning Rate": 4.925838559542048e-05, "Pretrain/Loss": 2.0830891132354736, "Pretrain/Loss (Raw)": 1.9742865562438965, "Pretrain/Step": 2010, "Pretrain/Step Time": 8.437476307153702} +{"Pretrain/Learning Rate": 4.925735892322439e-05, "Pretrain/Loss": 2.0826687812805176, "Pretrain/Loss (Raw)": 2.0829432010650635, "Pretrain/Step": 2011, "Pretrain/Step Time": 8.440520457923412} +{"Pretrain/Learning Rate": 4.925633155158447e-05, "Pretrain/Loss": 2.0821919441223145, "Pretrain/Loss (Raw)": 1.9359692335128784, "Pretrain/Step": 2012, "Pretrain/Step Time": 8.437764346599579} +{"Pretrain/Learning Rate": 4.9255303480530326e-05, "Pretrain/Loss": 2.0853281021118164, "Pretrain/Loss (Raw)": 2.3289530277252197, "Pretrain/Step": 2013, "Pretrain/Step Time": 8.441336629912257} +{"Pretrain/Learning Rate": 4.92542747100916e-05, "Pretrain/Loss": 2.085435390472412, "Pretrain/Loss (Raw)": 2.0821139812469482, "Pretrain/Step": 2014, "Pretrain/Step Time": 8.4417217168957} +{"Pretrain/Learning Rate": 4.925324524029797e-05, "Pretrain/Loss": 2.0862388610839844, "Pretrain/Loss (Raw)": 2.092653512954712, "Pretrain/Step": 2015, "Pretrain/Step Time": 8.44256665930152} +{"Pretrain/Learning Rate": 4.92522150711791e-05, "Pretrain/Loss": 2.088212251663208, "Pretrain/Loss (Raw)": 2.117394208908081, "Pretrain/Step": 2016, "Pretrain/Step Time": 8.441226534545422} +{"Pretrain/Learning Rate": 4.925118420276471e-05, "Pretrain/Loss": 2.0891692638397217, "Pretrain/Loss (Raw)": 1.973609447479248, "Pretrain/Step": 2017, "Pretrain/Step Time": 8.441840626299381} +{"Pretrain/Learning Rate": 4.925015263508452e-05, "Pretrain/Loss": 2.0888547897338867, "Pretrain/Loss (Raw)": 2.2054171562194824, "Pretrain/Step": 2018, "Pretrain/Step Time": 8.441343074664474} +{"Pretrain/Learning Rate": 4.9249120368168275e-05, "Pretrain/Loss": 2.08866548538208, "Pretrain/Loss (Raw)": 2.284369945526123, "Pretrain/Step": 2019, "Pretrain/Step Time": 8.443742332980037} +{"Pretrain/Learning Rate": 4.924808740204574e-05, "Pretrain/Loss": 2.0890064239501953, "Pretrain/Loss (Raw)": 2.2387280464172363, "Pretrain/Step": 2020, "Pretrain/Step Time": 8.440730141475797} +{"Pretrain/Learning Rate": 4.924705373674669e-05, "Pretrain/Loss": 2.090203285217285, "Pretrain/Loss (Raw)": 2.113264560699463, "Pretrain/Step": 2021, "Pretrain/Step Time": 8.434228252619505} +{"Pretrain/Learning Rate": 4.9246019372300946e-05, "Pretrain/Loss": 2.093921422958374, "Pretrain/Loss (Raw)": 2.2061843872070312, "Pretrain/Step": 2022, "Pretrain/Step Time": 8.433961398899555} +{"Pretrain/Learning Rate": 4.924498430873833e-05, "Pretrain/Loss": 2.0959339141845703, "Pretrain/Loss (Raw)": 2.3433001041412354, "Pretrain/Step": 2023, "Pretrain/Step Time": 8.432015012949705} +{"Pretrain/Learning Rate": 4.924394854608867e-05, "Pretrain/Loss": 2.0981597900390625, "Pretrain/Loss (Raw)": 2.429534673690796, "Pretrain/Step": 2024, "Pretrain/Step Time": 8.43665250390768} +{"Pretrain/Learning Rate": 4.924291208438185e-05, "Pretrain/Loss": 2.0954766273498535, "Pretrain/Loss (Raw)": 1.8818516731262207, "Pretrain/Step": 2025, "Pretrain/Step Time": 8.433293979614973} +{"Pretrain/Learning Rate": 4.924187492364776e-05, "Pretrain/Loss": 2.0934832096099854, "Pretrain/Loss (Raw)": 1.9165288209915161, "Pretrain/Step": 2026, "Pretrain/Step Time": 8.43461375683546} +{"Pretrain/Learning Rate": 4.9240837063916285e-05, "Pretrain/Loss": 2.0954790115356445, "Pretrain/Loss (Raw)": 2.2730045318603516, "Pretrain/Step": 2027, "Pretrain/Step Time": 8.429400706663728} +{"Pretrain/Learning Rate": 4.9239798505217365e-05, "Pretrain/Loss": 2.0934791564941406, "Pretrain/Loss (Raw)": 1.999974250793457, "Pretrain/Step": 2028, "Pretrain/Step Time": 8.43157185614109} +{"Pretrain/Learning Rate": 4.923875924758095e-05, "Pretrain/Loss": 2.0924572944641113, "Pretrain/Loss (Raw)": 1.9239217042922974, "Pretrain/Step": 2029, "Pretrain/Step Time": 8.438697194680572} +{"Pretrain/Learning Rate": 4.923771929103699e-05, "Pretrain/Loss": 2.091986894607544, "Pretrain/Loss (Raw)": 2.1011545658111572, "Pretrain/Step": 2030, "Pretrain/Step Time": 8.436391346156597} +{"Pretrain/Learning Rate": 4.923667863561548e-05, "Pretrain/Loss": 2.093337059020996, "Pretrain/Loss (Raw)": 2.122318983078003, "Pretrain/Step": 2031, "Pretrain/Step Time": 8.435496356338263} +{"Pretrain/Learning Rate": 4.9235637281346426e-05, "Pretrain/Loss": 2.0968034267425537, "Pretrain/Loss (Raw)": 2.3941032886505127, "Pretrain/Step": 2032, "Pretrain/Step Time": 8.433241751044989} +{"Pretrain/Learning Rate": 4.923459522825986e-05, "Pretrain/Loss": 2.095261812210083, "Pretrain/Loss (Raw)": 2.1100950241088867, "Pretrain/Step": 2033, "Pretrain/Step Time": 8.441409941762686} +{"Pretrain/Learning Rate": 4.923355247638582e-05, "Pretrain/Loss": 2.095796585083008, "Pretrain/Loss (Raw)": 2.0947086811065674, "Pretrain/Step": 2034, "Pretrain/Step Time": 8.442091042175889} +{"Pretrain/Learning Rate": 4.9232509025754394e-05, "Pretrain/Loss": 2.095095634460449, "Pretrain/Loss (Raw)": 2.0388243198394775, "Pretrain/Step": 2035, "Pretrain/Step Time": 8.439424179494381} +{"Pretrain/Learning Rate": 4.923146487639564e-05, "Pretrain/Loss": 2.0945229530334473, "Pretrain/Loss (Raw)": 2.1938364505767822, "Pretrain/Step": 2036, "Pretrain/Step Time": 8.44474665261805} +{"Pretrain/Learning Rate": 4.923042002833967e-05, "Pretrain/Loss": 2.0950303077697754, "Pretrain/Loss (Raw)": 2.1232705116271973, "Pretrain/Step": 2037, "Pretrain/Step Time": 8.44383724220097} +{"Pretrain/Learning Rate": 4.922937448161664e-05, "Pretrain/Loss": 2.094865322113037, "Pretrain/Loss (Raw)": 1.9790890216827393, "Pretrain/Step": 2038, "Pretrain/Step Time": 8.443634506314993} +{"Pretrain/Learning Rate": 4.922832823625667e-05, "Pretrain/Loss": 2.0928092002868652, "Pretrain/Loss (Raw)": 1.8235505819320679, "Pretrain/Step": 2039, "Pretrain/Step Time": 8.44795092009008} +{"Pretrain/Learning Rate": 4.922728129228993e-05, "Pretrain/Loss": 2.089616537094116, "Pretrain/Loss (Raw)": 1.7778520584106445, "Pretrain/Step": 2040, "Pretrain/Step Time": 8.453170513734221} +{"Pretrain/Learning Rate": 4.922623364974661e-05, "Pretrain/Loss": 2.0888843536376953, "Pretrain/Loss (Raw)": 2.0209946632385254, "Pretrain/Step": 2041, "Pretrain/Step Time": 8.448258178308606} +{"Pretrain/Learning Rate": 4.922518530865693e-05, "Pretrain/Loss": 2.0891761779785156, "Pretrain/Loss (Raw)": 2.1878461837768555, "Pretrain/Step": 2042, "Pretrain/Step Time": 8.45136048272252} +{"Pretrain/Learning Rate": 4.9224136269051105e-05, "Pretrain/Loss": 2.08839750289917, "Pretrain/Loss (Raw)": 2.093724012374878, "Pretrain/Step": 2043, "Pretrain/Step Time": 8.45274967700243} +{"Pretrain/Learning Rate": 4.922308653095939e-05, "Pretrain/Loss": 2.088088035583496, "Pretrain/Loss (Raw)": 2.023332118988037, "Pretrain/Step": 2044, "Pretrain/Step Time": 8.449365613982081} +{"Pretrain/Learning Rate": 4.922203609441205e-05, "Pretrain/Loss": 2.088336706161499, "Pretrain/Loss (Raw)": 2.1482045650482178, "Pretrain/Step": 2045, "Pretrain/Step Time": 8.451684160158038} +{"Pretrain/Learning Rate": 4.9220984959439374e-05, "Pretrain/Loss": 2.0868167877197266, "Pretrain/Loss (Raw)": 2.0318944454193115, "Pretrain/Step": 2046, "Pretrain/Step Time": 8.452527550980449} +{"Pretrain/Learning Rate": 4.921993312607167e-05, "Pretrain/Loss": 2.08772611618042, "Pretrain/Loss (Raw)": 2.129220962524414, "Pretrain/Step": 2047, "Pretrain/Step Time": 8.451627003028989} +{"Pretrain/Learning Rate": 4.9218880594339264e-05, "Pretrain/Loss": 2.0875043869018555, "Pretrain/Loss (Raw)": 2.0225131511688232, "Pretrain/Step": 2048, "Pretrain/Step Time": 8.45118484646082} +{"Pretrain/Learning Rate": 4.9217827364272525e-05, "Pretrain/Loss": 2.088427782058716, "Pretrain/Loss (Raw)": 2.0718421936035156, "Pretrain/Step": 2049, "Pretrain/Step Time": 8.451548838987947} +{"Pretrain/Learning Rate": 4.9216773435901795e-05, "Pretrain/Loss": 2.091031074523926, "Pretrain/Loss (Raw)": 2.1609387397766113, "Pretrain/Step": 2050, "Pretrain/Step Time": 8.45197593048215} +{"Pretrain/Learning Rate": 4.921571880925747e-05, "Pretrain/Loss": 2.0906240940093994, "Pretrain/Loss (Raw)": 2.0005874633789062, "Pretrain/Step": 2051, "Pretrain/Step Time": 8.46256403811276} +{"Pretrain/Learning Rate": 4.921466348436997e-05, "Pretrain/Loss": 2.088820457458496, "Pretrain/Loss (Raw)": 1.8588743209838867, "Pretrain/Step": 2052, "Pretrain/Step Time": 8.462420403957367} +{"Pretrain/Learning Rate": 4.921360746126972e-05, "Pretrain/Loss": 2.0890607833862305, "Pretrain/Loss (Raw)": 2.1186821460723877, "Pretrain/Step": 2053, "Pretrain/Step Time": 8.46147484332323} +{"Pretrain/Learning Rate": 4.9212550739987173e-05, "Pretrain/Loss": 2.088909149169922, "Pretrain/Loss (Raw)": 1.9733753204345703, "Pretrain/Step": 2054, "Pretrain/Step Time": 8.466405212879181} +{"Pretrain/Learning Rate": 4.9211493320552784e-05, "Pretrain/Loss": 2.0887718200683594, "Pretrain/Loss (Raw)": 1.9958523511886597, "Pretrain/Step": 2055, "Pretrain/Step Time": 8.459552444517612} +{"Pretrain/Learning Rate": 4.9210435202997065e-05, "Pretrain/Loss": 2.0858702659606934, "Pretrain/Loss (Raw)": 2.0133113861083984, "Pretrain/Step": 2056, "Pretrain/Step Time": 8.462854351848364} +{"Pretrain/Learning Rate": 4.92093763873505e-05, "Pretrain/Loss": 2.085681438446045, "Pretrain/Loss (Raw)": 1.9616882801055908, "Pretrain/Step": 2057, "Pretrain/Step Time": 8.468798050656915} +{"Pretrain/Learning Rate": 4.920831687364364e-05, "Pretrain/Loss": 2.082284450531006, "Pretrain/Loss (Raw)": 1.8177109956741333, "Pretrain/Step": 2058, "Pretrain/Step Time": 8.465122872963548} +{"Pretrain/Learning Rate": 4.920725666190703e-05, "Pretrain/Loss": 2.082467555999756, "Pretrain/Loss (Raw)": 2.0598700046539307, "Pretrain/Step": 2059, "Pretrain/Step Time": 8.465927734971046} +{"Pretrain/Learning Rate": 4.920619575217124e-05, "Pretrain/Loss": 2.084219217300415, "Pretrain/Loss (Raw)": 2.216503858566284, "Pretrain/Step": 2060, "Pretrain/Step Time": 8.467302428558469} +{"Pretrain/Learning Rate": 4.920513414446686e-05, "Pretrain/Loss": 2.086366653442383, "Pretrain/Loss (Raw)": 2.1566760540008545, "Pretrain/Step": 2061, "Pretrain/Step Time": 8.459029633551836} +{"Pretrain/Learning Rate": 4.920407183882449e-05, "Pretrain/Loss": 2.0845484733581543, "Pretrain/Loss (Raw)": 1.962095022201538, "Pretrain/Step": 2062, "Pretrain/Step Time": 8.461157288402319} +{"Pretrain/Learning Rate": 4.9203008835274786e-05, "Pretrain/Loss": 2.0848464965820312, "Pretrain/Loss (Raw)": 2.2777645587921143, "Pretrain/Step": 2063, "Pretrain/Step Time": 8.462617572396994} +{"Pretrain/Learning Rate": 4.9201945133848374e-05, "Pretrain/Loss": 2.086798667907715, "Pretrain/Loss (Raw)": 2.078575372695923, "Pretrain/Step": 2064, "Pretrain/Step Time": 8.458813775330782} +{"Pretrain/Learning Rate": 4.920088073457594e-05, "Pretrain/Loss": 2.0869526863098145, "Pretrain/Loss (Raw)": 1.9590758085250854, "Pretrain/Step": 2065, "Pretrain/Step Time": 8.458776362240314} +{"Pretrain/Learning Rate": 4.919981563748817e-05, "Pretrain/Loss": 2.0867209434509277, "Pretrain/Loss (Raw)": 2.1141958236694336, "Pretrain/Step": 2066, "Pretrain/Step Time": 8.46476224809885} +{"Pretrain/Learning Rate": 4.919874984261578e-05, "Pretrain/Loss": 2.0854601860046387, "Pretrain/Loss (Raw)": 1.9629786014556885, "Pretrain/Step": 2067, "Pretrain/Step Time": 8.463689483702183} +{"Pretrain/Learning Rate": 4.9197683349989486e-05, "Pretrain/Loss": 2.083422899246216, "Pretrain/Loss (Raw)": 1.8717495203018188, "Pretrain/Step": 2068, "Pretrain/Step Time": 8.462549641728401} +{"Pretrain/Learning Rate": 4.9196616159640055e-05, "Pretrain/Loss": 2.0874054431915283, "Pretrain/Loss (Raw)": 2.223510980606079, "Pretrain/Step": 2069, "Pretrain/Step Time": 8.461107330396771} +{"Pretrain/Learning Rate": 4.919554827159826e-05, "Pretrain/Loss": 2.0852432250976562, "Pretrain/Loss (Raw)": 1.8011832237243652, "Pretrain/Step": 2070, "Pretrain/Step Time": 8.46267462708056} +{"Pretrain/Learning Rate": 4.919447968589488e-05, "Pretrain/Loss": 2.083550453186035, "Pretrain/Loss (Raw)": 2.054536819458008, "Pretrain/Step": 2071, "Pretrain/Step Time": 8.463014671579003} +{"Pretrain/Learning Rate": 4.919341040256074e-05, "Pretrain/Loss": 2.0815720558166504, "Pretrain/Loss (Raw)": 1.947778582572937, "Pretrain/Step": 2072, "Pretrain/Step Time": 8.467543326318264} +{"Pretrain/Learning Rate": 4.9192340421626665e-05, "Pretrain/Loss": 2.0815792083740234, "Pretrain/Loss (Raw)": 2.0038857460021973, "Pretrain/Step": 2073, "Pretrain/Step Time": 8.464395193383098} +{"Pretrain/Learning Rate": 4.9191269743123505e-05, "Pretrain/Loss": 2.08311128616333, "Pretrain/Loss (Raw)": 2.3351991176605225, "Pretrain/Step": 2074, "Pretrain/Step Time": 8.469158181920648} +{"Pretrain/Learning Rate": 4.919019836708214e-05, "Pretrain/Loss": 2.0842251777648926, "Pretrain/Loss (Raw)": 2.100451707839966, "Pretrain/Step": 2075, "Pretrain/Step Time": 8.467527171596885} +{"Pretrain/Learning Rate": 4.918912629353346e-05, "Pretrain/Loss": 2.081488609313965, "Pretrain/Loss (Raw)": 1.8105775117874146, "Pretrain/Step": 2076, "Pretrain/Step Time": 8.466208079829812} +{"Pretrain/Learning Rate": 4.918805352250837e-05, "Pretrain/Loss": 2.0808281898498535, "Pretrain/Loss (Raw)": 2.0532820224761963, "Pretrain/Step": 2077, "Pretrain/Step Time": 8.464926166459918} +{"Pretrain/Learning Rate": 4.918698005403781e-05, "Pretrain/Loss": 2.0813632011413574, "Pretrain/Loss (Raw)": 2.1804168224334717, "Pretrain/Step": 2078, "Pretrain/Step Time": 8.465617084875703} +{"Pretrain/Learning Rate": 4.918590588815273e-05, "Pretrain/Loss": 2.0800399780273438, "Pretrain/Loss (Raw)": 2.078573703765869, "Pretrain/Step": 2079, "Pretrain/Step Time": 8.46437131240964} +{"Pretrain/Learning Rate": 4.91848310248841e-05, "Pretrain/Loss": 2.0801968574523926, "Pretrain/Loss (Raw)": 2.1376895904541016, "Pretrain/Step": 2080, "Pretrain/Step Time": 8.46864171512425} +{"Pretrain/Learning Rate": 4.9183755464262924e-05, "Pretrain/Loss": 2.0767149925231934, "Pretrain/Loss (Raw)": 1.797165870666504, "Pretrain/Step": 2081, "Pretrain/Step Time": 8.470394168049097} +{"Pretrain/Learning Rate": 4.9182679206320206e-05, "Pretrain/Loss": 2.0784285068511963, "Pretrain/Loss (Raw)": 2.1116104125976562, "Pretrain/Step": 2082, "Pretrain/Step Time": 8.469038994982839} +{"Pretrain/Learning Rate": 4.918160225108698e-05, "Pretrain/Loss": 2.0790815353393555, "Pretrain/Loss (Raw)": 2.232168674468994, "Pretrain/Step": 2083, "Pretrain/Step Time": 8.472345568239689} +{"Pretrain/Learning Rate": 4.91805245985943e-05, "Pretrain/Loss": 2.0792527198791504, "Pretrain/Loss (Raw)": 2.149632692337036, "Pretrain/Step": 2084, "Pretrain/Step Time": 8.472044307738543} +{"Pretrain/Learning Rate": 4.917944624887324e-05, "Pretrain/Loss": 2.078442096710205, "Pretrain/Loss (Raw)": 1.8827102184295654, "Pretrain/Step": 2085, "Pretrain/Step Time": 8.471987318247557} +{"Pretrain/Learning Rate": 4.9178367201954894e-05, "Pretrain/Loss": 2.0768775939941406, "Pretrain/Loss (Raw)": 1.9283431768417358, "Pretrain/Step": 2086, "Pretrain/Step Time": 8.474353488534689} +{"Pretrain/Learning Rate": 4.9177287457870374e-05, "Pretrain/Loss": 2.0753135681152344, "Pretrain/Loss (Raw)": 2.137401819229126, "Pretrain/Step": 2087, "Pretrain/Step Time": 8.47306570969522} +{"Pretrain/Learning Rate": 4.917620701665081e-05, "Pretrain/Loss": 2.0740890502929688, "Pretrain/Loss (Raw)": 1.962109088897705, "Pretrain/Step": 2088, "Pretrain/Step Time": 8.474305963143706} +{"Pretrain/Learning Rate": 4.9175125878327363e-05, "Pretrain/Loss": 2.07470703125, "Pretrain/Loss (Raw)": 2.1062848567962646, "Pretrain/Step": 2089, "Pretrain/Step Time": 8.475181128829718} +{"Pretrain/Learning Rate": 4.917404404293121e-05, "Pretrain/Loss": 2.07627534866333, "Pretrain/Loss (Raw)": 2.279463529586792, "Pretrain/Step": 2090, "Pretrain/Step Time": 8.469120657071471} +{"Pretrain/Learning Rate": 4.917296151049353e-05, "Pretrain/Loss": 2.0776124000549316, "Pretrain/Loss (Raw)": 2.1383657455444336, "Pretrain/Step": 2091, "Pretrain/Step Time": 8.470619011670351} +{"Pretrain/Learning Rate": 4.917187828104555e-05, "Pretrain/Loss": 2.0769095420837402, "Pretrain/Loss (Raw)": 2.0431883335113525, "Pretrain/Step": 2092, "Pretrain/Step Time": 8.47090102173388} +{"Pretrain/Learning Rate": 4.9170794354618486e-05, "Pretrain/Loss": 2.0748822689056396, "Pretrain/Loss (Raw)": 2.2214760780334473, "Pretrain/Step": 2093, "Pretrain/Step Time": 8.470668217167258} +{"Pretrain/Learning Rate": 4.916970973124362e-05, "Pretrain/Loss": 2.075730800628662, "Pretrain/Loss (Raw)": 2.1305601596832275, "Pretrain/Step": 2094, "Pretrain/Step Time": 8.469656500965357} +{"Pretrain/Learning Rate": 4.916862441095221e-05, "Pretrain/Loss": 2.0770130157470703, "Pretrain/Loss (Raw)": 2.2131125926971436, "Pretrain/Step": 2095, "Pretrain/Step Time": 8.463989689946175} +{"Pretrain/Learning Rate": 4.916753839377555e-05, "Pretrain/Loss": 2.0771701335906982, "Pretrain/Loss (Raw)": 2.1119837760925293, "Pretrain/Step": 2096, "Pretrain/Step Time": 8.463648410513997} +{"Pretrain/Learning Rate": 4.916645167974496e-05, "Pretrain/Loss": 2.076997756958008, "Pretrain/Loss (Raw)": 2.1495361328125, "Pretrain/Step": 2097, "Pretrain/Step Time": 8.46307698637247} +{"Pretrain/Learning Rate": 4.916536426889177e-05, "Pretrain/Loss": 2.0766143798828125, "Pretrain/Loss (Raw)": 2.0595805644989014, "Pretrain/Step": 2098, "Pretrain/Step Time": 8.468810252845287} +{"Pretrain/Learning Rate": 4.916427616124734e-05, "Pretrain/Loss": 2.0761146545410156, "Pretrain/Loss (Raw)": 1.9786503314971924, "Pretrain/Step": 2099, "Pretrain/Step Time": 8.468563616275787} +{"Pretrain/Learning Rate": 4.916318735684304e-05, "Pretrain/Loss": 2.076099395751953, "Pretrain/Loss (Raw)": 2.1295905113220215, "Pretrain/Step": 2100, "Pretrain/Step Time": 8.463817635551095} +{"Pretrain/Learning Rate": 4.9162097855710264e-05, "Pretrain/Loss": 2.0750885009765625, "Pretrain/Loss (Raw)": 2.0376174449920654, "Pretrain/Step": 2101, "Pretrain/Step Time": 8.468758592382073} +{"Pretrain/Learning Rate": 4.916100765788044e-05, "Pretrain/Loss": 2.0747604370117188, "Pretrain/Loss (Raw)": 2.1104979515075684, "Pretrain/Step": 2102, "Pretrain/Step Time": 8.466983361169696} +{"Pretrain/Learning Rate": 4.915991676338498e-05, "Pretrain/Loss": 2.0768442153930664, "Pretrain/Loss (Raw)": 2.2569520473480225, "Pretrain/Step": 2103, "Pretrain/Step Time": 8.463142884895205} +{"Pretrain/Learning Rate": 4.915882517225536e-05, "Pretrain/Loss": 2.075345516204834, "Pretrain/Loss (Raw)": 1.882974624633789, "Pretrain/Step": 2104, "Pretrain/Step Time": 8.466324971988797} +{"Pretrain/Learning Rate": 4.9157732884523045e-05, "Pretrain/Loss": 2.0732476711273193, "Pretrain/Loss (Raw)": 2.0126030445098877, "Pretrain/Step": 2105, "Pretrain/Step Time": 8.463121360167861} +{"Pretrain/Learning Rate": 4.9156639900219525e-05, "Pretrain/Loss": 2.0740678310394287, "Pretrain/Loss (Raw)": 2.2991652488708496, "Pretrain/Step": 2106, "Pretrain/Step Time": 8.462645268067718} +{"Pretrain/Learning Rate": 4.915554621937633e-05, "Pretrain/Loss": 2.073453426361084, "Pretrain/Loss (Raw)": 1.9496870040893555, "Pretrain/Step": 2107, "Pretrain/Step Time": 8.462766572833061} +{"Pretrain/Learning Rate": 4.915445184202498e-05, "Pretrain/Loss": 2.0745387077331543, "Pretrain/Loss (Raw)": 2.1792943477630615, "Pretrain/Step": 2108, "Pretrain/Step Time": 8.461910124868155} +{"Pretrain/Learning Rate": 4.915335676819706e-05, "Pretrain/Loss": 2.075610399246216, "Pretrain/Loss (Raw)": 2.270684003829956, "Pretrain/Step": 2109, "Pretrain/Step Time": 8.463697308674455} +{"Pretrain/Learning Rate": 4.9152260997924106e-05, "Pretrain/Loss": 2.0753350257873535, "Pretrain/Loss (Raw)": 1.938253402709961, "Pretrain/Step": 2110, "Pretrain/Step Time": 8.46360830962658} +{"Pretrain/Learning Rate": 4.915116453123774e-05, "Pretrain/Loss": 2.0735743045806885, "Pretrain/Loss (Raw)": 2.011385202407837, "Pretrain/Step": 2111, "Pretrain/Step Time": 8.459637271240354} +{"Pretrain/Learning Rate": 4.9150067368169564e-05, "Pretrain/Loss": 2.0727105140686035, "Pretrain/Loss (Raw)": 2.007049560546875, "Pretrain/Step": 2112, "Pretrain/Step Time": 8.460763121023774} +{"Pretrain/Learning Rate": 4.914896950875122e-05, "Pretrain/Loss": 2.072610378265381, "Pretrain/Loss (Raw)": 1.90285062789917, "Pretrain/Step": 2113, "Pretrain/Step Time": 8.463399428874254} +{"Pretrain/Learning Rate": 4.914787095301437e-05, "Pretrain/Loss": 2.071381092071533, "Pretrain/Loss (Raw)": 1.9368302822113037, "Pretrain/Step": 2114, "Pretrain/Step Time": 8.463733645156026} +{"Pretrain/Learning Rate": 4.914677170099068e-05, "Pretrain/Loss": 2.0739173889160156, "Pretrain/Loss (Raw)": 2.357752561569214, "Pretrain/Step": 2115, "Pretrain/Step Time": 8.472501059994102} +{"Pretrain/Learning Rate": 4.914567175271185e-05, "Pretrain/Loss": 2.074254035949707, "Pretrain/Loss (Raw)": 2.0261123180389404, "Pretrain/Step": 2116, "Pretrain/Step Time": 8.467320216819644} +{"Pretrain/Learning Rate": 4.91445711082096e-05, "Pretrain/Loss": 2.0741610527038574, "Pretrain/Loss (Raw)": 2.086275339126587, "Pretrain/Step": 2117, "Pretrain/Step Time": 8.47196371667087} +{"Pretrain/Learning Rate": 4.914346976751566e-05, "Pretrain/Loss": 2.0754754543304443, "Pretrain/Loss (Raw)": 2.1237635612487793, "Pretrain/Step": 2118, "Pretrain/Step Time": 8.468807592988014} +{"Pretrain/Learning Rate": 4.914236773066179e-05, "Pretrain/Loss": 2.076038360595703, "Pretrain/Loss (Raw)": 2.073291778564453, "Pretrain/Step": 2119, "Pretrain/Step Time": 8.466742619872093} +{"Pretrain/Learning Rate": 4.914126499767977e-05, "Pretrain/Loss": 2.076241970062256, "Pretrain/Loss (Raw)": 2.0823395252227783, "Pretrain/Step": 2120, "Pretrain/Step Time": 8.4715027064085} +{"Pretrain/Learning Rate": 4.914016156860139e-05, "Pretrain/Loss": 2.0766754150390625, "Pretrain/Loss (Raw)": 1.9817531108856201, "Pretrain/Step": 2121, "Pretrain/Step Time": 8.478752871975303} +{"Pretrain/Learning Rate": 4.9139057443458456e-05, "Pretrain/Loss": 2.0779762268066406, "Pretrain/Loss (Raw)": 2.1809983253479004, "Pretrain/Step": 2122, "Pretrain/Step Time": 8.472200095653534} +{"Pretrain/Learning Rate": 4.9137952622282836e-05, "Pretrain/Loss": 2.0753564834594727, "Pretrain/Loss (Raw)": 1.7593262195587158, "Pretrain/Step": 2123, "Pretrain/Step Time": 8.477101165801287} +{"Pretrain/Learning Rate": 4.913684710510636e-05, "Pretrain/Loss": 2.0738916397094727, "Pretrain/Loss (Raw)": 2.0141477584838867, "Pretrain/Step": 2124, "Pretrain/Step Time": 8.473441423848271} +{"Pretrain/Learning Rate": 4.913574089196091e-05, "Pretrain/Loss": 2.072770595550537, "Pretrain/Loss (Raw)": 1.9584534168243408, "Pretrain/Step": 2125, "Pretrain/Step Time": 8.46705162152648} +{"Pretrain/Learning Rate": 4.9134633982878396e-05, "Pretrain/Loss": 2.073234796524048, "Pretrain/Loss (Raw)": 2.0848236083984375, "Pretrain/Step": 2126, "Pretrain/Step Time": 8.46283502317965} +{"Pretrain/Learning Rate": 4.9133526377890716e-05, "Pretrain/Loss": 2.074337959289551, "Pretrain/Loss (Raw)": 2.1806116104125977, "Pretrain/Step": 2127, "Pretrain/Step Time": 8.46314892731607} +{"Pretrain/Learning Rate": 4.913241807702982e-05, "Pretrain/Loss": 2.0731735229492188, "Pretrain/Loss (Raw)": 2.0975446701049805, "Pretrain/Step": 2128, "Pretrain/Step Time": 8.459206843748689} +{"Pretrain/Learning Rate": 4.913130908032766e-05, "Pretrain/Loss": 2.0728988647460938, "Pretrain/Loss (Raw)": 2.1163437366485596, "Pretrain/Step": 2129, "Pretrain/Step Time": 8.460075398907065} +{"Pretrain/Learning Rate": 4.913019938781621e-05, "Pretrain/Loss": 2.074634313583374, "Pretrain/Loss (Raw)": 2.1027770042419434, "Pretrain/Step": 2130, "Pretrain/Step Time": 8.463772993534803} +{"Pretrain/Learning Rate": 4.9129088999527485e-05, "Pretrain/Loss": 2.0763583183288574, "Pretrain/Loss (Raw)": 2.1931910514831543, "Pretrain/Step": 2131, "Pretrain/Step Time": 8.464775150641799} +{"Pretrain/Learning Rate": 4.9127977915493475e-05, "Pretrain/Loss": 2.0752816200256348, "Pretrain/Loss (Raw)": 2.056598663330078, "Pretrain/Step": 2132, "Pretrain/Step Time": 8.46462875790894} +{"Pretrain/Learning Rate": 4.912686613574624e-05, "Pretrain/Loss": 2.0771753787994385, "Pretrain/Loss (Raw)": 2.22944974899292, "Pretrain/Step": 2133, "Pretrain/Step Time": 8.464810671284795} +{"Pretrain/Learning Rate": 4.912575366031782e-05, "Pretrain/Loss": 2.076524257659912, "Pretrain/Loss (Raw)": 1.9721232652664185, "Pretrain/Step": 2134, "Pretrain/Step Time": 8.466725928708911} +{"Pretrain/Learning Rate": 4.9124640489240304e-05, "Pretrain/Loss": 2.0746378898620605, "Pretrain/Loss (Raw)": 1.9201194047927856, "Pretrain/Step": 2135, "Pretrain/Step Time": 8.468807730823755} +{"Pretrain/Learning Rate": 4.9123526622545787e-05, "Pretrain/Loss": 2.0742249488830566, "Pretrain/Loss (Raw)": 1.9448556900024414, "Pretrain/Step": 2136, "Pretrain/Step Time": 8.463909957557917} +{"Pretrain/Learning Rate": 4.912241206026638e-05, "Pretrain/Loss": 2.0733346939086914, "Pretrain/Loss (Raw)": 2.1054470539093018, "Pretrain/Step": 2137, "Pretrain/Step Time": 8.469369638711214} +{"Pretrain/Learning Rate": 4.912129680243423e-05, "Pretrain/Loss": 2.0712037086486816, "Pretrain/Loss (Raw)": 1.7014925479888916, "Pretrain/Step": 2138, "Pretrain/Step Time": 8.464907631278038} +{"Pretrain/Learning Rate": 4.9120180849081496e-05, "Pretrain/Loss": 2.0732603073120117, "Pretrain/Loss (Raw)": 2.346207618713379, "Pretrain/Step": 2139, "Pretrain/Step Time": 8.464159447699785} +{"Pretrain/Learning Rate": 4.911906420024035e-05, "Pretrain/Loss": 2.075324058532715, "Pretrain/Loss (Raw)": 2.2001090049743652, "Pretrain/Step": 2140, "Pretrain/Step Time": 8.465283814817667} +{"Pretrain/Learning Rate": 4.911794685594299e-05, "Pretrain/Loss": 2.0740742683410645, "Pretrain/Loss (Raw)": 2.1690173149108887, "Pretrain/Step": 2141, "Pretrain/Step Time": 8.464990548789501} +{"Pretrain/Learning Rate": 4.911682881622163e-05, "Pretrain/Loss": 2.0750365257263184, "Pretrain/Loss (Raw)": 2.205291986465454, "Pretrain/Step": 2142, "Pretrain/Step Time": 8.464071907103062} +{"Pretrain/Learning Rate": 4.911571008110851e-05, "Pretrain/Loss": 2.075577735900879, "Pretrain/Loss (Raw)": 2.16188645362854, "Pretrain/Step": 2143, "Pretrain/Step Time": 8.45861840620637} +{"Pretrain/Learning Rate": 4.9114590650635895e-05, "Pretrain/Loss": 2.076380729675293, "Pretrain/Loss (Raw)": 2.220198392868042, "Pretrain/Step": 2144, "Pretrain/Step Time": 8.45786851271987} +{"Pretrain/Learning Rate": 4.9113470524836056e-05, "Pretrain/Loss": 2.0777902603149414, "Pretrain/Loss (Raw)": 2.154017925262451, "Pretrain/Step": 2145, "Pretrain/Step Time": 8.45614948682487} +{"Pretrain/Learning Rate": 4.91123497037413e-05, "Pretrain/Loss": 2.0777552127838135, "Pretrain/Loss (Raw)": 2.200927734375, "Pretrain/Step": 2146, "Pretrain/Step Time": 8.45680645853281} +{"Pretrain/Learning Rate": 4.911122818738394e-05, "Pretrain/Loss": 2.0760550498962402, "Pretrain/Loss (Raw)": 2.0667717456817627, "Pretrain/Step": 2147, "Pretrain/Step Time": 8.46070859581232} +{"Pretrain/Learning Rate": 4.91101059757963e-05, "Pretrain/Loss": 2.0749588012695312, "Pretrain/Loss (Raw)": 2.0983667373657227, "Pretrain/Step": 2148, "Pretrain/Step Time": 8.463280826807022} +{"Pretrain/Learning Rate": 4.910898306901076e-05, "Pretrain/Loss": 2.07533860206604, "Pretrain/Loss (Raw)": 2.161926031112671, "Pretrain/Step": 2149, "Pretrain/Step Time": 8.46496701054275} +{"Pretrain/Learning Rate": 4.910785946705968e-05, "Pretrain/Loss": 2.075145721435547, "Pretrain/Loss (Raw)": 2.1815085411071777, "Pretrain/Step": 2150, "Pretrain/Step Time": 8.464474651962519} +{"Pretrain/Learning Rate": 4.9106735169975475e-05, "Pretrain/Loss": 2.0722973346710205, "Pretrain/Loss (Raw)": 1.9786769151687622, "Pretrain/Step": 2151, "Pretrain/Step Time": 8.466393508017063} +{"Pretrain/Learning Rate": 4.9105610177790556e-05, "Pretrain/Loss": 2.068878650665283, "Pretrain/Loss (Raw)": 1.9919322729110718, "Pretrain/Step": 2152, "Pretrain/Step Time": 8.466521814465523} +{"Pretrain/Learning Rate": 4.910448449053736e-05, "Pretrain/Loss": 2.0706558227539062, "Pretrain/Loss (Raw)": 2.1093461513519287, "Pretrain/Step": 2153, "Pretrain/Step Time": 8.464898079633713} +{"Pretrain/Learning Rate": 4.9103358108248344e-05, "Pretrain/Loss": 2.0710055828094482, "Pretrain/Loss (Raw)": 1.9612901210784912, "Pretrain/Step": 2154, "Pretrain/Step Time": 8.463324392214417} +{"Pretrain/Learning Rate": 4.9102231030955995e-05, "Pretrain/Loss": 2.0714406967163086, "Pretrain/Loss (Raw)": 2.3287155628204346, "Pretrain/Step": 2155, "Pretrain/Step Time": 8.463121945038438} +{"Pretrain/Learning Rate": 4.910110325869279e-05, "Pretrain/Loss": 2.070976972579956, "Pretrain/Loss (Raw)": 1.9405992031097412, "Pretrain/Step": 2156, "Pretrain/Step Time": 8.461449675261974} +{"Pretrain/Learning Rate": 4.909997479149128e-05, "Pretrain/Loss": 2.0716116428375244, "Pretrain/Loss (Raw)": 2.005160331726074, "Pretrain/Step": 2157, "Pretrain/Step Time": 8.45833440311253} +{"Pretrain/Learning Rate": 4.909884562938397e-05, "Pretrain/Loss": 2.0721960067749023, "Pretrain/Loss (Raw)": 2.1759631633758545, "Pretrain/Step": 2158, "Pretrain/Step Time": 8.463231079280376} +{"Pretrain/Learning Rate": 4.9097715772403446e-05, "Pretrain/Loss": 2.0720229148864746, "Pretrain/Loss (Raw)": 2.1001479625701904, "Pretrain/Step": 2159, "Pretrain/Step Time": 8.459782419726253} +{"Pretrain/Learning Rate": 4.909658522058227e-05, "Pretrain/Loss": 2.07008957862854, "Pretrain/Loss (Raw)": 2.146649122238159, "Pretrain/Step": 2160, "Pretrain/Step Time": 8.463024951517582} +{"Pretrain/Learning Rate": 4.909545397395305e-05, "Pretrain/Loss": 2.0710039138793945, "Pretrain/Loss (Raw)": 2.2271156311035156, "Pretrain/Step": 2161, "Pretrain/Step Time": 8.455969167873263} +{"Pretrain/Learning Rate": 4.90943220325484e-05, "Pretrain/Loss": 2.0718674659729004, "Pretrain/Loss (Raw)": 2.2052464485168457, "Pretrain/Step": 2162, "Pretrain/Step Time": 8.455253949388862} +{"Pretrain/Learning Rate": 4.909318939640096e-05, "Pretrain/Loss": 2.0714704990386963, "Pretrain/Loss (Raw)": 1.9880086183547974, "Pretrain/Step": 2163, "Pretrain/Step Time": 8.457892496138811} +{"Pretrain/Learning Rate": 4.909205606554339e-05, "Pretrain/Loss": 2.070970058441162, "Pretrain/Loss (Raw)": 2.1297872066497803, "Pretrain/Step": 2164, "Pretrain/Step Time": 8.452971955761313} +{"Pretrain/Learning Rate": 4.909092204000837e-05, "Pretrain/Loss": 2.06982684135437, "Pretrain/Loss (Raw)": 1.9769611358642578, "Pretrain/Step": 2165, "Pretrain/Step Time": 8.457324720919132} +{"Pretrain/Learning Rate": 4.9089787319828585e-05, "Pretrain/Loss": 2.0707550048828125, "Pretrain/Loss (Raw)": 2.0978684425354004, "Pretrain/Step": 2166, "Pretrain/Step Time": 8.45567773282528} +{"Pretrain/Learning Rate": 4.9088651905036777e-05, "Pretrain/Loss": 2.0731801986694336, "Pretrain/Loss (Raw)": 2.1339874267578125, "Pretrain/Step": 2167, "Pretrain/Step Time": 8.455855451524258} +{"Pretrain/Learning Rate": 4.908751579566566e-05, "Pretrain/Loss": 2.0753307342529297, "Pretrain/Loss (Raw)": 2.0531108379364014, "Pretrain/Step": 2168, "Pretrain/Step Time": 8.456982204690576} +{"Pretrain/Learning Rate": 4.9086378991748016e-05, "Pretrain/Loss": 2.0753560066223145, "Pretrain/Loss (Raw)": 2.024240016937256, "Pretrain/Step": 2169, "Pretrain/Step Time": 8.459785467013717} +{"Pretrain/Learning Rate": 4.908524149331661e-05, "Pretrain/Loss": 2.0748002529144287, "Pretrain/Loss (Raw)": 2.1166915893554688, "Pretrain/Step": 2170, "Pretrain/Step Time": 8.452425161376595} +{"Pretrain/Learning Rate": 4.908410330040424e-05, "Pretrain/Loss": 2.0747294425964355, "Pretrain/Loss (Raw)": 2.0846521854400635, "Pretrain/Step": 2171, "Pretrain/Step Time": 8.450494403019547} +{"Pretrain/Learning Rate": 4.908296441304374e-05, "Pretrain/Loss": 2.0773940086364746, "Pretrain/Loss (Raw)": 2.364428997039795, "Pretrain/Step": 2172, "Pretrain/Step Time": 8.449730826541781} +{"Pretrain/Learning Rate": 4.908182483126793e-05, "Pretrain/Loss": 2.076765298843384, "Pretrain/Loss (Raw)": 2.0677170753479004, "Pretrain/Step": 2173, "Pretrain/Step Time": 8.45061719045043} +{"Pretrain/Learning Rate": 4.908068455510968e-05, "Pretrain/Loss": 2.0794272422790527, "Pretrain/Loss (Raw)": 2.3726208209991455, "Pretrain/Step": 2174, "Pretrain/Step Time": 8.454830758273602} +{"Pretrain/Learning Rate": 4.907954358460186e-05, "Pretrain/Loss": 2.079556465148926, "Pretrain/Loss (Raw)": 2.1457533836364746, "Pretrain/Step": 2175, "Pretrain/Step Time": 8.452773282304406} +{"Pretrain/Learning Rate": 4.907840191977738e-05, "Pretrain/Loss": 2.081401824951172, "Pretrain/Loss (Raw)": 2.2587404251098633, "Pretrain/Step": 2176, "Pretrain/Step Time": 8.451799316331744} +{"Pretrain/Learning Rate": 4.9077259560669166e-05, "Pretrain/Loss": 2.0817439556121826, "Pretrain/Loss (Raw)": 2.115621566772461, "Pretrain/Step": 2177, "Pretrain/Step Time": 8.451727271080017} +{"Pretrain/Learning Rate": 4.907611650731013e-05, "Pretrain/Loss": 2.0811235904693604, "Pretrain/Loss (Raw)": 2.081531524658203, "Pretrain/Step": 2178, "Pretrain/Step Time": 8.456818483769894} +{"Pretrain/Learning Rate": 4.907497275973326e-05, "Pretrain/Loss": 2.08078670501709, "Pretrain/Loss (Raw)": 1.9574785232543945, "Pretrain/Step": 2179, "Pretrain/Step Time": 8.443423207849264} +{"Pretrain/Learning Rate": 4.9073828317971514e-05, "Pretrain/Loss": 2.0821540355682373, "Pretrain/Loss (Raw)": 2.0338664054870605, "Pretrain/Step": 2180, "Pretrain/Step Time": 8.447758562862873} +{"Pretrain/Learning Rate": 4.9072683182057896e-05, "Pretrain/Loss": 2.0807313919067383, "Pretrain/Loss (Raw)": 1.9366227388381958, "Pretrain/Step": 2181, "Pretrain/Step Time": 8.453912742435932} +{"Pretrain/Learning Rate": 4.907153735202544e-05, "Pretrain/Loss": 2.08196759223938, "Pretrain/Loss (Raw)": 2.1315977573394775, "Pretrain/Step": 2182, "Pretrain/Step Time": 8.449670309200883} +{"Pretrain/Learning Rate": 4.907039082790716e-05, "Pretrain/Loss": 2.0835132598876953, "Pretrain/Loss (Raw)": 2.1936991214752197, "Pretrain/Step": 2183, "Pretrain/Step Time": 8.45195621624589} +{"Pretrain/Learning Rate": 4.906924360973615e-05, "Pretrain/Loss": 2.0838966369628906, "Pretrain/Loss (Raw)": 2.062354326248169, "Pretrain/Step": 2184, "Pretrain/Step Time": 8.451083635911345} +{"Pretrain/Learning Rate": 4.906809569754545e-05, "Pretrain/Loss": 2.0848069190979004, "Pretrain/Loss (Raw)": 2.0782270431518555, "Pretrain/Step": 2185, "Pretrain/Step Time": 8.446470035240054} +{"Pretrain/Learning Rate": 4.906694709136818e-05, "Pretrain/Loss": 2.087468147277832, "Pretrain/Loss (Raw)": 2.1583235263824463, "Pretrain/Step": 2186, "Pretrain/Step Time": 8.449779376387596} +{"Pretrain/Learning Rate": 4.906579779123746e-05, "Pretrain/Loss": 2.0886969566345215, "Pretrain/Loss (Raw)": 2.2171614170074463, "Pretrain/Step": 2187, "Pretrain/Step Time": 8.44657970406115} +{"Pretrain/Learning Rate": 4.906464779718643e-05, "Pretrain/Loss": 2.088183641433716, "Pretrain/Loss (Raw)": 2.1508047580718994, "Pretrain/Step": 2188, "Pretrain/Step Time": 8.44498953782022} +{"Pretrain/Learning Rate": 4.9063497109248237e-05, "Pretrain/Loss": 2.0866775512695312, "Pretrain/Loss (Raw)": 1.9638935327529907, "Pretrain/Step": 2189, "Pretrain/Step Time": 8.449439082294703} +{"Pretrain/Learning Rate": 4.906234572745607e-05, "Pretrain/Loss": 2.0879039764404297, "Pretrain/Loss (Raw)": 2.119083881378174, "Pretrain/Step": 2190, "Pretrain/Step Time": 8.448695298284292} +{"Pretrain/Learning Rate": 4.906119365184313e-05, "Pretrain/Loss": 2.08695912361145, "Pretrain/Loss (Raw)": 2.156825065612793, "Pretrain/Step": 2191, "Pretrain/Step Time": 8.44805620238185} +{"Pretrain/Learning Rate": 4.906004088244263e-05, "Pretrain/Loss": 2.086945056915283, "Pretrain/Loss (Raw)": 2.0767745971679688, "Pretrain/Step": 2192, "Pretrain/Step Time": 8.449681710451841} +{"Pretrain/Learning Rate": 4.905888741928781e-05, "Pretrain/Loss": 2.08804988861084, "Pretrain/Loss (Raw)": 2.100487470626831, "Pretrain/Step": 2193, "Pretrain/Step Time": 8.450110722333193} +{"Pretrain/Learning Rate": 4.9057733262411945e-05, "Pretrain/Loss": 2.0873684883117676, "Pretrain/Loss (Raw)": 2.026978015899658, "Pretrain/Step": 2194, "Pretrain/Step Time": 8.442494189366698} +{"Pretrain/Learning Rate": 4.9056578411848283e-05, "Pretrain/Loss": 2.0898985862731934, "Pretrain/Loss (Raw)": 2.2868409156799316, "Pretrain/Step": 2195, "Pretrain/Step Time": 8.443335887044668} +{"Pretrain/Learning Rate": 4.905542286763015e-05, "Pretrain/Loss": 2.089857578277588, "Pretrain/Loss (Raw)": 1.8664966821670532, "Pretrain/Step": 2196, "Pretrain/Step Time": 8.44948017410934} +{"Pretrain/Learning Rate": 4.9054266629790866e-05, "Pretrain/Loss": 2.088960647583008, "Pretrain/Loss (Raw)": 2.108717918395996, "Pretrain/Step": 2197, "Pretrain/Step Time": 8.451999016106129} +{"Pretrain/Learning Rate": 4.905310969836375e-05, "Pretrain/Loss": 2.090409278869629, "Pretrain/Loss (Raw)": 1.9866275787353516, "Pretrain/Step": 2198, "Pretrain/Step Time": 8.454112857580185} +{"Pretrain/Learning Rate": 4.905195207338217e-05, "Pretrain/Loss": 2.0898334980010986, "Pretrain/Loss (Raw)": 1.9808019399642944, "Pretrain/Step": 2199, "Pretrain/Step Time": 8.449864817783237} +{"Pretrain/Learning Rate": 4.905079375487951e-05, "Pretrain/Loss": 2.0910964012145996, "Pretrain/Loss (Raw)": 2.109423875808716, "Pretrain/Step": 2200, "Pretrain/Step Time": 8.447963174432516} +{"Pretrain/Learning Rate": 4.9049634742889174e-05, "Pretrain/Loss": 2.0913212299346924, "Pretrain/Loss (Raw)": 2.0326757431030273, "Pretrain/Step": 2201, "Pretrain/Step Time": 8.44932017289102} +{"Pretrain/Learning Rate": 4.904847503744456e-05, "Pretrain/Loss": 2.091305732727051, "Pretrain/Loss (Raw)": 2.333225727081299, "Pretrain/Step": 2202, "Pretrain/Step Time": 8.447165753692389} +{"Pretrain/Learning Rate": 4.9047314638579134e-05, "Pretrain/Loss": 2.0901565551757812, "Pretrain/Loss (Raw)": 1.953335165977478, "Pretrain/Step": 2203, "Pretrain/Step Time": 8.446379836648703} +{"Pretrain/Learning Rate": 4.9046153546326333e-05, "Pretrain/Loss": 2.090888023376465, "Pretrain/Loss (Raw)": 1.904231071472168, "Pretrain/Step": 2204, "Pretrain/Step Time": 8.444861704483628} +{"Pretrain/Learning Rate": 4.904499176071966e-05, "Pretrain/Loss": 2.090322971343994, "Pretrain/Loss (Raw)": 1.9809571504592896, "Pretrain/Step": 2205, "Pretrain/Step Time": 8.448127711191773} +{"Pretrain/Learning Rate": 4.904382928179259e-05, "Pretrain/Loss": 2.089416742324829, "Pretrain/Loss (Raw)": 2.0644147396087646, "Pretrain/Step": 2206, "Pretrain/Step Time": 8.44752125069499} +{"Pretrain/Learning Rate": 4.904266610957865e-05, "Pretrain/Loss": 2.087188243865967, "Pretrain/Loss (Raw)": 1.7932958602905273, "Pretrain/Step": 2207, "Pretrain/Step Time": 8.447578659281135} +{"Pretrain/Learning Rate": 4.904150224411138e-05, "Pretrain/Loss": 2.0869107246398926, "Pretrain/Loss (Raw)": 2.102219581604004, "Pretrain/Step": 2208, "Pretrain/Step Time": 8.442027773708105} +{"Pretrain/Learning Rate": 4.904033768542435e-05, "Pretrain/Loss": 2.0896289348602295, "Pretrain/Loss (Raw)": 2.145049810409546, "Pretrain/Step": 2209, "Pretrain/Step Time": 8.439451925456524} +{"Pretrain/Learning Rate": 4.903917243355113e-05, "Pretrain/Loss": 2.0894994735717773, "Pretrain/Loss (Raw)": 2.0950608253479004, "Pretrain/Step": 2210, "Pretrain/Step Time": 8.441749773919582} +{"Pretrain/Learning Rate": 4.9038006488525314e-05, "Pretrain/Loss": 2.0884757041931152, "Pretrain/Loss (Raw)": 2.1010921001434326, "Pretrain/Step": 2211, "Pretrain/Step Time": 8.439604513347149} +{"Pretrain/Learning Rate": 4.903683985038052e-05, "Pretrain/Loss": 2.0875179767608643, "Pretrain/Loss (Raw)": 2.027071714401245, "Pretrain/Step": 2212, "Pretrain/Step Time": 8.440311040729284} +{"Pretrain/Learning Rate": 4.903567251915041e-05, "Pretrain/Loss": 2.0889859199523926, "Pretrain/Loss (Raw)": 2.0706028938293457, "Pretrain/Step": 2213, "Pretrain/Step Time": 8.442993922159076} +{"Pretrain/Learning Rate": 4.9034504494868615e-05, "Pretrain/Loss": 2.0910935401916504, "Pretrain/Loss (Raw)": 2.1981022357940674, "Pretrain/Step": 2214, "Pretrain/Step Time": 8.443879486992955} +{"Pretrain/Learning Rate": 4.903333577756883e-05, "Pretrain/Loss": 2.0895237922668457, "Pretrain/Loss (Raw)": 1.93649160861969, "Pretrain/Step": 2215, "Pretrain/Step Time": 8.443646116182208} +{"Pretrain/Learning Rate": 4.903216636728475e-05, "Pretrain/Loss": 2.0911264419555664, "Pretrain/Loss (Raw)": 2.167238712310791, "Pretrain/Step": 2216, "Pretrain/Step Time": 8.439705273136497} +{"Pretrain/Learning Rate": 4.90309962640501e-05, "Pretrain/Loss": 2.091310501098633, "Pretrain/Loss (Raw)": 2.1298701763153076, "Pretrain/Step": 2217, "Pretrain/Step Time": 8.439721882343292} +{"Pretrain/Learning Rate": 4.9029825467898606e-05, "Pretrain/Loss": 2.0882859230041504, "Pretrain/Loss (Raw)": 1.8922996520996094, "Pretrain/Step": 2218, "Pretrain/Step Time": 8.439024010673165} +{"Pretrain/Learning Rate": 4.9028653978864036e-05, "Pretrain/Loss": 2.088836908340454, "Pretrain/Loss (Raw)": 2.2089059352874756, "Pretrain/Step": 2219, "Pretrain/Step Time": 8.44027371890843} +{"Pretrain/Learning Rate": 4.902748179698017e-05, "Pretrain/Loss": 2.08945894241333, "Pretrain/Loss (Raw)": 2.122796058654785, "Pretrain/Step": 2220, "Pretrain/Step Time": 8.437740374356508} +{"Pretrain/Learning Rate": 4.9026308922280803e-05, "Pretrain/Loss": 2.088300943374634, "Pretrain/Loss (Raw)": 2.0732758045196533, "Pretrain/Step": 2221, "Pretrain/Step Time": 8.440556349232793} +{"Pretrain/Learning Rate": 4.9025135354799755e-05, "Pretrain/Loss": 2.088655948638916, "Pretrain/Loss (Raw)": 2.1759605407714844, "Pretrain/Step": 2222, "Pretrain/Step Time": 8.44166786596179} +{"Pretrain/Learning Rate": 4.9023961094570866e-05, "Pretrain/Loss": 2.0883562564849854, "Pretrain/Loss (Raw)": 2.1747689247131348, "Pretrain/Step": 2223, "Pretrain/Step Time": 8.44413592107594} +{"Pretrain/Learning Rate": 4.9022786141628e-05, "Pretrain/Loss": 2.0887105464935303, "Pretrain/Loss (Raw)": 2.1573431491851807, "Pretrain/Step": 2224, "Pretrain/Step Time": 8.44390687532723} +{"Pretrain/Learning Rate": 4.9021610496005024e-05, "Pretrain/Loss": 2.0886125564575195, "Pretrain/Loss (Raw)": 2.136975049972534, "Pretrain/Step": 2225, "Pretrain/Step Time": 8.441099662333727} +{"Pretrain/Learning Rate": 4.902043415773584e-05, "Pretrain/Loss": 2.0874228477478027, "Pretrain/Loss (Raw)": 1.907313346862793, "Pretrain/Step": 2226, "Pretrain/Step Time": 8.433206332847476} +{"Pretrain/Learning Rate": 4.901925712685438e-05, "Pretrain/Loss": 2.0860180854797363, "Pretrain/Loss (Raw)": 1.7988266944885254, "Pretrain/Step": 2227, "Pretrain/Step Time": 8.437633274123073} +{"Pretrain/Learning Rate": 4.901807940339457e-05, "Pretrain/Loss": 2.0857419967651367, "Pretrain/Loss (Raw)": 2.094245195388794, "Pretrain/Step": 2228, "Pretrain/Step Time": 8.441180659458041} +{"Pretrain/Learning Rate": 4.901690098739037e-05, "Pretrain/Loss": 2.085650682449341, "Pretrain/Loss (Raw)": 2.0259437561035156, "Pretrain/Step": 2229, "Pretrain/Step Time": 8.439037531614304} +{"Pretrain/Learning Rate": 4.901572187887575e-05, "Pretrain/Loss": 2.0849151611328125, "Pretrain/Loss (Raw)": 2.0163462162017822, "Pretrain/Step": 2230, "Pretrain/Step Time": 8.44256492331624} +{"Pretrain/Learning Rate": 4.901454207788474e-05, "Pretrain/Loss": 2.082770824432373, "Pretrain/Loss (Raw)": 1.982492208480835, "Pretrain/Step": 2231, "Pretrain/Step Time": 8.441268850117922} +{"Pretrain/Learning Rate": 4.9013361584451325e-05, "Pretrain/Loss": 2.0849711894989014, "Pretrain/Loss (Raw)": 2.1646153926849365, "Pretrain/Step": 2232, "Pretrain/Step Time": 8.440031887963414} +{"Pretrain/Learning Rate": 4.901218039860956e-05, "Pretrain/Loss": 2.087144374847412, "Pretrain/Loss (Raw)": 2.2907752990722656, "Pretrain/Step": 2233, "Pretrain/Step Time": 8.438646456226707} +{"Pretrain/Learning Rate": 4.9010998520393505e-05, "Pretrain/Loss": 2.0843780040740967, "Pretrain/Loss (Raw)": 1.9450587034225464, "Pretrain/Step": 2234, "Pretrain/Step Time": 8.439797505736351} +{"Pretrain/Learning Rate": 4.900981594983723e-05, "Pretrain/Loss": 2.0860354900360107, "Pretrain/Loss (Raw)": 2.1618592739105225, "Pretrain/Step": 2235, "Pretrain/Step Time": 8.44102775119245} +{"Pretrain/Learning Rate": 4.900863268697484e-05, "Pretrain/Loss": 2.084141254425049, "Pretrain/Loss (Raw)": 1.9368220567703247, "Pretrain/Step": 2236, "Pretrain/Step Time": 8.444784028455615} +{"Pretrain/Learning Rate": 4.900744873184045e-05, "Pretrain/Loss": 2.0831573009490967, "Pretrain/Loss (Raw)": 2.144744634628296, "Pretrain/Step": 2237, "Pretrain/Step Time": 8.44183911010623} +{"Pretrain/Learning Rate": 4.90062640844682e-05, "Pretrain/Loss": 2.0861406326293945, "Pretrain/Loss (Raw)": 2.3201093673706055, "Pretrain/Step": 2238, "Pretrain/Step Time": 8.442620042711496} +{"Pretrain/Learning Rate": 4.9005078744892255e-05, "Pretrain/Loss": 2.0873665809631348, "Pretrain/Loss (Raw)": 2.1682779788970947, "Pretrain/Step": 2239, "Pretrain/Step Time": 8.443784082308412} +{"Pretrain/Learning Rate": 4.900389271314677e-05, "Pretrain/Loss": 2.090102195739746, "Pretrain/Loss (Raw)": 2.357252836227417, "Pretrain/Step": 2240, "Pretrain/Step Time": 8.442772613838315} +{"Pretrain/Learning Rate": 4.900270598926597e-05, "Pretrain/Loss": 2.091695785522461, "Pretrain/Loss (Raw)": 2.1067922115325928, "Pretrain/Step": 2241, "Pretrain/Step Time": 8.441142892464995} +{"Pretrain/Learning Rate": 4.9001518573284066e-05, "Pretrain/Loss": 2.0954084396362305, "Pretrain/Loss (Raw)": 2.4120466709136963, "Pretrain/Step": 2242, "Pretrain/Step Time": 8.441065846011043} +{"Pretrain/Learning Rate": 4.90003304652353e-05, "Pretrain/Loss": 2.0945394039154053, "Pretrain/Loss (Raw)": 2.246532440185547, "Pretrain/Step": 2243, "Pretrain/Step Time": 8.431658966466784} +{"Pretrain/Learning Rate": 4.8999141665153915e-05, "Pretrain/Loss": 2.093639850616455, "Pretrain/Loss (Raw)": 1.9109549522399902, "Pretrain/Step": 2244, "Pretrain/Step Time": 8.436951393261552} +{"Pretrain/Learning Rate": 4.8997952173074204e-05, "Pretrain/Loss": 2.094308376312256, "Pretrain/Loss (Raw)": 2.171877861022949, "Pretrain/Step": 2245, "Pretrain/Step Time": 8.433547668159008} +{"Pretrain/Learning Rate": 4.899676198903045e-05, "Pretrain/Loss": 2.094055414199829, "Pretrain/Loss (Raw)": 2.091386556625366, "Pretrain/Step": 2246, "Pretrain/Step Time": 8.437752906233072} +{"Pretrain/Learning Rate": 4.899557111305699e-05, "Pretrain/Loss": 2.0947046279907227, "Pretrain/Loss (Raw)": 2.156373977661133, "Pretrain/Step": 2247, "Pretrain/Step Time": 8.443239141255617} +{"Pretrain/Learning Rate": 4.8994379545188144e-05, "Pretrain/Loss": 2.0956430435180664, "Pretrain/Loss (Raw)": 2.202479600906372, "Pretrain/Step": 2248, "Pretrain/Step Time": 8.438222093507648} +{"Pretrain/Learning Rate": 4.8993187285458284e-05, "Pretrain/Loss": 2.095332145690918, "Pretrain/Loss (Raw)": 1.9419265985488892, "Pretrain/Step": 2249, "Pretrain/Step Time": 8.431652976199985} +{"Pretrain/Learning Rate": 4.899199433390178e-05, "Pretrain/Loss": 2.0945773124694824, "Pretrain/Loss (Raw)": 2.084383487701416, "Pretrain/Step": 2250, "Pretrain/Step Time": 8.433078782632947} +{"Pretrain/Learning Rate": 4.899080069055304e-05, "Pretrain/Loss": 2.096738815307617, "Pretrain/Loss (Raw)": 2.036017417907715, "Pretrain/Step": 2251, "Pretrain/Step Time": 8.432819506153464} +{"Pretrain/Learning Rate": 4.898960635544647e-05, "Pretrain/Loss": 2.097700595855713, "Pretrain/Loss (Raw)": 2.1372480392456055, "Pretrain/Step": 2252, "Pretrain/Step Time": 8.435132393613458} +{"Pretrain/Learning Rate": 4.898841132861651e-05, "Pretrain/Loss": 2.099307060241699, "Pretrain/Loss (Raw)": 2.164076089859009, "Pretrain/Step": 2253, "Pretrain/Step Time": 8.43261617794633} +{"Pretrain/Learning Rate": 4.898721561009762e-05, "Pretrain/Loss": 2.1011147499084473, "Pretrain/Loss (Raw)": 2.316211223602295, "Pretrain/Step": 2254, "Pretrain/Step Time": 8.439762314781547} +{"Pretrain/Learning Rate": 4.8986019199924286e-05, "Pretrain/Loss": 2.100184679031372, "Pretrain/Loss (Raw)": 2.0615601539611816, "Pretrain/Step": 2255, "Pretrain/Step Time": 8.439145365729928} +{"Pretrain/Learning Rate": 4.898482209813099e-05, "Pretrain/Loss": 2.100759983062744, "Pretrain/Loss (Raw)": 2.1711838245391846, "Pretrain/Step": 2256, "Pretrain/Step Time": 8.4418935906142} +{"Pretrain/Learning Rate": 4.898362430475225e-05, "Pretrain/Loss": 2.099936008453369, "Pretrain/Loss (Raw)": 2.010866641998291, "Pretrain/Step": 2257, "Pretrain/Step Time": 8.43943870253861} +{"Pretrain/Learning Rate": 4.898242581982262e-05, "Pretrain/Loss": 2.0999183654785156, "Pretrain/Loss (Raw)": 2.100524663925171, "Pretrain/Step": 2258, "Pretrain/Step Time": 8.435752235352993} +{"Pretrain/Learning Rate": 4.898122664337665e-05, "Pretrain/Loss": 2.099520444869995, "Pretrain/Loss (Raw)": 2.142258644104004, "Pretrain/Step": 2259, "Pretrain/Step Time": 8.436474362388253} +{"Pretrain/Learning Rate": 4.898002677544891e-05, "Pretrain/Loss": 2.101487159729004, "Pretrain/Loss (Raw)": 2.3083226680755615, "Pretrain/Step": 2260, "Pretrain/Step Time": 8.432746179401875} +{"Pretrain/Learning Rate": 4.8978826216074e-05, "Pretrain/Loss": 2.100111722946167, "Pretrain/Loss (Raw)": 2.053436517715454, "Pretrain/Step": 2261, "Pretrain/Step Time": 8.438668798655272} +{"Pretrain/Learning Rate": 4.897762496528655e-05, "Pretrain/Loss": 2.1016764640808105, "Pretrain/Loss (Raw)": 2.172400712966919, "Pretrain/Step": 2262, "Pretrain/Step Time": 8.434331821277738} +{"Pretrain/Learning Rate": 4.8976423023121184e-05, "Pretrain/Loss": 2.103213310241699, "Pretrain/Loss (Raw)": 2.1168148517608643, "Pretrain/Step": 2263, "Pretrain/Step Time": 8.441100228577852} +{"Pretrain/Learning Rate": 4.8975220389612557e-05, "Pretrain/Loss": 2.1031734943389893, "Pretrain/Loss (Raw)": 1.939780354499817, "Pretrain/Step": 2264, "Pretrain/Step Time": 8.441690200939775} +{"Pretrain/Learning Rate": 4.897401706479535e-05, "Pretrain/Loss": 2.102721929550171, "Pretrain/Loss (Raw)": 2.0476233959198, "Pretrain/Step": 2265, "Pretrain/Step Time": 8.436134722083807} +{"Pretrain/Learning Rate": 4.897281304870427e-05, "Pretrain/Loss": 2.104930877685547, "Pretrain/Loss (Raw)": 1.9842562675476074, "Pretrain/Step": 2266, "Pretrain/Step Time": 8.435812750831246} +{"Pretrain/Learning Rate": 4.897160834137402e-05, "Pretrain/Loss": 2.1016221046447754, "Pretrain/Loss (Raw)": 1.9226627349853516, "Pretrain/Step": 2267, "Pretrain/Step Time": 8.439328163862228} +{"Pretrain/Learning Rate": 4.8970402942839346e-05, "Pretrain/Loss": 2.1010096073150635, "Pretrain/Loss (Raw)": 2.12172269821167, "Pretrain/Step": 2268, "Pretrain/Step Time": 8.43882218003273} +{"Pretrain/Learning Rate": 4.8969196853135e-05, "Pretrain/Loss": 2.0992517471313477, "Pretrain/Loss (Raw)": 1.94400954246521, "Pretrain/Step": 2269, "Pretrain/Step Time": 8.437201598659158} +{"Pretrain/Learning Rate": 4.896799007229576e-05, "Pretrain/Loss": 2.0985875129699707, "Pretrain/Loss (Raw)": 2.1202714443206787, "Pretrain/Step": 2270, "Pretrain/Step Time": 8.438870059326291} +{"Pretrain/Learning Rate": 4.896678260035642e-05, "Pretrain/Loss": 2.098837375640869, "Pretrain/Loss (Raw)": 2.193876266479492, "Pretrain/Step": 2271, "Pretrain/Step Time": 8.443712646141648} +{"Pretrain/Learning Rate": 4.89655744373518e-05, "Pretrain/Loss": 2.099379062652588, "Pretrain/Loss (Raw)": 2.289511203765869, "Pretrain/Step": 2272, "Pretrain/Step Time": 8.440382674336433} +{"Pretrain/Learning Rate": 4.896436558331674e-05, "Pretrain/Loss": 2.0988316535949707, "Pretrain/Loss (Raw)": 2.083965539932251, "Pretrain/Step": 2273, "Pretrain/Step Time": 8.44183631055057} +{"Pretrain/Learning Rate": 4.8963156038286084e-05, "Pretrain/Loss": 2.096972942352295, "Pretrain/Loss (Raw)": 1.9630037546157837, "Pretrain/Step": 2274, "Pretrain/Step Time": 8.440056789666414} +{"Pretrain/Learning Rate": 4.8961945802294726e-05, "Pretrain/Loss": 2.0975394248962402, "Pretrain/Loss (Raw)": 2.1393065452575684, "Pretrain/Step": 2275, "Pretrain/Step Time": 8.434590395539999} +{"Pretrain/Learning Rate": 4.896073487537754e-05, "Pretrain/Loss": 2.0990500450134277, "Pretrain/Loss (Raw)": 2.2917091846466064, "Pretrain/Step": 2276, "Pretrain/Step Time": 8.431354854255915} +{"Pretrain/Learning Rate": 4.895952325756947e-05, "Pretrain/Loss": 2.09887957572937, "Pretrain/Loss (Raw)": 2.1401243209838867, "Pretrain/Step": 2277, "Pretrain/Step Time": 8.433157354593277} +{"Pretrain/Learning Rate": 4.8958310948905426e-05, "Pretrain/Loss": 2.0986547470092773, "Pretrain/Loss (Raw)": 2.1527085304260254, "Pretrain/Step": 2278, "Pretrain/Step Time": 8.431815950199962} +{"Pretrain/Learning Rate": 4.8957097949420383e-05, "Pretrain/Loss": 2.1013054847717285, "Pretrain/Loss (Raw)": 2.317976951599121, "Pretrain/Step": 2279, "Pretrain/Step Time": 8.43232267536223} +{"Pretrain/Learning Rate": 4.895588425914931e-05, "Pretrain/Loss": 2.1027116775512695, "Pretrain/Loss (Raw)": 2.1719210147857666, "Pretrain/Step": 2280, "Pretrain/Step Time": 8.43197956122458} +{"Pretrain/Learning Rate": 4.89546698781272e-05, "Pretrain/Loss": 2.1032869815826416, "Pretrain/Loss (Raw)": 2.1829962730407715, "Pretrain/Step": 2281, "Pretrain/Step Time": 8.435761090368032} +{"Pretrain/Learning Rate": 4.8953454806389066e-05, "Pretrain/Loss": 2.104090690612793, "Pretrain/Loss (Raw)": 2.064161539077759, "Pretrain/Step": 2282, "Pretrain/Step Time": 8.435418410226703} +{"Pretrain/Learning Rate": 4.895223904396995e-05, "Pretrain/Loss": 2.0993902683258057, "Pretrain/Loss (Raw)": 1.727057933807373, "Pretrain/Step": 2283, "Pretrain/Step Time": 8.437891649082303} +{"Pretrain/Learning Rate": 4.895102259090491e-05, "Pretrain/Loss": 2.0989723205566406, "Pretrain/Loss (Raw)": 1.8871128559112549, "Pretrain/Step": 2284, "Pretrain/Step Time": 8.437830150127411} +{"Pretrain/Learning Rate": 4.8949805447229016e-05, "Pretrain/Loss": 2.0993194580078125, "Pretrain/Loss (Raw)": 2.049592971801758, "Pretrain/Step": 2285, "Pretrain/Step Time": 8.436931043863297} +{"Pretrain/Learning Rate": 4.894858761297737e-05, "Pretrain/Loss": 2.09875750541687, "Pretrain/Loss (Raw)": 2.104022264480591, "Pretrain/Step": 2286, "Pretrain/Step Time": 8.434445271268487} +{"Pretrain/Learning Rate": 4.8947369088185075e-05, "Pretrain/Loss": 2.1000685691833496, "Pretrain/Loss (Raw)": 2.2679779529571533, "Pretrain/Step": 2287, "Pretrain/Step Time": 8.439051499590278} +{"Pretrain/Learning Rate": 4.894614987288728e-05, "Pretrain/Loss": 2.0988588333129883, "Pretrain/Loss (Raw)": 1.9917986392974854, "Pretrain/Step": 2288, "Pretrain/Step Time": 8.440303571522236} +{"Pretrain/Learning Rate": 4.894492996711913e-05, "Pretrain/Loss": 2.0974347591400146, "Pretrain/Loss (Raw)": 2.0448250770568848, "Pretrain/Step": 2289, "Pretrain/Step Time": 8.438145328313112} +{"Pretrain/Learning Rate": 4.8943709370915804e-05, "Pretrain/Loss": 2.0962820053100586, "Pretrain/Loss (Raw)": 2.057687997817993, "Pretrain/Step": 2290, "Pretrain/Step Time": 8.437038000673056} +{"Pretrain/Learning Rate": 4.8942488084312496e-05, "Pretrain/Loss": 2.097196102142334, "Pretrain/Loss (Raw)": 2.1050350666046143, "Pretrain/Step": 2291, "Pretrain/Step Time": 8.434399789199233} +{"Pretrain/Learning Rate": 4.894126610734443e-05, "Pretrain/Loss": 2.0966103076934814, "Pretrain/Loss (Raw)": 2.054802417755127, "Pretrain/Step": 2292, "Pretrain/Step Time": 8.433553948998451} +{"Pretrain/Learning Rate": 4.8940043440046837e-05, "Pretrain/Loss": 2.096752643585205, "Pretrain/Loss (Raw)": 1.9951533079147339, "Pretrain/Step": 2293, "Pretrain/Step Time": 8.431555459275842} +{"Pretrain/Learning Rate": 4.893882008245496e-05, "Pretrain/Loss": 2.0962905883789062, "Pretrain/Loss (Raw)": 2.0387349128723145, "Pretrain/Step": 2294, "Pretrain/Step Time": 8.432654298841953} +{"Pretrain/Learning Rate": 4.893759603460408e-05, "Pretrain/Loss": 2.0963311195373535, "Pretrain/Loss (Raw)": 2.1391966342926025, "Pretrain/Step": 2295, "Pretrain/Step Time": 8.428765749558806} +{"Pretrain/Learning Rate": 4.893637129652949e-05, "Pretrain/Loss": 2.096571445465088, "Pretrain/Loss (Raw)": 2.0838661193847656, "Pretrain/Step": 2296, "Pretrain/Step Time": 8.426921654492617} +{"Pretrain/Learning Rate": 4.893514586826652e-05, "Pretrain/Loss": 2.097012996673584, "Pretrain/Loss (Raw)": 2.08074688911438, "Pretrain/Step": 2297, "Pretrain/Step Time": 8.4231699090451} +{"Pretrain/Learning Rate": 4.893391974985048e-05, "Pretrain/Loss": 2.0980224609375, "Pretrain/Loss (Raw)": 2.2458906173706055, "Pretrain/Step": 2298, "Pretrain/Step Time": 8.426514968276024} +{"Pretrain/Learning Rate": 4.8932692941316745e-05, "Pretrain/Loss": 2.099846839904785, "Pretrain/Loss (Raw)": 2.3181710243225098, "Pretrain/Step": 2299, "Pretrain/Step Time": 8.431582797318697} +{"Pretrain/Learning Rate": 4.8931465442700674e-05, "Pretrain/Loss": 2.0972185134887695, "Pretrain/Loss (Raw)": 2.028041124343872, "Pretrain/Step": 2300, "Pretrain/Step Time": 8.432788519188762} +{"Pretrain/Learning Rate": 4.893023725403767e-05, "Pretrain/Loss": 2.096268653869629, "Pretrain/Loss (Raw)": 1.946128249168396, "Pretrain/Step": 2301, "Pretrain/Step Time": 8.430001379922032} +{"Pretrain/Learning Rate": 4.892900837536315e-05, "Pretrain/Loss": 2.0947461128234863, "Pretrain/Loss (Raw)": 2.1777114868164062, "Pretrain/Step": 2302, "Pretrain/Step Time": 8.422806926071644} +{"Pretrain/Learning Rate": 4.8927778806712535e-05, "Pretrain/Loss": 2.093113422393799, "Pretrain/Loss (Raw)": 1.9367645978927612, "Pretrain/Step": 2303, "Pretrain/Step Time": 8.427192321047187} +{"Pretrain/Learning Rate": 4.8926548548121286e-05, "Pretrain/Loss": 2.0894007682800293, "Pretrain/Loss (Raw)": 1.7835350036621094, "Pretrain/Step": 2304, "Pretrain/Step Time": 8.431855164468288} +{"Pretrain/Learning Rate": 4.8925317599624886e-05, "Pretrain/Loss": 2.0881683826446533, "Pretrain/Loss (Raw)": 1.9578924179077148, "Pretrain/Step": 2305, "Pretrain/Step Time": 8.429754255339503} +{"Pretrain/Learning Rate": 4.892408596125881e-05, "Pretrain/Loss": 2.0887503623962402, "Pretrain/Loss (Raw)": 2.156017541885376, "Pretrain/Step": 2306, "Pretrain/Step Time": 8.423021357506514} +{"Pretrain/Learning Rate": 4.8922853633058584e-05, "Pretrain/Loss": 2.089378833770752, "Pretrain/Loss (Raw)": 2.0379128456115723, "Pretrain/Step": 2307, "Pretrain/Step Time": 8.42428333684802} +{"Pretrain/Learning Rate": 4.892162061505974e-05, "Pretrain/Loss": 2.089048385620117, "Pretrain/Loss (Raw)": 1.9915683269500732, "Pretrain/Step": 2308, "Pretrain/Step Time": 8.418255887925625} +{"Pretrain/Learning Rate": 4.892038690729782e-05, "Pretrain/Loss": 2.090000629425049, "Pretrain/Loss (Raw)": 2.05853009223938, "Pretrain/Step": 2309, "Pretrain/Step Time": 8.412650104612112} +{"Pretrain/Learning Rate": 4.891915250980842e-05, "Pretrain/Loss": 2.089365005493164, "Pretrain/Loss (Raw)": 2.0502262115478516, "Pretrain/Step": 2310, "Pretrain/Step Time": 8.41942435130477} +{"Pretrain/Learning Rate": 4.891791742262711e-05, "Pretrain/Loss": 2.0856621265411377, "Pretrain/Loss (Raw)": 1.71971595287323, "Pretrain/Step": 2311, "Pretrain/Step Time": 8.421728316694498} +{"Pretrain/Learning Rate": 4.8916681645789507e-05, "Pretrain/Loss": 2.0874314308166504, "Pretrain/Loss (Raw)": 2.288837432861328, "Pretrain/Step": 2312, "Pretrain/Step Time": 8.42084858007729} +{"Pretrain/Learning Rate": 4.891544517933127e-05, "Pretrain/Loss": 2.0856480598449707, "Pretrain/Loss (Raw)": 1.849928617477417, "Pretrain/Step": 2313, "Pretrain/Step Time": 8.42108473367989} +{"Pretrain/Learning Rate": 4.891420802328801e-05, "Pretrain/Loss": 2.0863499641418457, "Pretrain/Loss (Raw)": 2.2481892108917236, "Pretrain/Step": 2314, "Pretrain/Step Time": 8.42016877233982} +{"Pretrain/Learning Rate": 4.8912970177695426e-05, "Pretrain/Loss": 2.0847437381744385, "Pretrain/Loss (Raw)": 2.011558771133423, "Pretrain/Step": 2315, "Pretrain/Step Time": 8.419843923300505} +{"Pretrain/Learning Rate": 4.8911731642589205e-05, "Pretrain/Loss": 2.0831189155578613, "Pretrain/Loss (Raw)": 1.9428279399871826, "Pretrain/Step": 2316, "Pretrain/Step Time": 8.420087041333318} +{"Pretrain/Learning Rate": 4.891049241800506e-05, "Pretrain/Loss": 2.0850698947906494, "Pretrain/Loss (Raw)": 2.2136220932006836, "Pretrain/Step": 2317, "Pretrain/Step Time": 8.417401917278767} +{"Pretrain/Learning Rate": 4.890925250397872e-05, "Pretrain/Loss": 2.0838704109191895, "Pretrain/Loss (Raw)": 1.9655745029449463, "Pretrain/Step": 2318, "Pretrain/Step Time": 8.414291536435485} +{"Pretrain/Learning Rate": 4.890801190054594e-05, "Pretrain/Loss": 2.0836000442504883, "Pretrain/Loss (Raw)": 2.122195243835449, "Pretrain/Step": 2319, "Pretrain/Step Time": 8.416057286784053} +{"Pretrain/Learning Rate": 4.890677060774249e-05, "Pretrain/Loss": 2.084271192550659, "Pretrain/Loss (Raw)": 2.1627023220062256, "Pretrain/Step": 2320, "Pretrain/Step Time": 8.420881340280175} +{"Pretrain/Learning Rate": 4.890552862560416e-05, "Pretrain/Loss": 2.0856611728668213, "Pretrain/Loss (Raw)": 2.2783873081207275, "Pretrain/Step": 2321, "Pretrain/Step Time": 8.42059021256864} +{"Pretrain/Learning Rate": 4.890428595416677e-05, "Pretrain/Loss": 2.0877037048339844, "Pretrain/Loss (Raw)": 2.2884271144866943, "Pretrain/Step": 2322, "Pretrain/Step Time": 8.421202166005969} +{"Pretrain/Learning Rate": 4.8903042593466144e-05, "Pretrain/Loss": 2.085460662841797, "Pretrain/Loss (Raw)": 1.999722957611084, "Pretrain/Step": 2323, "Pretrain/Step Time": 8.417835922911763} +{"Pretrain/Learning Rate": 4.8901798543538136e-05, "Pretrain/Loss": 2.087493419647217, "Pretrain/Loss (Raw)": 2.1266937255859375, "Pretrain/Step": 2324, "Pretrain/Step Time": 8.413447979837656} +{"Pretrain/Learning Rate": 4.8900553804418613e-05, "Pretrain/Loss": 2.0870423316955566, "Pretrain/Loss (Raw)": 2.050968885421753, "Pretrain/Step": 2325, "Pretrain/Step Time": 8.40775441005826} +{"Pretrain/Learning Rate": 4.889930837614347e-05, "Pretrain/Loss": 2.087717056274414, "Pretrain/Loss (Raw)": 2.0730035305023193, "Pretrain/Step": 2326, "Pretrain/Step Time": 8.409117318689823} +{"Pretrain/Learning Rate": 4.8898062258748624e-05, "Pretrain/Loss": 2.0883545875549316, "Pretrain/Loss (Raw)": 2.0623927116394043, "Pretrain/Step": 2327, "Pretrain/Step Time": 8.41027177684009} +{"Pretrain/Learning Rate": 4.889681545226999e-05, "Pretrain/Loss": 2.089315414428711, "Pretrain/Loss (Raw)": 2.232424259185791, "Pretrain/Step": 2328, "Pretrain/Step Time": 8.4149430077523} +{"Pretrain/Learning Rate": 4.889556795674354e-05, "Pretrain/Loss": 2.089235305786133, "Pretrain/Loss (Raw)": 2.0224082469940186, "Pretrain/Step": 2329, "Pretrain/Step Time": 8.415585046634078} +{"Pretrain/Learning Rate": 4.8894319772205226e-05, "Pretrain/Loss": 2.085953712463379, "Pretrain/Loss (Raw)": 1.9131728410720825, "Pretrain/Step": 2330, "Pretrain/Step Time": 8.41347829438746} +{"Pretrain/Learning Rate": 4.889307089869105e-05, "Pretrain/Loss": 2.0877177715301514, "Pretrain/Loss (Raw)": 2.179145574569702, "Pretrain/Step": 2331, "Pretrain/Step Time": 8.412634851410985} +{"Pretrain/Learning Rate": 4.8891821336237015e-05, "Pretrain/Loss": 2.0887274742126465, "Pretrain/Loss (Raw)": 2.0334620475769043, "Pretrain/Step": 2332, "Pretrain/Step Time": 8.415496887639165} +{"Pretrain/Learning Rate": 4.8890571084879155e-05, "Pretrain/Loss": 2.0889205932617188, "Pretrain/Loss (Raw)": 2.0056843757629395, "Pretrain/Step": 2333, "Pretrain/Step Time": 8.41803384386003} +{"Pretrain/Learning Rate": 4.888932014465352e-05, "Pretrain/Loss": 2.0907297134399414, "Pretrain/Loss (Raw)": 2.2959957122802734, "Pretrain/Step": 2334, "Pretrain/Step Time": 8.412814311683178} +{"Pretrain/Learning Rate": 4.888806851559618e-05, "Pretrain/Loss": 2.09098744392395, "Pretrain/Loss (Raw)": 1.8262832164764404, "Pretrain/Step": 2335, "Pretrain/Step Time": 8.413775620982051} +{"Pretrain/Learning Rate": 4.888681619774322e-05, "Pretrain/Loss": 2.091975212097168, "Pretrain/Loss (Raw)": 2.228632926940918, "Pretrain/Step": 2336, "Pretrain/Step Time": 8.416053898632526} +{"Pretrain/Learning Rate": 4.888556319113076e-05, "Pretrain/Loss": 2.090571880340576, "Pretrain/Loss (Raw)": 1.9654245376586914, "Pretrain/Step": 2337, "Pretrain/Step Time": 8.421489706262946} +{"Pretrain/Learning Rate": 4.888430949579492e-05, "Pretrain/Loss": 2.0894713401794434, "Pretrain/Loss (Raw)": 1.9542025327682495, "Pretrain/Step": 2338, "Pretrain/Step Time": 8.419678078964353} +{"Pretrain/Learning Rate": 4.8883055111771855e-05, "Pretrain/Loss": 2.0906004905700684, "Pretrain/Loss (Raw)": 2.2455973625183105, "Pretrain/Step": 2339, "Pretrain/Step Time": 8.41834138520062} +{"Pretrain/Learning Rate": 4.8881800039097737e-05, "Pretrain/Loss": 2.091644525527954, "Pretrain/Loss (Raw)": 2.1607396602630615, "Pretrain/Step": 2340, "Pretrain/Step Time": 8.412919519469142} +{"Pretrain/Learning Rate": 4.8880544277808735e-05, "Pretrain/Loss": 2.0915167331695557, "Pretrain/Loss (Raw)": 2.0542213916778564, "Pretrain/Step": 2341, "Pretrain/Step Time": 8.4115284755826} +{"Pretrain/Learning Rate": 4.887928782794109e-05, "Pretrain/Loss": 2.0914087295532227, "Pretrain/Loss (Raw)": 2.184288501739502, "Pretrain/Step": 2342, "Pretrain/Step Time": 8.40626635029912} +{"Pretrain/Learning Rate": 4.887803068953101e-05, "Pretrain/Loss": 2.092668056488037, "Pretrain/Loss (Raw)": 2.0977046489715576, "Pretrain/Step": 2343, "Pretrain/Step Time": 8.408768989145756} +{"Pretrain/Learning Rate": 4.887677286261474e-05, "Pretrain/Loss": 2.092139482498169, "Pretrain/Loss (Raw)": 2.0995547771453857, "Pretrain/Step": 2344, "Pretrain/Step Time": 8.411006515845656} +{"Pretrain/Learning Rate": 4.887551434722857e-05, "Pretrain/Loss": 2.090867519378662, "Pretrain/Loss (Raw)": 1.9670993089675903, "Pretrain/Step": 2345, "Pretrain/Step Time": 8.413748430088162} +{"Pretrain/Learning Rate": 4.887425514340877e-05, "Pretrain/Loss": 2.0918664932250977, "Pretrain/Loss (Raw)": 2.020153284072876, "Pretrain/Step": 2346, "Pretrain/Step Time": 8.417554905638099} +{"Pretrain/Learning Rate": 4.887299525119164e-05, "Pretrain/Loss": 2.0907626152038574, "Pretrain/Loss (Raw)": 2.0676045417785645, "Pretrain/Step": 2347, "Pretrain/Step Time": 8.41271609812975} +{"Pretrain/Learning Rate": 4.8871734670613536e-05, "Pretrain/Loss": 2.092468738555908, "Pretrain/Loss (Raw)": 2.3411636352539062, "Pretrain/Step": 2348, "Pretrain/Step Time": 8.416378181427717} +{"Pretrain/Learning Rate": 4.887047340171078e-05, "Pretrain/Loss": 2.0934810638427734, "Pretrain/Loss (Raw)": 2.2028563022613525, "Pretrain/Step": 2349, "Pretrain/Step Time": 8.416614521294832} +{"Pretrain/Learning Rate": 4.8869211444519767e-05, "Pretrain/Loss": 2.092095136642456, "Pretrain/Loss (Raw)": 1.9985756874084473, "Pretrain/Step": 2350, "Pretrain/Step Time": 8.416406584903598} +{"Pretrain/Learning Rate": 4.8867948799076854e-05, "Pretrain/Loss": 2.0901873111724854, "Pretrain/Loss (Raw)": 1.9305616617202759, "Pretrain/Step": 2351, "Pretrain/Step Time": 8.415097169578075} +{"Pretrain/Learning Rate": 4.886668546541847e-05, "Pretrain/Loss": 2.090178966522217, "Pretrain/Loss (Raw)": 2.156275987625122, "Pretrain/Step": 2352, "Pretrain/Step Time": 8.413859723135829} +{"Pretrain/Learning Rate": 4.8865421443581036e-05, "Pretrain/Loss": 2.089280128479004, "Pretrain/Loss (Raw)": 2.0219361782073975, "Pretrain/Step": 2353, "Pretrain/Step Time": 8.416231965646148} +{"Pretrain/Learning Rate": 4.8864156733601e-05, "Pretrain/Loss": 2.0877761840820312, "Pretrain/Loss (Raw)": 1.7148038148880005, "Pretrain/Step": 2354, "Pretrain/Step Time": 8.418129369616508} +{"Pretrain/Learning Rate": 4.8862891335514824e-05, "Pretrain/Loss": 2.090087890625, "Pretrain/Loss (Raw)": 2.0947065353393555, "Pretrain/Step": 2355, "Pretrain/Step Time": 8.418070470914245} +{"Pretrain/Learning Rate": 4.886162524935899e-05, "Pretrain/Loss": 2.0892457962036133, "Pretrain/Loss (Raw)": 1.986478567123413, "Pretrain/Step": 2356, "Pretrain/Step Time": 8.415416738018394} +{"Pretrain/Learning Rate": 4.886035847517003e-05, "Pretrain/Loss": 2.0896944999694824, "Pretrain/Loss (Raw)": 2.0833747386932373, "Pretrain/Step": 2357, "Pretrain/Step Time": 8.413235234096646} +{"Pretrain/Learning Rate": 4.885909101298444e-05, "Pretrain/Loss": 2.088319778442383, "Pretrain/Loss (Raw)": 1.840396761894226, "Pretrain/Step": 2358, "Pretrain/Step Time": 8.41054112650454} +{"Pretrain/Learning Rate": 4.8857822862838784e-05, "Pretrain/Loss": 2.0895118713378906, "Pretrain/Loss (Raw)": 2.1350395679473877, "Pretrain/Step": 2359, "Pretrain/Step Time": 8.41272123157978} +{"Pretrain/Learning Rate": 4.885655402476963e-05, "Pretrain/Loss": 2.0875909328460693, "Pretrain/Loss (Raw)": 1.9187486171722412, "Pretrain/Step": 2360, "Pretrain/Step Time": 8.40976413153112} +{"Pretrain/Learning Rate": 4.885528449881356e-05, "Pretrain/Loss": 2.0856528282165527, "Pretrain/Loss (Raw)": 2.0426995754241943, "Pretrain/Step": 2361, "Pretrain/Step Time": 8.41573180258274} +{"Pretrain/Learning Rate": 4.8854014285007175e-05, "Pretrain/Loss": 2.0868959426879883, "Pretrain/Loss (Raw)": 2.1041853427886963, "Pretrain/Step": 2362, "Pretrain/Step Time": 8.418258484452963} +{"Pretrain/Learning Rate": 4.88527433833871e-05, "Pretrain/Loss": 2.0871167182922363, "Pretrain/Loss (Raw)": 2.1901159286499023, "Pretrain/Step": 2363, "Pretrain/Step Time": 8.415162831544876} +{"Pretrain/Learning Rate": 4.885147179398999e-05, "Pretrain/Loss": 2.088592529296875, "Pretrain/Loss (Raw)": 2.125746726989746, "Pretrain/Step": 2364, "Pretrain/Step Time": 8.40940142981708} +{"Pretrain/Learning Rate": 4.8850199516852504e-05, "Pretrain/Loss": 2.087728977203369, "Pretrain/Loss (Raw)": 2.034188985824585, "Pretrain/Step": 2365, "Pretrain/Step Time": 8.414456095546484} +{"Pretrain/Learning Rate": 4.884892655201132e-05, "Pretrain/Loss": 2.0836682319641113, "Pretrain/Loss (Raw)": 1.8003557920455933, "Pretrain/Step": 2366, "Pretrain/Step Time": 8.413583222776651} +{"Pretrain/Learning Rate": 4.884765289950316e-05, "Pretrain/Loss": 2.0843164920806885, "Pretrain/Loss (Raw)": 2.2512168884277344, "Pretrain/Step": 2367, "Pretrain/Step Time": 8.413091786205769} +{"Pretrain/Learning Rate": 4.8846378559364736e-05, "Pretrain/Loss": 2.0811820030212402, "Pretrain/Loss (Raw)": 1.9560635089874268, "Pretrain/Step": 2368, "Pretrain/Step Time": 8.416332671418786} +{"Pretrain/Learning Rate": 4.8845103531632795e-05, "Pretrain/Loss": 2.081465721130371, "Pretrain/Loss (Raw)": 2.1431024074554443, "Pretrain/Step": 2369, "Pretrain/Step Time": 8.418230891227722} +{"Pretrain/Learning Rate": 4.884382781634411e-05, "Pretrain/Loss": 2.078552484512329, "Pretrain/Loss (Raw)": 2.039156913757324, "Pretrain/Step": 2370, "Pretrain/Step Time": 8.41623349301517} +{"Pretrain/Learning Rate": 4.8842551413535456e-05, "Pretrain/Loss": 2.0763614177703857, "Pretrain/Loss (Raw)": 1.9660651683807373, "Pretrain/Step": 2371, "Pretrain/Step Time": 8.417621864005923} +{"Pretrain/Learning Rate": 4.884127432324364e-05, "Pretrain/Loss": 2.0769622325897217, "Pretrain/Loss (Raw)": 1.9878623485565186, "Pretrain/Step": 2372, "Pretrain/Step Time": 8.414564279839396} +{"Pretrain/Learning Rate": 4.8839996545505483e-05, "Pretrain/Loss": 2.0781333446502686, "Pretrain/Loss (Raw)": 2.3217971324920654, "Pretrain/Step": 2373, "Pretrain/Step Time": 8.413540998473763} +{"Pretrain/Learning Rate": 4.883871808035784e-05, "Pretrain/Loss": 2.0791118144989014, "Pretrain/Loss (Raw)": 2.216627836227417, "Pretrain/Step": 2374, "Pretrain/Step Time": 8.412111952900887} +{"Pretrain/Learning Rate": 4.883743892783756e-05, "Pretrain/Loss": 2.079623222351074, "Pretrain/Loss (Raw)": 2.221829414367676, "Pretrain/Step": 2375, "Pretrain/Step Time": 8.407523905858397} +{"Pretrain/Learning Rate": 4.8836159087981535e-05, "Pretrain/Loss": 2.077700138092041, "Pretrain/Loss (Raw)": 1.9563034772872925, "Pretrain/Step": 2376, "Pretrain/Step Time": 8.407365024089813} +{"Pretrain/Learning Rate": 4.883487856082666e-05, "Pretrain/Loss": 2.0793533325195312, "Pretrain/Loss (Raw)": 2.1535544395446777, "Pretrain/Step": 2377, "Pretrain/Step Time": 8.408762017264962} +{"Pretrain/Learning Rate": 4.883359734640987e-05, "Pretrain/Loss": 2.0792016983032227, "Pretrain/Loss (Raw)": 2.06496262550354, "Pretrain/Step": 2378, "Pretrain/Step Time": 8.414645349606872} +{"Pretrain/Learning Rate": 4.883231544476811e-05, "Pretrain/Loss": 2.0817713737487793, "Pretrain/Loss (Raw)": 2.3649423122406006, "Pretrain/Step": 2379, "Pretrain/Step Time": 8.411184197291732} +{"Pretrain/Learning Rate": 4.883103285593832e-05, "Pretrain/Loss": 2.080954074859619, "Pretrain/Loss (Raw)": 2.032639980316162, "Pretrain/Step": 2380, "Pretrain/Step Time": 8.410389063879848} +{"Pretrain/Learning Rate": 4.88297495799575e-05, "Pretrain/Loss": 2.0796589851379395, "Pretrain/Loss (Raw)": 1.9983068704605103, "Pretrain/Step": 2381, "Pretrain/Step Time": 8.41174403950572} +{"Pretrain/Learning Rate": 4.882846561686265e-05, "Pretrain/Loss": 2.0775630474090576, "Pretrain/Loss (Raw)": 2.0479393005371094, "Pretrain/Step": 2382, "Pretrain/Step Time": 8.406361155211926} +{"Pretrain/Learning Rate": 4.88271809666908e-05, "Pretrain/Loss": 2.077139377593994, "Pretrain/Loss (Raw)": 2.00730299949646, "Pretrain/Step": 2383, "Pretrain/Step Time": 8.406841171905398} +{"Pretrain/Learning Rate": 4.882589562947898e-05, "Pretrain/Loss": 2.0754261016845703, "Pretrain/Loss (Raw)": 1.951887845993042, "Pretrain/Step": 2384, "Pretrain/Step Time": 8.405865032225847} +{"Pretrain/Learning Rate": 4.882460960526425e-05, "Pretrain/Loss": 2.075904369354248, "Pretrain/Loss (Raw)": 2.072093963623047, "Pretrain/Step": 2385, "Pretrain/Step Time": 8.407609039917588} +{"Pretrain/Learning Rate": 4.88233228940837e-05, "Pretrain/Loss": 2.073634624481201, "Pretrain/Loss (Raw)": 1.8100157976150513, "Pretrain/Step": 2386, "Pretrain/Step Time": 8.410584408789873} +{"Pretrain/Learning Rate": 4.8822035495974433e-05, "Pretrain/Loss": 2.072676658630371, "Pretrain/Loss (Raw)": 2.0196259021759033, "Pretrain/Step": 2387, "Pretrain/Step Time": 8.410289974883199} +{"Pretrain/Learning Rate": 4.882074741097357e-05, "Pretrain/Loss": 2.070265293121338, "Pretrain/Loss (Raw)": 1.999674677848816, "Pretrain/Step": 2388, "Pretrain/Step Time": 8.410354917868972} +{"Pretrain/Learning Rate": 4.8819458639118235e-05, "Pretrain/Loss": 2.0705008506774902, "Pretrain/Loss (Raw)": 2.083566665649414, "Pretrain/Step": 2389, "Pretrain/Step Time": 8.403917334973812} +{"Pretrain/Learning Rate": 4.8818169180445605e-05, "Pretrain/Loss": 2.0705924034118652, "Pretrain/Loss (Raw)": 2.1841349601745605, "Pretrain/Step": 2390, "Pretrain/Step Time": 8.405480766668916} +{"Pretrain/Learning Rate": 4.881687903499286e-05, "Pretrain/Loss": 2.0709519386291504, "Pretrain/Loss (Raw)": 2.1628403663635254, "Pretrain/Step": 2391, "Pretrain/Step Time": 8.402224529534578} +{"Pretrain/Learning Rate": 4.8815588202797205e-05, "Pretrain/Loss": 2.0722174644470215, "Pretrain/Loss (Raw)": 2.1017565727233887, "Pretrain/Step": 2392, "Pretrain/Step Time": 8.403576165437698} +{"Pretrain/Learning Rate": 4.8814296683895845e-05, "Pretrain/Loss": 2.071812152862549, "Pretrain/Loss (Raw)": 1.9957460165023804, "Pretrain/Step": 2393, "Pretrain/Step Time": 8.405774638056755} +{"Pretrain/Learning Rate": 4.881300447832602e-05, "Pretrain/Loss": 2.072279691696167, "Pretrain/Loss (Raw)": 2.0440897941589355, "Pretrain/Step": 2394, "Pretrain/Step Time": 8.410252435132861} +{"Pretrain/Learning Rate": 4.881171158612501e-05, "Pretrain/Loss": 2.074916362762451, "Pretrain/Loss (Raw)": 2.260162591934204, "Pretrain/Step": 2395, "Pretrain/Step Time": 8.405360909178853} +{"Pretrain/Learning Rate": 4.8810418007330086e-05, "Pretrain/Loss": 2.07293438911438, "Pretrain/Loss (Raw)": 1.8680118322372437, "Pretrain/Step": 2396, "Pretrain/Step Time": 8.404311709105968} +{"Pretrain/Learning Rate": 4.880912374197854e-05, "Pretrain/Loss": 2.0738818645477295, "Pretrain/Loss (Raw)": 2.0653088092803955, "Pretrain/Step": 2397, "Pretrain/Step Time": 8.40330771356821} +{"Pretrain/Learning Rate": 4.880782879010769e-05, "Pretrain/Loss": 2.073993682861328, "Pretrain/Loss (Raw)": 2.134600877761841, "Pretrain/Step": 2398, "Pretrain/Step Time": 8.403480818495154} +{"Pretrain/Learning Rate": 4.880653315175488e-05, "Pretrain/Loss": 2.071275472640991, "Pretrain/Loss (Raw)": 1.8459326028823853, "Pretrain/Step": 2399, "Pretrain/Step Time": 8.401204185560346} +{"Pretrain/Learning Rate": 4.880523682695747e-05, "Pretrain/Loss": 2.070186138153076, "Pretrain/Loss (Raw)": 2.150057315826416, "Pretrain/Step": 2400, "Pretrain/Step Time": 8.40430703945458} +{"Pretrain/Learning Rate": 4.880393981575284e-05, "Pretrain/Loss": 2.0694923400878906, "Pretrain/Loss (Raw)": 1.9952020645141602, "Pretrain/Step": 2401, "Pretrain/Step Time": 8.404644101858139} +{"Pretrain/Learning Rate": 4.880264211817839e-05, "Pretrain/Loss": 2.0705549716949463, "Pretrain/Loss (Raw)": 2.0989913940429688, "Pretrain/Step": 2402, "Pretrain/Step Time": 8.404412798583508} +{"Pretrain/Learning Rate": 4.8801343734271524e-05, "Pretrain/Loss": 2.06854510307312, "Pretrain/Loss (Raw)": 1.8820492029190063, "Pretrain/Step": 2403, "Pretrain/Step Time": 8.410802165046334} +{"Pretrain/Learning Rate": 4.88000446640697e-05, "Pretrain/Loss": 2.066617250442505, "Pretrain/Loss (Raw)": 2.044935703277588, "Pretrain/Step": 2404, "Pretrain/Step Time": 8.41330711171031} +{"Pretrain/Learning Rate": 4.879874490761036e-05, "Pretrain/Loss": 2.066470146179199, "Pretrain/Loss (Raw)": 2.1212947368621826, "Pretrain/Step": 2405, "Pretrain/Step Time": 8.409119768068194} +{"Pretrain/Learning Rate": 4.879744446493099e-05, "Pretrain/Loss": 2.065809488296509, "Pretrain/Loss (Raw)": 2.0681467056274414, "Pretrain/Step": 2406, "Pretrain/Step Time": 8.408374344930053} +{"Pretrain/Learning Rate": 4.8796143336069086e-05, "Pretrain/Loss": 2.0637049674987793, "Pretrain/Loss (Raw)": 2.048612356185913, "Pretrain/Step": 2407, "Pretrain/Step Time": 8.41072759218514} +{"Pretrain/Learning Rate": 4.8794841521062165e-05, "Pretrain/Loss": 2.0612173080444336, "Pretrain/Loss (Raw)": 1.8534713983535767, "Pretrain/Step": 2408, "Pretrain/Step Time": 8.409747553989291} +{"Pretrain/Learning Rate": 4.879353901994777e-05, "Pretrain/Loss": 2.059833526611328, "Pretrain/Loss (Raw)": 2.0058867931365967, "Pretrain/Step": 2409, "Pretrain/Step Time": 8.409793620929122} +{"Pretrain/Learning Rate": 4.8792235832763436e-05, "Pretrain/Loss": 2.0594675540924072, "Pretrain/Loss (Raw)": 2.0173285007476807, "Pretrain/Step": 2410, "Pretrain/Step Time": 8.410226358100772} +{"Pretrain/Learning Rate": 4.879093195954676e-05, "Pretrain/Loss": 2.0615134239196777, "Pretrain/Loss (Raw)": 1.9888981580734253, "Pretrain/Step": 2411, "Pretrain/Step Time": 8.409852348268032} +{"Pretrain/Learning Rate": 4.878962740033533e-05, "Pretrain/Loss": 2.062607765197754, "Pretrain/Loss (Raw)": 2.0271990299224854, "Pretrain/Step": 2412, "Pretrain/Step Time": 8.410213934257627} +{"Pretrain/Learning Rate": 4.878832215516677e-05, "Pretrain/Loss": 2.062710762023926, "Pretrain/Loss (Raw)": 2.062803268432617, "Pretrain/Step": 2413, "Pretrain/Step Time": 8.409085463732481} +{"Pretrain/Learning Rate": 4.8787016224078706e-05, "Pretrain/Loss": 2.0626277923583984, "Pretrain/Loss (Raw)": 2.093358039855957, "Pretrain/Step": 2414, "Pretrain/Step Time": 8.406195625662804} +{"Pretrain/Learning Rate": 4.87857096071088e-05, "Pretrain/Loss": 2.0597481727600098, "Pretrain/Loss (Raw)": 1.8993821144104004, "Pretrain/Step": 2415, "Pretrain/Step Time": 8.408816369250417} +{"Pretrain/Learning Rate": 4.878440230429472e-05, "Pretrain/Loss": 2.0597457885742188, "Pretrain/Loss (Raw)": 1.9914971590042114, "Pretrain/Step": 2416, "Pretrain/Step Time": 8.406528480350971} +{"Pretrain/Learning Rate": 4.878309431567417e-05, "Pretrain/Loss": 2.0606284141540527, "Pretrain/Loss (Raw)": 2.1578471660614014, "Pretrain/Step": 2417, "Pretrain/Step Time": 8.409526288509369} +{"Pretrain/Learning Rate": 4.878178564128486e-05, "Pretrain/Loss": 2.0624988079071045, "Pretrain/Loss (Raw)": 2.2970869541168213, "Pretrain/Step": 2418, "Pretrain/Step Time": 8.411459824070334} +{"Pretrain/Learning Rate": 4.8780476281164536e-05, "Pretrain/Loss": 2.062509298324585, "Pretrain/Loss (Raw)": 2.106367826461792, "Pretrain/Step": 2419, "Pretrain/Step Time": 8.414130685850978} +{"Pretrain/Learning Rate": 4.877916623535094e-05, "Pretrain/Loss": 2.0639383792877197, "Pretrain/Loss (Raw)": 2.2377231121063232, "Pretrain/Step": 2420, "Pretrain/Step Time": 8.414215037599206} +{"Pretrain/Learning Rate": 4.877785550388184e-05, "Pretrain/Loss": 2.0657618045806885, "Pretrain/Loss (Raw)": 2.2285726070404053, "Pretrain/Step": 2421, "Pretrain/Step Time": 8.412290131673217} +{"Pretrain/Learning Rate": 4.877654408679504e-05, "Pretrain/Loss": 2.0652706623077393, "Pretrain/Loss (Raw)": 1.975836992263794, "Pretrain/Step": 2422, "Pretrain/Step Time": 8.411634115502238} +{"Pretrain/Learning Rate": 4.877523198412836e-05, "Pretrain/Loss": 2.064553737640381, "Pretrain/Loss (Raw)": 2.0474252700805664, "Pretrain/Step": 2423, "Pretrain/Step Time": 8.414249243214726} +{"Pretrain/Learning Rate": 4.877391919591962e-05, "Pretrain/Loss": 2.06471848487854, "Pretrain/Loss (Raw)": 2.1049745082855225, "Pretrain/Step": 2424, "Pretrain/Step Time": 8.414012970402837} +{"Pretrain/Learning Rate": 4.877260572220668e-05, "Pretrain/Loss": 2.063699245452881, "Pretrain/Loss (Raw)": 1.9502849578857422, "Pretrain/Step": 2425, "Pretrain/Step Time": 8.417940478771925} +{"Pretrain/Learning Rate": 4.877129156302741e-05, "Pretrain/Loss": 2.0610408782958984, "Pretrain/Loss (Raw)": 1.905640721321106, "Pretrain/Step": 2426, "Pretrain/Step Time": 8.415858570486307} +{"Pretrain/Learning Rate": 4.8769976718419705e-05, "Pretrain/Loss": 2.060070514678955, "Pretrain/Loss (Raw)": 2.1939194202423096, "Pretrain/Step": 2427, "Pretrain/Step Time": 8.415459146723151} +{"Pretrain/Learning Rate": 4.876866118842149e-05, "Pretrain/Loss": 2.063554525375366, "Pretrain/Loss (Raw)": 2.4740214347839355, "Pretrain/Step": 2428, "Pretrain/Step Time": 8.41572642326355} +{"Pretrain/Learning Rate": 4.8767344973070674e-05, "Pretrain/Loss": 2.06449556350708, "Pretrain/Loss (Raw)": 2.066577672958374, "Pretrain/Step": 2429, "Pretrain/Step Time": 8.41804669611156} +{"Pretrain/Learning Rate": 4.876602807240522e-05, "Pretrain/Loss": 2.0636160373687744, "Pretrain/Loss (Raw)": 2.065122127532959, "Pretrain/Step": 2430, "Pretrain/Step Time": 8.417224979028106} +{"Pretrain/Learning Rate": 4.876471048646311e-05, "Pretrain/Loss": 2.0646142959594727, "Pretrain/Loss (Raw)": 2.064558982849121, "Pretrain/Step": 2431, "Pretrain/Step Time": 8.417660588398576} +{"Pretrain/Learning Rate": 4.876339221528232e-05, "Pretrain/Loss": 2.06592059135437, "Pretrain/Loss (Raw)": 1.9507319927215576, "Pretrain/Step": 2432, "Pretrain/Step Time": 8.415692897513509} +{"Pretrain/Learning Rate": 4.876207325890086e-05, "Pretrain/Loss": 2.067279815673828, "Pretrain/Loss (Raw)": 2.131875991821289, "Pretrain/Step": 2433, "Pretrain/Step Time": 8.41551711410284} +{"Pretrain/Learning Rate": 4.8760753617356786e-05, "Pretrain/Loss": 2.06443452835083, "Pretrain/Loss (Raw)": 1.791810393333435, "Pretrain/Step": 2434, "Pretrain/Step Time": 8.41670191846788} +{"Pretrain/Learning Rate": 4.8759433290688124e-05, "Pretrain/Loss": 2.0639092922210693, "Pretrain/Loss (Raw)": 1.9706830978393555, "Pretrain/Step": 2435, "Pretrain/Step Time": 8.417533656582236} +{"Pretrain/Learning Rate": 4.8758112278932946e-05, "Pretrain/Loss": 2.0633163452148438, "Pretrain/Loss (Raw)": 1.9156572818756104, "Pretrain/Step": 2436, "Pretrain/Step Time": 8.420751729980111} +{"Pretrain/Learning Rate": 4.875679058212935e-05, "Pretrain/Loss": 2.0630054473876953, "Pretrain/Loss (Raw)": 2.0187811851501465, "Pretrain/Step": 2437, "Pretrain/Step Time": 8.421118592843413} +{"Pretrain/Learning Rate": 4.8755468200315455e-05, "Pretrain/Loss": 2.0626020431518555, "Pretrain/Loss (Raw)": 1.998564600944519, "Pretrain/Step": 2438, "Pretrain/Step Time": 8.417962342500687} +{"Pretrain/Learning Rate": 4.8754145133529375e-05, "Pretrain/Loss": 2.064451217651367, "Pretrain/Loss (Raw)": 1.9563918113708496, "Pretrain/Step": 2439, "Pretrain/Step Time": 8.413816418498755} +{"Pretrain/Learning Rate": 4.8752821381809265e-05, "Pretrain/Loss": 2.061892032623291, "Pretrain/Loss (Raw)": 1.961276888847351, "Pretrain/Step": 2440, "Pretrain/Step Time": 8.41617733053863} +{"Pretrain/Learning Rate": 4.8751496945193296e-05, "Pretrain/Loss": 2.062324047088623, "Pretrain/Loss (Raw)": 1.9052640199661255, "Pretrain/Step": 2441, "Pretrain/Step Time": 8.416072636842728} +{"Pretrain/Learning Rate": 4.875017182371966e-05, "Pretrain/Loss": 2.061994791030884, "Pretrain/Loss (Raw)": 2.206014633178711, "Pretrain/Step": 2442, "Pretrain/Step Time": 8.414856124669313} +{"Pretrain/Learning Rate": 4.874884601742655e-05, "Pretrain/Loss": 2.0631906986236572, "Pretrain/Loss (Raw)": 2.1646299362182617, "Pretrain/Step": 2443, "Pretrain/Step Time": 8.419124698266387} +{"Pretrain/Learning Rate": 4.874751952635222e-05, "Pretrain/Loss": 2.0646579265594482, "Pretrain/Loss (Raw)": 2.1306307315826416, "Pretrain/Step": 2444, "Pretrain/Step Time": 8.421375520527363} +{"Pretrain/Learning Rate": 4.8746192350534904e-05, "Pretrain/Loss": 2.063047409057617, "Pretrain/Loss (Raw)": 2.007493257522583, "Pretrain/Step": 2445, "Pretrain/Step Time": 8.421089839190245} +{"Pretrain/Learning Rate": 4.8744864490012866e-05, "Pretrain/Loss": 2.0642497539520264, "Pretrain/Loss (Raw)": 2.1194567680358887, "Pretrain/Step": 2446, "Pretrain/Step Time": 8.426756056025624} +{"Pretrain/Learning Rate": 4.87435359448244e-05, "Pretrain/Loss": 2.0623397827148438, "Pretrain/Loss (Raw)": 1.877700924873352, "Pretrain/Step": 2447, "Pretrain/Step Time": 8.424473522230983} +{"Pretrain/Learning Rate": 4.874220671500781e-05, "Pretrain/Loss": 2.062429428100586, "Pretrain/Loss (Raw)": 2.1742148399353027, "Pretrain/Step": 2448, "Pretrain/Step Time": 8.417556092143059} +{"Pretrain/Learning Rate": 4.8740876800601434e-05, "Pretrain/Loss": 2.0605833530426025, "Pretrain/Loss (Raw)": 2.0420892238616943, "Pretrain/Step": 2449, "Pretrain/Step Time": 8.418714562430978} +{"Pretrain/Learning Rate": 4.87395462016436e-05, "Pretrain/Loss": 2.0577027797698975, "Pretrain/Loss (Raw)": 1.9196988344192505, "Pretrain/Step": 2450, "Pretrain/Step Time": 8.416731839999557} +{"Pretrain/Learning Rate": 4.87382149181727e-05, "Pretrain/Loss": 2.0572590827941895, "Pretrain/Loss (Raw)": 1.9429185390472412, "Pretrain/Step": 2451, "Pretrain/Step Time": 8.418475460261106} +{"Pretrain/Learning Rate": 4.87368829502271e-05, "Pretrain/Loss": 2.056994676589966, "Pretrain/Loss (Raw)": 2.0928611755371094, "Pretrain/Step": 2452, "Pretrain/Step Time": 8.420768275856972} +{"Pretrain/Learning Rate": 4.873555029784522e-05, "Pretrain/Loss": 2.057851552963257, "Pretrain/Loss (Raw)": 2.1606733798980713, "Pretrain/Step": 2453, "Pretrain/Step Time": 8.420040432363749} +{"Pretrain/Learning Rate": 4.873421696106548e-05, "Pretrain/Loss": 2.0594675540924072, "Pretrain/Loss (Raw)": 2.2798478603363037, "Pretrain/Step": 2454, "Pretrain/Step Time": 8.417319349944592} +{"Pretrain/Learning Rate": 4.873288293992632e-05, "Pretrain/Loss": 2.0602409839630127, "Pretrain/Loss (Raw)": 2.161360502243042, "Pretrain/Step": 2455, "Pretrain/Step Time": 8.42393884807825} +{"Pretrain/Learning Rate": 4.8731548234466205e-05, "Pretrain/Loss": 2.0613327026367188, "Pretrain/Loss (Raw)": 2.372152090072632, "Pretrain/Step": 2456, "Pretrain/Step Time": 8.41597199626267} +{"Pretrain/Learning Rate": 4.873021284472364e-05, "Pretrain/Loss": 2.0602469444274902, "Pretrain/Loss (Raw)": 1.8834545612335205, "Pretrain/Step": 2457, "Pretrain/Step Time": 8.415079874917865} +{"Pretrain/Learning Rate": 4.8728876770737106e-05, "Pretrain/Loss": 2.0618538856506348, "Pretrain/Loss (Raw)": 2.1188390254974365, "Pretrain/Step": 2458, "Pretrain/Step Time": 8.420727614313364} +{"Pretrain/Learning Rate": 4.872754001254515e-05, "Pretrain/Loss": 2.060171127319336, "Pretrain/Loss (Raw)": 1.963762640953064, "Pretrain/Step": 2459, "Pretrain/Step Time": 8.419652067124844} +{"Pretrain/Learning Rate": 4.872620257018629e-05, "Pretrain/Loss": 2.0600521564483643, "Pretrain/Loss (Raw)": 2.0182604789733887, "Pretrain/Step": 2460, "Pretrain/Step Time": 8.41872962936759} +{"Pretrain/Learning Rate": 4.8724864443699114e-05, "Pretrain/Loss": 2.060116767883301, "Pretrain/Loss (Raw)": 2.0139667987823486, "Pretrain/Step": 2461, "Pretrain/Step Time": 8.41686267964542} +{"Pretrain/Learning Rate": 4.8723525633122193e-05, "Pretrain/Loss": 2.058339834213257, "Pretrain/Loss (Raw)": 2.068528890609741, "Pretrain/Step": 2462, "Pretrain/Step Time": 8.417427675798535} +{"Pretrain/Learning Rate": 4.872218613849413e-05, "Pretrain/Loss": 2.0606179237365723, "Pretrain/Loss (Raw)": 2.117863655090332, "Pretrain/Step": 2463, "Pretrain/Step Time": 8.4177066963166} +{"Pretrain/Learning Rate": 4.872084595985356e-05, "Pretrain/Loss": 2.059232711791992, "Pretrain/Loss (Raw)": 2.05131196975708, "Pretrain/Step": 2464, "Pretrain/Step Time": 8.416310399770737} +{"Pretrain/Learning Rate": 4.871950509723912e-05, "Pretrain/Loss": 2.0605947971343994, "Pretrain/Loss (Raw)": 2.1398074626922607, "Pretrain/Step": 2465, "Pretrain/Step Time": 8.411402150988579} +{"Pretrain/Learning Rate": 4.871816355068947e-05, "Pretrain/Loss": 2.062452793121338, "Pretrain/Loss (Raw)": 2.192007303237915, "Pretrain/Step": 2466, "Pretrain/Step Time": 8.411509035155177} +{"Pretrain/Learning Rate": 4.871682132024329e-05, "Pretrain/Loss": 2.061997413635254, "Pretrain/Loss (Raw)": 2.187321186065674, "Pretrain/Step": 2467, "Pretrain/Step Time": 8.414459386840463} +{"Pretrain/Learning Rate": 4.8715478405939284e-05, "Pretrain/Loss": 2.062593936920166, "Pretrain/Loss (Raw)": 2.237119674682617, "Pretrain/Step": 2468, "Pretrain/Step Time": 8.419250503182411} +{"Pretrain/Learning Rate": 4.8714134807816184e-05, "Pretrain/Loss": 2.061669111251831, "Pretrain/Loss (Raw)": 1.9358209371566772, "Pretrain/Step": 2469, "Pretrain/Step Time": 8.416681313887239} +{"Pretrain/Learning Rate": 4.871279052591272e-05, "Pretrain/Loss": 2.061485528945923, "Pretrain/Loss (Raw)": 2.1607918739318848, "Pretrain/Step": 2470, "Pretrain/Step Time": 8.416799725964665} +{"Pretrain/Learning Rate": 4.871144556026766e-05, "Pretrain/Loss": 2.0621285438537598, "Pretrain/Loss (Raw)": 2.1799941062927246, "Pretrain/Step": 2471, "Pretrain/Step Time": 8.417326092720032} +{"Pretrain/Learning Rate": 4.871009991091978e-05, "Pretrain/Loss": 2.060350179672241, "Pretrain/Loss (Raw)": 1.871928095817566, "Pretrain/Step": 2472, "Pretrain/Step Time": 8.417811209335923} +{"Pretrain/Learning Rate": 4.870875357790789e-05, "Pretrain/Loss": 2.062878370285034, "Pretrain/Loss (Raw)": 2.2907168865203857, "Pretrain/Step": 2473, "Pretrain/Step Time": 8.415305439382792} +{"Pretrain/Learning Rate": 4.8707406561270794e-05, "Pretrain/Loss": 2.066340446472168, "Pretrain/Loss (Raw)": 2.463270664215088, "Pretrain/Step": 2474, "Pretrain/Step Time": 8.416728049516678} +{"Pretrain/Learning Rate": 4.8706058861047354e-05, "Pretrain/Loss": 2.06704044342041, "Pretrain/Loss (Raw)": 2.1572015285491943, "Pretrain/Step": 2475, "Pretrain/Step Time": 8.417755130678415} +{"Pretrain/Learning Rate": 4.870471047727641e-05, "Pretrain/Loss": 2.0654590129852295, "Pretrain/Loss (Raw)": 2.1387784481048584, "Pretrain/Step": 2476, "Pretrain/Step Time": 8.419014185667038} +{"Pretrain/Learning Rate": 4.870336140999685e-05, "Pretrain/Loss": 2.064005136489868, "Pretrain/Loss (Raw)": 2.0167500972747803, "Pretrain/Step": 2477, "Pretrain/Step Time": 8.414418768137693} +{"Pretrain/Learning Rate": 4.8702011659247585e-05, "Pretrain/Loss": 2.062711715698242, "Pretrain/Loss (Raw)": 1.833020806312561, "Pretrain/Step": 2478, "Pretrain/Step Time": 8.417785534635186} +{"Pretrain/Learning Rate": 4.870066122506751e-05, "Pretrain/Loss": 2.06391978263855, "Pretrain/Loss (Raw)": 2.0851762294769287, "Pretrain/Step": 2479, "Pretrain/Step Time": 8.414683757349849} +{"Pretrain/Learning Rate": 4.869931010749558e-05, "Pretrain/Loss": 2.0654053688049316, "Pretrain/Loss (Raw)": 2.3464291095733643, "Pretrain/Step": 2480, "Pretrain/Step Time": 8.419045802205801} +{"Pretrain/Learning Rate": 4.8697958306570747e-05, "Pretrain/Loss": 2.0665478706359863, "Pretrain/Loss (Raw)": 2.1682188510894775, "Pretrain/Step": 2481, "Pretrain/Step Time": 8.415078761056066} +{"Pretrain/Learning Rate": 4.8696605822332e-05, "Pretrain/Loss": 2.068620204925537, "Pretrain/Loss (Raw)": 1.9800364971160889, "Pretrain/Step": 2482, "Pretrain/Step Time": 8.41503675095737} +{"Pretrain/Learning Rate": 4.8695252654818325e-05, "Pretrain/Loss": 2.0682663917541504, "Pretrain/Loss (Raw)": 2.0494344234466553, "Pretrain/Step": 2483, "Pretrain/Step Time": 8.416278148069978} +{"Pretrain/Learning Rate": 4.869389880406874e-05, "Pretrain/Loss": 2.069230079650879, "Pretrain/Loss (Raw)": 2.1098215579986572, "Pretrain/Step": 2484, "Pretrain/Step Time": 8.414944043383002} +{"Pretrain/Learning Rate": 4.8692544270122285e-05, "Pretrain/Loss": 2.0708227157592773, "Pretrain/Loss (Raw)": 2.287226438522339, "Pretrain/Step": 2485, "Pretrain/Step Time": 8.416435521095991} +{"Pretrain/Learning Rate": 4.8691189053018024e-05, "Pretrain/Loss": 2.0714170932769775, "Pretrain/Loss (Raw)": 1.9164832830429077, "Pretrain/Step": 2486, "Pretrain/Step Time": 8.416691599413753} +{"Pretrain/Learning Rate": 4.8689833152795026e-05, "Pretrain/Loss": 2.070345401763916, "Pretrain/Loss (Raw)": 1.9978493452072144, "Pretrain/Step": 2487, "Pretrain/Step Time": 8.415831925347447} +{"Pretrain/Learning Rate": 4.868847656949239e-05, "Pretrain/Loss": 2.072113037109375, "Pretrain/Loss (Raw)": 2.145001173019409, "Pretrain/Step": 2488, "Pretrain/Step Time": 8.424767352640629} +{"Pretrain/Learning Rate": 4.868711930314923e-05, "Pretrain/Loss": 2.071763515472412, "Pretrain/Loss (Raw)": 1.9979724884033203, "Pretrain/Step": 2489, "Pretrain/Step Time": 8.420410379767418} +{"Pretrain/Learning Rate": 4.868576135380469e-05, "Pretrain/Loss": 2.0715715885162354, "Pretrain/Loss (Raw)": 2.0796210765838623, "Pretrain/Step": 2490, "Pretrain/Step Time": 8.416739953681827} +{"Pretrain/Learning Rate": 4.868440272149791e-05, "Pretrain/Loss": 2.069401264190674, "Pretrain/Loss (Raw)": 1.912293791770935, "Pretrain/Step": 2491, "Pretrain/Step Time": 8.4186687823385} +{"Pretrain/Learning Rate": 4.868304340626808e-05, "Pretrain/Loss": 2.068721294403076, "Pretrain/Loss (Raw)": 2.038703680038452, "Pretrain/Step": 2492, "Pretrain/Step Time": 8.419333174824715} +{"Pretrain/Learning Rate": 4.868168340815439e-05, "Pretrain/Loss": 2.0701236724853516, "Pretrain/Loss (Raw)": 2.213728666305542, "Pretrain/Step": 2493, "Pretrain/Step Time": 8.417159844189882} +{"Pretrain/Learning Rate": 4.868032272719604e-05, "Pretrain/Loss": 2.0710575580596924, "Pretrain/Loss (Raw)": 1.919879674911499, "Pretrain/Step": 2494, "Pretrain/Step Time": 8.416571343317628} +{"Pretrain/Learning Rate": 4.867896136343229e-05, "Pretrain/Loss": 2.069805383682251, "Pretrain/Loss (Raw)": 2.090932846069336, "Pretrain/Step": 2495, "Pretrain/Step Time": 8.418653544038534} +{"Pretrain/Learning Rate": 4.8677599316902375e-05, "Pretrain/Loss": 2.069418430328369, "Pretrain/Loss (Raw)": 1.9065587520599365, "Pretrain/Step": 2496, "Pretrain/Step Time": 8.415916418656707} +{"Pretrain/Learning Rate": 4.8676236587645585e-05, "Pretrain/Loss": 2.0702037811279297, "Pretrain/Loss (Raw)": 2.2436234951019287, "Pretrain/Step": 2497, "Pretrain/Step Time": 8.413969960063696} +{"Pretrain/Learning Rate": 4.86748731757012e-05, "Pretrain/Loss": 2.0698821544647217, "Pretrain/Loss (Raw)": 1.9979580640792847, "Pretrain/Step": 2498, "Pretrain/Step Time": 8.414734061807394} +{"Pretrain/Learning Rate": 4.8673509081108526e-05, "Pretrain/Loss": 2.069584608078003, "Pretrain/Loss (Raw)": 1.927995204925537, "Pretrain/Step": 2499, "Pretrain/Step Time": 8.417311714962125} +{"Pretrain/Learning Rate": 4.867214430390692e-05, "Pretrain/Loss": 2.065946340560913, "Pretrain/Loss (Raw)": 1.522147536277771, "Pretrain/Step": 2500, "Pretrain/Step Time": 8.41905502974987} +{"Pretrain/Learning Rate": 4.867077884413571e-05, "Pretrain/Loss": 2.0640065670013428, "Pretrain/Loss (Raw)": 2.073539972305298, "Pretrain/Step": 2501, "Pretrain/Step Time": 8.42009437456727} +{"Pretrain/Learning Rate": 4.8669412701834286e-05, "Pretrain/Loss": 2.0639734268188477, "Pretrain/Loss (Raw)": 2.2123727798461914, "Pretrain/Step": 2502, "Pretrain/Step Time": 8.416934292763472} +{"Pretrain/Learning Rate": 4.8668045877042036e-05, "Pretrain/Loss": 2.0624184608459473, "Pretrain/Loss (Raw)": 2.0227720737457275, "Pretrain/Step": 2503, "Pretrain/Step Time": 8.417371936142445} +{"Pretrain/Learning Rate": 4.8666678369798355e-05, "Pretrain/Loss": 2.0630528926849365, "Pretrain/Loss (Raw)": 2.0375263690948486, "Pretrain/Step": 2504, "Pretrain/Step Time": 8.41946098767221} +{"Pretrain/Learning Rate": 4.8665310180142695e-05, "Pretrain/Loss": 2.0622482299804688, "Pretrain/Loss (Raw)": 2.0505452156066895, "Pretrain/Step": 2505, "Pretrain/Step Time": 8.420065319165587} +{"Pretrain/Learning Rate": 4.86639413081145e-05, "Pretrain/Loss": 2.063197612762451, "Pretrain/Loss (Raw)": 2.1865086555480957, "Pretrain/Step": 2506, "Pretrain/Step Time": 8.415125537663698} +{"Pretrain/Learning Rate": 4.866257175375324e-05, "Pretrain/Loss": 2.060957431793213, "Pretrain/Loss (Raw)": 2.0781948566436768, "Pretrain/Step": 2507, "Pretrain/Step Time": 8.419376105070114} +{"Pretrain/Learning Rate": 4.86612015170984e-05, "Pretrain/Loss": 2.0627591609954834, "Pretrain/Loss (Raw)": 2.263249635696411, "Pretrain/Step": 2508, "Pretrain/Step Time": 8.4213503357023} +{"Pretrain/Learning Rate": 4.86598305981895e-05, "Pretrain/Loss": 2.0645668506622314, "Pretrain/Loss (Raw)": 2.229703426361084, "Pretrain/Step": 2509, "Pretrain/Step Time": 8.420379972085357} +{"Pretrain/Learning Rate": 4.865845899706606e-05, "Pretrain/Loss": 2.0636284351348877, "Pretrain/Loss (Raw)": 1.9278093576431274, "Pretrain/Step": 2510, "Pretrain/Step Time": 8.421314634382725} +{"Pretrain/Learning Rate": 4.865708671376763e-05, "Pretrain/Loss": 2.0645322799682617, "Pretrain/Loss (Raw)": 2.123008966445923, "Pretrain/Step": 2511, "Pretrain/Step Time": 8.422372449189425} +{"Pretrain/Learning Rate": 4.8655713748333786e-05, "Pretrain/Loss": 2.065168619155884, "Pretrain/Loss (Raw)": 2.033323287963867, "Pretrain/Step": 2512, "Pretrain/Step Time": 8.421676171943545} +{"Pretrain/Learning Rate": 4.865434010080411e-05, "Pretrain/Loss": 2.063707113265991, "Pretrain/Loss (Raw)": 1.8850409984588623, "Pretrain/Step": 2513, "Pretrain/Step Time": 8.423437394201756} +{"Pretrain/Learning Rate": 4.865296577121822e-05, "Pretrain/Loss": 2.0645976066589355, "Pretrain/Loss (Raw)": 1.923962116241455, "Pretrain/Step": 2514, "Pretrain/Step Time": 8.419435132294893} +{"Pretrain/Learning Rate": 4.865159075961573e-05, "Pretrain/Loss": 2.0636849403381348, "Pretrain/Loss (Raw)": 1.9028140306472778, "Pretrain/Step": 2515, "Pretrain/Step Time": 8.420324949547648} +{"Pretrain/Learning Rate": 4.865021506603629e-05, "Pretrain/Loss": 2.064894199371338, "Pretrain/Loss (Raw)": 2.154454231262207, "Pretrain/Step": 2516, "Pretrain/Step Time": 8.420970106497407} +{"Pretrain/Learning Rate": 4.864883869051958e-05, "Pretrain/Loss": 2.0637664794921875, "Pretrain/Loss (Raw)": 1.9392279386520386, "Pretrain/Step": 2517, "Pretrain/Step Time": 8.421648418530822} +{"Pretrain/Learning Rate": 4.8647461633105274e-05, "Pretrain/Loss": 2.0625648498535156, "Pretrain/Loss (Raw)": 2.030325174331665, "Pretrain/Step": 2518, "Pretrain/Step Time": 8.42955020815134} +{"Pretrain/Learning Rate": 4.864608389383307e-05, "Pretrain/Loss": 2.061373710632324, "Pretrain/Loss (Raw)": 2.0103864669799805, "Pretrain/Step": 2519, "Pretrain/Step Time": 8.425660718232393} +{"Pretrain/Learning Rate": 4.864470547274273e-05, "Pretrain/Loss": 2.061276912689209, "Pretrain/Loss (Raw)": 2.089362859725952, "Pretrain/Step": 2520, "Pretrain/Step Time": 8.418932281434536} +{"Pretrain/Learning Rate": 4.864332636987395e-05, "Pretrain/Loss": 2.0645856857299805, "Pretrain/Loss (Raw)": 2.4192652702331543, "Pretrain/Step": 2521, "Pretrain/Step Time": 8.428077530115843} +{"Pretrain/Learning Rate": 4.864194658526654e-05, "Pretrain/Loss": 2.064821720123291, "Pretrain/Loss (Raw)": 2.074324131011963, "Pretrain/Step": 2522, "Pretrain/Step Time": 8.425065074115992} +{"Pretrain/Learning Rate": 4.8640566118960265e-05, "Pretrain/Loss": 2.0629100799560547, "Pretrain/Loss (Raw)": 2.01546311378479, "Pretrain/Step": 2523, "Pretrain/Step Time": 8.42431372590363} +{"Pretrain/Learning Rate": 4.863918497099492e-05, "Pretrain/Loss": 2.0638058185577393, "Pretrain/Loss (Raw)": 1.9826600551605225, "Pretrain/Step": 2524, "Pretrain/Step Time": 8.431721616536379} +{"Pretrain/Learning Rate": 4.8637803141410353e-05, "Pretrain/Loss": 2.063232421875, "Pretrain/Loss (Raw)": 1.9919167757034302, "Pretrain/Step": 2525, "Pretrain/Step Time": 8.429394049569964} +{"Pretrain/Learning Rate": 4.863642063024639e-05, "Pretrain/Loss": 2.0648810863494873, "Pretrain/Loss (Raw)": 2.3456153869628906, "Pretrain/Step": 2526, "Pretrain/Step Time": 8.432661214843392} +{"Pretrain/Learning Rate": 4.8635037437542904e-05, "Pretrain/Loss": 2.0678133964538574, "Pretrain/Loss (Raw)": 2.221285104751587, "Pretrain/Step": 2527, "Pretrain/Step Time": 8.434388928115368} +{"Pretrain/Learning Rate": 4.863365356333977e-05, "Pretrain/Loss": 2.067054510116577, "Pretrain/Loss (Raw)": 2.0529184341430664, "Pretrain/Step": 2528, "Pretrain/Step Time": 8.434243872761726} +{"Pretrain/Learning Rate": 4.86322690076769e-05, "Pretrain/Loss": 2.067121982574463, "Pretrain/Loss (Raw)": 2.003840684890747, "Pretrain/Step": 2529, "Pretrain/Step Time": 8.434019956737757} +{"Pretrain/Learning Rate": 4.8630883770594216e-05, "Pretrain/Loss": 2.0675697326660156, "Pretrain/Loss (Raw)": 2.156301259994507, "Pretrain/Step": 2530, "Pretrain/Step Time": 8.434772225096822} +{"Pretrain/Learning Rate": 4.8629497852131656e-05, "Pretrain/Loss": 2.068061590194702, "Pretrain/Loss (Raw)": 1.9449950456619263, "Pretrain/Step": 2531, "Pretrain/Step Time": 8.430316941812634} +{"Pretrain/Learning Rate": 4.8628111252329177e-05, "Pretrain/Loss": 2.067791700363159, "Pretrain/Loss (Raw)": 2.0103847980499268, "Pretrain/Step": 2532, "Pretrain/Step Time": 8.429225876927376} +{"Pretrain/Learning Rate": 4.862672397122677e-05, "Pretrain/Loss": 2.068100690841675, "Pretrain/Loss (Raw)": 2.160851001739502, "Pretrain/Step": 2533, "Pretrain/Step Time": 8.432300545275211} +{"Pretrain/Learning Rate": 4.862533600886444e-05, "Pretrain/Loss": 2.067418336868286, "Pretrain/Loss (Raw)": 1.9807977676391602, "Pretrain/Step": 2534, "Pretrain/Step Time": 8.433199128136039} +{"Pretrain/Learning Rate": 4.862394736528219e-05, "Pretrain/Loss": 2.0655689239501953, "Pretrain/Loss (Raw)": 1.8119019269943237, "Pretrain/Step": 2535, "Pretrain/Step Time": 8.429571745917201} +{"Pretrain/Learning Rate": 4.8622558040520074e-05, "Pretrain/Loss": 2.0664725303649902, "Pretrain/Loss (Raw)": 1.9691565036773682, "Pretrain/Step": 2536, "Pretrain/Step Time": 8.428325621411204} +{"Pretrain/Learning Rate": 4.8621168034618156e-05, "Pretrain/Loss": 2.065311908721924, "Pretrain/Loss (Raw)": 1.8573163747787476, "Pretrain/Step": 2537, "Pretrain/Step Time": 8.428003648295999} +{"Pretrain/Learning Rate": 4.86197773476165e-05, "Pretrain/Loss": 2.065962791442871, "Pretrain/Loss (Raw)": 2.1006126403808594, "Pretrain/Step": 2538, "Pretrain/Step Time": 8.426509285345674} +{"Pretrain/Learning Rate": 4.8618385979555224e-05, "Pretrain/Loss": 2.068110704421997, "Pretrain/Loss (Raw)": 2.2638328075408936, "Pretrain/Step": 2539, "Pretrain/Step Time": 8.424523301422596} +{"Pretrain/Learning Rate": 4.8616993930474434e-05, "Pretrain/Loss": 2.0681862831115723, "Pretrain/Loss (Raw)": 2.0368893146514893, "Pretrain/Step": 2540, "Pretrain/Step Time": 8.425070250406861} +{"Pretrain/Learning Rate": 4.8615601200414275e-05, "Pretrain/Loss": 2.0682592391967773, "Pretrain/Loss (Raw)": 2.0721237659454346, "Pretrain/Step": 2541, "Pretrain/Step Time": 8.426035134121776} +{"Pretrain/Learning Rate": 4.86142077894149e-05, "Pretrain/Loss": 2.0654296875, "Pretrain/Loss (Raw)": 1.7311724424362183, "Pretrain/Step": 2542, "Pretrain/Step Time": 8.428910188376904} +{"Pretrain/Learning Rate": 4.861281369751649e-05, "Pretrain/Loss": 2.066096544265747, "Pretrain/Loss (Raw)": 1.984766960144043, "Pretrain/Step": 2543, "Pretrain/Step Time": 8.422238420695066} +{"Pretrain/Learning Rate": 4.861141892475924e-05, "Pretrain/Loss": 2.066197156906128, "Pretrain/Loss (Raw)": 2.0043723583221436, "Pretrain/Step": 2544, "Pretrain/Step Time": 8.421337358653545} +{"Pretrain/Learning Rate": 4.861002347118338e-05, "Pretrain/Loss": 2.0672225952148438, "Pretrain/Loss (Raw)": 2.289113998413086, "Pretrain/Step": 2545, "Pretrain/Step Time": 8.42067289352417} +{"Pretrain/Learning Rate": 4.860862733682913e-05, "Pretrain/Loss": 2.0649008750915527, "Pretrain/Loss (Raw)": 1.999876856803894, "Pretrain/Step": 2546, "Pretrain/Step Time": 8.419052604585886} +{"Pretrain/Learning Rate": 4.860723052173676e-05, "Pretrain/Loss": 2.065134048461914, "Pretrain/Loss (Raw)": 2.1362245082855225, "Pretrain/Step": 2547, "Pretrain/Step Time": 8.420248350128531} +{"Pretrain/Learning Rate": 4.8605833025946535e-05, "Pretrain/Loss": 2.0627782344818115, "Pretrain/Loss (Raw)": 1.9361838102340698, "Pretrain/Step": 2548, "Pretrain/Step Time": 8.421091729775071} +{"Pretrain/Learning Rate": 4.860443484949876e-05, "Pretrain/Loss": 2.061554431915283, "Pretrain/Loss (Raw)": 2.0719029903411865, "Pretrain/Step": 2549, "Pretrain/Step Time": 8.420480383560061} +{"Pretrain/Learning Rate": 4.860303599243374e-05, "Pretrain/Loss": 2.0617499351501465, "Pretrain/Loss (Raw)": 2.0008704662323, "Pretrain/Step": 2550, "Pretrain/Step Time": 8.420913383364677} +{"Pretrain/Learning Rate": 4.860163645479182e-05, "Pretrain/Loss": 2.06296706199646, "Pretrain/Loss (Raw)": 2.2032394409179688, "Pretrain/Step": 2551, "Pretrain/Step Time": 8.419634049758315} +{"Pretrain/Learning Rate": 4.860023623661335e-05, "Pretrain/Loss": 2.0583863258361816, "Pretrain/Loss (Raw)": 1.518636703491211, "Pretrain/Step": 2552, "Pretrain/Step Time": 8.419790159910917} +{"Pretrain/Learning Rate": 4.8598835337938704e-05, "Pretrain/Loss": 2.058119297027588, "Pretrain/Loss (Raw)": 1.9161014556884766, "Pretrain/Step": 2553, "Pretrain/Step Time": 8.41588919237256} +{"Pretrain/Learning Rate": 4.859743375880827e-05, "Pretrain/Loss": 2.0626275539398193, "Pretrain/Loss (Raw)": 2.4827051162719727, "Pretrain/Step": 2554, "Pretrain/Step Time": 8.423885188996792} +{"Pretrain/Learning Rate": 4.859603149926248e-05, "Pretrain/Loss": 2.061431646347046, "Pretrain/Loss (Raw)": 2.0408310890197754, "Pretrain/Step": 2555, "Pretrain/Step Time": 8.418233936652541} +{"Pretrain/Learning Rate": 4.859462855934176e-05, "Pretrain/Loss": 2.058373212814331, "Pretrain/Loss (Raw)": 2.0825209617614746, "Pretrain/Step": 2556, "Pretrain/Step Time": 8.41843898780644} +{"Pretrain/Learning Rate": 4.859322493908654e-05, "Pretrain/Loss": 2.0569639205932617, "Pretrain/Loss (Raw)": 1.886191964149475, "Pretrain/Step": 2557, "Pretrain/Step Time": 8.420276399701834} +{"Pretrain/Learning Rate": 4.859182063853733e-05, "Pretrain/Loss": 2.056325912475586, "Pretrain/Loss (Raw)": 1.9834810495376587, "Pretrain/Step": 2558, "Pretrain/Step Time": 8.42295926809311} +{"Pretrain/Learning Rate": 4.85904156577346e-05, "Pretrain/Loss": 2.0552175045013428, "Pretrain/Loss (Raw)": 1.9226855039596558, "Pretrain/Step": 2559, "Pretrain/Step Time": 8.419761581346393} +{"Pretrain/Learning Rate": 4.858900999671886e-05, "Pretrain/Loss": 2.056049346923828, "Pretrain/Loss (Raw)": 2.0571908950805664, "Pretrain/Step": 2560, "Pretrain/Step Time": 8.418527198955417} +{"Pretrain/Learning Rate": 4.8587603655530647e-05, "Pretrain/Loss": 2.0547919273376465, "Pretrain/Loss (Raw)": 1.9709426164627075, "Pretrain/Step": 2561, "Pretrain/Step Time": 8.420770345255733} +{"Pretrain/Learning Rate": 4.85861966342105e-05, "Pretrain/Loss": 2.056215286254883, "Pretrain/Loss (Raw)": 1.9740097522735596, "Pretrain/Step": 2562, "Pretrain/Step Time": 8.419982988387346} +{"Pretrain/Learning Rate": 4.8584788932799014e-05, "Pretrain/Loss": 2.056295394897461, "Pretrain/Loss (Raw)": 1.9809128046035767, "Pretrain/Step": 2563, "Pretrain/Step Time": 8.423066018149257} +{"Pretrain/Learning Rate": 4.8583380551336766e-05, "Pretrain/Loss": 2.0572164058685303, "Pretrain/Loss (Raw)": 2.0335612297058105, "Pretrain/Step": 2564, "Pretrain/Step Time": 8.424182346090674} +{"Pretrain/Learning Rate": 4.858197148986435e-05, "Pretrain/Loss": 2.057626724243164, "Pretrain/Loss (Raw)": 2.0712811946868896, "Pretrain/Step": 2565, "Pretrain/Step Time": 8.421871216967702} +{"Pretrain/Learning Rate": 4.858056174842243e-05, "Pretrain/Loss": 2.0582327842712402, "Pretrain/Loss (Raw)": 2.0761430263519287, "Pretrain/Step": 2566, "Pretrain/Step Time": 8.420069366693497} +{"Pretrain/Learning Rate": 4.857915132705162e-05, "Pretrain/Loss": 2.060060739517212, "Pretrain/Loss (Raw)": 2.190392255783081, "Pretrain/Step": 2567, "Pretrain/Step Time": 8.422245332971215} +{"Pretrain/Learning Rate": 4.8577740225792614e-05, "Pretrain/Loss": 2.0605435371398926, "Pretrain/Loss (Raw)": 2.0230588912963867, "Pretrain/Step": 2568, "Pretrain/Step Time": 8.419248851016164} +{"Pretrain/Learning Rate": 4.8576328444686085e-05, "Pretrain/Loss": 2.060713291168213, "Pretrain/Loss (Raw)": 1.9270038604736328, "Pretrain/Step": 2569, "Pretrain/Step Time": 8.42066664621234} +{"Pretrain/Learning Rate": 4.857491598377274e-05, "Pretrain/Loss": 2.059749126434326, "Pretrain/Loss (Raw)": 2.082608222961426, "Pretrain/Step": 2570, "Pretrain/Step Time": 8.423723934218287} +{"Pretrain/Learning Rate": 4.857350284309332e-05, "Pretrain/Loss": 2.0575976371765137, "Pretrain/Loss (Raw)": 1.8892189264297485, "Pretrain/Step": 2571, "Pretrain/Step Time": 8.41886418312788} +{"Pretrain/Learning Rate": 4.857208902268856e-05, "Pretrain/Loss": 2.055253505706787, "Pretrain/Loss (Raw)": 1.830586314201355, "Pretrain/Step": 2572, "Pretrain/Step Time": 8.417225809767842} +{"Pretrain/Learning Rate": 4.857067452259924e-05, "Pretrain/Loss": 2.0566139221191406, "Pretrain/Loss (Raw)": 2.181652784347534, "Pretrain/Step": 2573, "Pretrain/Step Time": 8.420642601326108} +{"Pretrain/Learning Rate": 4.856925934286613e-05, "Pretrain/Loss": 2.0567636489868164, "Pretrain/Loss (Raw)": 2.1385819911956787, "Pretrain/Step": 2574, "Pretrain/Step Time": 8.413107339292765} +{"Pretrain/Learning Rate": 4.856784348353003e-05, "Pretrain/Loss": 2.0594100952148438, "Pretrain/Loss (Raw)": 2.2164595127105713, "Pretrain/Step": 2575, "Pretrain/Step Time": 8.415600668638945} +{"Pretrain/Learning Rate": 4.856642694463179e-05, "Pretrain/Loss": 2.058093309402466, "Pretrain/Loss (Raw)": 2.005674362182617, "Pretrain/Step": 2576, "Pretrain/Step Time": 8.416083749383688} +{"Pretrain/Learning Rate": 4.856500972621224e-05, "Pretrain/Loss": 2.0600008964538574, "Pretrain/Loss (Raw)": 2.2862727642059326, "Pretrain/Step": 2577, "Pretrain/Step Time": 8.415095156058669} +{"Pretrain/Learning Rate": 4.856359182831225e-05, "Pretrain/Loss": 2.060638427734375, "Pretrain/Loss (Raw)": 2.0012784004211426, "Pretrain/Step": 2578, "Pretrain/Step Time": 8.418220147490501} +{"Pretrain/Learning Rate": 4.856217325097269e-05, "Pretrain/Loss": 2.0611355304718018, "Pretrain/Loss (Raw)": 2.0065457820892334, "Pretrain/Step": 2579, "Pretrain/Step Time": 8.41950823366642} +{"Pretrain/Learning Rate": 4.856075399423449e-05, "Pretrain/Loss": 2.0619001388549805, "Pretrain/Loss (Raw)": 2.190762996673584, "Pretrain/Step": 2580, "Pretrain/Step Time": 8.419101471081376} +{"Pretrain/Learning Rate": 4.8559334058138547e-05, "Pretrain/Loss": 2.0596513748168945, "Pretrain/Loss (Raw)": 1.8728479146957397, "Pretrain/Step": 2581, "Pretrain/Step Time": 8.420432832092047} +{"Pretrain/Learning Rate": 4.855791344272581e-05, "Pretrain/Loss": 2.055068254470825, "Pretrain/Loss (Raw)": 1.693169355392456, "Pretrain/Step": 2582, "Pretrain/Step Time": 8.420235522091389} +{"Pretrain/Learning Rate": 4.8556492148037256e-05, "Pretrain/Loss": 2.054440975189209, "Pretrain/Loss (Raw)": 2.08107852935791, "Pretrain/Step": 2583, "Pretrain/Step Time": 8.414740223437548} +{"Pretrain/Learning Rate": 4.855507017411386e-05, "Pretrain/Loss": 2.0516462326049805, "Pretrain/Loss (Raw)": 2.0144221782684326, "Pretrain/Step": 2584, "Pretrain/Step Time": 8.418059291318059} +{"Pretrain/Learning Rate": 4.8553647520996614e-05, "Pretrain/Loss": 2.0531764030456543, "Pretrain/Loss (Raw)": 2.079331636428833, "Pretrain/Step": 2585, "Pretrain/Step Time": 8.41646977327764} +{"Pretrain/Learning Rate": 4.855222418872655e-05, "Pretrain/Loss": 2.053907871246338, "Pretrain/Loss (Raw)": 2.2124297618865967, "Pretrain/Step": 2586, "Pretrain/Step Time": 8.420229077339172} +{"Pretrain/Learning Rate": 4.8550800177344694e-05, "Pretrain/Loss": 2.0539731979370117, "Pretrain/Loss (Raw)": 1.9721722602844238, "Pretrain/Step": 2587, "Pretrain/Step Time": 8.42127250507474} +{"Pretrain/Learning Rate": 4.854937548689213e-05, "Pretrain/Loss": 2.0559635162353516, "Pretrain/Loss (Raw)": 2.273014545440674, "Pretrain/Step": 2588, "Pretrain/Step Time": 8.422179689630866} +{"Pretrain/Learning Rate": 4.854795011740992e-05, "Pretrain/Loss": 2.0568439960479736, "Pretrain/Loss (Raw)": 2.1266531944274902, "Pretrain/Step": 2589, "Pretrain/Step Time": 8.417948627844453} +{"Pretrain/Learning Rate": 4.854652406893917e-05, "Pretrain/Loss": 2.0577008724212646, "Pretrain/Loss (Raw)": 2.1782009601593018, "Pretrain/Step": 2590, "Pretrain/Step Time": 8.421880351379514} +{"Pretrain/Learning Rate": 4.8545097341520996e-05, "Pretrain/Loss": 2.059091806411743, "Pretrain/Loss (Raw)": 2.295891046524048, "Pretrain/Step": 2591, "Pretrain/Step Time": 8.420387767255306} +{"Pretrain/Learning Rate": 4.854366993519654e-05, "Pretrain/Loss": 2.059380531311035, "Pretrain/Loss (Raw)": 2.088291883468628, "Pretrain/Step": 2592, "Pretrain/Step Time": 8.419608514755964} +{"Pretrain/Learning Rate": 4.854224185000695e-05, "Pretrain/Loss": 2.0601892471313477, "Pretrain/Loss (Raw)": 2.243300676345825, "Pretrain/Step": 2593, "Pretrain/Step Time": 8.421954235062003} +{"Pretrain/Learning Rate": 4.8540813085993424e-05, "Pretrain/Loss": 2.060483455657959, "Pretrain/Loss (Raw)": 2.229694366455078, "Pretrain/Step": 2594, "Pretrain/Step Time": 8.42075227946043} +{"Pretrain/Learning Rate": 4.8539383643197143e-05, "Pretrain/Loss": 2.0601730346679688, "Pretrain/Loss (Raw)": 2.147573232650757, "Pretrain/Step": 2595, "Pretrain/Step Time": 8.420020943507552} +{"Pretrain/Learning Rate": 4.853795352165933e-05, "Pretrain/Loss": 2.062689781188965, "Pretrain/Loss (Raw)": 2.5592639446258545, "Pretrain/Step": 2596, "Pretrain/Step Time": 8.419442005455494} +{"Pretrain/Learning Rate": 4.853652272142122e-05, "Pretrain/Loss": 2.0648694038391113, "Pretrain/Loss (Raw)": 2.2148046493530273, "Pretrain/Step": 2597, "Pretrain/Step Time": 8.421695513650775} +{"Pretrain/Learning Rate": 4.8535091242524063e-05, "Pretrain/Loss": 2.0637030601501465, "Pretrain/Loss (Raw)": 2.01151180267334, "Pretrain/Step": 2598, "Pretrain/Step Time": 8.424628362059593} +{"Pretrain/Learning Rate": 4.8533659085009155e-05, "Pretrain/Loss": 2.0622496604919434, "Pretrain/Loss (Raw)": 1.9939677715301514, "Pretrain/Step": 2599, "Pretrain/Step Time": 8.422911256551743} +{"Pretrain/Learning Rate": 4.853222624891777e-05, "Pretrain/Loss": 2.0630197525024414, "Pretrain/Loss (Raw)": 1.9704855680465698, "Pretrain/Step": 2600, "Pretrain/Step Time": 8.421318037435412} +{"Pretrain/Learning Rate": 4.853079273429123e-05, "Pretrain/Loss": 2.062012195587158, "Pretrain/Loss (Raw)": 2.1617510318756104, "Pretrain/Step": 2601, "Pretrain/Step Time": 8.424075162038207} +{"Pretrain/Learning Rate": 4.852935854117087e-05, "Pretrain/Loss": 2.0589451789855957, "Pretrain/Loss (Raw)": 2.070678234100342, "Pretrain/Step": 2602, "Pretrain/Step Time": 8.422775644809008} +{"Pretrain/Learning Rate": 4.852792366959804e-05, "Pretrain/Loss": 2.0582878589630127, "Pretrain/Loss (Raw)": 2.073098659515381, "Pretrain/Step": 2603, "Pretrain/Step Time": 8.425309492275119} +{"Pretrain/Learning Rate": 4.852648811961412e-05, "Pretrain/Loss": 2.0581512451171875, "Pretrain/Loss (Raw)": 2.121277093887329, "Pretrain/Step": 2604, "Pretrain/Step Time": 8.420915707945824} +{"Pretrain/Learning Rate": 4.85250518912605e-05, "Pretrain/Loss": 2.058196544647217, "Pretrain/Loss (Raw)": 2.022536277770996, "Pretrain/Step": 2605, "Pretrain/Step Time": 8.42121359705925} +{"Pretrain/Learning Rate": 4.85236149845786e-05, "Pretrain/Loss": 2.0587496757507324, "Pretrain/Loss (Raw)": 1.9038259983062744, "Pretrain/Step": 2606, "Pretrain/Step Time": 8.418839450925589} +{"Pretrain/Learning Rate": 4.8522177399609834e-05, "Pretrain/Loss": 2.058272123336792, "Pretrain/Loss (Raw)": 2.0240352153778076, "Pretrain/Step": 2607, "Pretrain/Step Time": 8.424792930483818} +{"Pretrain/Learning Rate": 4.8520739136395674e-05, "Pretrain/Loss": 2.056976556777954, "Pretrain/Loss (Raw)": 2.1806089878082275, "Pretrain/Step": 2608, "Pretrain/Step Time": 8.423016890883446} +{"Pretrain/Learning Rate": 4.8519300194977574e-05, "Pretrain/Loss": 2.0552639961242676, "Pretrain/Loss (Raw)": 1.949028491973877, "Pretrain/Step": 2609, "Pretrain/Step Time": 8.42868086695671} +{"Pretrain/Learning Rate": 4.851786057539703e-05, "Pretrain/Loss": 2.0561418533325195, "Pretrain/Loss (Raw)": 2.092357873916626, "Pretrain/Step": 2610, "Pretrain/Step Time": 8.428441606462002} +{"Pretrain/Learning Rate": 4.851642027769557e-05, "Pretrain/Loss": 2.055987596511841, "Pretrain/Loss (Raw)": 2.029742956161499, "Pretrain/Step": 2611, "Pretrain/Step Time": 8.425498083233833} +{"Pretrain/Learning Rate": 4.85149793019147e-05, "Pretrain/Loss": 2.056756019592285, "Pretrain/Loss (Raw)": 2.2081668376922607, "Pretrain/Step": 2612, "Pretrain/Step Time": 8.428378311917186} +{"Pretrain/Learning Rate": 4.8513537648095974e-05, "Pretrain/Loss": 2.0537471771240234, "Pretrain/Loss (Raw)": 1.902080774307251, "Pretrain/Step": 2613, "Pretrain/Step Time": 8.426709773018956} +{"Pretrain/Learning Rate": 4.8512095316280977e-05, "Pretrain/Loss": 2.0544979572296143, "Pretrain/Loss (Raw)": 2.0125954151153564, "Pretrain/Step": 2614, "Pretrain/Step Time": 8.431520756334066} +{"Pretrain/Learning Rate": 4.851065230651128e-05, "Pretrain/Loss": 2.0557169914245605, "Pretrain/Loss (Raw)": 2.153886556625366, "Pretrain/Step": 2615, "Pretrain/Step Time": 8.429967166855931} +{"Pretrain/Learning Rate": 4.85092086188285e-05, "Pretrain/Loss": 2.0547029972076416, "Pretrain/Loss (Raw)": 2.0152053833007812, "Pretrain/Step": 2616, "Pretrain/Step Time": 8.424162490293384} +{"Pretrain/Learning Rate": 4.8507764253274254e-05, "Pretrain/Loss": 2.055079936981201, "Pretrain/Loss (Raw)": 2.0462019443511963, "Pretrain/Step": 2617, "Pretrain/Step Time": 8.425241135060787} +{"Pretrain/Learning Rate": 4.85063192098902e-05, "Pretrain/Loss": 2.054640054702759, "Pretrain/Loss (Raw)": 2.023324966430664, "Pretrain/Step": 2618, "Pretrain/Step Time": 8.422758642584085} +{"Pretrain/Learning Rate": 4.850487348871802e-05, "Pretrain/Loss": 2.0532355308532715, "Pretrain/Loss (Raw)": 1.73252534866333, "Pretrain/Step": 2619, "Pretrain/Step Time": 8.427391301840544} +{"Pretrain/Learning Rate": 4.850342708979937e-05, "Pretrain/Loss": 2.0542335510253906, "Pretrain/Loss (Raw)": 2.1664481163024902, "Pretrain/Step": 2620, "Pretrain/Step Time": 8.42947960831225} +{"Pretrain/Learning Rate": 4.850198001317596e-05, "Pretrain/Loss": 2.0520217418670654, "Pretrain/Loss (Raw)": 1.9306049346923828, "Pretrain/Step": 2621, "Pretrain/Step Time": 8.427511239424348} +{"Pretrain/Learning Rate": 4.850053225888954e-05, "Pretrain/Loss": 2.052100658416748, "Pretrain/Loss (Raw)": 1.9299837350845337, "Pretrain/Step": 2622, "Pretrain/Step Time": 8.428409880027175} +{"Pretrain/Learning Rate": 4.8499083826981825e-05, "Pretrain/Loss": 2.0504114627838135, "Pretrain/Loss (Raw)": 1.87472665309906, "Pretrain/Step": 2623, "Pretrain/Step Time": 8.426290053874254} +{"Pretrain/Learning Rate": 4.84976347174946e-05, "Pretrain/Loss": 2.0514354705810547, "Pretrain/Loss (Raw)": 2.0376088619232178, "Pretrain/Step": 2624, "Pretrain/Step Time": 8.426895359531045} +{"Pretrain/Learning Rate": 4.8496184930469644e-05, "Pretrain/Loss": 2.0523910522460938, "Pretrain/Loss (Raw)": 2.3659346103668213, "Pretrain/Step": 2625, "Pretrain/Step Time": 8.428784171119332} +{"Pretrain/Learning Rate": 4.849473446594876e-05, "Pretrain/Loss": 2.053429365158081, "Pretrain/Loss (Raw)": 2.130859851837158, "Pretrain/Step": 2626, "Pretrain/Step Time": 8.430512093007565} +{"Pretrain/Learning Rate": 4.849328332397377e-05, "Pretrain/Loss": 2.055072069168091, "Pretrain/Loss (Raw)": 2.1383001804351807, "Pretrain/Step": 2627, "Pretrain/Step Time": 8.427456570789218} +{"Pretrain/Learning Rate": 4.849183150458652e-05, "Pretrain/Loss": 2.0593600273132324, "Pretrain/Loss (Raw)": 2.0709738731384277, "Pretrain/Step": 2628, "Pretrain/Step Time": 8.42540624924004} +{"Pretrain/Learning Rate": 4.8490379007828856e-05, "Pretrain/Loss": 2.059964895248413, "Pretrain/Loss (Raw)": 2.1509735584259033, "Pretrain/Step": 2629, "Pretrain/Step Time": 8.429117776453495} +{"Pretrain/Learning Rate": 4.848892583374268e-05, "Pretrain/Loss": 2.0600504875183105, "Pretrain/Loss (Raw)": 2.223353862762451, "Pretrain/Step": 2630, "Pretrain/Step Time": 8.43110666424036} +{"Pretrain/Learning Rate": 4.848747198236989e-05, "Pretrain/Loss": 2.060227394104004, "Pretrain/Loss (Raw)": 2.045379400253296, "Pretrain/Step": 2631, "Pretrain/Step Time": 8.430998526513577} +{"Pretrain/Learning Rate": 4.848601745375241e-05, "Pretrain/Loss": 2.0615551471710205, "Pretrain/Loss (Raw)": 2.2075035572052, "Pretrain/Step": 2632, "Pretrain/Step Time": 8.431266840547323} +{"Pretrain/Learning Rate": 4.848456224793216e-05, "Pretrain/Loss": 2.0624523162841797, "Pretrain/Loss (Raw)": 2.165356159210205, "Pretrain/Step": 2633, "Pretrain/Step Time": 8.430316967889667} +{"Pretrain/Learning Rate": 4.848310636495111e-05, "Pretrain/Loss": 2.0604982376098633, "Pretrain/Loss (Raw)": 1.9364022016525269, "Pretrain/Step": 2634, "Pretrain/Step Time": 8.427761686965823} +{"Pretrain/Learning Rate": 4.8481649804851256e-05, "Pretrain/Loss": 2.060541868209839, "Pretrain/Loss (Raw)": 2.083772659301758, "Pretrain/Step": 2635, "Pretrain/Step Time": 8.429520167410374} +{"Pretrain/Learning Rate": 4.848019256767458e-05, "Pretrain/Loss": 2.057826042175293, "Pretrain/Loss (Raw)": 1.915616750717163, "Pretrain/Step": 2636, "Pretrain/Step Time": 8.426025921478868} +{"Pretrain/Learning Rate": 4.8478734653463097e-05, "Pretrain/Loss": 2.055983543395996, "Pretrain/Loss (Raw)": 1.9938554763793945, "Pretrain/Step": 2637, "Pretrain/Step Time": 8.428725825622678} +{"Pretrain/Learning Rate": 4.847727606225886e-05, "Pretrain/Loss": 2.0565757751464844, "Pretrain/Loss (Raw)": 2.0036492347717285, "Pretrain/Step": 2638, "Pretrain/Step Time": 8.426742609590292} +{"Pretrain/Learning Rate": 4.847581679410391e-05, "Pretrain/Loss": 2.056792974472046, "Pretrain/Loss (Raw)": 2.1508138179779053, "Pretrain/Step": 2639, "Pretrain/Step Time": 8.424481850117445} +{"Pretrain/Learning Rate": 4.847435684904034e-05, "Pretrain/Loss": 2.0574278831481934, "Pretrain/Loss (Raw)": 2.1145529747009277, "Pretrain/Step": 2640, "Pretrain/Step Time": 8.421468310058117} +{"Pretrain/Learning Rate": 4.847289622711023e-05, "Pretrain/Loss": 2.05737042427063, "Pretrain/Loss (Raw)": 1.8777035474777222, "Pretrain/Step": 2641, "Pretrain/Step Time": 8.424659710377455} +{"Pretrain/Learning Rate": 4.847143492835571e-05, "Pretrain/Loss": 2.0573348999023438, "Pretrain/Loss (Raw)": 1.919433832168579, "Pretrain/Step": 2642, "Pretrain/Step Time": 8.426207875832915} +{"Pretrain/Learning Rate": 4.846997295281891e-05, "Pretrain/Loss": 2.057504653930664, "Pretrain/Loss (Raw)": 1.924521565437317, "Pretrain/Step": 2643, "Pretrain/Step Time": 8.42370212264359} +{"Pretrain/Learning Rate": 4.846851030054198e-05, "Pretrain/Loss": 2.056941509246826, "Pretrain/Loss (Raw)": 2.0824031829833984, "Pretrain/Step": 2644, "Pretrain/Step Time": 8.423624379560351} +{"Pretrain/Learning Rate": 4.846704697156711e-05, "Pretrain/Loss": 2.0559535026550293, "Pretrain/Loss (Raw)": 1.812760353088379, "Pretrain/Step": 2645, "Pretrain/Step Time": 8.424510091543198} +{"Pretrain/Learning Rate": 4.8465582965936474e-05, "Pretrain/Loss": 2.055821418762207, "Pretrain/Loss (Raw)": 2.0134012699127197, "Pretrain/Step": 2646, "Pretrain/Step Time": 8.420859549194574} +{"Pretrain/Learning Rate": 4.84641182836923e-05, "Pretrain/Loss": 2.0566673278808594, "Pretrain/Loss (Raw)": 2.1186492443084717, "Pretrain/Step": 2647, "Pretrain/Step Time": 8.4211295414716} +{"Pretrain/Learning Rate": 4.8462652924876815e-05, "Pretrain/Loss": 2.056706190109253, "Pretrain/Loss (Raw)": 2.0943374633789062, "Pretrain/Step": 2648, "Pretrain/Step Time": 8.423907304182649} +{"Pretrain/Learning Rate": 4.8461186889532274e-05, "Pretrain/Loss": 2.0538249015808105, "Pretrain/Loss (Raw)": 2.050471305847168, "Pretrain/Step": 2649, "Pretrain/Step Time": 8.41853503882885} +{"Pretrain/Learning Rate": 4.845972017770095e-05, "Pretrain/Loss": 2.0520360469818115, "Pretrain/Loss (Raw)": 1.8453519344329834, "Pretrain/Step": 2650, "Pretrain/Step Time": 8.419286562129855} +{"Pretrain/Learning Rate": 4.845825278942513e-05, "Pretrain/Loss": 2.051643133163452, "Pretrain/Loss (Raw)": 1.9651631116867065, "Pretrain/Step": 2651, "Pretrain/Step Time": 8.419197719544172} +{"Pretrain/Learning Rate": 4.845678472474713e-05, "Pretrain/Loss": 2.051274538040161, "Pretrain/Loss (Raw)": 1.935479760169983, "Pretrain/Step": 2652, "Pretrain/Step Time": 8.414081575348973} +{"Pretrain/Learning Rate": 4.845531598370927e-05, "Pretrain/Loss": 2.0519611835479736, "Pretrain/Loss (Raw)": 2.079820394515991, "Pretrain/Step": 2653, "Pretrain/Step Time": 8.420685755088925} +{"Pretrain/Learning Rate": 4.8453846566353916e-05, "Pretrain/Loss": 2.0487377643585205, "Pretrain/Loss (Raw)": 1.933009147644043, "Pretrain/Step": 2654, "Pretrain/Step Time": 8.413499128073454} +{"Pretrain/Learning Rate": 4.845237647272343e-05, "Pretrain/Loss": 2.0483129024505615, "Pretrain/Loss (Raw)": 2.1668996810913086, "Pretrain/Step": 2655, "Pretrain/Step Time": 8.415150942280889} +{"Pretrain/Learning Rate": 4.84509057028602e-05, "Pretrain/Loss": 2.0473499298095703, "Pretrain/Loss (Raw)": 1.9296603202819824, "Pretrain/Step": 2656, "Pretrain/Step Time": 8.417157504707575} +{"Pretrain/Learning Rate": 4.844943425680664e-05, "Pretrain/Loss": 2.0469436645507812, "Pretrain/Loss (Raw)": 1.9518414735794067, "Pretrain/Step": 2657, "Pretrain/Step Time": 8.421537540853024} +{"Pretrain/Learning Rate": 4.844796213460516e-05, "Pretrain/Loss": 2.044801712036133, "Pretrain/Loss (Raw)": 1.882124423980713, "Pretrain/Step": 2658, "Pretrain/Step Time": 8.422044947743416} +{"Pretrain/Learning Rate": 4.844648933629824e-05, "Pretrain/Loss": 2.045742988586426, "Pretrain/Loss (Raw)": 2.065484046936035, "Pretrain/Step": 2659, "Pretrain/Step Time": 8.422903364524245} +{"Pretrain/Learning Rate": 4.8445015861928315e-05, "Pretrain/Loss": 2.047633171081543, "Pretrain/Loss (Raw)": 2.2523303031921387, "Pretrain/Step": 2660, "Pretrain/Step Time": 8.422223819419742} +{"Pretrain/Learning Rate": 4.8443541711537895e-05, "Pretrain/Loss": 2.0441126823425293, "Pretrain/Loss (Raw)": 1.710253119468689, "Pretrain/Step": 2661, "Pretrain/Step Time": 8.421979753300548} +{"Pretrain/Learning Rate": 4.844206688516947e-05, "Pretrain/Loss": 2.046309471130371, "Pretrain/Loss (Raw)": 2.2619545459747314, "Pretrain/Step": 2662, "Pretrain/Step Time": 8.420119216665626} +{"Pretrain/Learning Rate": 4.8440591382865574e-05, "Pretrain/Loss": 2.0485317707061768, "Pretrain/Loss (Raw)": 2.0963571071624756, "Pretrain/Step": 2663, "Pretrain/Step Time": 8.421893294900656} +{"Pretrain/Learning Rate": 4.843911520466875e-05, "Pretrain/Loss": 2.049100160598755, "Pretrain/Loss (Raw)": 2.0419089794158936, "Pretrain/Step": 2664, "Pretrain/Step Time": 8.424103232100606} +{"Pretrain/Learning Rate": 4.843763835062156e-05, "Pretrain/Loss": 2.0526576042175293, "Pretrain/Loss (Raw)": 2.312654495239258, "Pretrain/Step": 2665, "Pretrain/Step Time": 8.422985235229135} +{"Pretrain/Learning Rate": 4.84361608207666e-05, "Pretrain/Loss": 2.0524141788482666, "Pretrain/Loss (Raw)": 2.0694780349731445, "Pretrain/Step": 2666, "Pretrain/Step Time": 8.423243725672364} +{"Pretrain/Learning Rate": 4.843468261514645e-05, "Pretrain/Loss": 2.050910234451294, "Pretrain/Loss (Raw)": 2.071335554122925, "Pretrain/Step": 2667, "Pretrain/Step Time": 8.423200864344835} +{"Pretrain/Learning Rate": 4.8433203733803755e-05, "Pretrain/Loss": 2.0519633293151855, "Pretrain/Loss (Raw)": 2.171680450439453, "Pretrain/Step": 2668, "Pretrain/Step Time": 8.423431258648634} +{"Pretrain/Learning Rate": 4.8431724176781155e-05, "Pretrain/Loss": 2.0523264408111572, "Pretrain/Loss (Raw)": 2.118610143661499, "Pretrain/Step": 2669, "Pretrain/Step Time": 8.42178657092154} +{"Pretrain/Learning Rate": 4.84302439441213e-05, "Pretrain/Loss": 2.0553371906280518, "Pretrain/Loss (Raw)": 2.116542339324951, "Pretrain/Step": 2670, "Pretrain/Step Time": 8.421964837238193} +{"Pretrain/Learning Rate": 4.842876303586688e-05, "Pretrain/Loss": 2.05737042427063, "Pretrain/Loss (Raw)": 2.245011568069458, "Pretrain/Step": 2671, "Pretrain/Step Time": 8.42726867645979} +{"Pretrain/Learning Rate": 4.8427281452060594e-05, "Pretrain/Loss": 2.0589871406555176, "Pretrain/Loss (Raw)": 2.2112960815429688, "Pretrain/Step": 2672, "Pretrain/Step Time": 8.426294591277838} +{"Pretrain/Learning Rate": 4.8425799192745156e-05, "Pretrain/Loss": 2.0573532581329346, "Pretrain/Loss (Raw)": 2.0799977779388428, "Pretrain/Step": 2673, "Pretrain/Step Time": 8.426307428628206} +{"Pretrain/Learning Rate": 4.842431625796332e-05, "Pretrain/Loss": 2.058497905731201, "Pretrain/Loss (Raw)": 2.1463892459869385, "Pretrain/Step": 2674, "Pretrain/Step Time": 8.428914280608296} +{"Pretrain/Learning Rate": 4.842283264775783e-05, "Pretrain/Loss": 2.057960271835327, "Pretrain/Loss (Raw)": 2.0674145221710205, "Pretrain/Step": 2675, "Pretrain/Step Time": 8.426908317953348} +{"Pretrain/Learning Rate": 4.842134836217148e-05, "Pretrain/Loss": 2.059037208557129, "Pretrain/Loss (Raw)": 2.07403302192688, "Pretrain/Step": 2676, "Pretrain/Step Time": 8.425206959247589} +{"Pretrain/Learning Rate": 4.841986340124706e-05, "Pretrain/Loss": 2.0597715377807617, "Pretrain/Loss (Raw)": 2.165915012359619, "Pretrain/Step": 2677, "Pretrain/Step Time": 8.427325632423162} +{"Pretrain/Learning Rate": 4.841837776502739e-05, "Pretrain/Loss": 2.0628561973571777, "Pretrain/Loss (Raw)": 2.3956902027130127, "Pretrain/Step": 2678, "Pretrain/Step Time": 8.427681980654597} +{"Pretrain/Learning Rate": 4.84168914535553e-05, "Pretrain/Loss": 2.0622220039367676, "Pretrain/Loss (Raw)": 2.1220314502716064, "Pretrain/Step": 2679, "Pretrain/Step Time": 8.42669558338821} +{"Pretrain/Learning Rate": 4.841540446687366e-05, "Pretrain/Loss": 2.066819667816162, "Pretrain/Loss (Raw)": 2.107174873352051, "Pretrain/Step": 2680, "Pretrain/Step Time": 8.42234468832612} +{"Pretrain/Learning Rate": 4.841391680502534e-05, "Pretrain/Loss": 2.0688531398773193, "Pretrain/Loss (Raw)": 2.1763663291931152, "Pretrain/Step": 2681, "Pretrain/Step Time": 8.42577140033245} +{"Pretrain/Learning Rate": 4.841242846805323e-05, "Pretrain/Loss": 2.0670275688171387, "Pretrain/Loss (Raw)": 2.249052047729492, "Pretrain/Step": 2682, "Pretrain/Step Time": 8.421389576047659} +{"Pretrain/Learning Rate": 4.841093945600025e-05, "Pretrain/Loss": 2.0670547485351562, "Pretrain/Loss (Raw)": 2.044313669204712, "Pretrain/Step": 2683, "Pretrain/Step Time": 8.422365805134177} +{"Pretrain/Learning Rate": 4.8409449768909335e-05, "Pretrain/Loss": 2.066585063934326, "Pretrain/Loss (Raw)": 2.0223793983459473, "Pretrain/Step": 2684, "Pretrain/Step Time": 8.425432657822967} +{"Pretrain/Learning Rate": 4.8407959406823435e-05, "Pretrain/Loss": 2.0685112476348877, "Pretrain/Loss (Raw)": 2.13273286819458, "Pretrain/Step": 2685, "Pretrain/Step Time": 8.417497538030148} +{"Pretrain/Learning Rate": 4.840646836978553e-05, "Pretrain/Loss": 2.0687203407287598, "Pretrain/Loss (Raw)": 2.010262966156006, "Pretrain/Step": 2686, "Pretrain/Step Time": 8.421711960807443} +{"Pretrain/Learning Rate": 4.840497665783861e-05, "Pretrain/Loss": 2.070669651031494, "Pretrain/Loss (Raw)": 2.172179937362671, "Pretrain/Step": 2687, "Pretrain/Step Time": 8.421424986794591} +{"Pretrain/Learning Rate": 4.840348427102568e-05, "Pretrain/Loss": 2.0697317123413086, "Pretrain/Loss (Raw)": 1.9371274709701538, "Pretrain/Step": 2688, "Pretrain/Step Time": 8.422724138945341} +{"Pretrain/Learning Rate": 4.8401991209389794e-05, "Pretrain/Loss": 2.0694198608398438, "Pretrain/Loss (Raw)": 1.9310294389724731, "Pretrain/Step": 2689, "Pretrain/Step Time": 8.422233128920197} +{"Pretrain/Learning Rate": 4.8400497472973986e-05, "Pretrain/Loss": 2.0700290203094482, "Pretrain/Loss (Raw)": 2.0519907474517822, "Pretrain/Step": 2690, "Pretrain/Step Time": 8.423065843060613} +{"Pretrain/Learning Rate": 4.839900306182132e-05, "Pretrain/Loss": 2.0700185298919678, "Pretrain/Loss (Raw)": 1.9795721769332886, "Pretrain/Step": 2691, "Pretrain/Step Time": 8.421474903821945} +{"Pretrain/Learning Rate": 4.83975079759749e-05, "Pretrain/Loss": 2.0712976455688477, "Pretrain/Loss (Raw)": 2.197275400161743, "Pretrain/Step": 2692, "Pretrain/Step Time": 8.420465487986803} +{"Pretrain/Learning Rate": 4.839601221547783e-05, "Pretrain/Loss": 2.071181535720825, "Pretrain/Loss (Raw)": 2.0564417839050293, "Pretrain/Step": 2693, "Pretrain/Step Time": 8.419274941086769} +{"Pretrain/Learning Rate": 4.839451578037324e-05, "Pretrain/Loss": 2.0709238052368164, "Pretrain/Loss (Raw)": 2.043161153793335, "Pretrain/Step": 2694, "Pretrain/Step Time": 8.419723063707352} +{"Pretrain/Learning Rate": 4.8393018670704294e-05, "Pretrain/Loss": 2.0680060386657715, "Pretrain/Loss (Raw)": 1.8169087171554565, "Pretrain/Step": 2695, "Pretrain/Step Time": 8.417898379266262} +{"Pretrain/Learning Rate": 4.839152088651413e-05, "Pretrain/Loss": 2.069175958633423, "Pretrain/Loss (Raw)": 2.172804117202759, "Pretrain/Step": 2696, "Pretrain/Step Time": 8.416278200224042} +{"Pretrain/Learning Rate": 4.839002242784596e-05, "Pretrain/Loss": 2.0701870918273926, "Pretrain/Loss (Raw)": 2.0564141273498535, "Pretrain/Step": 2697, "Pretrain/Step Time": 8.416151780635118} +{"Pretrain/Learning Rate": 4.838852329474297e-05, "Pretrain/Loss": 2.0722665786743164, "Pretrain/Loss (Raw)": 2.3487842082977295, "Pretrain/Step": 2698, "Pretrain/Step Time": 8.411538077518344} +{"Pretrain/Learning Rate": 4.838702348724841e-05, "Pretrain/Loss": 2.074349880218506, "Pretrain/Loss (Raw)": 2.1558902263641357, "Pretrain/Step": 2699, "Pretrain/Step Time": 8.41549651697278} +{"Pretrain/Learning Rate": 4.8385523005405516e-05, "Pretrain/Loss": 2.074894666671753, "Pretrain/Loss (Raw)": 1.9003108739852905, "Pretrain/Step": 2700, "Pretrain/Step Time": 8.419628100469708} +{"Pretrain/Learning Rate": 4.838402184925754e-05, "Pretrain/Loss": 2.07491135597229, "Pretrain/Loss (Raw)": 2.1837825775146484, "Pretrain/Step": 2701, "Pretrain/Step Time": 8.414193328469992} +{"Pretrain/Learning Rate": 4.8382520018847785e-05, "Pretrain/Loss": 2.0761523246765137, "Pretrain/Loss (Raw)": 2.297456979751587, "Pretrain/Step": 2702, "Pretrain/Step Time": 8.422382026910782} +{"Pretrain/Learning Rate": 4.838101751421955e-05, "Pretrain/Loss": 2.0731141567230225, "Pretrain/Loss (Raw)": 1.8275368213653564, "Pretrain/Step": 2703, "Pretrain/Step Time": 8.421382494270802} +{"Pretrain/Learning Rate": 4.837951433541617e-05, "Pretrain/Loss": 2.074923515319824, "Pretrain/Loss (Raw)": 2.2373008728027344, "Pretrain/Step": 2704, "Pretrain/Step Time": 8.426294034346938} +{"Pretrain/Learning Rate": 4.837801048248095e-05, "Pretrain/Loss": 2.0723235607147217, "Pretrain/Loss (Raw)": 1.953465223312378, "Pretrain/Step": 2705, "Pretrain/Step Time": 8.423864427953959} +{"Pretrain/Learning Rate": 4.83765059554573e-05, "Pretrain/Loss": 2.072242259979248, "Pretrain/Loss (Raw)": 1.9908812046051025, "Pretrain/Step": 2706, "Pretrain/Step Time": 8.422444205731153} +{"Pretrain/Learning Rate": 4.8375000754388566e-05, "Pretrain/Loss": 2.07300066947937, "Pretrain/Loss (Raw)": 2.1036274433135986, "Pretrain/Step": 2707, "Pretrain/Step Time": 8.42208594456315} +{"Pretrain/Learning Rate": 4.837349487931817e-05, "Pretrain/Loss": 2.0708184242248535, "Pretrain/Loss (Raw)": 1.9113996028900146, "Pretrain/Step": 2708, "Pretrain/Step Time": 8.424206905066967} +{"Pretrain/Learning Rate": 4.8371988330289525e-05, "Pretrain/Loss": 2.0733747482299805, "Pretrain/Loss (Raw)": 2.2000579833984375, "Pretrain/Step": 2709, "Pretrain/Step Time": 8.425137462094426} +{"Pretrain/Learning Rate": 4.837048110734607e-05, "Pretrain/Loss": 2.0783302783966064, "Pretrain/Loss (Raw)": 2.3275153636932373, "Pretrain/Step": 2710, "Pretrain/Step Time": 8.426673108711839} +{"Pretrain/Learning Rate": 4.836897321053127e-05, "Pretrain/Loss": 2.0782089233398438, "Pretrain/Loss (Raw)": 2.0655038356781006, "Pretrain/Step": 2711, "Pretrain/Step Time": 8.423488236963749} +{"Pretrain/Learning Rate": 4.83674646398886e-05, "Pretrain/Loss": 2.0774264335632324, "Pretrain/Loss (Raw)": 1.9143261909484863, "Pretrain/Step": 2712, "Pretrain/Step Time": 8.42476830072701} +{"Pretrain/Learning Rate": 4.8365955395461564e-05, "Pretrain/Loss": 2.077800750732422, "Pretrain/Loss (Raw)": 2.1272237300872803, "Pretrain/Step": 2713, "Pretrain/Step Time": 8.422979850322008} +{"Pretrain/Learning Rate": 4.836444547729367e-05, "Pretrain/Loss": 2.0780529975891113, "Pretrain/Loss (Raw)": 2.2446906566619873, "Pretrain/Step": 2714, "Pretrain/Step Time": 8.417379321530461} +{"Pretrain/Learning Rate": 4.836293488542847e-05, "Pretrain/Loss": 2.079011917114258, "Pretrain/Loss (Raw)": 2.0949137210845947, "Pretrain/Step": 2715, "Pretrain/Step Time": 8.416232185438275} +{"Pretrain/Learning Rate": 4.836142361990951e-05, "Pretrain/Loss": 2.0775439739227295, "Pretrain/Loss (Raw)": 2.0851409435272217, "Pretrain/Step": 2716, "Pretrain/Step Time": 8.414978699758649} +{"Pretrain/Learning Rate": 4.835991168078037e-05, "Pretrain/Loss": 2.0760018825531006, "Pretrain/Loss (Raw)": 1.9292547702789307, "Pretrain/Step": 2717, "Pretrain/Step Time": 8.419508332386613} +{"Pretrain/Learning Rate": 4.8358399068084635e-05, "Pretrain/Loss": 2.0745553970336914, "Pretrain/Loss (Raw)": 1.9930787086486816, "Pretrain/Step": 2718, "Pretrain/Step Time": 8.41619686037302} +{"Pretrain/Learning Rate": 4.8356885781865936e-05, "Pretrain/Loss": 2.075488567352295, "Pretrain/Loss (Raw)": 2.41530442237854, "Pretrain/Step": 2719, "Pretrain/Step Time": 8.422362629324198} +{"Pretrain/Learning Rate": 4.83553718221679e-05, "Pretrain/Loss": 2.0760016441345215, "Pretrain/Loss (Raw)": 2.1539881229400635, "Pretrain/Step": 2720, "Pretrain/Step Time": 8.422872569411993} +{"Pretrain/Learning Rate": 4.835385718903418e-05, "Pretrain/Loss": 2.074716091156006, "Pretrain/Loss (Raw)": 2.0787458419799805, "Pretrain/Step": 2721, "Pretrain/Step Time": 8.420982148498297} +{"Pretrain/Learning Rate": 4.8352341882508456e-05, "Pretrain/Loss": 2.074134349822998, "Pretrain/Loss (Raw)": 2.1551995277404785, "Pretrain/Step": 2722, "Pretrain/Step Time": 8.42334240861237} +{"Pretrain/Learning Rate": 4.835082590263441e-05, "Pretrain/Loss": 2.0724730491638184, "Pretrain/Loss (Raw)": 1.934937834739685, "Pretrain/Step": 2723, "Pretrain/Step Time": 8.422103701159358} +{"Pretrain/Learning Rate": 4.834930924945576e-05, "Pretrain/Loss": 2.0710947513580322, "Pretrain/Loss (Raw)": 2.38285493850708, "Pretrain/Step": 2724, "Pretrain/Step Time": 8.421428812667727} +{"Pretrain/Learning Rate": 4.834779192301625e-05, "Pretrain/Loss": 2.0686140060424805, "Pretrain/Loss (Raw)": 1.8972667455673218, "Pretrain/Step": 2725, "Pretrain/Step Time": 8.424280798062682} +{"Pretrain/Learning Rate": 4.834627392335961e-05, "Pretrain/Loss": 2.068131446838379, "Pretrain/Loss (Raw)": 1.949763298034668, "Pretrain/Step": 2726, "Pretrain/Step Time": 8.421514123678207} +{"Pretrain/Learning Rate": 4.834475525052961e-05, "Pretrain/Loss": 2.068103790283203, "Pretrain/Loss (Raw)": 1.9903839826583862, "Pretrain/Step": 2727, "Pretrain/Step Time": 8.420371999964118} +{"Pretrain/Learning Rate": 4.834323590457007e-05, "Pretrain/Loss": 2.067045211791992, "Pretrain/Loss (Raw)": 1.835047721862793, "Pretrain/Step": 2728, "Pretrain/Step Time": 8.419374112039804} +{"Pretrain/Learning Rate": 4.8341715885524766e-05, "Pretrain/Loss": 2.066263437271118, "Pretrain/Loss (Raw)": 2.061640501022339, "Pretrain/Step": 2729, "Pretrain/Step Time": 8.416086584329605} +{"Pretrain/Learning Rate": 4.8340195193437546e-05, "Pretrain/Loss": 2.0638558864593506, "Pretrain/Loss (Raw)": 1.7625162601470947, "Pretrain/Step": 2730, "Pretrain/Step Time": 8.41896446608007} +{"Pretrain/Learning Rate": 4.8338673828352243e-05, "Pretrain/Loss": 2.0635809898376465, "Pretrain/Loss (Raw)": 2.037938117980957, "Pretrain/Step": 2731, "Pretrain/Step Time": 8.418223826214671} +{"Pretrain/Learning Rate": 4.833715179031274e-05, "Pretrain/Loss": 2.0648677349090576, "Pretrain/Loss (Raw)": 2.2859814167022705, "Pretrain/Step": 2732, "Pretrain/Step Time": 8.419943807646632} +{"Pretrain/Learning Rate": 4.833562907936291e-05, "Pretrain/Loss": 2.065342903137207, "Pretrain/Loss (Raw)": 2.0833630561828613, "Pretrain/Step": 2733, "Pretrain/Step Time": 8.41935557872057} +{"Pretrain/Learning Rate": 4.833410569554667e-05, "Pretrain/Loss": 2.066521167755127, "Pretrain/Loss (Raw)": 2.0546274185180664, "Pretrain/Step": 2734, "Pretrain/Step Time": 8.42093999311328} +{"Pretrain/Learning Rate": 4.833258163890794e-05, "Pretrain/Loss": 2.0655903816223145, "Pretrain/Loss (Raw)": 1.9048963785171509, "Pretrain/Step": 2735, "Pretrain/Step Time": 8.422457775101066} +{"Pretrain/Learning Rate": 4.833105690949067e-05, "Pretrain/Loss": 2.064451217651367, "Pretrain/Loss (Raw)": 2.0347888469696045, "Pretrain/Step": 2736, "Pretrain/Step Time": 8.42105002142489} +{"Pretrain/Learning Rate": 4.8329531507338824e-05, "Pretrain/Loss": 2.0642006397247314, "Pretrain/Loss (Raw)": 1.916946530342102, "Pretrain/Step": 2737, "Pretrain/Step Time": 8.41804701462388} +{"Pretrain/Learning Rate": 4.8328005432496374e-05, "Pretrain/Loss": 2.0665974617004395, "Pretrain/Loss (Raw)": 2.399137020111084, "Pretrain/Step": 2738, "Pretrain/Step Time": 8.42120879329741} +{"Pretrain/Learning Rate": 4.8326478685007334e-05, "Pretrain/Loss": 2.0663633346557617, "Pretrain/Loss (Raw)": 1.9997901916503906, "Pretrain/Step": 2739, "Pretrain/Step Time": 8.417738607153296} +{"Pretrain/Learning Rate": 4.832495126491573e-05, "Pretrain/Loss": 2.066053628921509, "Pretrain/Loss (Raw)": 2.1685261726379395, "Pretrain/Step": 2740, "Pretrain/Step Time": 8.415881602093577} +{"Pretrain/Learning Rate": 4.83234231722656e-05, "Pretrain/Loss": 2.066901683807373, "Pretrain/Loss (Raw)": 2.01062273979187, "Pretrain/Step": 2741, "Pretrain/Step Time": 8.415905328467488} +{"Pretrain/Learning Rate": 4.8321894407101e-05, "Pretrain/Loss": 2.0665245056152344, "Pretrain/Loss (Raw)": 1.964324712753296, "Pretrain/Step": 2742, "Pretrain/Step Time": 8.414121059700847} +{"Pretrain/Learning Rate": 4.832036496946602e-05, "Pretrain/Loss": 2.066591501235962, "Pretrain/Loss (Raw)": 2.1624581813812256, "Pretrain/Step": 2743, "Pretrain/Step Time": 8.411611888557673} +{"Pretrain/Learning Rate": 4.8318834859404746e-05, "Pretrain/Loss": 2.0668673515319824, "Pretrain/Loss (Raw)": 2.050516128540039, "Pretrain/Step": 2744, "Pretrain/Step Time": 8.40681585855782} +{"Pretrain/Learning Rate": 4.831730407696132e-05, "Pretrain/Loss": 2.066537618637085, "Pretrain/Loss (Raw)": 2.0039873123168945, "Pretrain/Step": 2745, "Pretrain/Step Time": 8.41094284132123} +{"Pretrain/Learning Rate": 4.8315772622179865e-05, "Pretrain/Loss": 2.0663161277770996, "Pretrain/Loss (Raw)": 1.995003581047058, "Pretrain/Step": 2746, "Pretrain/Step Time": 8.416393831372261} +{"Pretrain/Learning Rate": 4.831424049510454e-05, "Pretrain/Loss": 2.068648099899292, "Pretrain/Loss (Raw)": 2.0310070514678955, "Pretrain/Step": 2747, "Pretrain/Step Time": 8.41044807061553} +{"Pretrain/Learning Rate": 4.831270769577953e-05, "Pretrain/Loss": 2.0685646533966064, "Pretrain/Loss (Raw)": 2.155778646469116, "Pretrain/Step": 2748, "Pretrain/Step Time": 8.408070588484406} +{"Pretrain/Learning Rate": 4.831117422424902e-05, "Pretrain/Loss": 2.0714917182922363, "Pretrain/Loss (Raw)": 2.305280923843384, "Pretrain/Step": 2749, "Pretrain/Step Time": 8.412070905789733} +{"Pretrain/Learning Rate": 4.830964008055724e-05, "Pretrain/Loss": 2.074481964111328, "Pretrain/Loss (Raw)": 2.3127145767211914, "Pretrain/Step": 2750, "Pretrain/Step Time": 8.41031058691442} +{"Pretrain/Learning Rate": 4.830810526474843e-05, "Pretrain/Loss": 2.0765035152435303, "Pretrain/Loss (Raw)": 2.133484363555908, "Pretrain/Step": 2751, "Pretrain/Step Time": 8.413495877757668} +{"Pretrain/Learning Rate": 4.830656977686682e-05, "Pretrain/Loss": 2.0765469074249268, "Pretrain/Loss (Raw)": 2.043170928955078, "Pretrain/Step": 2752, "Pretrain/Step Time": 8.414549952372909} +{"Pretrain/Learning Rate": 4.8305033616956704e-05, "Pretrain/Loss": 2.074615955352783, "Pretrain/Loss (Raw)": 2.11875057220459, "Pretrain/Step": 2753, "Pretrain/Step Time": 8.413683811202645} +{"Pretrain/Learning Rate": 4.830349678506238e-05, "Pretrain/Loss": 2.07452654838562, "Pretrain/Loss (Raw)": 2.1194231510162354, "Pretrain/Step": 2754, "Pretrain/Step Time": 8.414947468787432} +{"Pretrain/Learning Rate": 4.8301959281228146e-05, "Pretrain/Loss": 2.074312448501587, "Pretrain/Loss (Raw)": 2.1108994483947754, "Pretrain/Step": 2755, "Pretrain/Step Time": 8.415201757103205} +{"Pretrain/Learning Rate": 4.8300421105498353e-05, "Pretrain/Loss": 2.0734267234802246, "Pretrain/Loss (Raw)": 1.9575817584991455, "Pretrain/Step": 2756, "Pretrain/Step Time": 8.415320608764887} +{"Pretrain/Learning Rate": 4.8298882257917335e-05, "Pretrain/Loss": 2.073273181915283, "Pretrain/Loss (Raw)": 2.131338357925415, "Pretrain/Step": 2757, "Pretrain/Step Time": 8.414121832698584} +{"Pretrain/Learning Rate": 4.8297342738529474e-05, "Pretrain/Loss": 2.0721912384033203, "Pretrain/Loss (Raw)": 2.0848476886749268, "Pretrain/Step": 2758, "Pretrain/Step Time": 8.415478091686964} +{"Pretrain/Learning Rate": 4.829580254737916e-05, "Pretrain/Loss": 2.0738368034362793, "Pretrain/Loss (Raw)": 2.2560391426086426, "Pretrain/Step": 2759, "Pretrain/Step Time": 8.412863548845053} +{"Pretrain/Learning Rate": 4.82942616845108e-05, "Pretrain/Loss": 2.0731148719787598, "Pretrain/Loss (Raw)": 2.115093231201172, "Pretrain/Step": 2760, "Pretrain/Step Time": 8.411474151536822} +{"Pretrain/Learning Rate": 4.8292720149968824e-05, "Pretrain/Loss": 2.071524143218994, "Pretrain/Loss (Raw)": 1.9617459774017334, "Pretrain/Step": 2761, "Pretrain/Step Time": 8.410720417276025} +{"Pretrain/Learning Rate": 4.8291177943797686e-05, "Pretrain/Loss": 2.0720062255859375, "Pretrain/Loss (Raw)": 1.998104453086853, "Pretrain/Step": 2762, "Pretrain/Step Time": 8.414846736937761} +{"Pretrain/Learning Rate": 4.828963506604185e-05, "Pretrain/Loss": 2.072244644165039, "Pretrain/Loss (Raw)": 2.1142737865448, "Pretrain/Step": 2763, "Pretrain/Step Time": 8.414689904078841} +{"Pretrain/Learning Rate": 4.8288091516745804e-05, "Pretrain/Loss": 2.072208881378174, "Pretrain/Loss (Raw)": 1.9110264778137207, "Pretrain/Step": 2764, "Pretrain/Step Time": 8.41582670621574} +{"Pretrain/Learning Rate": 4.828654729595405e-05, "Pretrain/Loss": 2.075941324234009, "Pretrain/Loss (Raw)": 2.471628189086914, "Pretrain/Step": 2765, "Pretrain/Step Time": 8.416711641475558} +{"Pretrain/Learning Rate": 4.828500240371113e-05, "Pretrain/Loss": 2.0767109394073486, "Pretrain/Loss (Raw)": 2.1021554470062256, "Pretrain/Step": 2766, "Pretrain/Step Time": 8.41790571436286} +{"Pretrain/Learning Rate": 4.828345684006158e-05, "Pretrain/Loss": 2.074833631515503, "Pretrain/Loss (Raw)": 1.9105286598205566, "Pretrain/Step": 2767, "Pretrain/Step Time": 8.422696970403194} +{"Pretrain/Learning Rate": 4.828191060504997e-05, "Pretrain/Loss": 2.0777947902679443, "Pretrain/Loss (Raw)": 2.4935696125030518, "Pretrain/Step": 2768, "Pretrain/Step Time": 8.425881756469607} +{"Pretrain/Learning Rate": 4.828036369872087e-05, "Pretrain/Loss": 2.0790860652923584, "Pretrain/Loss (Raw)": 2.042991876602173, "Pretrain/Step": 2769, "Pretrain/Step Time": 8.419585414230824} +{"Pretrain/Learning Rate": 4.8278816121118894e-05, "Pretrain/Loss": 2.082242012023926, "Pretrain/Loss (Raw)": 2.323392152786255, "Pretrain/Step": 2770, "Pretrain/Step Time": 8.422327294945717} +{"Pretrain/Learning Rate": 4.827726787228868e-05, "Pretrain/Loss": 2.0837032794952393, "Pretrain/Loss (Raw)": 2.111569404602051, "Pretrain/Step": 2771, "Pretrain/Step Time": 8.422728514298797} +{"Pretrain/Learning Rate": 4.827571895227484e-05, "Pretrain/Loss": 2.086639881134033, "Pretrain/Loss (Raw)": 2.458298683166504, "Pretrain/Step": 2772, "Pretrain/Step Time": 8.422989498823881} +{"Pretrain/Learning Rate": 4.827416936112206e-05, "Pretrain/Loss": 2.0881426334381104, "Pretrain/Loss (Raw)": 2.0051114559173584, "Pretrain/Step": 2773, "Pretrain/Step Time": 8.424114223569632} +{"Pretrain/Learning Rate": 4.827261909887502e-05, "Pretrain/Loss": 2.0880727767944336, "Pretrain/Loss (Raw)": 2.0044078826904297, "Pretrain/Step": 2774, "Pretrain/Step Time": 8.419462643563747} +{"Pretrain/Learning Rate": 4.8271068165578406e-05, "Pretrain/Loss": 2.086982250213623, "Pretrain/Loss (Raw)": 1.9791146516799927, "Pretrain/Step": 2775, "Pretrain/Step Time": 8.417909298092127} +{"Pretrain/Learning Rate": 4.826951656127694e-05, "Pretrain/Loss": 2.087353229522705, "Pretrain/Loss (Raw)": 2.1418261528015137, "Pretrain/Step": 2776, "Pretrain/Step Time": 8.414959931746125} +{"Pretrain/Learning Rate": 4.826796428601538e-05, "Pretrain/Loss": 2.0880422592163086, "Pretrain/Loss (Raw)": 2.1386406421661377, "Pretrain/Step": 2777, "Pretrain/Step Time": 8.411875328049064} +{"Pretrain/Learning Rate": 4.826641133983847e-05, "Pretrain/Loss": 2.090085744857788, "Pretrain/Loss (Raw)": 2.106917142868042, "Pretrain/Step": 2778, "Pretrain/Step Time": 8.41408327780664} +{"Pretrain/Learning Rate": 4.826485772279098e-05, "Pretrain/Loss": 2.090580940246582, "Pretrain/Loss (Raw)": 2.028573751449585, "Pretrain/Step": 2779, "Pretrain/Step Time": 8.41398367099464} +{"Pretrain/Learning Rate": 4.826330343491773e-05, "Pretrain/Loss": 2.0912914276123047, "Pretrain/Loss (Raw)": 2.0263845920562744, "Pretrain/Step": 2780, "Pretrain/Step Time": 8.414869744330645} +{"Pretrain/Learning Rate": 4.826174847626352e-05, "Pretrain/Loss": 2.091989517211914, "Pretrain/Loss (Raw)": 2.1691887378692627, "Pretrain/Step": 2781, "Pretrain/Step Time": 8.410714650526643} +{"Pretrain/Learning Rate": 4.82601928468732e-05, "Pretrain/Loss": 2.093047618865967, "Pretrain/Loss (Raw)": 2.0684354305267334, "Pretrain/Step": 2782, "Pretrain/Step Time": 8.417177250608802} +{"Pretrain/Learning Rate": 4.82586365467916e-05, "Pretrain/Loss": 2.092144012451172, "Pretrain/Loss (Raw)": 2.051286220550537, "Pretrain/Step": 2783, "Pretrain/Step Time": 8.412814490497112} +{"Pretrain/Learning Rate": 4.825707957606362e-05, "Pretrain/Loss": 2.092846632003784, "Pretrain/Loss (Raw)": 2.019562244415283, "Pretrain/Step": 2784, "Pretrain/Step Time": 8.411249950528145} +{"Pretrain/Learning Rate": 4.825552193473415e-05, "Pretrain/Loss": 2.095130681991577, "Pretrain/Loss (Raw)": 2.244201898574829, "Pretrain/Step": 2785, "Pretrain/Step Time": 8.403668992221355} +{"Pretrain/Learning Rate": 4.8253963622848095e-05, "Pretrain/Loss": 2.0993356704711914, "Pretrain/Loss (Raw)": 2.420366048812866, "Pretrain/Step": 2786, "Pretrain/Step Time": 8.411496991291642} +{"Pretrain/Learning Rate": 4.82524046404504e-05, "Pretrain/Loss": 2.101191520690918, "Pretrain/Loss (Raw)": 2.303009510040283, "Pretrain/Step": 2787, "Pretrain/Step Time": 8.40871232189238} +{"Pretrain/Learning Rate": 4.8250844987586e-05, "Pretrain/Loss": 2.1008687019348145, "Pretrain/Loss (Raw)": 2.211005210876465, "Pretrain/Step": 2788, "Pretrain/Step Time": 8.406670263037086} +{"Pretrain/Learning Rate": 4.8249284664299875e-05, "Pretrain/Loss": 2.103893518447876, "Pretrain/Loss (Raw)": 2.0974671840667725, "Pretrain/Step": 2789, "Pretrain/Step Time": 8.408617217093706} +{"Pretrain/Learning Rate": 4.8247723670637027e-05, "Pretrain/Loss": 2.103254556655884, "Pretrain/Loss (Raw)": 2.180147886276245, "Pretrain/Step": 2790, "Pretrain/Step Time": 8.409339310601354} +{"Pretrain/Learning Rate": 4.8246162006642434e-05, "Pretrain/Loss": 2.1040775775909424, "Pretrain/Loss (Raw)": 2.2017111778259277, "Pretrain/Step": 2791, "Pretrain/Step Time": 8.408848168328404} +{"Pretrain/Learning Rate": 4.8244599672361167e-05, "Pretrain/Loss": 2.104292631149292, "Pretrain/Loss (Raw)": 2.0694358348846436, "Pretrain/Step": 2792, "Pretrain/Step Time": 8.405728280544281} +{"Pretrain/Learning Rate": 4.8243036667838246e-05, "Pretrain/Loss": 2.1034843921661377, "Pretrain/Loss (Raw)": 2.2092034816741943, "Pretrain/Step": 2793, "Pretrain/Step Time": 8.40309638902545} +{"Pretrain/Learning Rate": 4.8241472993118753e-05, "Pretrain/Loss": 2.1048362255096436, "Pretrain/Loss (Raw)": 2.242515802383423, "Pretrain/Step": 2794, "Pretrain/Step Time": 8.403299827128649} +{"Pretrain/Learning Rate": 4.8239908648247766e-05, "Pretrain/Loss": 2.1027963161468506, "Pretrain/Loss (Raw)": 1.8102343082427979, "Pretrain/Step": 2795, "Pretrain/Step Time": 8.403875498101115} +{"Pretrain/Learning Rate": 4.82383436332704e-05, "Pretrain/Loss": 2.1008942127227783, "Pretrain/Loss (Raw)": 1.9281885623931885, "Pretrain/Step": 2796, "Pretrain/Step Time": 8.401757100597024} +{"Pretrain/Learning Rate": 4.823677794823177e-05, "Pretrain/Loss": 2.1018688678741455, "Pretrain/Loss (Raw)": 2.243365526199341, "Pretrain/Step": 2797, "Pretrain/Step Time": 8.400854639708996} +{"Pretrain/Learning Rate": 4.8235211593177036e-05, "Pretrain/Loss": 2.1012473106384277, "Pretrain/Loss (Raw)": 2.036968231201172, "Pretrain/Step": 2798, "Pretrain/Step Time": 8.403185399249196} +{"Pretrain/Learning Rate": 4.823364456815135e-05, "Pretrain/Loss": 2.1010901927948, "Pretrain/Loss (Raw)": 2.22493052482605, "Pretrain/Step": 2799, "Pretrain/Step Time": 8.401900447905064} +{"Pretrain/Learning Rate": 4.8232076873199905e-05, "Pretrain/Loss": 2.1031951904296875, "Pretrain/Loss (Raw)": 2.4807403087615967, "Pretrain/Step": 2800, "Pretrain/Step Time": 8.402849983423948} +{"Pretrain/Learning Rate": 4.82305085083679e-05, "Pretrain/Loss": 2.104382038116455, "Pretrain/Loss (Raw)": 2.2319023609161377, "Pretrain/Step": 2801, "Pretrain/Step Time": 8.405520297586918} +{"Pretrain/Learning Rate": 4.822893947370056e-05, "Pretrain/Loss": 2.102107524871826, "Pretrain/Loss (Raw)": 1.8552473783493042, "Pretrain/Step": 2802, "Pretrain/Step Time": 8.403750084340572} +{"Pretrain/Learning Rate": 4.822736976924312e-05, "Pretrain/Loss": 2.102889060974121, "Pretrain/Loss (Raw)": 2.167466878890991, "Pretrain/Step": 2803, "Pretrain/Step Time": 8.401970433071256} +{"Pretrain/Learning Rate": 4.822579939504086e-05, "Pretrain/Loss": 2.104160785675049, "Pretrain/Loss (Raw)": 2.2367913722991943, "Pretrain/Step": 2804, "Pretrain/Step Time": 8.402641436085105} +{"Pretrain/Learning Rate": 4.8224228351139034e-05, "Pretrain/Loss": 2.102874279022217, "Pretrain/Loss (Raw)": 2.0012781620025635, "Pretrain/Step": 2805, "Pretrain/Step Time": 8.404002234339714} +{"Pretrain/Learning Rate": 4.8222656637582965e-05, "Pretrain/Loss": 2.10132098197937, "Pretrain/Loss (Raw)": 2.196840524673462, "Pretrain/Step": 2806, "Pretrain/Step Time": 8.402545502409339} +{"Pretrain/Learning Rate": 4.822108425441796e-05, "Pretrain/Loss": 2.099949359893799, "Pretrain/Loss (Raw)": 1.946465015411377, "Pretrain/Step": 2807, "Pretrain/Step Time": 8.401659658178687} +{"Pretrain/Learning Rate": 4.821951120168936e-05, "Pretrain/Loss": 2.09995698928833, "Pretrain/Loss (Raw)": 2.1081748008728027, "Pretrain/Step": 2808, "Pretrain/Step Time": 8.403696222230792} +{"Pretrain/Learning Rate": 4.821793747944252e-05, "Pretrain/Loss": 2.10046124458313, "Pretrain/Loss (Raw)": 2.2408933639526367, "Pretrain/Step": 2809, "Pretrain/Step Time": 8.401643382385373} +{"Pretrain/Learning Rate": 4.821636308772282e-05, "Pretrain/Loss": 2.099611282348633, "Pretrain/Loss (Raw)": 2.140260934829712, "Pretrain/Step": 2810, "Pretrain/Step Time": 8.398906217887998} +{"Pretrain/Learning Rate": 4.8214788026575664e-05, "Pretrain/Loss": 2.0995705127716064, "Pretrain/Loss (Raw)": 2.039085626602173, "Pretrain/Step": 2811, "Pretrain/Step Time": 8.398163152858615} +{"Pretrain/Learning Rate": 4.821321229604645e-05, "Pretrain/Loss": 2.099775552749634, "Pretrain/Loss (Raw)": 2.04862117767334, "Pretrain/Step": 2812, "Pretrain/Step Time": 8.397064873948693} +{"Pretrain/Learning Rate": 4.821163589618063e-05, "Pretrain/Loss": 2.098386287689209, "Pretrain/Loss (Raw)": 1.954924464225769, "Pretrain/Step": 2813, "Pretrain/Step Time": 8.403226604685187} +{"Pretrain/Learning Rate": 4.821005882702365e-05, "Pretrain/Loss": 2.097561836242676, "Pretrain/Loss (Raw)": 1.9047062397003174, "Pretrain/Step": 2814, "Pretrain/Step Time": 8.401397921144962} +{"Pretrain/Learning Rate": 4.820848108862099e-05, "Pretrain/Loss": 2.0967912673950195, "Pretrain/Loss (Raw)": 2.073563575744629, "Pretrain/Step": 2815, "Pretrain/Step Time": 8.39985877647996} +{"Pretrain/Learning Rate": 4.8206902681018135e-05, "Pretrain/Loss": 2.098971366882324, "Pretrain/Loss (Raw)": 2.2161967754364014, "Pretrain/Step": 2816, "Pretrain/Step Time": 8.399839343503118} +{"Pretrain/Learning Rate": 4.82053236042606e-05, "Pretrain/Loss": 2.1012423038482666, "Pretrain/Loss (Raw)": 2.221708059310913, "Pretrain/Step": 2817, "Pretrain/Step Time": 8.399726148694754} +{"Pretrain/Learning Rate": 4.820374385839392e-05, "Pretrain/Loss": 2.102966785430908, "Pretrain/Loss (Raw)": 2.272726058959961, "Pretrain/Step": 2818, "Pretrain/Step Time": 8.408169075846672} +{"Pretrain/Learning Rate": 4.820216344346364e-05, "Pretrain/Loss": 2.104146957397461, "Pretrain/Loss (Raw)": 2.1305975914001465, "Pretrain/Step": 2819, "Pretrain/Step Time": 8.405535468831658} +{"Pretrain/Learning Rate": 4.820058235951534e-05, "Pretrain/Loss": 2.1034092903137207, "Pretrain/Loss (Raw)": 2.102902889251709, "Pretrain/Step": 2820, "Pretrain/Step Time": 8.403438713401556} +{"Pretrain/Learning Rate": 4.81990006065946e-05, "Pretrain/Loss": 2.1024789810180664, "Pretrain/Loss (Raw)": 1.9373388290405273, "Pretrain/Step": 2821, "Pretrain/Step Time": 8.405204696580768} +{"Pretrain/Learning Rate": 4.819741818474704e-05, "Pretrain/Loss": 2.101673126220703, "Pretrain/Loss (Raw)": 1.9399919509887695, "Pretrain/Step": 2822, "Pretrain/Step Time": 8.40968194231391} +{"Pretrain/Learning Rate": 4.819583509401826e-05, "Pretrain/Loss": 2.1044602394104004, "Pretrain/Loss (Raw)": 2.1736671924591064, "Pretrain/Step": 2823, "Pretrain/Step Time": 8.407069489359856} +{"Pretrain/Learning Rate": 4.819425133445394e-05, "Pretrain/Loss": 2.101815938949585, "Pretrain/Loss (Raw)": 1.8343281745910645, "Pretrain/Step": 2824, "Pretrain/Step Time": 8.408580090850592} +{"Pretrain/Learning Rate": 4.819266690609973e-05, "Pretrain/Loss": 2.1007936000823975, "Pretrain/Loss (Raw)": 1.925582766532898, "Pretrain/Step": 2825, "Pretrain/Step Time": 8.404344204813242} +{"Pretrain/Learning Rate": 4.819108180900132e-05, "Pretrain/Loss": 2.099576950073242, "Pretrain/Loss (Raw)": 2.1930227279663086, "Pretrain/Step": 2826, "Pretrain/Step Time": 8.408778408542275} +{"Pretrain/Learning Rate": 4.818949604320442e-05, "Pretrain/Loss": 2.0977566242218018, "Pretrain/Loss (Raw)": 1.9228802919387817, "Pretrain/Step": 2827, "Pretrain/Step Time": 8.4052658341825} +{"Pretrain/Learning Rate": 4.8187909608754744e-05, "Pretrain/Loss": 2.1007285118103027, "Pretrain/Loss (Raw)": 2.2807531356811523, "Pretrain/Step": 2828, "Pretrain/Step Time": 8.402468418702483} +{"Pretrain/Learning Rate": 4.818632250569804e-05, "Pretrain/Loss": 2.100376605987549, "Pretrain/Loss (Raw)": 2.1387500762939453, "Pretrain/Step": 2829, "Pretrain/Step Time": 8.402730792760849} +{"Pretrain/Learning Rate": 4.818473473408007e-05, "Pretrain/Loss": 2.0979981422424316, "Pretrain/Loss (Raw)": 1.9929795265197754, "Pretrain/Step": 2830, "Pretrain/Step Time": 8.404825111851096} +{"Pretrain/Learning Rate": 4.8183146293946625e-05, "Pretrain/Loss": 2.0972070693969727, "Pretrain/Loss (Raw)": 1.7262787818908691, "Pretrain/Step": 2831, "Pretrain/Step Time": 8.404190255329013} +{"Pretrain/Learning Rate": 4.8181557185343496e-05, "Pretrain/Loss": 2.0949978828430176, "Pretrain/Loss (Raw)": 1.9545459747314453, "Pretrain/Step": 2832, "Pretrain/Step Time": 8.401547566056252} +{"Pretrain/Learning Rate": 4.817996740831651e-05, "Pretrain/Loss": 2.0965638160705566, "Pretrain/Loss (Raw)": 2.15389347076416, "Pretrain/Step": 2833, "Pretrain/Step Time": 8.405622113496065} +{"Pretrain/Learning Rate": 4.81783769629115e-05, "Pretrain/Loss": 2.0961251258850098, "Pretrain/Loss (Raw)": 1.9347137212753296, "Pretrain/Step": 2834, "Pretrain/Step Time": 8.405063834041357} +{"Pretrain/Learning Rate": 4.8176785849174336e-05, "Pretrain/Loss": 2.0964646339416504, "Pretrain/Loss (Raw)": 2.147104501724243, "Pretrain/Step": 2835, "Pretrain/Step Time": 8.402422308921814} +{"Pretrain/Learning Rate": 4.8175194067150884e-05, "Pretrain/Loss": 2.0988998413085938, "Pretrain/Loss (Raw)": 2.223083257675171, "Pretrain/Step": 2836, "Pretrain/Step Time": 8.3979572057724} +{"Pretrain/Learning Rate": 4.817360161688705e-05, "Pretrain/Loss": 2.098452568054199, "Pretrain/Loss (Raw)": 2.1428425312042236, "Pretrain/Step": 2837, "Pretrain/Step Time": 8.39864906668663} +{"Pretrain/Learning Rate": 4.817200849842875e-05, "Pretrain/Loss": 2.09780216217041, "Pretrain/Loss (Raw)": 2.244241237640381, "Pretrain/Step": 2838, "Pretrain/Step Time": 8.39839437045157} +{"Pretrain/Learning Rate": 4.817041471182192e-05, "Pretrain/Loss": 2.098503828048706, "Pretrain/Loss (Raw)": 2.1553120613098145, "Pretrain/Step": 2839, "Pretrain/Step Time": 8.399472389370203} +{"Pretrain/Learning Rate": 4.816882025711252e-05, "Pretrain/Loss": 2.097325563430786, "Pretrain/Loss (Raw)": 1.763502836227417, "Pretrain/Step": 2840, "Pretrain/Step Time": 8.396744202822447} +{"Pretrain/Learning Rate": 4.816722513434652e-05, "Pretrain/Loss": 2.0969181060791016, "Pretrain/Loss (Raw)": 2.075108528137207, "Pretrain/Step": 2841, "Pretrain/Step Time": 8.398335579782724} +{"Pretrain/Learning Rate": 4.8165629343569904e-05, "Pretrain/Loss": 2.095250129699707, "Pretrain/Loss (Raw)": 2.031167984008789, "Pretrain/Step": 2842, "Pretrain/Step Time": 8.399517562240362} +{"Pretrain/Learning Rate": 4.816403288482871e-05, "Pretrain/Loss": 2.0942163467407227, "Pretrain/Loss (Raw)": 1.9625681638717651, "Pretrain/Step": 2843, "Pretrain/Step Time": 8.40218649059534} +{"Pretrain/Learning Rate": 4.816243575816895e-05, "Pretrain/Loss": 2.0944132804870605, "Pretrain/Loss (Raw)": 2.1103579998016357, "Pretrain/Step": 2844, "Pretrain/Step Time": 8.403382997959852} +{"Pretrain/Learning Rate": 4.816083796363669e-05, "Pretrain/Loss": 2.09515643119812, "Pretrain/Loss (Raw)": 2.024416923522949, "Pretrain/Step": 2845, "Pretrain/Step Time": 8.400426361709833} +{"Pretrain/Learning Rate": 4.815923950127799e-05, "Pretrain/Loss": 2.095161199569702, "Pretrain/Loss (Raw)": 1.9936684370040894, "Pretrain/Step": 2846, "Pretrain/Step Time": 8.401960281655192} +{"Pretrain/Learning Rate": 4.815764037113895e-05, "Pretrain/Loss": 2.092597007751465, "Pretrain/Loss (Raw)": 2.0870895385742188, "Pretrain/Step": 2847, "Pretrain/Step Time": 8.401704812422395} +{"Pretrain/Learning Rate": 4.815604057326567e-05, "Pretrain/Loss": 2.093487501144409, "Pretrain/Loss (Raw)": 2.2679603099823, "Pretrain/Step": 2848, "Pretrain/Step Time": 8.401255369186401} +{"Pretrain/Learning Rate": 4.815444010770429e-05, "Pretrain/Loss": 2.092895984649658, "Pretrain/Loss (Raw)": 2.0030250549316406, "Pretrain/Step": 2849, "Pretrain/Step Time": 8.405411900952458} +{"Pretrain/Learning Rate": 4.815283897450094e-05, "Pretrain/Loss": 2.0916967391967773, "Pretrain/Loss (Raw)": 2.001723527908325, "Pretrain/Step": 2850, "Pretrain/Step Time": 8.401722298935056} +{"Pretrain/Learning Rate": 4.815123717370181e-05, "Pretrain/Loss": 2.091379165649414, "Pretrain/Loss (Raw)": 1.8942673206329346, "Pretrain/Step": 2851, "Pretrain/Step Time": 8.40698079019785} +{"Pretrain/Learning Rate": 4.814963470535308e-05, "Pretrain/Loss": 2.0892043113708496, "Pretrain/Loss (Raw)": 2.104473829269409, "Pretrain/Step": 2852, "Pretrain/Step Time": 8.404840156435966} +{"Pretrain/Learning Rate": 4.814803156950094e-05, "Pretrain/Loss": 2.0904202461242676, "Pretrain/Loss (Raw)": 2.05293345451355, "Pretrain/Step": 2853, "Pretrain/Step Time": 8.404592171311378} +{"Pretrain/Learning Rate": 4.814642776619163e-05, "Pretrain/Loss": 2.0912721157073975, "Pretrain/Loss (Raw)": 2.058763265609741, "Pretrain/Step": 2854, "Pretrain/Step Time": 8.404874397441745} +{"Pretrain/Learning Rate": 4.81448232954714e-05, "Pretrain/Loss": 2.091172695159912, "Pretrain/Loss (Raw)": 1.9776676893234253, "Pretrain/Step": 2855, "Pretrain/Step Time": 8.406675750389695} +{"Pretrain/Learning Rate": 4.814321815738651e-05, "Pretrain/Loss": 2.094123363494873, "Pretrain/Loss (Raw)": 2.2127058506011963, "Pretrain/Step": 2856, "Pretrain/Step Time": 8.40781675465405} +{"Pretrain/Learning Rate": 4.8141612351983226e-05, "Pretrain/Loss": 2.093093156814575, "Pretrain/Loss (Raw)": 1.929821491241455, "Pretrain/Step": 2857, "Pretrain/Step Time": 8.408452974632382} +{"Pretrain/Learning Rate": 4.814000587930787e-05, "Pretrain/Loss": 2.0962045192718506, "Pretrain/Loss (Raw)": 2.1607534885406494, "Pretrain/Step": 2858, "Pretrain/Step Time": 8.402600588276982} +{"Pretrain/Learning Rate": 4.813839873940675e-05, "Pretrain/Loss": 2.0974228382110596, "Pretrain/Loss (Raw)": 2.1938726902008057, "Pretrain/Step": 2859, "Pretrain/Step Time": 8.404183538630605} +{"Pretrain/Learning Rate": 4.8136790932326226e-05, "Pretrain/Loss": 2.0955092906951904, "Pretrain/Loss (Raw)": 2.04105544090271, "Pretrain/Step": 2860, "Pretrain/Step Time": 8.403217934072018} +{"Pretrain/Learning Rate": 4.8135182458112644e-05, "Pretrain/Loss": 2.097195863723755, "Pretrain/Loss (Raw)": 2.2992725372314453, "Pretrain/Step": 2861, "Pretrain/Step Time": 8.406034141778946} +{"Pretrain/Learning Rate": 4.813357331681238e-05, "Pretrain/Loss": 2.096461772918701, "Pretrain/Loss (Raw)": 1.960631012916565, "Pretrain/Step": 2862, "Pretrain/Step Time": 8.405131278559566} +{"Pretrain/Learning Rate": 4.8131963508471843e-05, "Pretrain/Loss": 2.0968573093414307, "Pretrain/Loss (Raw)": 1.9555226564407349, "Pretrain/Step": 2863, "Pretrain/Step Time": 8.3996812235564} +{"Pretrain/Learning Rate": 4.813035303313744e-05, "Pretrain/Loss": 2.097245216369629, "Pretrain/Loss (Raw)": 2.084425449371338, "Pretrain/Step": 2864, "Pretrain/Step Time": 8.399577159434557} +{"Pretrain/Learning Rate": 4.812874189085561e-05, "Pretrain/Loss": 2.0992002487182617, "Pretrain/Loss (Raw)": 2.167210102081299, "Pretrain/Step": 2865, "Pretrain/Step Time": 8.404246389865875} +{"Pretrain/Learning Rate": 4.8127130081672825e-05, "Pretrain/Loss": 2.0954437255859375, "Pretrain/Loss (Raw)": 1.9183132648468018, "Pretrain/Step": 2866, "Pretrain/Step Time": 8.399447431787848} +{"Pretrain/Learning Rate": 4.812551760563554e-05, "Pretrain/Loss": 2.095512866973877, "Pretrain/Loss (Raw)": 2.008613109588623, "Pretrain/Step": 2867, "Pretrain/Step Time": 8.403639368712902} +{"Pretrain/Learning Rate": 4.8123904462790253e-05, "Pretrain/Loss": 2.093256950378418, "Pretrain/Loss (Raw)": 1.879759669303894, "Pretrain/Step": 2868, "Pretrain/Step Time": 8.40576084703207} +{"Pretrain/Learning Rate": 4.8122290653183485e-05, "Pretrain/Loss": 2.092371940612793, "Pretrain/Loss (Raw)": 1.8973745107650757, "Pretrain/Step": 2869, "Pretrain/Step Time": 8.403389152139425} +{"Pretrain/Learning Rate": 4.812067617686177e-05, "Pretrain/Loss": 2.0912561416625977, "Pretrain/Loss (Raw)": 1.8214689493179321, "Pretrain/Step": 2870, "Pretrain/Step Time": 8.404832985252142} +{"Pretrain/Learning Rate": 4.8119061033871646e-05, "Pretrain/Loss": 2.0921759605407715, "Pretrain/Loss (Raw)": 2.2802278995513916, "Pretrain/Step": 2871, "Pretrain/Step Time": 8.40602246671915} +{"Pretrain/Learning Rate": 4.81174452242597e-05, "Pretrain/Loss": 2.0927324295043945, "Pretrain/Loss (Raw)": 2.121727466583252, "Pretrain/Step": 2872, "Pretrain/Step Time": 8.408599196001887} +{"Pretrain/Learning Rate": 4.811582874807253e-05, "Pretrain/Loss": 2.0937085151672363, "Pretrain/Loss (Raw)": 2.128960371017456, "Pretrain/Step": 2873, "Pretrain/Step Time": 8.401851788163185} +{"Pretrain/Learning Rate": 4.8114211605356725e-05, "Pretrain/Loss": 2.0946526527404785, "Pretrain/Loss (Raw)": 2.115837335586548, "Pretrain/Step": 2874, "Pretrain/Step Time": 8.397465804591775} +{"Pretrain/Learning Rate": 4.811259379615892e-05, "Pretrain/Loss": 2.0954554080963135, "Pretrain/Loss (Raw)": 2.133741617202759, "Pretrain/Step": 2875, "Pretrain/Step Time": 8.39742648229003} +{"Pretrain/Learning Rate": 4.8110975320525764e-05, "Pretrain/Loss": 2.095257043838501, "Pretrain/Loss (Raw)": 2.130397081375122, "Pretrain/Step": 2876, "Pretrain/Step Time": 8.396520910784602} +{"Pretrain/Learning Rate": 4.810935617850394e-05, "Pretrain/Loss": 2.0944082736968994, "Pretrain/Loss (Raw)": 2.1966567039489746, "Pretrain/Step": 2877, "Pretrain/Step Time": 8.395276250317693} +{"Pretrain/Learning Rate": 4.810773637014011e-05, "Pretrain/Loss": 2.093012809753418, "Pretrain/Loss (Raw)": 2.134068250656128, "Pretrain/Step": 2878, "Pretrain/Step Time": 8.393596265465021} +{"Pretrain/Learning Rate": 4.8106115895480993e-05, "Pretrain/Loss": 2.093071937561035, "Pretrain/Loss (Raw)": 2.1410634517669678, "Pretrain/Step": 2879, "Pretrain/Step Time": 8.399610102176666} +{"Pretrain/Learning Rate": 4.8104494754573314e-05, "Pretrain/Loss": 2.0927228927612305, "Pretrain/Loss (Raw)": 1.9984838962554932, "Pretrain/Step": 2880, "Pretrain/Step Time": 8.396534621715546} +{"Pretrain/Learning Rate": 4.8102872947463814e-05, "Pretrain/Loss": 2.0924737453460693, "Pretrain/Loss (Raw)": 2.086862325668335, "Pretrain/Step": 2881, "Pretrain/Step Time": 8.396176112815738} +{"Pretrain/Learning Rate": 4.810125047419926e-05, "Pretrain/Loss": 2.0906667709350586, "Pretrain/Loss (Raw)": 1.8881169557571411, "Pretrain/Step": 2882, "Pretrain/Step Time": 8.396886818110943} +{"Pretrain/Learning Rate": 4.8099627334826435e-05, "Pretrain/Loss": 2.090599536895752, "Pretrain/Loss (Raw)": 2.1023266315460205, "Pretrain/Step": 2883, "Pretrain/Step Time": 8.404577404260635} +{"Pretrain/Learning Rate": 4.8098003529392144e-05, "Pretrain/Loss": 2.091668128967285, "Pretrain/Loss (Raw)": 2.0943593978881836, "Pretrain/Step": 2884, "Pretrain/Step Time": 8.404113613069057} +{"Pretrain/Learning Rate": 4.80963790579432e-05, "Pretrain/Loss": 2.0903990268707275, "Pretrain/Loss (Raw)": 1.9688920974731445, "Pretrain/Step": 2885, "Pretrain/Step Time": 8.4028140027076} +{"Pretrain/Learning Rate": 4.809475392052645e-05, "Pretrain/Loss": 2.0895965099334717, "Pretrain/Loss (Raw)": 1.9821176528930664, "Pretrain/Step": 2886, "Pretrain/Step Time": 8.402264021337032} +{"Pretrain/Learning Rate": 4.809312811718875e-05, "Pretrain/Loss": 2.0891823768615723, "Pretrain/Loss (Raw)": 2.20302677154541, "Pretrain/Step": 2887, "Pretrain/Step Time": 8.40276644937694} +{"Pretrain/Learning Rate": 4.809150164797698e-05, "Pretrain/Loss": 2.0891947746276855, "Pretrain/Loss (Raw)": 2.116677761077881, "Pretrain/Step": 2888, "Pretrain/Step Time": 8.40469764918089} +{"Pretrain/Learning Rate": 4.808987451293804e-05, "Pretrain/Loss": 2.0917863845825195, "Pretrain/Loss (Raw)": 2.2935030460357666, "Pretrain/Step": 2889, "Pretrain/Step Time": 8.404506612569094} +{"Pretrain/Learning Rate": 4.808824671211884e-05, "Pretrain/Loss": 2.0919010639190674, "Pretrain/Loss (Raw)": 2.012753486633301, "Pretrain/Step": 2890, "Pretrain/Step Time": 8.401769353076816} +{"Pretrain/Learning Rate": 4.808661824556633e-05, "Pretrain/Loss": 2.0912513732910156, "Pretrain/Loss (Raw)": 2.031094551086426, "Pretrain/Step": 2891, "Pretrain/Step Time": 8.398822529241443} +{"Pretrain/Learning Rate": 4.808498911332745e-05, "Pretrain/Loss": 2.091465711593628, "Pretrain/Loss (Raw)": 1.9384870529174805, "Pretrain/Step": 2892, "Pretrain/Step Time": 8.397808399051428} +{"Pretrain/Learning Rate": 4.808335931544919e-05, "Pretrain/Loss": 2.0880208015441895, "Pretrain/Loss (Raw)": 2.030701160430908, "Pretrain/Step": 2893, "Pretrain/Step Time": 8.396390959620476} +{"Pretrain/Learning Rate": 4.808172885197853e-05, "Pretrain/Loss": 2.087130546569824, "Pretrain/Loss (Raw)": 1.988195538520813, "Pretrain/Step": 2894, "Pretrain/Step Time": 8.394770946353674} +{"Pretrain/Learning Rate": 4.8080097722962494e-05, "Pretrain/Loss": 2.088853597640991, "Pretrain/Loss (Raw)": 2.1310744285583496, "Pretrain/Step": 2895, "Pretrain/Step Time": 8.393158573657274} +{"Pretrain/Learning Rate": 4.8078465928448116e-05, "Pretrain/Loss": 2.084907293319702, "Pretrain/Loss (Raw)": 1.9884247779846191, "Pretrain/Step": 2896, "Pretrain/Step Time": 8.397666152566671} +{"Pretrain/Learning Rate": 4.807683346848243e-05, "Pretrain/Loss": 2.085446834564209, "Pretrain/Loss (Raw)": 2.1120572090148926, "Pretrain/Step": 2897, "Pretrain/Step Time": 8.397959291934967} +{"Pretrain/Learning Rate": 4.8075200343112525e-05, "Pretrain/Loss": 2.078838348388672, "Pretrain/Loss (Raw)": 1.477507472038269, "Pretrain/Step": 2898, "Pretrain/Step Time": 8.397937471047044} +{"Pretrain/Learning Rate": 4.807356655238548e-05, "Pretrain/Loss": 2.0770130157470703, "Pretrain/Loss (Raw)": 1.8779548406600952, "Pretrain/Step": 2899, "Pretrain/Step Time": 8.399872113019228} +{"Pretrain/Learning Rate": 4.807193209634842e-05, "Pretrain/Loss": 2.074662208557129, "Pretrain/Loss (Raw)": 2.157400608062744, "Pretrain/Step": 2900, "Pretrain/Step Time": 8.399964399635792} +{"Pretrain/Learning Rate": 4.8070296975048454e-05, "Pretrain/Loss": 2.0745513439178467, "Pretrain/Loss (Raw)": 1.9908950328826904, "Pretrain/Step": 2901, "Pretrain/Step Time": 8.396346367895603} +{"Pretrain/Learning Rate": 4.806866118853275e-05, "Pretrain/Loss": 2.0757017135620117, "Pretrain/Loss (Raw)": 2.151623010635376, "Pretrain/Step": 2902, "Pretrain/Step Time": 8.400517197325826} +{"Pretrain/Learning Rate": 4.806702473684845e-05, "Pretrain/Loss": 2.0763535499572754, "Pretrain/Loss (Raw)": 2.062574625015259, "Pretrain/Step": 2903, "Pretrain/Step Time": 8.401465566828847} +{"Pretrain/Learning Rate": 4.8065387620042754e-05, "Pretrain/Loss": 2.0756373405456543, "Pretrain/Loss (Raw)": 2.050166130065918, "Pretrain/Step": 2904, "Pretrain/Step Time": 8.407520554959774} +{"Pretrain/Learning Rate": 4.806374983816287e-05, "Pretrain/Loss": 2.0742900371551514, "Pretrain/Loss (Raw)": 1.9661891460418701, "Pretrain/Step": 2905, "Pretrain/Step Time": 8.405304282903671} +{"Pretrain/Learning Rate": 4.806211139125602e-05, "Pretrain/Loss": 2.074842929840088, "Pretrain/Loss (Raw)": 2.177664279937744, "Pretrain/Step": 2906, "Pretrain/Step Time": 8.404027316719294} +{"Pretrain/Learning Rate": 4.8060472279369445e-05, "Pretrain/Loss": 2.0757546424865723, "Pretrain/Loss (Raw)": 2.145275831222534, "Pretrain/Step": 2907, "Pretrain/Step Time": 8.403346288949251} +{"Pretrain/Learning Rate": 4.805883250255041e-05, "Pretrain/Loss": 2.0758867263793945, "Pretrain/Loss (Raw)": 2.0432703495025635, "Pretrain/Step": 2908, "Pretrain/Step Time": 8.403096605092287} +{"Pretrain/Learning Rate": 4.805719206084619e-05, "Pretrain/Loss": 2.0733189582824707, "Pretrain/Loss (Raw)": 1.8405622243881226, "Pretrain/Step": 2909, "Pretrain/Step Time": 8.405694490298629} +{"Pretrain/Learning Rate": 4.80555509543041e-05, "Pretrain/Loss": 2.0721778869628906, "Pretrain/Loss (Raw)": 1.9223287105560303, "Pretrain/Step": 2910, "Pretrain/Step Time": 8.401796787977219} +{"Pretrain/Learning Rate": 4.805390918297144e-05, "Pretrain/Loss": 2.072094440460205, "Pretrain/Loss (Raw)": 2.0406525135040283, "Pretrain/Step": 2911, "Pretrain/Step Time": 8.406369365751743} +{"Pretrain/Learning Rate": 4.805226674689556e-05, "Pretrain/Loss": 2.0714197158813477, "Pretrain/Loss (Raw)": 1.9331614971160889, "Pretrain/Step": 2912, "Pretrain/Step Time": 8.404943574219942} +{"Pretrain/Learning Rate": 4.805062364612383e-05, "Pretrain/Loss": 2.0706090927124023, "Pretrain/Loss (Raw)": 2.140446424484253, "Pretrain/Step": 2913, "Pretrain/Step Time": 8.40892825089395} +{"Pretrain/Learning Rate": 4.804897988070361e-05, "Pretrain/Loss": 2.0678281784057617, "Pretrain/Loss (Raw)": 2.064424991607666, "Pretrain/Step": 2914, "Pretrain/Step Time": 8.403608871623874} +{"Pretrain/Learning Rate": 4.804733545068231e-05, "Pretrain/Loss": 2.063157558441162, "Pretrain/Loss (Raw)": 1.7051717042922974, "Pretrain/Step": 2915, "Pretrain/Step Time": 8.403918540105224} +{"Pretrain/Learning Rate": 4.8045690356107334e-05, "Pretrain/Loss": 2.0625624656677246, "Pretrain/Loss (Raw)": 2.134819984436035, "Pretrain/Step": 2916, "Pretrain/Step Time": 8.41018738783896} +{"Pretrain/Learning Rate": 4.8044044597026114e-05, "Pretrain/Loss": 2.062156915664673, "Pretrain/Loss (Raw)": 2.045562982559204, "Pretrain/Step": 2917, "Pretrain/Step Time": 8.405736463144422} +{"Pretrain/Learning Rate": 4.8042398173486124e-05, "Pretrain/Loss": 2.061774730682373, "Pretrain/Loss (Raw)": 2.131226062774658, "Pretrain/Step": 2918, "Pretrain/Step Time": 8.412628894671798} +{"Pretrain/Learning Rate": 4.804075108553483e-05, "Pretrain/Loss": 2.059420585632324, "Pretrain/Loss (Raw)": 1.9003831148147583, "Pretrain/Step": 2919, "Pretrain/Step Time": 8.414614195004106} +{"Pretrain/Learning Rate": 4.803910333321971e-05, "Pretrain/Loss": 2.0595932006835938, "Pretrain/Loss (Raw)": 2.091546058654785, "Pretrain/Step": 2920, "Pretrain/Step Time": 8.414214285090566} +{"Pretrain/Learning Rate": 4.80374549165883e-05, "Pretrain/Loss": 2.055703639984131, "Pretrain/Loss (Raw)": 1.711315631866455, "Pretrain/Step": 2921, "Pretrain/Step Time": 8.41791714541614} +{"Pretrain/Learning Rate": 4.8035805835688105e-05, "Pretrain/Loss": 2.0556042194366455, "Pretrain/Loss (Raw)": 2.2297985553741455, "Pretrain/Step": 2922, "Pretrain/Step Time": 8.417550655081868} +{"Pretrain/Learning Rate": 4.8034156090566695e-05, "Pretrain/Loss": 2.0556185245513916, "Pretrain/Loss (Raw)": 1.8120733499526978, "Pretrain/Step": 2923, "Pretrain/Step Time": 8.416359340772033} +{"Pretrain/Learning Rate": 4.8032505681271634e-05, "Pretrain/Loss": 2.057522773742676, "Pretrain/Loss (Raw)": 2.171924591064453, "Pretrain/Step": 2924, "Pretrain/Step Time": 8.416446600109339} +{"Pretrain/Learning Rate": 4.80308546078505e-05, "Pretrain/Loss": 2.0565409660339355, "Pretrain/Loss (Raw)": 2.1176788806915283, "Pretrain/Step": 2925, "Pretrain/Step Time": 8.419800600036979} +{"Pretrain/Learning Rate": 4.802920287035092e-05, "Pretrain/Loss": 2.055680513381958, "Pretrain/Loss (Raw)": 1.9268494844436646, "Pretrain/Step": 2926, "Pretrain/Step Time": 8.415921533480287} +{"Pretrain/Learning Rate": 4.80275504688205e-05, "Pretrain/Loss": 2.0531420707702637, "Pretrain/Loss (Raw)": 1.9000169038772583, "Pretrain/Step": 2927, "Pretrain/Step Time": 8.420259514823556} +{"Pretrain/Learning Rate": 4.802589740330689e-05, "Pretrain/Loss": 2.0491342544555664, "Pretrain/Loss (Raw)": 1.9677283763885498, "Pretrain/Step": 2928, "Pretrain/Step Time": 8.420300526544452} +{"Pretrain/Learning Rate": 4.8024243673857784e-05, "Pretrain/Loss": 2.0500216484069824, "Pretrain/Loss (Raw)": 2.345461130142212, "Pretrain/Step": 2929, "Pretrain/Step Time": 8.414973106235266} +{"Pretrain/Learning Rate": 4.8022589280520825e-05, "Pretrain/Loss": 2.051520347595215, "Pretrain/Loss (Raw)": 2.047118902206421, "Pretrain/Step": 2930, "Pretrain/Step Time": 8.419457944110036} +{"Pretrain/Learning Rate": 4.8020934223343736e-05, "Pretrain/Loss": 2.0519518852233887, "Pretrain/Loss (Raw)": 2.222698926925659, "Pretrain/Step": 2931, "Pretrain/Step Time": 8.41911007463932} +{"Pretrain/Learning Rate": 4.801927850237424e-05, "Pretrain/Loss": 2.0513100624084473, "Pretrain/Loss (Raw)": 2.1546361446380615, "Pretrain/Step": 2932, "Pretrain/Step Time": 8.42400573566556} +{"Pretrain/Learning Rate": 4.801762211766008e-05, "Pretrain/Loss": 2.051067590713501, "Pretrain/Loss (Raw)": 1.9702439308166504, "Pretrain/Step": 2933, "Pretrain/Step Time": 8.422221688553691} +{"Pretrain/Learning Rate": 4.8015965069249e-05, "Pretrain/Loss": 2.053853988647461, "Pretrain/Loss (Raw)": 2.55352520942688, "Pretrain/Step": 2934, "Pretrain/Step Time": 8.424348758533597} +{"Pretrain/Learning Rate": 4.8014307357188804e-05, "Pretrain/Loss": 2.054788589477539, "Pretrain/Loss (Raw)": 2.066049337387085, "Pretrain/Step": 2935, "Pretrain/Step Time": 8.425889614969492} +{"Pretrain/Learning Rate": 4.801264898152728e-05, "Pretrain/Loss": 2.05513334274292, "Pretrain/Loss (Raw)": 2.152333974838257, "Pretrain/Step": 2936, "Pretrain/Step Time": 8.425918009132147} +{"Pretrain/Learning Rate": 4.8010989942312236e-05, "Pretrain/Loss": 2.054335355758667, "Pretrain/Loss (Raw)": 2.1387181282043457, "Pretrain/Step": 2937, "Pretrain/Step Time": 8.425452722236514} +{"Pretrain/Learning Rate": 4.800933023959152e-05, "Pretrain/Loss": 2.0529303550720215, "Pretrain/Loss (Raw)": 1.9604285955429077, "Pretrain/Step": 2938, "Pretrain/Step Time": 8.426675220951438} +{"Pretrain/Learning Rate": 4.8007669873412995e-05, "Pretrain/Loss": 2.0521175861358643, "Pretrain/Loss (Raw)": 1.9350666999816895, "Pretrain/Step": 2939, "Pretrain/Step Time": 8.428330209106207} +{"Pretrain/Learning Rate": 4.8006008843824525e-05, "Pretrain/Loss": 2.0517985820770264, "Pretrain/Loss (Raw)": 2.007767915725708, "Pretrain/Step": 2940, "Pretrain/Step Time": 8.424887491390109} +{"Pretrain/Learning Rate": 4.800434715087401e-05, "Pretrain/Loss": 2.051578998565674, "Pretrain/Loss (Raw)": 1.926854133605957, "Pretrain/Step": 2941, "Pretrain/Step Time": 8.420195506885648} +{"Pretrain/Learning Rate": 4.8002684794609356e-05, "Pretrain/Loss": 2.052549362182617, "Pretrain/Loss (Raw)": 2.028900146484375, "Pretrain/Step": 2942, "Pretrain/Step Time": 8.41959180124104} +{"Pretrain/Learning Rate": 4.80010217750785e-05, "Pretrain/Loss": 2.0522208213806152, "Pretrain/Loss (Raw)": 2.0314903259277344, "Pretrain/Step": 2943, "Pretrain/Step Time": 8.423649882897735} +{"Pretrain/Learning Rate": 4.79993580923294e-05, "Pretrain/Loss": 2.051567554473877, "Pretrain/Loss (Raw)": 2.1325957775115967, "Pretrain/Step": 2944, "Pretrain/Step Time": 8.42808454297483} +{"Pretrain/Learning Rate": 4.7997693746410024e-05, "Pretrain/Loss": 2.0492911338806152, "Pretrain/Loss (Raw)": 1.9303243160247803, "Pretrain/Step": 2945, "Pretrain/Step Time": 8.426502346992493} +{"Pretrain/Learning Rate": 4.7996028737368367e-05, "Pretrain/Loss": 2.048092842102051, "Pretrain/Loss (Raw)": 2.1193437576293945, "Pretrain/Step": 2946, "Pretrain/Step Time": 8.418381011113524} +{"Pretrain/Learning Rate": 4.7994363065252424e-05, "Pretrain/Loss": 2.0481133460998535, "Pretrain/Loss (Raw)": 2.133227825164795, "Pretrain/Step": 2947, "Pretrain/Step Time": 8.42402721568942} +{"Pretrain/Learning Rate": 4.7992696730110235e-05, "Pretrain/Loss": 2.0491621494293213, "Pretrain/Loss (Raw)": 2.2371349334716797, "Pretrain/Step": 2948, "Pretrain/Step Time": 8.424762105569243} +{"Pretrain/Learning Rate": 4.799102973198985e-05, "Pretrain/Loss": 2.048510789871216, "Pretrain/Loss (Raw)": 1.8539776802062988, "Pretrain/Step": 2949, "Pretrain/Step Time": 8.427263213321567} +{"Pretrain/Learning Rate": 4.7989362070939315e-05, "Pretrain/Loss": 2.0492076873779297, "Pretrain/Loss (Raw)": 2.0291860103607178, "Pretrain/Step": 2950, "Pretrain/Step Time": 8.42520777322352} +{"Pretrain/Learning Rate": 4.798769374700675e-05, "Pretrain/Loss": 2.047236442565918, "Pretrain/Loss (Raw)": 1.921370029449463, "Pretrain/Step": 2951, "Pretrain/Step Time": 8.42596629820764} +{"Pretrain/Learning Rate": 4.798602476024022e-05, "Pretrain/Loss": 2.049800395965576, "Pretrain/Loss (Raw)": 2.1625070571899414, "Pretrain/Step": 2952, "Pretrain/Step Time": 8.433694513514638} +{"Pretrain/Learning Rate": 4.7984355110687885e-05, "Pretrain/Loss": 2.051647424697876, "Pretrain/Loss (Raw)": 2.161991596221924, "Pretrain/Step": 2953, "Pretrain/Step Time": 8.433648154139519} +{"Pretrain/Learning Rate": 4.798268479839787e-05, "Pretrain/Loss": 2.0500543117523193, "Pretrain/Loss (Raw)": 1.9891012907028198, "Pretrain/Step": 2954, "Pretrain/Step Time": 8.431369710713625} +{"Pretrain/Learning Rate": 4.798101382341834e-05, "Pretrain/Loss": 2.050947666168213, "Pretrain/Loss (Raw)": 2.0372321605682373, "Pretrain/Step": 2955, "Pretrain/Step Time": 8.430372092872858} +{"Pretrain/Learning Rate": 4.7979342185797475e-05, "Pretrain/Loss": 2.0492959022521973, "Pretrain/Loss (Raw)": 2.0693085193634033, "Pretrain/Step": 2956, "Pretrain/Step Time": 8.431198416277766} +{"Pretrain/Learning Rate": 4.797766988558348e-05, "Pretrain/Loss": 2.052631378173828, "Pretrain/Loss (Raw)": 2.5657060146331787, "Pretrain/Step": 2957, "Pretrain/Step Time": 8.432595815509558} +{"Pretrain/Learning Rate": 4.797599692282457e-05, "Pretrain/Loss": 2.0550999641418457, "Pretrain/Loss (Raw)": 2.3089702129364014, "Pretrain/Step": 2958, "Pretrain/Step Time": 8.426194226369262} +{"Pretrain/Learning Rate": 4.797432329756899e-05, "Pretrain/Loss": 2.05885648727417, "Pretrain/Loss (Raw)": 2.207097053527832, "Pretrain/Step": 2959, "Pretrain/Step Time": 8.427712090313435} +{"Pretrain/Learning Rate": 4.797264900986499e-05, "Pretrain/Loss": 2.0592260360717773, "Pretrain/Loss (Raw)": 2.001847743988037, "Pretrain/Step": 2960, "Pretrain/Step Time": 8.428595006465912} +{"Pretrain/Learning Rate": 4.797097405976085e-05, "Pretrain/Loss": 2.0590662956237793, "Pretrain/Loss (Raw)": 2.1334874629974365, "Pretrain/Step": 2961, "Pretrain/Step Time": 8.427101353183389} +{"Pretrain/Learning Rate": 4.7969298447304875e-05, "Pretrain/Loss": 2.05977463722229, "Pretrain/Loss (Raw)": 2.0253424644470215, "Pretrain/Step": 2962, "Pretrain/Step Time": 8.425366252660751} +{"Pretrain/Learning Rate": 4.796762217254536e-05, "Pretrain/Loss": 2.0587663650512695, "Pretrain/Loss (Raw)": 2.0180764198303223, "Pretrain/Step": 2963, "Pretrain/Step Time": 8.428582595661283} +{"Pretrain/Learning Rate": 4.7965945235530654e-05, "Pretrain/Loss": 2.0577709674835205, "Pretrain/Loss (Raw)": 2.095644474029541, "Pretrain/Step": 2964, "Pretrain/Step Time": 8.431305151432753} +{"Pretrain/Learning Rate": 4.7964267636309114e-05, "Pretrain/Loss": 2.0590505599975586, "Pretrain/Loss (Raw)": 2.3066325187683105, "Pretrain/Step": 2965, "Pretrain/Step Time": 8.435151435434818} +{"Pretrain/Learning Rate": 4.7962589374929095e-05, "Pretrain/Loss": 2.059779644012451, "Pretrain/Loss (Raw)": 2.337536573410034, "Pretrain/Step": 2966, "Pretrain/Step Time": 8.434011816978455} +{"Pretrain/Learning Rate": 4.796091045143901e-05, "Pretrain/Loss": 2.0594303607940674, "Pretrain/Loss (Raw)": 2.110619306564331, "Pretrain/Step": 2967, "Pretrain/Step Time": 8.438052399083972} +{"Pretrain/Learning Rate": 4.795923086588725e-05, "Pretrain/Loss": 2.0627965927124023, "Pretrain/Loss (Raw)": 2.1944029331207275, "Pretrain/Step": 2968, "Pretrain/Step Time": 8.43975330144167} +{"Pretrain/Learning Rate": 4.7957550618322254e-05, "Pretrain/Loss": 2.0623867511749268, "Pretrain/Loss (Raw)": 2.0226449966430664, "Pretrain/Step": 2969, "Pretrain/Step Time": 8.438834259286523} +{"Pretrain/Learning Rate": 4.795586970879247e-05, "Pretrain/Loss": 2.0596797466278076, "Pretrain/Loss (Raw)": 1.6846587657928467, "Pretrain/Step": 2970, "Pretrain/Step Time": 8.434467375278473} +{"Pretrain/Learning Rate": 4.795418813734637e-05, "Pretrain/Loss": 2.0612497329711914, "Pretrain/Loss (Raw)": 2.1635162830352783, "Pretrain/Step": 2971, "Pretrain/Step Time": 8.43077034689486} +{"Pretrain/Learning Rate": 4.795250590403243e-05, "Pretrain/Loss": 2.0593035221099854, "Pretrain/Loss (Raw)": 1.8612356185913086, "Pretrain/Step": 2972, "Pretrain/Step Time": 8.430458758026361} +{"Pretrain/Learning Rate": 4.795082300889917e-05, "Pretrain/Loss": 2.0598106384277344, "Pretrain/Loss (Raw)": 2.089359760284424, "Pretrain/Step": 2973, "Pretrain/Step Time": 8.428451435640454} +{"Pretrain/Learning Rate": 4.79491394519951e-05, "Pretrain/Loss": 2.058091163635254, "Pretrain/Loss (Raw)": 1.7735697031021118, "Pretrain/Step": 2974, "Pretrain/Step Time": 8.432106940075755} +{"Pretrain/Learning Rate": 4.7947455233368776e-05, "Pretrain/Loss": 2.058925151824951, "Pretrain/Loss (Raw)": 2.1938352584838867, "Pretrain/Step": 2975, "Pretrain/Step Time": 8.433633666485548} +{"Pretrain/Learning Rate": 4.794577035306876e-05, "Pretrain/Loss": 2.0576980113983154, "Pretrain/Loss (Raw)": 2.1108767986297607, "Pretrain/Step": 2976, "Pretrain/Step Time": 8.433212168514729} +{"Pretrain/Learning Rate": 4.794408481114363e-05, "Pretrain/Loss": 2.059023380279541, "Pretrain/Loss (Raw)": 2.1727075576782227, "Pretrain/Step": 2977, "Pretrain/Step Time": 8.431072784587741} +{"Pretrain/Learning Rate": 4.7942398607641987e-05, "Pretrain/Loss": 2.0578811168670654, "Pretrain/Loss (Raw)": 1.8554812669754028, "Pretrain/Step": 2978, "Pretrain/Step Time": 8.433778302744031} +{"Pretrain/Learning Rate": 4.794071174261246e-05, "Pretrain/Loss": 2.0599589347839355, "Pretrain/Loss (Raw)": 2.1602373123168945, "Pretrain/Step": 2979, "Pretrain/Step Time": 8.431530429050326} +{"Pretrain/Learning Rate": 4.793902421610367e-05, "Pretrain/Loss": 2.0635664463043213, "Pretrain/Loss (Raw)": 2.5662379264831543, "Pretrain/Step": 2980, "Pretrain/Step Time": 8.432342115789652} +{"Pretrain/Learning Rate": 4.793733602816429e-05, "Pretrain/Loss": 2.0620718002319336, "Pretrain/Loss (Raw)": 1.8616297245025635, "Pretrain/Step": 2981, "Pretrain/Step Time": 8.437189707532525} +{"Pretrain/Learning Rate": 4.7935647178843e-05, "Pretrain/Loss": 2.0625998973846436, "Pretrain/Loss (Raw)": 2.1263327598571777, "Pretrain/Step": 2982, "Pretrain/Step Time": 8.440319137647748} +{"Pretrain/Learning Rate": 4.7933957668188494e-05, "Pretrain/Loss": 2.0630626678466797, "Pretrain/Loss (Raw)": 2.0369133949279785, "Pretrain/Step": 2983, "Pretrain/Step Time": 8.439502881839871} +{"Pretrain/Learning Rate": 4.793226749624948e-05, "Pretrain/Loss": 2.0632357597351074, "Pretrain/Loss (Raw)": 2.2348668575286865, "Pretrain/Step": 2984, "Pretrain/Step Time": 8.438056351616979} +{"Pretrain/Learning Rate": 4.793057666307471e-05, "Pretrain/Loss": 2.0639519691467285, "Pretrain/Loss (Raw)": 2.0214738845825195, "Pretrain/Step": 2985, "Pretrain/Step Time": 8.440789042040706} +{"Pretrain/Learning Rate": 4.792888516871292e-05, "Pretrain/Loss": 2.062443494796753, "Pretrain/Loss (Raw)": 1.967676043510437, "Pretrain/Step": 2986, "Pretrain/Step Time": 8.444479763507843} +{"Pretrain/Learning Rate": 4.792719301321289e-05, "Pretrain/Loss": 2.060685157775879, "Pretrain/Loss (Raw)": 1.9688091278076172, "Pretrain/Step": 2987, "Pretrain/Step Time": 8.444470033049583} +{"Pretrain/Learning Rate": 4.7925500196623405e-05, "Pretrain/Loss": 2.0585319995880127, "Pretrain/Loss (Raw)": 1.765438199043274, "Pretrain/Step": 2988, "Pretrain/Step Time": 8.44519317522645} +{"Pretrain/Learning Rate": 4.792380671899329e-05, "Pretrain/Loss": 2.0563888549804688, "Pretrain/Loss (Raw)": 2.024947166442871, "Pretrain/Step": 2989, "Pretrain/Step Time": 8.446532832458615} +{"Pretrain/Learning Rate": 4.792211258037137e-05, "Pretrain/Loss": 2.0575718879699707, "Pretrain/Loss (Raw)": 2.1120622158050537, "Pretrain/Step": 2990, "Pretrain/Step Time": 8.448083126917481} +{"Pretrain/Learning Rate": 4.792041778080649e-05, "Pretrain/Loss": 2.0580198764801025, "Pretrain/Loss (Raw)": 2.012881278991699, "Pretrain/Step": 2991, "Pretrain/Step Time": 8.446420148015022} +{"Pretrain/Learning Rate": 4.791872232034753e-05, "Pretrain/Loss": 2.0573410987854004, "Pretrain/Loss (Raw)": 1.9975506067276, "Pretrain/Step": 2992, "Pretrain/Step Time": 8.449166465550661} +{"Pretrain/Learning Rate": 4.791702619904336e-05, "Pretrain/Loss": 2.055593729019165, "Pretrain/Loss (Raw)": 1.94354248046875, "Pretrain/Step": 2993, "Pretrain/Step Time": 8.443728549405932} +{"Pretrain/Learning Rate": 4.7915329416942886e-05, "Pretrain/Loss": 2.055219888687134, "Pretrain/Loss (Raw)": 1.8704620599746704, "Pretrain/Step": 2994, "Pretrain/Step Time": 8.44746951945126} +{"Pretrain/Learning Rate": 4.791363197409506e-05, "Pretrain/Loss": 2.0547823905944824, "Pretrain/Loss (Raw)": 1.9526033401489258, "Pretrain/Step": 2995, "Pretrain/Step Time": 8.443959385156631} +{"Pretrain/Learning Rate": 4.79119338705488e-05, "Pretrain/Loss": 2.0566816329956055, "Pretrain/Loss (Raw)": 2.12288498878479, "Pretrain/Step": 2996, "Pretrain/Step Time": 8.439727738499641} +{"Pretrain/Learning Rate": 4.791023510635308e-05, "Pretrain/Loss": 2.057344436645508, "Pretrain/Loss (Raw)": 1.9821746349334717, "Pretrain/Step": 2997, "Pretrain/Step Time": 8.446391087025404} +{"Pretrain/Learning Rate": 4.790853568155688e-05, "Pretrain/Loss": 2.0576534271240234, "Pretrain/Loss (Raw)": 1.8610481023788452, "Pretrain/Step": 2998, "Pretrain/Step Time": 8.448434330523014} +{"Pretrain/Learning Rate": 4.790683559620921e-05, "Pretrain/Loss": 2.0561485290527344, "Pretrain/Loss (Raw)": 2.0875868797302246, "Pretrain/Step": 2999, "Pretrain/Step Time": 8.448806904256344} +{"Pretrain/Learning Rate": 4.790513485035907e-05, "Pretrain/Loss": 2.0556468963623047, "Pretrain/Loss (Raw)": 2.0575339794158936, "Pretrain/Step": 3000, "Pretrain/Step Time": 8.449947806075215} +{"Pretrain/Learning Rate": 4.790343344405552e-05, "Pretrain/Loss": 2.053832530975342, "Pretrain/Loss (Raw)": 1.8967186212539673, "Pretrain/Step": 3001, "Pretrain/Step Time": 8.453829186037183} +{"Pretrain/Learning Rate": 4.790173137734762e-05, "Pretrain/Loss": 2.05267333984375, "Pretrain/Loss (Raw)": 1.967487096786499, "Pretrain/Step": 3002, "Pretrain/Step Time": 8.454519225284457} +{"Pretrain/Learning Rate": 4.7900028650284435e-05, "Pretrain/Loss": 2.050126552581787, "Pretrain/Loss (Raw)": 1.8077107667922974, "Pretrain/Step": 3003, "Pretrain/Step Time": 8.456998916342854} +{"Pretrain/Learning Rate": 4.7898325262915066e-05, "Pretrain/Loss": 2.0507397651672363, "Pretrain/Loss (Raw)": 2.208918809890747, "Pretrain/Step": 3004, "Pretrain/Step Time": 8.457342401146889} +{"Pretrain/Learning Rate": 4.789662121528863e-05, "Pretrain/Loss": 2.0502419471740723, "Pretrain/Loss (Raw)": 2.1329410076141357, "Pretrain/Step": 3005, "Pretrain/Step Time": 8.457230098545551} +{"Pretrain/Learning Rate": 4.7894916507454266e-05, "Pretrain/Loss": 2.050504207611084, "Pretrain/Loss (Raw)": 2.1676406860351562, "Pretrain/Step": 3006, "Pretrain/Step Time": 8.45989365130663} +{"Pretrain/Learning Rate": 4.789321113946112e-05, "Pretrain/Loss": 2.0489726066589355, "Pretrain/Loss (Raw)": 1.9449737071990967, "Pretrain/Step": 3007, "Pretrain/Step Time": 8.450333992019296} +{"Pretrain/Learning Rate": 4.789150511135838e-05, "Pretrain/Loss": 2.047668218612671, "Pretrain/Loss (Raw)": 1.831551432609558, "Pretrain/Step": 3008, "Pretrain/Step Time": 8.4549909401685} +{"Pretrain/Learning Rate": 4.7889798423195216e-05, "Pretrain/Loss": 2.046847343444824, "Pretrain/Loss (Raw)": 1.9817683696746826, "Pretrain/Step": 3009, "Pretrain/Step Time": 8.456790052354336} +{"Pretrain/Learning Rate": 4.788809107502085e-05, "Pretrain/Loss": 2.0476930141448975, "Pretrain/Loss (Raw)": 1.9963982105255127, "Pretrain/Step": 3010, "Pretrain/Step Time": 8.452872386202216} +{"Pretrain/Learning Rate": 4.788638306688452e-05, "Pretrain/Loss": 2.046304702758789, "Pretrain/Loss (Raw)": 1.9246011972427368, "Pretrain/Step": 3011, "Pretrain/Step Time": 8.447577638551593} +{"Pretrain/Learning Rate": 4.788467439883546e-05, "Pretrain/Loss": 2.0459556579589844, "Pretrain/Loss (Raw)": 2.049715042114258, "Pretrain/Step": 3012, "Pretrain/Step Time": 8.446386637166142} +{"Pretrain/Learning Rate": 4.7882965070922956e-05, "Pretrain/Loss": 2.0482428073883057, "Pretrain/Loss (Raw)": 2.2616066932678223, "Pretrain/Step": 3013, "Pretrain/Step Time": 8.45177011564374} +{"Pretrain/Learning Rate": 4.788125508319628e-05, "Pretrain/Loss": 2.0478007793426514, "Pretrain/Loss (Raw)": 1.9255588054656982, "Pretrain/Step": 3014, "Pretrain/Step Time": 8.45146412216127} +{"Pretrain/Learning Rate": 4.787954443570475e-05, "Pretrain/Loss": 2.045596122741699, "Pretrain/Loss (Raw)": 1.920827031135559, "Pretrain/Step": 3015, "Pretrain/Step Time": 8.454514365643263} +{"Pretrain/Learning Rate": 4.787783312849767e-05, "Pretrain/Loss": 2.046213150024414, "Pretrain/Loss (Raw)": 2.1956419944763184, "Pretrain/Step": 3016, "Pretrain/Step Time": 8.45265875943005} +{"Pretrain/Learning Rate": 4.7876121161624415e-05, "Pretrain/Loss": 2.0451443195343018, "Pretrain/Loss (Raw)": 2.1566951274871826, "Pretrain/Step": 3017, "Pretrain/Step Time": 8.452883645892143} +{"Pretrain/Learning Rate": 4.787440853513433e-05, "Pretrain/Loss": 2.0452349185943604, "Pretrain/Loss (Raw)": 2.0243608951568604, "Pretrain/Step": 3018, "Pretrain/Step Time": 8.454596810042858} +{"Pretrain/Learning Rate": 4.7872695249076794e-05, "Pretrain/Loss": 2.0465188026428223, "Pretrain/Loss (Raw)": 2.1954267024993896, "Pretrain/Step": 3019, "Pretrain/Step Time": 8.453120386227965} +{"Pretrain/Learning Rate": 4.787098130350122e-05, "Pretrain/Loss": 2.0472917556762695, "Pretrain/Loss (Raw)": 2.037412166595459, "Pretrain/Step": 3020, "Pretrain/Step Time": 8.452582431957126} +{"Pretrain/Learning Rate": 4.786926669845702e-05, "Pretrain/Loss": 2.0478334426879883, "Pretrain/Loss (Raw)": 2.1000633239746094, "Pretrain/Step": 3021, "Pretrain/Step Time": 8.453954631462693} +{"Pretrain/Learning Rate": 4.786755143399364e-05, "Pretrain/Loss": 2.0479416847229004, "Pretrain/Loss (Raw)": 2.002047538757324, "Pretrain/Step": 3022, "Pretrain/Step Time": 8.456385347992182} +{"Pretrain/Learning Rate": 4.786583551016053e-05, "Pretrain/Loss": 2.0455212593078613, "Pretrain/Loss (Raw)": 1.8212581872940063, "Pretrain/Step": 3023, "Pretrain/Step Time": 8.45561096817255} +{"Pretrain/Learning Rate": 4.786411892700718e-05, "Pretrain/Loss": 2.04681658744812, "Pretrain/Loss (Raw)": 2.1542251110076904, "Pretrain/Step": 3024, "Pretrain/Step Time": 8.447142884135246} +{"Pretrain/Learning Rate": 4.786240168458307e-05, "Pretrain/Loss": 2.0449740886688232, "Pretrain/Loss (Raw)": 1.8762180805206299, "Pretrain/Step": 3025, "Pretrain/Step Time": 8.452314347028732} +{"Pretrain/Learning Rate": 4.7860683782937735e-05, "Pretrain/Loss": 2.051079034805298, "Pretrain/Loss (Raw)": 2.2589309215545654, "Pretrain/Step": 3026, "Pretrain/Step Time": 8.448557924479246} +{"Pretrain/Learning Rate": 4.785896522212069e-05, "Pretrain/Loss": 2.053196668624878, "Pretrain/Loss (Raw)": 2.1490166187286377, "Pretrain/Step": 3027, "Pretrain/Step Time": 8.45126460492611} +{"Pretrain/Learning Rate": 4.78572460021815e-05, "Pretrain/Loss": 2.052800178527832, "Pretrain/Loss (Raw)": 2.1066510677337646, "Pretrain/Step": 3028, "Pretrain/Step Time": 8.45280011370778} +{"Pretrain/Learning Rate": 4.785552612316974e-05, "Pretrain/Loss": 2.055222749710083, "Pretrain/Loss (Raw)": 2.300964593887329, "Pretrain/Step": 3029, "Pretrain/Step Time": 8.462932327762246} +{"Pretrain/Learning Rate": 4.785380558513498e-05, "Pretrain/Loss": 2.0570931434631348, "Pretrain/Loss (Raw)": 2.3910434246063232, "Pretrain/Step": 3030, "Pretrain/Step Time": 8.461683912202716} +{"Pretrain/Learning Rate": 4.785208438812686e-05, "Pretrain/Loss": 2.0574920177459717, "Pretrain/Loss (Raw)": 2.1136412620544434, "Pretrain/Step": 3031, "Pretrain/Step Time": 8.463430564850569} +{"Pretrain/Learning Rate": 4.785036253219499e-05, "Pretrain/Loss": 2.0584187507629395, "Pretrain/Loss (Raw)": 2.1688010692596436, "Pretrain/Step": 3032, "Pretrain/Step Time": 8.459868492558599} +{"Pretrain/Learning Rate": 4.7848640017389035e-05, "Pretrain/Loss": 2.060657501220703, "Pretrain/Loss (Raw)": 2.252746820449829, "Pretrain/Step": 3033, "Pretrain/Step Time": 8.461583591997623} +{"Pretrain/Learning Rate": 4.784691684375865e-05, "Pretrain/Loss": 2.0595924854278564, "Pretrain/Loss (Raw)": 2.041306495666504, "Pretrain/Step": 3034, "Pretrain/Step Time": 8.461118929088116} +{"Pretrain/Learning Rate": 4.7845193011353516e-05, "Pretrain/Loss": 2.0586249828338623, "Pretrain/Loss (Raw)": 2.021451234817505, "Pretrain/Step": 3035, "Pretrain/Step Time": 8.462679831311107} +{"Pretrain/Learning Rate": 4.784346852022335e-05, "Pretrain/Loss": 2.060270309448242, "Pretrain/Loss (Raw)": 2.2538821697235107, "Pretrain/Step": 3036, "Pretrain/Step Time": 8.462507294490933} +{"Pretrain/Learning Rate": 4.784174337041787e-05, "Pretrain/Loss": 2.062112808227539, "Pretrain/Loss (Raw)": 2.0764081478118896, "Pretrain/Step": 3037, "Pretrain/Step Time": 8.459645140916109} +{"Pretrain/Learning Rate": 4.784001756198683e-05, "Pretrain/Loss": 2.0638413429260254, "Pretrain/Loss (Raw)": 2.143531560897827, "Pretrain/Step": 3038, "Pretrain/Step Time": 8.46069653891027} +{"Pretrain/Learning Rate": 4.783829109497998e-05, "Pretrain/Loss": 2.064426898956299, "Pretrain/Loss (Raw)": 2.1156368255615234, "Pretrain/Step": 3039, "Pretrain/Step Time": 8.456192050129175} +{"Pretrain/Learning Rate": 4.7836563969447105e-05, "Pretrain/Loss": 2.0661747455596924, "Pretrain/Loss (Raw)": 2.1568820476531982, "Pretrain/Step": 3040, "Pretrain/Step Time": 8.458459589630365} +{"Pretrain/Learning Rate": 4.7834836185438006e-05, "Pretrain/Loss": 2.066011428833008, "Pretrain/Loss (Raw)": 2.119562864303589, "Pretrain/Step": 3041, "Pretrain/Step Time": 8.454686248674989} +{"Pretrain/Learning Rate": 4.783310774300251e-05, "Pretrain/Loss": 2.0649147033691406, "Pretrain/Loss (Raw)": 1.924007534980774, "Pretrain/Step": 3042, "Pretrain/Step Time": 8.451481921598315} +{"Pretrain/Learning Rate": 4.783137864219044e-05, "Pretrain/Loss": 2.069267749786377, "Pretrain/Loss (Raw)": 2.2623703479766846, "Pretrain/Step": 3043, "Pretrain/Step Time": 8.452637130394578} +{"Pretrain/Learning Rate": 4.782964888305167e-05, "Pretrain/Loss": 2.069155693054199, "Pretrain/Loss (Raw)": 2.1204886436462402, "Pretrain/Step": 3044, "Pretrain/Step Time": 8.452806303277612} +{"Pretrain/Learning Rate": 4.782791846563606e-05, "Pretrain/Loss": 2.0668869018554688, "Pretrain/Loss (Raw)": 1.755140781402588, "Pretrain/Step": 3045, "Pretrain/Step Time": 8.455816054716706} +{"Pretrain/Learning Rate": 4.782618738999352e-05, "Pretrain/Loss": 2.0661940574645996, "Pretrain/Loss (Raw)": 2.0425586700439453, "Pretrain/Step": 3046, "Pretrain/Step Time": 8.45377629995346} +{"Pretrain/Learning Rate": 4.7824455656173954e-05, "Pretrain/Loss": 2.068284511566162, "Pretrain/Loss (Raw)": 2.167973279953003, "Pretrain/Step": 3047, "Pretrain/Step Time": 8.455766011029482} +{"Pretrain/Learning Rate": 4.78227232642273e-05, "Pretrain/Loss": 2.069185733795166, "Pretrain/Loss (Raw)": 2.206890821456909, "Pretrain/Step": 3048, "Pretrain/Step Time": 8.456701673567295} +{"Pretrain/Learning Rate": 4.782099021420351e-05, "Pretrain/Loss": 2.0719223022460938, "Pretrain/Loss (Raw)": 2.061601161956787, "Pretrain/Step": 3049, "Pretrain/Step Time": 8.45244106464088} +{"Pretrain/Learning Rate": 4.781925650615256e-05, "Pretrain/Loss": 2.07010817527771, "Pretrain/Loss (Raw)": 1.9975804090499878, "Pretrain/Step": 3050, "Pretrain/Step Time": 8.456250376999378} +{"Pretrain/Learning Rate": 4.7817522140124424e-05, "Pretrain/Loss": 2.072157859802246, "Pretrain/Loss (Raw)": 2.0744545459747314, "Pretrain/Step": 3051, "Pretrain/Step Time": 8.458978187292814} +{"Pretrain/Learning Rate": 4.7815787116169134e-05, "Pretrain/Loss": 2.0709359645843506, "Pretrain/Loss (Raw)": 2.015491485595703, "Pretrain/Step": 3052, "Pretrain/Step Time": 8.458906503394246} +{"Pretrain/Learning Rate": 4.78140514343367e-05, "Pretrain/Loss": 2.0693166255950928, "Pretrain/Loss (Raw)": 1.9104238748550415, "Pretrain/Step": 3053, "Pretrain/Step Time": 8.456600362434983} +{"Pretrain/Learning Rate": 4.781231509467718e-05, "Pretrain/Loss": 2.0719988346099854, "Pretrain/Loss (Raw)": 2.2701399326324463, "Pretrain/Step": 3054, "Pretrain/Step Time": 8.458704624325037} +{"Pretrain/Learning Rate": 4.7810578097240635e-05, "Pretrain/Loss": 2.071986675262451, "Pretrain/Loss (Raw)": 1.8985106945037842, "Pretrain/Step": 3055, "Pretrain/Step Time": 8.452264994382858} +{"Pretrain/Learning Rate": 4.7808840442077146e-05, "Pretrain/Loss": 2.0718631744384766, "Pretrain/Loss (Raw)": 1.9518964290618896, "Pretrain/Step": 3056, "Pretrain/Step Time": 8.451861754059792} +{"Pretrain/Learning Rate": 4.780710212923682e-05, "Pretrain/Loss": 2.070685863494873, "Pretrain/Loss (Raw)": 2.194776773452759, "Pretrain/Step": 3057, "Pretrain/Step Time": 8.45652617327869} +{"Pretrain/Learning Rate": 4.7805363158769794e-05, "Pretrain/Loss": 2.0721073150634766, "Pretrain/Loss (Raw)": 2.2290396690368652, "Pretrain/Step": 3058, "Pretrain/Step Time": 8.449446639046073} +{"Pretrain/Learning Rate": 4.780362353072619e-05, "Pretrain/Loss": 2.0704102516174316, "Pretrain/Loss (Raw)": 2.0055031776428223, "Pretrain/Step": 3059, "Pretrain/Step Time": 8.451643904671073} +{"Pretrain/Learning Rate": 4.780188324515618e-05, "Pretrain/Loss": 2.0690410137176514, "Pretrain/Loss (Raw)": 1.9793429374694824, "Pretrain/Step": 3060, "Pretrain/Step Time": 8.448417512699962} +{"Pretrain/Learning Rate": 4.780014230210994e-05, "Pretrain/Loss": 2.0691399574279785, "Pretrain/Loss (Raw)": 1.9829180240631104, "Pretrain/Step": 3061, "Pretrain/Step Time": 8.446467265486717} +{"Pretrain/Learning Rate": 4.779840070163767e-05, "Pretrain/Loss": 2.0641653537750244, "Pretrain/Loss (Raw)": 1.9167736768722534, "Pretrain/Step": 3062, "Pretrain/Step Time": 8.449868939816952} +{"Pretrain/Learning Rate": 4.7796658443789585e-05, "Pretrain/Loss": 2.0632121562957764, "Pretrain/Loss (Raw)": 1.944063663482666, "Pretrain/Step": 3063, "Pretrain/Step Time": 8.45408270508051} +{"Pretrain/Learning Rate": 4.779491552861592e-05, "Pretrain/Loss": 2.062758445739746, "Pretrain/Loss (Raw)": 2.0942533016204834, "Pretrain/Step": 3064, "Pretrain/Step Time": 8.450520845130086} +{"Pretrain/Learning Rate": 4.779317195616695e-05, "Pretrain/Loss": 2.0618698596954346, "Pretrain/Loss (Raw)": 2.024956464767456, "Pretrain/Step": 3065, "Pretrain/Step Time": 8.45424934104085} +{"Pretrain/Learning Rate": 4.779142772649292e-05, "Pretrain/Loss": 2.0620875358581543, "Pretrain/Loss (Raw)": 1.9882922172546387, "Pretrain/Step": 3066, "Pretrain/Step Time": 8.45364249125123} +{"Pretrain/Learning Rate": 4.778968283964415e-05, "Pretrain/Loss": 2.0630288124084473, "Pretrain/Loss (Raw)": 2.055577278137207, "Pretrain/Step": 3067, "Pretrain/Step Time": 8.45395035110414} +{"Pretrain/Learning Rate": 4.778793729567093e-05, "Pretrain/Loss": 2.0628392696380615, "Pretrain/Loss (Raw)": 1.9834736585617065, "Pretrain/Step": 3068, "Pretrain/Step Time": 8.453244367614388} +{"Pretrain/Learning Rate": 4.778619109462361e-05, "Pretrain/Loss": 2.063258171081543, "Pretrain/Loss (Raw)": 1.9804917573928833, "Pretrain/Step": 3069, "Pretrain/Step Time": 8.455278174951673} +{"Pretrain/Learning Rate": 4.778444423655253e-05, "Pretrain/Loss": 2.064645290374756, "Pretrain/Loss (Raw)": 2.206454038619995, "Pretrain/Step": 3070, "Pretrain/Step Time": 8.454974927008152} +{"Pretrain/Learning Rate": 4.778269672150807e-05, "Pretrain/Loss": 2.064761161804199, "Pretrain/Loss (Raw)": 2.0463271141052246, "Pretrain/Step": 3071, "Pretrain/Step Time": 8.449544794857502} +{"Pretrain/Learning Rate": 4.77809485495406e-05, "Pretrain/Loss": 2.0660481452941895, "Pretrain/Loss (Raw)": 2.2973244190216064, "Pretrain/Step": 3072, "Pretrain/Step Time": 8.444852691143751} +{"Pretrain/Learning Rate": 4.777919972070054e-05, "Pretrain/Loss": 2.067779541015625, "Pretrain/Loss (Raw)": 2.151958465576172, "Pretrain/Step": 3073, "Pretrain/Step Time": 8.44737546890974} +{"Pretrain/Learning Rate": 4.777745023503831e-05, "Pretrain/Loss": 2.067838191986084, "Pretrain/Loss (Raw)": 2.126814842224121, "Pretrain/Step": 3074, "Pretrain/Step Time": 8.449104180559516} +{"Pretrain/Learning Rate": 4.777570009260437e-05, "Pretrain/Loss": 2.067629098892212, "Pretrain/Loss (Raw)": 2.1064724922180176, "Pretrain/Step": 3075, "Pretrain/Step Time": 8.444416511803865} +{"Pretrain/Learning Rate": 4.777394929344917e-05, "Pretrain/Loss": 2.066652774810791, "Pretrain/Loss (Raw)": 2.1121718883514404, "Pretrain/Step": 3076, "Pretrain/Step Time": 8.447119753807783} +{"Pretrain/Learning Rate": 4.77721978376232e-05, "Pretrain/Loss": 2.0693390369415283, "Pretrain/Loss (Raw)": 2.1978094577789307, "Pretrain/Step": 3077, "Pretrain/Step Time": 8.444664413109422} +{"Pretrain/Learning Rate": 4.777044572517695e-05, "Pretrain/Loss": 2.0692877769470215, "Pretrain/Loss (Raw)": 2.0226330757141113, "Pretrain/Step": 3078, "Pretrain/Step Time": 8.444895783439279} +{"Pretrain/Learning Rate": 4.776869295616095e-05, "Pretrain/Loss": 2.068936347961426, "Pretrain/Loss (Raw)": 1.8763976097106934, "Pretrain/Step": 3079, "Pretrain/Step Time": 8.44750295765698} +{"Pretrain/Learning Rate": 4.776693953062575e-05, "Pretrain/Loss": 2.0687270164489746, "Pretrain/Loss (Raw)": 2.1356801986694336, "Pretrain/Step": 3080, "Pretrain/Step Time": 8.443759799003601} +{"Pretrain/Learning Rate": 4.7765185448621894e-05, "Pretrain/Loss": 2.0676910877227783, "Pretrain/Loss (Raw)": 2.029418706893921, "Pretrain/Step": 3081, "Pretrain/Step Time": 8.44535536505282} +{"Pretrain/Learning Rate": 4.7763430710199965e-05, "Pretrain/Loss": 2.0691134929656982, "Pretrain/Loss (Raw)": 2.1711437702178955, "Pretrain/Step": 3082, "Pretrain/Step Time": 8.4426677711308} +{"Pretrain/Learning Rate": 4.7761675315410545e-05, "Pretrain/Loss": 2.0691792964935303, "Pretrain/Loss (Raw)": 2.0456666946411133, "Pretrain/Step": 3083, "Pretrain/Step Time": 8.449687264859676} +{"Pretrain/Learning Rate": 4.775991926430428e-05, "Pretrain/Loss": 2.0703868865966797, "Pretrain/Loss (Raw)": 2.2238805294036865, "Pretrain/Step": 3084, "Pretrain/Step Time": 8.446444872766733} +{"Pretrain/Learning Rate": 4.775816255693178e-05, "Pretrain/Loss": 2.0676980018615723, "Pretrain/Loss (Raw)": 2.2215216159820557, "Pretrain/Step": 3085, "Pretrain/Step Time": 8.447259170934558} +{"Pretrain/Learning Rate": 4.775640519334371e-05, "Pretrain/Loss": 2.064450740814209, "Pretrain/Loss (Raw)": 1.8933405876159668, "Pretrain/Step": 3086, "Pretrain/Step Time": 8.445333067327738} +{"Pretrain/Learning Rate": 4.7754647173590736e-05, "Pretrain/Loss": 2.0613625049591064, "Pretrain/Loss (Raw)": 1.8117799758911133, "Pretrain/Step": 3087, "Pretrain/Step Time": 8.445949211716652} +{"Pretrain/Learning Rate": 4.7752888497723555e-05, "Pretrain/Loss": 2.0621066093444824, "Pretrain/Loss (Raw)": 2.097090244293213, "Pretrain/Step": 3088, "Pretrain/Step Time": 8.443153524771333} +{"Pretrain/Learning Rate": 4.7751129165792866e-05, "Pretrain/Loss": 2.0627646446228027, "Pretrain/Loss (Raw)": 2.2177441120147705, "Pretrain/Step": 3089, "Pretrain/Step Time": 8.440924923866987} +{"Pretrain/Learning Rate": 4.774936917784941e-05, "Pretrain/Loss": 2.0625462532043457, "Pretrain/Loss (Raw)": 1.997359037399292, "Pretrain/Step": 3090, "Pretrain/Step Time": 8.445128349587321} +{"Pretrain/Learning Rate": 4.7747608533943934e-05, "Pretrain/Loss": 2.0617170333862305, "Pretrain/Loss (Raw)": 1.9119656085968018, "Pretrain/Step": 3091, "Pretrain/Step Time": 8.44171891361475} +{"Pretrain/Learning Rate": 4.7745847234127206e-05, "Pretrain/Loss": 2.0616841316223145, "Pretrain/Loss (Raw)": 2.0914204120635986, "Pretrain/Step": 3092, "Pretrain/Step Time": 8.443620912730694} +{"Pretrain/Learning Rate": 4.774408527845e-05, "Pretrain/Loss": 2.05985164642334, "Pretrain/Loss (Raw)": 2.0720667839050293, "Pretrain/Step": 3093, "Pretrain/Step Time": 8.437338463962078} +{"Pretrain/Learning Rate": 4.7742322666963127e-05, "Pretrain/Loss": 2.0582480430603027, "Pretrain/Loss (Raw)": 2.132276773452759, "Pretrain/Step": 3094, "Pretrain/Step Time": 8.437313685193658} +{"Pretrain/Learning Rate": 4.774055939971742e-05, "Pretrain/Loss": 2.05763578414917, "Pretrain/Loss (Raw)": 2.032254695892334, "Pretrain/Step": 3095, "Pretrain/Step Time": 8.438393438234925} +{"Pretrain/Learning Rate": 4.7738795476763706e-05, "Pretrain/Loss": 2.05554461479187, "Pretrain/Loss (Raw)": 1.9267290830612183, "Pretrain/Step": 3096, "Pretrain/Step Time": 8.43936925008893} +{"Pretrain/Learning Rate": 4.773703089815286e-05, "Pretrain/Loss": 2.0566232204437256, "Pretrain/Loss (Raw)": 2.1607398986816406, "Pretrain/Step": 3097, "Pretrain/Step Time": 8.441031981259584} +{"Pretrain/Learning Rate": 4.773526566393575e-05, "Pretrain/Loss": 2.0582473278045654, "Pretrain/Loss (Raw)": 1.892519474029541, "Pretrain/Step": 3098, "Pretrain/Step Time": 8.443626079708338} +{"Pretrain/Learning Rate": 4.773349977416329e-05, "Pretrain/Loss": 2.055837631225586, "Pretrain/Loss (Raw)": 1.8550961017608643, "Pretrain/Step": 3099, "Pretrain/Step Time": 8.442853910848498} +{"Pretrain/Learning Rate": 4.773173322888638e-05, "Pretrain/Loss": 2.0572824478149414, "Pretrain/Loss (Raw)": 2.0461320877075195, "Pretrain/Step": 3100, "Pretrain/Step Time": 8.44459835998714} +{"Pretrain/Learning Rate": 4.772996602815598e-05, "Pretrain/Loss": 2.0585830211639404, "Pretrain/Loss (Raw)": 2.2558534145355225, "Pretrain/Step": 3101, "Pretrain/Step Time": 8.447589509189129} +{"Pretrain/Learning Rate": 4.772819817202302e-05, "Pretrain/Loss": 2.060992479324341, "Pretrain/Loss (Raw)": 2.0819754600524902, "Pretrain/Step": 3102, "Pretrain/Step Time": 8.443461054936051} +{"Pretrain/Learning Rate": 4.7726429660538495e-05, "Pretrain/Loss": 2.060964822769165, "Pretrain/Loss (Raw)": 2.1903092861175537, "Pretrain/Step": 3103, "Pretrain/Step Time": 8.440737823024392} +{"Pretrain/Learning Rate": 4.772466049375339e-05, "Pretrain/Loss": 2.0598273277282715, "Pretrain/Loss (Raw)": 1.9652854204177856, "Pretrain/Step": 3104, "Pretrain/Step Time": 8.443465434014797} +{"Pretrain/Learning Rate": 4.7722890671718726e-05, "Pretrain/Loss": 2.060438632965088, "Pretrain/Loss (Raw)": 2.250943183898926, "Pretrain/Step": 3105, "Pretrain/Step Time": 8.441459590569139} +{"Pretrain/Learning Rate": 4.772112019448552e-05, "Pretrain/Loss": 2.0626115798950195, "Pretrain/Loss (Raw)": 2.1335909366607666, "Pretrain/Step": 3106, "Pretrain/Step Time": 8.443182984367013} +{"Pretrain/Learning Rate": 4.771934906210483e-05, "Pretrain/Loss": 2.0626566410064697, "Pretrain/Loss (Raw)": 2.1660397052764893, "Pretrain/Step": 3107, "Pretrain/Step Time": 8.437387676909566} +{"Pretrain/Learning Rate": 4.7717577274627735e-05, "Pretrain/Loss": 2.057936429977417, "Pretrain/Loss (Raw)": 1.9620380401611328, "Pretrain/Step": 3108, "Pretrain/Step Time": 8.440664730966091} +{"Pretrain/Learning Rate": 4.7715804832105305e-05, "Pretrain/Loss": 2.059023857116699, "Pretrain/Loss (Raw)": 2.0008411407470703, "Pretrain/Step": 3109, "Pretrain/Step Time": 8.43608863465488} +{"Pretrain/Learning Rate": 4.771403173458866e-05, "Pretrain/Loss": 2.0594170093536377, "Pretrain/Loss (Raw)": 2.176636219024658, "Pretrain/Step": 3110, "Pretrain/Step Time": 8.433984132483602} +{"Pretrain/Learning Rate": 4.771225798212892e-05, "Pretrain/Loss": 2.060081958770752, "Pretrain/Loss (Raw)": 2.122037649154663, "Pretrain/Step": 3111, "Pretrain/Step Time": 8.434288371354342} +{"Pretrain/Learning Rate": 4.7710483574777236e-05, "Pretrain/Loss": 2.0576210021972656, "Pretrain/Loss (Raw)": 1.9198393821716309, "Pretrain/Step": 3112, "Pretrain/Step Time": 8.435198593884706} +{"Pretrain/Learning Rate": 4.770870851258477e-05, "Pretrain/Loss": 2.056166648864746, "Pretrain/Loss (Raw)": 1.835335373878479, "Pretrain/Step": 3113, "Pretrain/Step Time": 8.435643576085567} +{"Pretrain/Learning Rate": 4.7706932795602696e-05, "Pretrain/Loss": 2.0556201934814453, "Pretrain/Loss (Raw)": 1.8977314233779907, "Pretrain/Step": 3114, "Pretrain/Step Time": 8.431250106543303} +{"Pretrain/Learning Rate": 4.770515642388223e-05, "Pretrain/Loss": 2.0536394119262695, "Pretrain/Loss (Raw)": 1.7152832746505737, "Pretrain/Step": 3115, "Pretrain/Step Time": 8.430989615619183} +{"Pretrain/Learning Rate": 4.770337939747457e-05, "Pretrain/Loss": 2.053321123123169, "Pretrain/Loss (Raw)": 1.7246806621551514, "Pretrain/Step": 3116, "Pretrain/Step Time": 8.433802818879485} +{"Pretrain/Learning Rate": 4.770160171643098e-05, "Pretrain/Loss": 2.053760051727295, "Pretrain/Loss (Raw)": 2.0811586380004883, "Pretrain/Step": 3117, "Pretrain/Step Time": 8.430908039212227} +{"Pretrain/Learning Rate": 4.769982338080271e-05, "Pretrain/Loss": 2.053220748901367, "Pretrain/Loss (Raw)": 2.0430023670196533, "Pretrain/Step": 3118, "Pretrain/Step Time": 8.425982166081667} +{"Pretrain/Learning Rate": 4.769804439064103e-05, "Pretrain/Loss": 2.0535709857940674, "Pretrain/Loss (Raw)": 2.057734251022339, "Pretrain/Step": 3119, "Pretrain/Step Time": 8.427422760054469} +{"Pretrain/Learning Rate": 4.7696264745997245e-05, "Pretrain/Loss": 2.0558550357818604, "Pretrain/Loss (Raw)": 2.2898952960968018, "Pretrain/Step": 3120, "Pretrain/Step Time": 8.422557076439261} +{"Pretrain/Learning Rate": 4.769448444692266e-05, "Pretrain/Loss": 2.0578765869140625, "Pretrain/Loss (Raw)": 2.202310085296631, "Pretrain/Step": 3121, "Pretrain/Step Time": 8.424952717497945} +{"Pretrain/Learning Rate": 4.769270349346862e-05, "Pretrain/Loss": 2.0597081184387207, "Pretrain/Loss (Raw)": 2.104860305786133, "Pretrain/Step": 3122, "Pretrain/Step Time": 8.421080304309726} +{"Pretrain/Learning Rate": 4.7690921885686474e-05, "Pretrain/Loss": 2.061368465423584, "Pretrain/Loss (Raw)": 2.1651625633239746, "Pretrain/Step": 3123, "Pretrain/Step Time": 8.42618664726615} +{"Pretrain/Learning Rate": 4.7689139623627584e-05, "Pretrain/Loss": 2.0597243309020996, "Pretrain/Loss (Raw)": 1.9124146699905396, "Pretrain/Step": 3124, "Pretrain/Step Time": 8.427501525729895} +{"Pretrain/Learning Rate": 4.7687356707343357e-05, "Pretrain/Loss": 2.0604257583618164, "Pretrain/Loss (Raw)": 2.071949005126953, "Pretrain/Step": 3125, "Pretrain/Step Time": 8.422138137742877} +{"Pretrain/Learning Rate": 4.768557313688519e-05, "Pretrain/Loss": 2.0617167949676514, "Pretrain/Loss (Raw)": 2.0263149738311768, "Pretrain/Step": 3126, "Pretrain/Step Time": 8.41762418858707} +{"Pretrain/Learning Rate": 4.7683788912304506e-05, "Pretrain/Loss": 2.0615780353546143, "Pretrain/Loss (Raw)": 2.0698494911193848, "Pretrain/Step": 3127, "Pretrain/Step Time": 8.416597209870815} +{"Pretrain/Learning Rate": 4.7682004033652774e-05, "Pretrain/Loss": 2.0601794719696045, "Pretrain/Loss (Raw)": 1.8784819841384888, "Pretrain/Step": 3128, "Pretrain/Step Time": 8.42005867138505} +{"Pretrain/Learning Rate": 4.768021850098143e-05, "Pretrain/Loss": 2.060527801513672, "Pretrain/Loss (Raw)": 1.9413121938705444, "Pretrain/Step": 3129, "Pretrain/Step Time": 8.4181252643466} +{"Pretrain/Learning Rate": 4.767843231434198e-05, "Pretrain/Loss": 2.064876079559326, "Pretrain/Loss (Raw)": 2.5240774154663086, "Pretrain/Step": 3130, "Pretrain/Step Time": 8.416369529440999} +{"Pretrain/Learning Rate": 4.767664547378593e-05, "Pretrain/Loss": 2.066708564758301, "Pretrain/Loss (Raw)": 2.042285680770874, "Pretrain/Step": 3131, "Pretrain/Step Time": 8.419039536267519} +{"Pretrain/Learning Rate": 4.7674857979364785e-05, "Pretrain/Loss": 2.0665111541748047, "Pretrain/Loss (Raw)": 2.1836369037628174, "Pretrain/Step": 3132, "Pretrain/Step Time": 8.416177013888955} +{"Pretrain/Learning Rate": 4.767306983113009e-05, "Pretrain/Loss": 2.0639328956604004, "Pretrain/Loss (Raw)": 1.8029130697250366, "Pretrain/Step": 3133, "Pretrain/Step Time": 8.417671848088503} +{"Pretrain/Learning Rate": 4.767128102913342e-05, "Pretrain/Loss": 2.0632059574127197, "Pretrain/Loss (Raw)": 2.0745928287506104, "Pretrain/Step": 3134, "Pretrain/Step Time": 8.417163910344243} +{"Pretrain/Learning Rate": 4.766949157342634e-05, "Pretrain/Loss": 2.0650956630706787, "Pretrain/Loss (Raw)": 2.1868722438812256, "Pretrain/Step": 3135, "Pretrain/Step Time": 8.420085918158293} +{"Pretrain/Learning Rate": 4.766770146406045e-05, "Pretrain/Loss": 2.066939115524292, "Pretrain/Loss (Raw)": 2.067507028579712, "Pretrain/Step": 3136, "Pretrain/Step Time": 8.419185465201735} +{"Pretrain/Learning Rate": 4.766591070108737e-05, "Pretrain/Loss": 2.0682709217071533, "Pretrain/Loss (Raw)": 2.1522469520568848, "Pretrain/Step": 3137, "Pretrain/Step Time": 8.415656818076968} +{"Pretrain/Learning Rate": 4.766411928455873e-05, "Pretrain/Loss": 2.069105863571167, "Pretrain/Loss (Raw)": 2.10325288772583, "Pretrain/Step": 3138, "Pretrain/Step Time": 8.4194322116673} +{"Pretrain/Learning Rate": 4.766232721452619e-05, "Pretrain/Loss": 2.0706164836883545, "Pretrain/Loss (Raw)": 2.117954730987549, "Pretrain/Step": 3139, "Pretrain/Step Time": 8.414456279948354} +{"Pretrain/Learning Rate": 4.766053449104142e-05, "Pretrain/Loss": 2.0676679611206055, "Pretrain/Loss (Raw)": 1.6723334789276123, "Pretrain/Step": 3140, "Pretrain/Step Time": 8.417263137176633} +{"Pretrain/Learning Rate": 4.765874111415611e-05, "Pretrain/Loss": 2.064575672149658, "Pretrain/Loss (Raw)": 1.8657608032226562, "Pretrain/Step": 3141, "Pretrain/Step Time": 8.411569882184267} +{"Pretrain/Learning Rate": 4.765694708392198e-05, "Pretrain/Loss": 2.0645875930786133, "Pretrain/Loss (Raw)": 1.927088975906372, "Pretrain/Step": 3142, "Pretrain/Step Time": 8.408649375662208} +{"Pretrain/Learning Rate": 4.765515240039075e-05, "Pretrain/Loss": 2.0657973289489746, "Pretrain/Loss (Raw)": 2.075695753097534, "Pretrain/Step": 3143, "Pretrain/Step Time": 8.409491669386625} +{"Pretrain/Learning Rate": 4.7653357063614176e-05, "Pretrain/Loss": 2.0650343894958496, "Pretrain/Loss (Raw)": 2.097968816757202, "Pretrain/Step": 3144, "Pretrain/Step Time": 8.414353815838695} +{"Pretrain/Learning Rate": 4.7651561073644015e-05, "Pretrain/Loss": 2.0631117820739746, "Pretrain/Loss (Raw)": 1.9105896949768066, "Pretrain/Step": 3145, "Pretrain/Step Time": 8.419765712693334} +{"Pretrain/Learning Rate": 4.7649764430532055e-05, "Pretrain/Loss": 2.0632834434509277, "Pretrain/Loss (Raw)": 2.0463428497314453, "Pretrain/Step": 3146, "Pretrain/Step Time": 8.418006986379623} +{"Pretrain/Learning Rate": 4.7647967134330106e-05, "Pretrain/Loss": 2.0622448921203613, "Pretrain/Loss (Raw)": 2.062471628189087, "Pretrain/Step": 3147, "Pretrain/Step Time": 8.422730084508657} +{"Pretrain/Learning Rate": 4.764616918509e-05, "Pretrain/Loss": 2.0631933212280273, "Pretrain/Loss (Raw)": 2.1588592529296875, "Pretrain/Step": 3148, "Pretrain/Step Time": 8.423440182581544} +{"Pretrain/Learning Rate": 4.764437058286356e-05, "Pretrain/Loss": 2.0626049041748047, "Pretrain/Loss (Raw)": 2.024717330932617, "Pretrain/Step": 3149, "Pretrain/Step Time": 8.420630795881152} +{"Pretrain/Learning Rate": 4.7642571327702666e-05, "Pretrain/Loss": 2.0622315406799316, "Pretrain/Loss (Raw)": 1.9542486667633057, "Pretrain/Step": 3150, "Pretrain/Step Time": 8.418019536882639} +{"Pretrain/Learning Rate": 4.764077141965918e-05, "Pretrain/Loss": 2.065265655517578, "Pretrain/Loss (Raw)": 2.209646224975586, "Pretrain/Step": 3151, "Pretrain/Step Time": 8.41845971904695} +{"Pretrain/Learning Rate": 4.7638970858785015e-05, "Pretrain/Loss": 2.064802646636963, "Pretrain/Loss (Raw)": 2.094956874847412, "Pretrain/Step": 3152, "Pretrain/Step Time": 8.423592634499073} +{"Pretrain/Learning Rate": 4.763716964513209e-05, "Pretrain/Loss": 2.066694498062134, "Pretrain/Loss (Raw)": 2.118382692337036, "Pretrain/Step": 3153, "Pretrain/Step Time": 8.417600637301803} +{"Pretrain/Learning Rate": 4.7635367778752325e-05, "Pretrain/Loss": 2.0645689964294434, "Pretrain/Loss (Raw)": 1.98685884475708, "Pretrain/Step": 3154, "Pretrain/Step Time": 8.421037327498198} +{"Pretrain/Learning Rate": 4.76335652596977e-05, "Pretrain/Loss": 2.0638604164123535, "Pretrain/Loss (Raw)": 2.0583014488220215, "Pretrain/Step": 3155, "Pretrain/Step Time": 8.41413482837379} +{"Pretrain/Learning Rate": 4.763176208802017e-05, "Pretrain/Loss": 2.0644421577453613, "Pretrain/Loss (Raw)": 2.1811435222625732, "Pretrain/Step": 3156, "Pretrain/Step Time": 8.412093583494425} +{"Pretrain/Learning Rate": 4.762995826377173e-05, "Pretrain/Loss": 2.0635037422180176, "Pretrain/Loss (Raw)": 2.1808371543884277, "Pretrain/Step": 3157, "Pretrain/Step Time": 8.406376872211695} +{"Pretrain/Learning Rate": 4.7628153787004404e-05, "Pretrain/Loss": 2.0620970726013184, "Pretrain/Loss (Raw)": 2.2109813690185547, "Pretrain/Step": 3158, "Pretrain/Step Time": 8.406807394698262} +{"Pretrain/Learning Rate": 4.762634865777021e-05, "Pretrain/Loss": 2.062384605407715, "Pretrain/Loss (Raw)": 2.150463342666626, "Pretrain/Step": 3159, "Pretrain/Step Time": 8.404981270432472} +{"Pretrain/Learning Rate": 4.762454287612121e-05, "Pretrain/Loss": 2.0615005493164062, "Pretrain/Loss (Raw)": 2.0556325912475586, "Pretrain/Step": 3160, "Pretrain/Step Time": 8.406561404466629} +{"Pretrain/Learning Rate": 4.762273644210946e-05, "Pretrain/Loss": 2.0610790252685547, "Pretrain/Loss (Raw)": 2.198763132095337, "Pretrain/Step": 3161, "Pretrain/Step Time": 8.409147569909692} +{"Pretrain/Learning Rate": 4.762092935578705e-05, "Pretrain/Loss": 2.0622568130493164, "Pretrain/Loss (Raw)": 2.1920738220214844, "Pretrain/Step": 3162, "Pretrain/Step Time": 8.408741276711226} +{"Pretrain/Learning Rate": 4.76191216172061e-05, "Pretrain/Loss": 2.0619211196899414, "Pretrain/Loss (Raw)": 1.9784984588623047, "Pretrain/Step": 3163, "Pretrain/Step Time": 8.412039330229163} +{"Pretrain/Learning Rate": 4.7617313226418715e-05, "Pretrain/Loss": 2.0580191612243652, "Pretrain/Loss (Raw)": 1.7544069290161133, "Pretrain/Step": 3164, "Pretrain/Step Time": 8.412517864257097} +{"Pretrain/Learning Rate": 4.761550418347704e-05, "Pretrain/Loss": 2.059286594390869, "Pretrain/Loss (Raw)": 2.238675355911255, "Pretrain/Step": 3165, "Pretrain/Step Time": 8.41230689175427} +{"Pretrain/Learning Rate": 4.761369448843326e-05, "Pretrain/Loss": 2.0575923919677734, "Pretrain/Loss (Raw)": 1.926639437675476, "Pretrain/Step": 3166, "Pretrain/Step Time": 8.413244044408202} +{"Pretrain/Learning Rate": 4.761188414133953e-05, "Pretrain/Loss": 2.0575554370880127, "Pretrain/Loss (Raw)": 2.1109299659729004, "Pretrain/Step": 3167, "Pretrain/Step Time": 8.413618009537458} +{"Pretrain/Learning Rate": 4.761007314224807e-05, "Pretrain/Loss": 2.057363510131836, "Pretrain/Loss (Raw)": 2.1323108673095703, "Pretrain/Step": 3168, "Pretrain/Step Time": 8.413169417530298} +{"Pretrain/Learning Rate": 4.760826149121108e-05, "Pretrain/Loss": 2.057199716567993, "Pretrain/Loss (Raw)": 2.0985960960388184, "Pretrain/Step": 3169, "Pretrain/Step Time": 8.41418600641191} +{"Pretrain/Learning Rate": 4.760644918828081e-05, "Pretrain/Loss": 2.0598626136779785, "Pretrain/Loss (Raw)": 2.26485013961792, "Pretrain/Step": 3170, "Pretrain/Step Time": 8.417035980150104} +{"Pretrain/Learning Rate": 4.760463623350952e-05, "Pretrain/Loss": 2.0599405765533447, "Pretrain/Loss (Raw)": 2.2723615169525146, "Pretrain/Step": 3171, "Pretrain/Step Time": 8.413905050605536} +{"Pretrain/Learning Rate": 4.760282262694947e-05, "Pretrain/Loss": 2.0591609477996826, "Pretrain/Loss (Raw)": 2.0206985473632812, "Pretrain/Step": 3172, "Pretrain/Step Time": 8.41274556145072} +{"Pretrain/Learning Rate": 4.760100836865298e-05, "Pretrain/Loss": 2.0614547729492188, "Pretrain/Loss (Raw)": 2.0487236976623535, "Pretrain/Step": 3173, "Pretrain/Step Time": 8.41230683401227} +{"Pretrain/Learning Rate": 4.759919345867233e-05, "Pretrain/Loss": 2.062404155731201, "Pretrain/Loss (Raw)": 2.164116859436035, "Pretrain/Step": 3174, "Pretrain/Step Time": 8.409888826310635} +{"Pretrain/Learning Rate": 4.7597377897059875e-05, "Pretrain/Loss": 2.062544345855713, "Pretrain/Loss (Raw)": 2.1859071254730225, "Pretrain/Step": 3175, "Pretrain/Step Time": 8.409178426489234} +{"Pretrain/Learning Rate": 4.759556168386796e-05, "Pretrain/Loss": 2.0602171421051025, "Pretrain/Loss (Raw)": 1.9090110063552856, "Pretrain/Step": 3176, "Pretrain/Step Time": 8.41063922829926} +{"Pretrain/Learning Rate": 4.759374481914895e-05, "Pretrain/Loss": 2.060361862182617, "Pretrain/Loss (Raw)": 2.0801126956939697, "Pretrain/Step": 3177, "Pretrain/Step Time": 8.414464097470045} +{"Pretrain/Learning Rate": 4.759192730295523e-05, "Pretrain/Loss": 2.0621273517608643, "Pretrain/Loss (Raw)": 2.2235610485076904, "Pretrain/Step": 3178, "Pretrain/Step Time": 8.41141496784985} +{"Pretrain/Learning Rate": 4.7590109135339224e-05, "Pretrain/Loss": 2.0609912872314453, "Pretrain/Loss (Raw)": 1.9290271997451782, "Pretrain/Step": 3179, "Pretrain/Step Time": 8.40654394775629} +{"Pretrain/Learning Rate": 4.758829031635334e-05, "Pretrain/Loss": 2.0616390705108643, "Pretrain/Loss (Raw)": 2.098414659500122, "Pretrain/Step": 3180, "Pretrain/Step Time": 8.412226032465696} +{"Pretrain/Learning Rate": 4.758647084605003e-05, "Pretrain/Loss": 2.062260150909424, "Pretrain/Loss (Raw)": 1.9899271726608276, "Pretrain/Step": 3181, "Pretrain/Step Time": 8.410920817404985} +{"Pretrain/Learning Rate": 4.758465072448175e-05, "Pretrain/Loss": 2.0610148906707764, "Pretrain/Loss (Raw)": 2.1107470989227295, "Pretrain/Step": 3182, "Pretrain/Step Time": 8.415695263072848} +{"Pretrain/Learning Rate": 4.758282995170099e-05, "Pretrain/Loss": 2.064018726348877, "Pretrain/Loss (Raw)": 2.283017635345459, "Pretrain/Step": 3183, "Pretrain/Step Time": 8.416087910532951} +{"Pretrain/Learning Rate": 4.758100852776025e-05, "Pretrain/Loss": 2.0650267601013184, "Pretrain/Loss (Raw)": 2.0809154510498047, "Pretrain/Step": 3184, "Pretrain/Step Time": 8.415463216602802} +{"Pretrain/Learning Rate": 4.7579186452712055e-05, "Pretrain/Loss": 2.0645041465759277, "Pretrain/Loss (Raw)": 2.127864122390747, "Pretrain/Step": 3185, "Pretrain/Step Time": 8.412871656939387} +{"Pretrain/Learning Rate": 4.7577363726608926e-05, "Pretrain/Loss": 2.0614964962005615, "Pretrain/Loss (Raw)": 1.8440842628479004, "Pretrain/Step": 3186, "Pretrain/Step Time": 8.414084857329726} +{"Pretrain/Learning Rate": 4.7575540349503434e-05, "Pretrain/Loss": 2.0634493827819824, "Pretrain/Loss (Raw)": 2.2554638385772705, "Pretrain/Step": 3187, "Pretrain/Step Time": 8.413207862526178} +{"Pretrain/Learning Rate": 4.757371632144815e-05, "Pretrain/Loss": 2.0649285316467285, "Pretrain/Loss (Raw)": 2.1686630249023438, "Pretrain/Step": 3188, "Pretrain/Step Time": 8.410471582785249} +{"Pretrain/Learning Rate": 4.757189164249567e-05, "Pretrain/Loss": 2.067244052886963, "Pretrain/Loss (Raw)": 2.279296636581421, "Pretrain/Step": 3189, "Pretrain/Step Time": 8.413837745785713} +{"Pretrain/Learning Rate": 4.7570066312698605e-05, "Pretrain/Loss": 2.0688376426696777, "Pretrain/Loss (Raw)": 2.1207895278930664, "Pretrain/Step": 3190, "Pretrain/Step Time": 8.411354126408696} +{"Pretrain/Learning Rate": 4.756824033210959e-05, "Pretrain/Loss": 2.068258285522461, "Pretrain/Loss (Raw)": 1.869881510734558, "Pretrain/Step": 3191, "Pretrain/Step Time": 8.409603288397193} +{"Pretrain/Learning Rate": 4.756641370078127e-05, "Pretrain/Loss": 2.0670433044433594, "Pretrain/Loss (Raw)": 1.9387390613555908, "Pretrain/Step": 3192, "Pretrain/Step Time": 8.412526033818722} +{"Pretrain/Learning Rate": 4.756458641876632e-05, "Pretrain/Loss": 2.0677051544189453, "Pretrain/Loss (Raw)": 2.1096646785736084, "Pretrain/Step": 3193, "Pretrain/Step Time": 8.413107343018055} +{"Pretrain/Learning Rate": 4.756275848611743e-05, "Pretrain/Loss": 2.068143129348755, "Pretrain/Loss (Raw)": 2.0443599224090576, "Pretrain/Step": 3194, "Pretrain/Step Time": 8.414444612339139} +{"Pretrain/Learning Rate": 4.756092990288731e-05, "Pretrain/Loss": 2.0680623054504395, "Pretrain/Loss (Raw)": 2.0452539920806885, "Pretrain/Step": 3195, "Pretrain/Step Time": 8.412428475916386} +{"Pretrain/Learning Rate": 4.7559100669128676e-05, "Pretrain/Loss": 2.069281816482544, "Pretrain/Loss (Raw)": 2.139554500579834, "Pretrain/Step": 3196, "Pretrain/Step Time": 8.416185451671481} +{"Pretrain/Learning Rate": 4.7557270784894276e-05, "Pretrain/Loss": 2.070305824279785, "Pretrain/Loss (Raw)": 2.1115705966949463, "Pretrain/Step": 3197, "Pretrain/Step Time": 8.41649815440178} +{"Pretrain/Learning Rate": 4.7555440250236875e-05, "Pretrain/Loss": 2.069878101348877, "Pretrain/Loss (Raw)": 2.151681900024414, "Pretrain/Step": 3198, "Pretrain/Step Time": 8.417166482657194} +{"Pretrain/Learning Rate": 4.755360906520926e-05, "Pretrain/Loss": 2.0683434009552, "Pretrain/Loss (Raw)": 1.8499271869659424, "Pretrain/Step": 3199, "Pretrain/Step Time": 8.424956047907472} +{"Pretrain/Learning Rate": 4.755177722986422e-05, "Pretrain/Loss": 2.0665996074676514, "Pretrain/Loss (Raw)": 2.0740935802459717, "Pretrain/Step": 3200, "Pretrain/Step Time": 8.421608848497272} +{"Pretrain/Learning Rate": 4.754994474425458e-05, "Pretrain/Loss": 2.0680036544799805, "Pretrain/Loss (Raw)": 2.3316845893859863, "Pretrain/Step": 3201, "Pretrain/Step Time": 8.419013479724526} +{"Pretrain/Learning Rate": 4.754811160843319e-05, "Pretrain/Loss": 2.0671937465667725, "Pretrain/Loss (Raw)": 2.0231356620788574, "Pretrain/Step": 3202, "Pretrain/Step Time": 8.417905950918794} +{"Pretrain/Learning Rate": 4.754627782245289e-05, "Pretrain/Loss": 2.071535587310791, "Pretrain/Loss (Raw)": 2.6622061729431152, "Pretrain/Step": 3203, "Pretrain/Step Time": 8.415693150833249} +{"Pretrain/Learning Rate": 4.754444338636657e-05, "Pretrain/Loss": 2.0720713138580322, "Pretrain/Loss (Raw)": 2.1807594299316406, "Pretrain/Step": 3204, "Pretrain/Step Time": 8.412859225645661} +{"Pretrain/Learning Rate": 4.754260830022711e-05, "Pretrain/Loss": 2.072002410888672, "Pretrain/Loss (Raw)": 2.1889965534210205, "Pretrain/Step": 3205, "Pretrain/Step Time": 8.413517620414495} +{"Pretrain/Learning Rate": 4.754077256408743e-05, "Pretrain/Loss": 2.0705108642578125, "Pretrain/Loss (Raw)": 1.831710696220398, "Pretrain/Step": 3206, "Pretrain/Step Time": 8.41141059435904} +{"Pretrain/Learning Rate": 4.753893617800046e-05, "Pretrain/Loss": 2.072720527648926, "Pretrain/Loss (Raw)": 2.159256935119629, "Pretrain/Step": 3207, "Pretrain/Step Time": 8.41706290282309} +{"Pretrain/Learning Rate": 4.753709914201916e-05, "Pretrain/Loss": 2.0714001655578613, "Pretrain/Loss (Raw)": 1.9666506052017212, "Pretrain/Step": 3208, "Pretrain/Step Time": 8.415983010083437} +{"Pretrain/Learning Rate": 4.75352614561965e-05, "Pretrain/Loss": 2.0704727172851562, "Pretrain/Loss (Raw)": 1.910714030265808, "Pretrain/Step": 3209, "Pretrain/Step Time": 8.418101239949465} +{"Pretrain/Learning Rate": 4.753342312058546e-05, "Pretrain/Loss": 2.071340799331665, "Pretrain/Loss (Raw)": 2.28227162361145, "Pretrain/Step": 3210, "Pretrain/Step Time": 8.424796760082245} +{"Pretrain/Learning Rate": 4.753158413523904e-05, "Pretrain/Loss": 2.071662187576294, "Pretrain/Loss (Raw)": 2.0867857933044434, "Pretrain/Step": 3211, "Pretrain/Step Time": 8.419612068682909} +{"Pretrain/Learning Rate": 4.752974450021028e-05, "Pretrain/Loss": 2.0713210105895996, "Pretrain/Loss (Raw)": 2.1802303791046143, "Pretrain/Step": 3212, "Pretrain/Step Time": 8.420753497630358} +{"Pretrain/Learning Rate": 4.7527904215552227e-05, "Pretrain/Loss": 2.070770740509033, "Pretrain/Loss (Raw)": 2.151085138320923, "Pretrain/Step": 3213, "Pretrain/Step Time": 8.42017170228064} +{"Pretrain/Learning Rate": 4.7526063281317935e-05, "Pretrain/Loss": 2.071978807449341, "Pretrain/Loss (Raw)": 2.0479612350463867, "Pretrain/Step": 3214, "Pretrain/Step Time": 8.421941805630922} +{"Pretrain/Learning Rate": 4.752422169756048e-05, "Pretrain/Loss": 2.073167085647583, "Pretrain/Loss (Raw)": 1.9638960361480713, "Pretrain/Step": 3215, "Pretrain/Step Time": 8.421139743179083} +{"Pretrain/Learning Rate": 4.752237946433298e-05, "Pretrain/Loss": 2.07381534576416, "Pretrain/Loss (Raw)": 2.1800575256347656, "Pretrain/Step": 3216, "Pretrain/Step Time": 8.419444920495152} +{"Pretrain/Learning Rate": 4.752053658168854e-05, "Pretrain/Loss": 2.0747809410095215, "Pretrain/Loss (Raw)": 2.3413236141204834, "Pretrain/Step": 3217, "Pretrain/Step Time": 8.420699540525675} +{"Pretrain/Learning Rate": 4.75186930496803e-05, "Pretrain/Loss": 2.0757482051849365, "Pretrain/Loss (Raw)": 2.121185064315796, "Pretrain/Step": 3218, "Pretrain/Step Time": 8.420639274641871} +{"Pretrain/Learning Rate": 4.751684886836143e-05, "Pretrain/Loss": 2.0771427154541016, "Pretrain/Loss (Raw)": 2.0904593467712402, "Pretrain/Step": 3219, "Pretrain/Step Time": 8.42318120598793} +{"Pretrain/Learning Rate": 4.751500403778508e-05, "Pretrain/Loss": 2.0771069526672363, "Pretrain/Loss (Raw)": 2.0868396759033203, "Pretrain/Step": 3220, "Pretrain/Step Time": 8.418995566666126} +{"Pretrain/Learning Rate": 4.751315855800448e-05, "Pretrain/Loss": 2.081660747528076, "Pretrain/Loss (Raw)": 2.6549742221832275, "Pretrain/Step": 3221, "Pretrain/Step Time": 8.422838643193245} +{"Pretrain/Learning Rate": 4.751131242907281e-05, "Pretrain/Loss": 2.082007884979248, "Pretrain/Loss (Raw)": 2.1766958236694336, "Pretrain/Step": 3222, "Pretrain/Step Time": 8.423960648477077} +{"Pretrain/Learning Rate": 4.750946565104333e-05, "Pretrain/Loss": 2.0831971168518066, "Pretrain/Loss (Raw)": 2.184460163116455, "Pretrain/Step": 3223, "Pretrain/Step Time": 8.420814372599125} +{"Pretrain/Learning Rate": 4.750761822396926e-05, "Pretrain/Loss": 2.0848422050476074, "Pretrain/Loss (Raw)": 2.1373114585876465, "Pretrain/Step": 3224, "Pretrain/Step Time": 8.420239234343171} +{"Pretrain/Learning Rate": 4.750577014790389e-05, "Pretrain/Loss": 2.0833864212036133, "Pretrain/Loss (Raw)": 1.974401593208313, "Pretrain/Step": 3225, "Pretrain/Step Time": 8.417376464232802} +{"Pretrain/Learning Rate": 4.750392142290051e-05, "Pretrain/Loss": 2.0838050842285156, "Pretrain/Loss (Raw)": 1.9461358785629272, "Pretrain/Step": 3226, "Pretrain/Step Time": 8.418757492676377} +{"Pretrain/Learning Rate": 4.7502072049012413e-05, "Pretrain/Loss": 2.0853967666625977, "Pretrain/Loss (Raw)": 2.0588042736053467, "Pretrain/Step": 3227, "Pretrain/Step Time": 8.420800160616636} +{"Pretrain/Learning Rate": 4.7500222026292936e-05, "Pretrain/Loss": 2.0850186347961426, "Pretrain/Loss (Raw)": 1.9977442026138306, "Pretrain/Step": 3228, "Pretrain/Step Time": 8.420956598594785} +{"Pretrain/Learning Rate": 4.749837135479541e-05, "Pretrain/Loss": 2.0838472843170166, "Pretrain/Loss (Raw)": 2.1059072017669678, "Pretrain/Step": 3229, "Pretrain/Step Time": 8.425058275461197} +{"Pretrain/Learning Rate": 4.7496520034573225e-05, "Pretrain/Loss": 2.0835204124450684, "Pretrain/Loss (Raw)": 2.040147542953491, "Pretrain/Step": 3230, "Pretrain/Step Time": 8.423037169501185} +{"Pretrain/Learning Rate": 4.7494668065679724e-05, "Pretrain/Loss": 2.081331729888916, "Pretrain/Loss (Raw)": 1.910133719444275, "Pretrain/Step": 3231, "Pretrain/Step Time": 8.420972907915711} +{"Pretrain/Learning Rate": 4.749281544816834e-05, "Pretrain/Loss": 2.07938289642334, "Pretrain/Loss (Raw)": 1.7158490419387817, "Pretrain/Step": 3232, "Pretrain/Step Time": 8.421844366937876} +{"Pretrain/Learning Rate": 4.7490962182092466e-05, "Pretrain/Loss": 2.0783419609069824, "Pretrain/Loss (Raw)": 2.1176810264587402, "Pretrain/Step": 3233, "Pretrain/Step Time": 8.422517331317067} +{"Pretrain/Learning Rate": 4.748910826750557e-05, "Pretrain/Loss": 2.0774948596954346, "Pretrain/Loss (Raw)": 2.0251870155334473, "Pretrain/Step": 3234, "Pretrain/Step Time": 8.418616184964776} +{"Pretrain/Learning Rate": 4.748725370446108e-05, "Pretrain/Loss": 2.076565742492676, "Pretrain/Loss (Raw)": 2.0470924377441406, "Pretrain/Step": 3235, "Pretrain/Step Time": 8.422048099339008} +{"Pretrain/Learning Rate": 4.7485398493012477e-05, "Pretrain/Loss": 2.07832932472229, "Pretrain/Loss (Raw)": 2.187803268432617, "Pretrain/Step": 3236, "Pretrain/Step Time": 8.417968327179551} +{"Pretrain/Learning Rate": 4.7483542633213265e-05, "Pretrain/Loss": 2.0794639587402344, "Pretrain/Loss (Raw)": 2.146070957183838, "Pretrain/Step": 3237, "Pretrain/Step Time": 8.417246671393514} +{"Pretrain/Learning Rate": 4.7481686125116956e-05, "Pretrain/Loss": 2.0778777599334717, "Pretrain/Loss (Raw)": 1.973595142364502, "Pretrain/Step": 3238, "Pretrain/Step Time": 8.416930204257369} +{"Pretrain/Learning Rate": 4.747982896877707e-05, "Pretrain/Loss": 2.0778791904449463, "Pretrain/Loss (Raw)": 2.1222164630889893, "Pretrain/Step": 3239, "Pretrain/Step Time": 8.414528463035822} +{"Pretrain/Learning Rate": 4.747797116424716e-05, "Pretrain/Loss": 2.0789637565612793, "Pretrain/Loss (Raw)": 2.0586655139923096, "Pretrain/Step": 3240, "Pretrain/Step Time": 8.418142043054104} +{"Pretrain/Learning Rate": 4.74761127115808e-05, "Pretrain/Loss": 2.0811502933502197, "Pretrain/Loss (Raw)": 2.115192174911499, "Pretrain/Step": 3241, "Pretrain/Step Time": 8.414343426004052} +{"Pretrain/Learning Rate": 4.747425361083158e-05, "Pretrain/Loss": 2.08400559425354, "Pretrain/Loss (Raw)": 2.2632334232330322, "Pretrain/Step": 3242, "Pretrain/Step Time": 8.41736463084817} +{"Pretrain/Learning Rate": 4.74723938620531e-05, "Pretrain/Loss": 2.087186813354492, "Pretrain/Loss (Raw)": 2.122506856918335, "Pretrain/Step": 3243, "Pretrain/Step Time": 8.418761676177382} +{"Pretrain/Learning Rate": 4.7470533465298985e-05, "Pretrain/Loss": 2.0909783840179443, "Pretrain/Loss (Raw)": 2.2099783420562744, "Pretrain/Step": 3244, "Pretrain/Step Time": 8.412462232634425} +{"Pretrain/Learning Rate": 4.746867242062287e-05, "Pretrain/Loss": 2.090876340866089, "Pretrain/Loss (Raw)": 2.0680930614471436, "Pretrain/Step": 3245, "Pretrain/Step Time": 8.41295268945396} +{"Pretrain/Learning Rate": 4.746681072807843e-05, "Pretrain/Loss": 2.089693546295166, "Pretrain/Loss (Raw)": 1.8915908336639404, "Pretrain/Step": 3246, "Pretrain/Step Time": 8.420519638806581} +{"Pretrain/Learning Rate": 4.746494838771934e-05, "Pretrain/Loss": 2.0882034301757812, "Pretrain/Loss (Raw)": 1.866988182067871, "Pretrain/Step": 3247, "Pretrain/Step Time": 8.423106651753187} +{"Pretrain/Learning Rate": 4.746308539959931e-05, "Pretrain/Loss": 2.085401773452759, "Pretrain/Loss (Raw)": 1.9312899112701416, "Pretrain/Step": 3248, "Pretrain/Step Time": 8.423945810645819} +{"Pretrain/Learning Rate": 4.746122176377204e-05, "Pretrain/Loss": 2.085841178894043, "Pretrain/Loss (Raw)": 2.2585859298706055, "Pretrain/Step": 3249, "Pretrain/Step Time": 8.422972820699215} +{"Pretrain/Learning Rate": 4.7459357480291267e-05, "Pretrain/Loss": 2.0871028900146484, "Pretrain/Loss (Raw)": 2.266357421875, "Pretrain/Step": 3250, "Pretrain/Step Time": 8.425775902345777} +{"Pretrain/Learning Rate": 4.745749254921076e-05, "Pretrain/Loss": 2.0861282348632812, "Pretrain/Loss (Raw)": 2.040386438369751, "Pretrain/Step": 3251, "Pretrain/Step Time": 8.421320339664817} +{"Pretrain/Learning Rate": 4.745562697058429e-05, "Pretrain/Loss": 2.08693265914917, "Pretrain/Loss (Raw)": 2.0153963565826416, "Pretrain/Step": 3252, "Pretrain/Step Time": 8.421840818598866} +{"Pretrain/Learning Rate": 4.745376074446563e-05, "Pretrain/Loss": 2.0871646404266357, "Pretrain/Loss (Raw)": 2.101639986038208, "Pretrain/Step": 3253, "Pretrain/Step Time": 8.423526840284467} +{"Pretrain/Learning Rate": 4.745189387090863e-05, "Pretrain/Loss": 2.087097406387329, "Pretrain/Loss (Raw)": 2.0177223682403564, "Pretrain/Step": 3254, "Pretrain/Step Time": 8.420182283967733} +{"Pretrain/Learning Rate": 4.745002634996709e-05, "Pretrain/Loss": 2.0866360664367676, "Pretrain/Loss (Raw)": 2.0107662677764893, "Pretrain/Step": 3255, "Pretrain/Step Time": 8.42450887337327} +{"Pretrain/Learning Rate": 4.744815818169487e-05, "Pretrain/Loss": 2.088090658187866, "Pretrain/Loss (Raw)": 2.0646755695343018, "Pretrain/Step": 3256, "Pretrain/Step Time": 8.423310754820704} +{"Pretrain/Learning Rate": 4.7446289366145824e-05, "Pretrain/Loss": 2.0890791416168213, "Pretrain/Loss (Raw)": 2.0678298473358154, "Pretrain/Step": 3257, "Pretrain/Step Time": 8.427706278860569} +{"Pretrain/Learning Rate": 4.744441990337385e-05, "Pretrain/Loss": 2.0873749256134033, "Pretrain/Loss (Raw)": 2.3059568405151367, "Pretrain/Step": 3258, "Pretrain/Step Time": 8.425201583653688} +{"Pretrain/Learning Rate": 4.744254979343286e-05, "Pretrain/Loss": 2.0868914127349854, "Pretrain/Loss (Raw)": 1.9804123640060425, "Pretrain/Step": 3259, "Pretrain/Step Time": 8.426487805321813} +{"Pretrain/Learning Rate": 4.7440679036376755e-05, "Pretrain/Loss": 2.08590030670166, "Pretrain/Loss (Raw)": 2.0567643642425537, "Pretrain/Step": 3260, "Pretrain/Step Time": 8.429330799728632} +{"Pretrain/Learning Rate": 4.74388076322595e-05, "Pretrain/Loss": 2.0883851051330566, "Pretrain/Loss (Raw)": 2.120952606201172, "Pretrain/Step": 3261, "Pretrain/Step Time": 8.429139863699675} +{"Pretrain/Learning Rate": 4.7436935581135037e-05, "Pretrain/Loss": 2.090707778930664, "Pretrain/Loss (Raw)": 2.3719377517700195, "Pretrain/Step": 3262, "Pretrain/Step Time": 8.431468287482858} +{"Pretrain/Learning Rate": 4.743506288305736e-05, "Pretrain/Loss": 2.090315341949463, "Pretrain/Loss (Raw)": 2.13663387298584, "Pretrain/Step": 3263, "Pretrain/Step Time": 8.428577626124024} +{"Pretrain/Learning Rate": 4.743318953808046e-05, "Pretrain/Loss": 2.090392589569092, "Pretrain/Loss (Raw)": 2.0773653984069824, "Pretrain/Step": 3264, "Pretrain/Step Time": 8.42617809586227} +{"Pretrain/Learning Rate": 4.7431315546258346e-05, "Pretrain/Loss": 2.089878797531128, "Pretrain/Loss (Raw)": 2.086482286453247, "Pretrain/Step": 3265, "Pretrain/Step Time": 8.425563568249345} +{"Pretrain/Learning Rate": 4.742944090764507e-05, "Pretrain/Loss": 2.0904693603515625, "Pretrain/Loss (Raw)": 2.178834915161133, "Pretrain/Step": 3266, "Pretrain/Step Time": 8.424013426527381} +{"Pretrain/Learning Rate": 4.742756562229468e-05, "Pretrain/Loss": 2.090301275253296, "Pretrain/Loss (Raw)": 2.096444606781006, "Pretrain/Step": 3267, "Pretrain/Step Time": 8.424093725159764} +{"Pretrain/Learning Rate": 4.7425689690261235e-05, "Pretrain/Loss": 2.0932512283325195, "Pretrain/Loss (Raw)": 2.0499205589294434, "Pretrain/Step": 3268, "Pretrain/Step Time": 8.424013182520866} +{"Pretrain/Learning Rate": 4.742381311159885e-05, "Pretrain/Loss": 2.0954792499542236, "Pretrain/Loss (Raw)": 2.1509687900543213, "Pretrain/Step": 3269, "Pretrain/Step Time": 8.421402735635638} +{"Pretrain/Learning Rate": 4.7421935886361605e-05, "Pretrain/Loss": 2.0969653129577637, "Pretrain/Loss (Raw)": 2.1173195838928223, "Pretrain/Step": 3270, "Pretrain/Step Time": 8.424128327518702} +{"Pretrain/Learning Rate": 4.742005801460365e-05, "Pretrain/Loss": 2.097360610961914, "Pretrain/Loss (Raw)": 2.1262547969818115, "Pretrain/Step": 3271, "Pretrain/Step Time": 8.420564057305455} +{"Pretrain/Learning Rate": 4.741817949637913e-05, "Pretrain/Loss": 2.0976061820983887, "Pretrain/Loss (Raw)": 2.1293933391571045, "Pretrain/Step": 3272, "Pretrain/Step Time": 8.418133769184351} +{"Pretrain/Learning Rate": 4.741630033174221e-05, "Pretrain/Loss": 2.097381830215454, "Pretrain/Loss (Raw)": 1.8818968534469604, "Pretrain/Step": 3273, "Pretrain/Step Time": 8.417116232216358} +{"Pretrain/Learning Rate": 4.741442052074708e-05, "Pretrain/Loss": 2.0969693660736084, "Pretrain/Loss (Raw)": 1.9935503005981445, "Pretrain/Step": 3274, "Pretrain/Step Time": 8.41803539171815} +{"Pretrain/Learning Rate": 4.741254006344793e-05, "Pretrain/Loss": 2.0966758728027344, "Pretrain/Loss (Raw)": 2.0249037742614746, "Pretrain/Step": 3275, "Pretrain/Step Time": 8.4123689327389} +{"Pretrain/Learning Rate": 4.741065895989898e-05, "Pretrain/Loss": 2.095529079437256, "Pretrain/Loss (Raw)": 2.012071132659912, "Pretrain/Step": 3276, "Pretrain/Step Time": 8.41545706987381} +{"Pretrain/Learning Rate": 4.7408777210154474e-05, "Pretrain/Loss": 2.0961966514587402, "Pretrain/Loss (Raw)": 2.1101601123809814, "Pretrain/Step": 3277, "Pretrain/Step Time": 8.421975087374449} +{"Pretrain/Learning Rate": 4.740689481426869e-05, "Pretrain/Loss": 2.095237970352173, "Pretrain/Loss (Raw)": 1.8315485715866089, "Pretrain/Step": 3278, "Pretrain/Step Time": 8.42189073562622} +{"Pretrain/Learning Rate": 4.7405011772295884e-05, "Pretrain/Loss": 2.0919651985168457, "Pretrain/Loss (Raw)": 1.790732502937317, "Pretrain/Step": 3279, "Pretrain/Step Time": 8.42461558431387} +{"Pretrain/Learning Rate": 4.7403128084290346e-05, "Pretrain/Loss": 2.0938901901245117, "Pretrain/Loss (Raw)": 2.341346025466919, "Pretrain/Step": 3280, "Pretrain/Step Time": 8.421531988307834} +{"Pretrain/Learning Rate": 4.740124375030641e-05, "Pretrain/Loss": 2.092625379562378, "Pretrain/Loss (Raw)": 1.9564868211746216, "Pretrain/Step": 3281, "Pretrain/Step Time": 8.422135839238763} +{"Pretrain/Learning Rate": 4.739935877039841e-05, "Pretrain/Loss": 2.093438148498535, "Pretrain/Loss (Raw)": 2.0909171104431152, "Pretrain/Step": 3282, "Pretrain/Step Time": 8.420094206929207} +{"Pretrain/Learning Rate": 4.7397473144620685e-05, "Pretrain/Loss": 2.0945374965667725, "Pretrain/Loss (Raw)": 2.199002742767334, "Pretrain/Step": 3283, "Pretrain/Step Time": 8.424008090049028} +{"Pretrain/Learning Rate": 4.739558687302761e-05, "Pretrain/Loss": 2.092740297317505, "Pretrain/Loss (Raw)": 1.9510611295700073, "Pretrain/Step": 3284, "Pretrain/Step Time": 8.424708550795913} +{"Pretrain/Learning Rate": 4.739369995567357e-05, "Pretrain/Loss": 2.0894827842712402, "Pretrain/Loss (Raw)": 1.7639130353927612, "Pretrain/Step": 3285, "Pretrain/Step Time": 8.424886580556631} +{"Pretrain/Learning Rate": 4.739181239261299e-05, "Pretrain/Loss": 2.0890374183654785, "Pretrain/Loss (Raw)": 2.1539852619171143, "Pretrain/Step": 3286, "Pretrain/Step Time": 8.420700639486313} +{"Pretrain/Learning Rate": 4.738992418390028e-05, "Pretrain/Loss": 2.0884437561035156, "Pretrain/Loss (Raw)": 2.0744705200195312, "Pretrain/Step": 3287, "Pretrain/Step Time": 8.426949514076114} +{"Pretrain/Learning Rate": 4.7388035329589895e-05, "Pretrain/Loss": 2.088534355163574, "Pretrain/Loss (Raw)": 2.0672061443328857, "Pretrain/Step": 3288, "Pretrain/Step Time": 8.428899431601167} +{"Pretrain/Learning Rate": 4.7386145829736284e-05, "Pretrain/Loss": 2.08618426322937, "Pretrain/Loss (Raw)": 1.8979780673980713, "Pretrain/Step": 3289, "Pretrain/Step Time": 8.430995410308242} +{"Pretrain/Learning Rate": 4.7384255684393944e-05, "Pretrain/Loss": 2.08575439453125, "Pretrain/Loss (Raw)": 2.137068271636963, "Pretrain/Step": 3290, "Pretrain/Step Time": 8.431700309738517} +{"Pretrain/Learning Rate": 4.738236489361737e-05, "Pretrain/Loss": 2.0885491371154785, "Pretrain/Loss (Raw)": 2.3361799716949463, "Pretrain/Step": 3291, "Pretrain/Step Time": 8.42845182493329} +{"Pretrain/Learning Rate": 4.7380473457461086e-05, "Pretrain/Loss": 2.0909435749053955, "Pretrain/Loss (Raw)": 2.060914993286133, "Pretrain/Step": 3292, "Pretrain/Step Time": 8.42657987587154} +{"Pretrain/Learning Rate": 4.7378581375979625e-05, "Pretrain/Loss": 2.089529037475586, "Pretrain/Loss (Raw)": 2.057593584060669, "Pretrain/Step": 3293, "Pretrain/Step Time": 8.429915565997362} +{"Pretrain/Learning Rate": 4.737668864922754e-05, "Pretrain/Loss": 2.091176986694336, "Pretrain/Loss (Raw)": 2.137601613998413, "Pretrain/Step": 3294, "Pretrain/Step Time": 8.42829298041761} +{"Pretrain/Learning Rate": 4.737479527725942e-05, "Pretrain/Loss": 2.091846227645874, "Pretrain/Loss (Raw)": 2.196586847305298, "Pretrain/Step": 3295, "Pretrain/Step Time": 8.427826594561338} +{"Pretrain/Learning Rate": 4.7372901260129854e-05, "Pretrain/Loss": 2.090496063232422, "Pretrain/Loss (Raw)": 1.959457516670227, "Pretrain/Step": 3296, "Pretrain/Step Time": 8.429304407909513} +{"Pretrain/Learning Rate": 4.737100659789344e-05, "Pretrain/Loss": 2.0931568145751953, "Pretrain/Loss (Raw)": 2.4392144680023193, "Pretrain/Step": 3297, "Pretrain/Step Time": 8.429538099095225} +{"Pretrain/Learning Rate": 4.736911129060483e-05, "Pretrain/Loss": 2.0918989181518555, "Pretrain/Loss (Raw)": 2.103839159011841, "Pretrain/Step": 3298, "Pretrain/Step Time": 8.429574023932219} +{"Pretrain/Learning Rate": 4.7367215338318665e-05, "Pretrain/Loss": 2.0911054611206055, "Pretrain/Loss (Raw)": 2.1707851886749268, "Pretrain/Step": 3299, "Pretrain/Step Time": 8.432421965524554} +{"Pretrain/Learning Rate": 4.736531874108962e-05, "Pretrain/Loss": 2.091836452484131, "Pretrain/Loss (Raw)": 2.1142427921295166, "Pretrain/Step": 3300, "Pretrain/Step Time": 8.431646520271897} +{"Pretrain/Learning Rate": 4.736342149897236e-05, "Pretrain/Loss": 2.092836380004883, "Pretrain/Loss (Raw)": 2.1767492294311523, "Pretrain/Step": 3301, "Pretrain/Step Time": 8.429139306768775} +{"Pretrain/Learning Rate": 4.7361523612021616e-05, "Pretrain/Loss": 2.092998504638672, "Pretrain/Loss (Raw)": 2.1848466396331787, "Pretrain/Step": 3302, "Pretrain/Step Time": 8.428154854103923} +{"Pretrain/Learning Rate": 4.7359625080292104e-05, "Pretrain/Loss": 2.091811180114746, "Pretrain/Loss (Raw)": 2.033937454223633, "Pretrain/Step": 3303, "Pretrain/Step Time": 8.422841973602772} +{"Pretrain/Learning Rate": 4.735772590383856e-05, "Pretrain/Loss": 2.0907351970672607, "Pretrain/Loss (Raw)": 1.7712838649749756, "Pretrain/Step": 3304, "Pretrain/Step Time": 8.424895457923412} +{"Pretrain/Learning Rate": 4.735582608271575e-05, "Pretrain/Loss": 2.0903468132019043, "Pretrain/Loss (Raw)": 2.030400276184082, "Pretrain/Step": 3305, "Pretrain/Step Time": 8.428366355597973} +{"Pretrain/Learning Rate": 4.7353925616978456e-05, "Pretrain/Loss": 2.0905537605285645, "Pretrain/Loss (Raw)": 2.2500691413879395, "Pretrain/Step": 3306, "Pretrain/Step Time": 8.429531568661332} +{"Pretrain/Learning Rate": 4.735202450668148e-05, "Pretrain/Loss": 2.091001510620117, "Pretrain/Loss (Raw)": 1.9863160848617554, "Pretrain/Step": 3307, "Pretrain/Step Time": 8.42964468151331} +{"Pretrain/Learning Rate": 4.735012275187963e-05, "Pretrain/Loss": 2.0898547172546387, "Pretrain/Loss (Raw)": 1.9516199827194214, "Pretrain/Step": 3308, "Pretrain/Step Time": 8.42906623519957} +{"Pretrain/Learning Rate": 4.734822035262775e-05, "Pretrain/Loss": 2.0925722122192383, "Pretrain/Loss (Raw)": 2.3377861976623535, "Pretrain/Step": 3309, "Pretrain/Step Time": 8.430159006267786} +{"Pretrain/Learning Rate": 4.734631730898068e-05, "Pretrain/Loss": 2.091714859008789, "Pretrain/Loss (Raw)": 2.000983715057373, "Pretrain/Step": 3310, "Pretrain/Step Time": 8.427066143602133} +{"Pretrain/Learning Rate": 4.734441362099331e-05, "Pretrain/Loss": 2.0925989151000977, "Pretrain/Loss (Raw)": 2.396206855773926, "Pretrain/Step": 3311, "Pretrain/Step Time": 8.426198095083237} +{"Pretrain/Learning Rate": 4.734250928872053e-05, "Pretrain/Loss": 2.091435432434082, "Pretrain/Loss (Raw)": 1.9319735765457153, "Pretrain/Step": 3312, "Pretrain/Step Time": 8.42481416463852} +{"Pretrain/Learning Rate": 4.734060431221724e-05, "Pretrain/Loss": 2.0903053283691406, "Pretrain/Loss (Raw)": 1.9832266569137573, "Pretrain/Step": 3313, "Pretrain/Step Time": 8.427895596250892} +{"Pretrain/Learning Rate": 4.7338698691538375e-05, "Pretrain/Loss": 2.091660499572754, "Pretrain/Loss (Raw)": 2.017530918121338, "Pretrain/Step": 3314, "Pretrain/Step Time": 8.42886509373784} +{"Pretrain/Learning Rate": 4.733679242673889e-05, "Pretrain/Loss": 2.088925361633301, "Pretrain/Loss (Raw)": 1.9053421020507812, "Pretrain/Step": 3315, "Pretrain/Step Time": 8.42819525115192} +{"Pretrain/Learning Rate": 4.733488551787373e-05, "Pretrain/Loss": 2.086348056793213, "Pretrain/Loss (Raw)": 1.838797688484192, "Pretrain/Step": 3316, "Pretrain/Step Time": 8.433808043599129} +{"Pretrain/Learning Rate": 4.733297796499789e-05, "Pretrain/Loss": 2.0833444595336914, "Pretrain/Loss (Raw)": 1.8948205709457397, "Pretrain/Step": 3317, "Pretrain/Step Time": 8.4320650100708} +{"Pretrain/Learning Rate": 4.733106976816638e-05, "Pretrain/Loss": 2.0849852561950684, "Pretrain/Loss (Raw)": 2.3308122158050537, "Pretrain/Step": 3318, "Pretrain/Step Time": 8.428788542747498} +{"Pretrain/Learning Rate": 4.7329160927434214e-05, "Pretrain/Loss": 2.0874452590942383, "Pretrain/Loss (Raw)": 2.1847853660583496, "Pretrain/Step": 3319, "Pretrain/Step Time": 8.424719475209713} +{"Pretrain/Learning Rate": 4.7327251442856434e-05, "Pretrain/Loss": 2.0898563861846924, "Pretrain/Loss (Raw)": 2.2473390102386475, "Pretrain/Step": 3320, "Pretrain/Step Time": 8.423903247341514} +{"Pretrain/Learning Rate": 4.73253413144881e-05, "Pretrain/Loss": 2.0899531841278076, "Pretrain/Loss (Raw)": 2.1220643520355225, "Pretrain/Step": 3321, "Pretrain/Step Time": 8.427533956244588} +{"Pretrain/Learning Rate": 4.7323430542384284e-05, "Pretrain/Loss": 2.0892505645751953, "Pretrain/Loss (Raw)": 1.954443335533142, "Pretrain/Step": 3322, "Pretrain/Step Time": 8.426862025633454} +{"Pretrain/Learning Rate": 4.732151912660009e-05, "Pretrain/Loss": 2.0888736248016357, "Pretrain/Loss (Raw)": 1.9969946146011353, "Pretrain/Step": 3323, "Pretrain/Step Time": 8.427089482545853} +{"Pretrain/Learning Rate": 4.731960706719062e-05, "Pretrain/Loss": 2.0876898765563965, "Pretrain/Loss (Raw)": 1.987999677658081, "Pretrain/Step": 3324, "Pretrain/Step Time": 8.429265666753054} +{"Pretrain/Learning Rate": 4.731769436421102e-05, "Pretrain/Loss": 2.087613105773926, "Pretrain/Loss (Raw)": 2.1017487049102783, "Pretrain/Step": 3325, "Pretrain/Step Time": 8.426598912104964} +{"Pretrain/Learning Rate": 4.731578101771643e-05, "Pretrain/Loss": 2.0886290073394775, "Pretrain/Loss (Raw)": 2.281740427017212, "Pretrain/Step": 3326, "Pretrain/Step Time": 8.427305212244391} +{"Pretrain/Learning Rate": 4.731386702776204e-05, "Pretrain/Loss": 2.089832305908203, "Pretrain/Loss (Raw)": 2.003971815109253, "Pretrain/Step": 3327, "Pretrain/Step Time": 8.421817738562822} +{"Pretrain/Learning Rate": 4.731195239440301e-05, "Pretrain/Loss": 2.090413808822632, "Pretrain/Loss (Raw)": 2.148483991622925, "Pretrain/Step": 3328, "Pretrain/Step Time": 8.426973601803184} +{"Pretrain/Learning Rate": 4.7310037117694565e-05, "Pretrain/Loss": 2.0886144638061523, "Pretrain/Loss (Raw)": 2.1013829708099365, "Pretrain/Step": 3329, "Pretrain/Step Time": 8.430735541507602} +{"Pretrain/Learning Rate": 4.730812119769193e-05, "Pretrain/Loss": 2.089268684387207, "Pretrain/Loss (Raw)": 2.1068854331970215, "Pretrain/Step": 3330, "Pretrain/Step Time": 8.43176600523293} +{"Pretrain/Learning Rate": 4.7306204634450346e-05, "Pretrain/Loss": 2.0827531814575195, "Pretrain/Loss (Raw)": 1.8282452821731567, "Pretrain/Step": 3331, "Pretrain/Step Time": 8.43232150003314} +{"Pretrain/Learning Rate": 4.730428742802507e-05, "Pretrain/Loss": 2.0828583240509033, "Pretrain/Loss (Raw)": 2.194190740585327, "Pretrain/Step": 3332, "Pretrain/Step Time": 8.433566616848111} +{"Pretrain/Learning Rate": 4.73023695784714e-05, "Pretrain/Loss": 2.081751823425293, "Pretrain/Loss (Raw)": 2.0473849773406982, "Pretrain/Step": 3333, "Pretrain/Step Time": 8.43346451036632} +{"Pretrain/Learning Rate": 4.730045108584462e-05, "Pretrain/Loss": 2.0840201377868652, "Pretrain/Loss (Raw)": 2.1220450401306152, "Pretrain/Step": 3334, "Pretrain/Step Time": 8.433072885498405} +{"Pretrain/Learning Rate": 4.7298531950200055e-05, "Pretrain/Loss": 2.0841426849365234, "Pretrain/Loss (Raw)": 2.174922466278076, "Pretrain/Step": 3335, "Pretrain/Step Time": 8.42494279704988} +{"Pretrain/Learning Rate": 4.729661217159304e-05, "Pretrain/Loss": 2.082070827484131, "Pretrain/Loss (Raw)": 1.7014652490615845, "Pretrain/Step": 3336, "Pretrain/Step Time": 8.421155484393239} +{"Pretrain/Learning Rate": 4.7294691750078935e-05, "Pretrain/Loss": 2.084090232849121, "Pretrain/Loss (Raw)": 2.1691925525665283, "Pretrain/Step": 3337, "Pretrain/Step Time": 8.419582765549421} +{"Pretrain/Learning Rate": 4.7292770685713104e-05, "Pretrain/Loss": 2.0811567306518555, "Pretrain/Loss (Raw)": 1.9067994356155396, "Pretrain/Step": 3338, "Pretrain/Step Time": 8.424655811861157} +{"Pretrain/Learning Rate": 4.729084897855095e-05, "Pretrain/Loss": 2.081594705581665, "Pretrain/Loss (Raw)": 2.142853260040283, "Pretrain/Step": 3339, "Pretrain/Step Time": 8.42344917729497} +{"Pretrain/Learning Rate": 4.7288926628647875e-05, "Pretrain/Loss": 2.0805530548095703, "Pretrain/Loss (Raw)": 2.046888828277588, "Pretrain/Step": 3340, "Pretrain/Step Time": 8.42599369585514} +{"Pretrain/Learning Rate": 4.728700363605931e-05, "Pretrain/Loss": 2.079517364501953, "Pretrain/Loss (Raw)": 2.0184972286224365, "Pretrain/Step": 3341, "Pretrain/Step Time": 8.42515759728849} +{"Pretrain/Learning Rate": 4.728508000084072e-05, "Pretrain/Loss": 2.0797619819641113, "Pretrain/Loss (Raw)": 2.079285144805908, "Pretrain/Step": 3342, "Pretrain/Step Time": 8.422893831506371} +{"Pretrain/Learning Rate": 4.728315572304754e-05, "Pretrain/Loss": 2.081148147583008, "Pretrain/Loss (Raw)": 2.141313076019287, "Pretrain/Step": 3343, "Pretrain/Step Time": 8.421099646016955} +{"Pretrain/Learning Rate": 4.7281230802735285e-05, "Pretrain/Loss": 2.080855369567871, "Pretrain/Loss (Raw)": 2.1425909996032715, "Pretrain/Step": 3344, "Pretrain/Step Time": 8.426866345107555} +{"Pretrain/Learning Rate": 4.7279305239959454e-05, "Pretrain/Loss": 2.0793631076812744, "Pretrain/Loss (Raw)": 2.150310516357422, "Pretrain/Step": 3345, "Pretrain/Step Time": 8.429403726011515} +{"Pretrain/Learning Rate": 4.727737903477555e-05, "Pretrain/Loss": 2.079123020172119, "Pretrain/Loss (Raw)": 2.0904276371002197, "Pretrain/Step": 3346, "Pretrain/Step Time": 8.425227919593453} +{"Pretrain/Learning Rate": 4.7275452187239134e-05, "Pretrain/Loss": 2.076986789703369, "Pretrain/Loss (Raw)": 1.8170815706253052, "Pretrain/Step": 3347, "Pretrain/Step Time": 8.428328733891249} +{"Pretrain/Learning Rate": 4.727352469740575e-05, "Pretrain/Loss": 2.0765786170959473, "Pretrain/Loss (Raw)": 2.0345373153686523, "Pretrain/Step": 3348, "Pretrain/Step Time": 8.430707341060042} +{"Pretrain/Learning Rate": 4.727159656533099e-05, "Pretrain/Loss": 2.072364330291748, "Pretrain/Loss (Raw)": 2.115586519241333, "Pretrain/Step": 3349, "Pretrain/Step Time": 8.428613876923919} +{"Pretrain/Learning Rate": 4.726966779107044e-05, "Pretrain/Loss": 2.073014259338379, "Pretrain/Loss (Raw)": 2.2598791122436523, "Pretrain/Step": 3350, "Pretrain/Step Time": 8.429681846871972} +{"Pretrain/Learning Rate": 4.726773837467972e-05, "Pretrain/Loss": 2.071920394897461, "Pretrain/Loss (Raw)": 2.0444254875183105, "Pretrain/Step": 3351, "Pretrain/Step Time": 8.429482901468873} +{"Pretrain/Learning Rate": 4.7265808316214454e-05, "Pretrain/Loss": 2.070816993713379, "Pretrain/Loss (Raw)": 1.9961020946502686, "Pretrain/Step": 3352, "Pretrain/Step Time": 8.430815229192376} +{"Pretrain/Learning Rate": 4.726387761573031e-05, "Pretrain/Loss": 2.071756362915039, "Pretrain/Loss (Raw)": 2.094627857208252, "Pretrain/Step": 3353, "Pretrain/Step Time": 8.432366456836462} +{"Pretrain/Learning Rate": 4.726194627328295e-05, "Pretrain/Loss": 2.0731992721557617, "Pretrain/Loss (Raw)": 2.13082218170166, "Pretrain/Step": 3354, "Pretrain/Step Time": 8.437496814876795} +{"Pretrain/Learning Rate": 4.726001428892806e-05, "Pretrain/Loss": 2.073160171508789, "Pretrain/Loss (Raw)": 2.05379056930542, "Pretrain/Step": 3355, "Pretrain/Step Time": 8.435706609860063} +{"Pretrain/Learning Rate": 4.725808166272135e-05, "Pretrain/Loss": 2.073042869567871, "Pretrain/Loss (Raw)": 1.9827302694320679, "Pretrain/Step": 3356, "Pretrain/Step Time": 8.436526421457529} +{"Pretrain/Learning Rate": 4.725614839471855e-05, "Pretrain/Loss": 2.0725972652435303, "Pretrain/Loss (Raw)": 2.0488779544830322, "Pretrain/Step": 3357, "Pretrain/Step Time": 8.430759366601706} +{"Pretrain/Learning Rate": 4.725421448497539e-05, "Pretrain/Loss": 2.0738556385040283, "Pretrain/Loss (Raw)": 2.2012298107147217, "Pretrain/Step": 3358, "Pretrain/Step Time": 8.430240921676159} +{"Pretrain/Learning Rate": 4.7252279933547657e-05, "Pretrain/Loss": 2.0760974884033203, "Pretrain/Loss (Raw)": 2.1970882415771484, "Pretrain/Step": 3359, "Pretrain/Step Time": 8.430648151785135} +{"Pretrain/Learning Rate": 4.7250344740491115e-05, "Pretrain/Loss": 2.0793745517730713, "Pretrain/Loss (Raw)": 2.135326623916626, "Pretrain/Step": 3360, "Pretrain/Step Time": 8.429071195423603} +{"Pretrain/Learning Rate": 4.724840890586156e-05, "Pretrain/Loss": 2.0793304443359375, "Pretrain/Loss (Raw)": 2.112032175064087, "Pretrain/Step": 3361, "Pretrain/Step Time": 8.43119335360825} +{"Pretrain/Learning Rate": 4.724647242971483e-05, "Pretrain/Loss": 2.079157829284668, "Pretrain/Loss (Raw)": 2.0030603408813477, "Pretrain/Step": 3362, "Pretrain/Step Time": 8.432955717667937} +{"Pretrain/Learning Rate": 4.724453531210674e-05, "Pretrain/Loss": 2.0814924240112305, "Pretrain/Loss (Raw)": 2.3459537029266357, "Pretrain/Step": 3363, "Pretrain/Step Time": 8.433406880125403} +{"Pretrain/Learning Rate": 4.724259755309316e-05, "Pretrain/Loss": 2.0811429023742676, "Pretrain/Loss (Raw)": 2.1430675983428955, "Pretrain/Step": 3364, "Pretrain/Step Time": 8.434143321588635} +{"Pretrain/Learning Rate": 4.724065915272996e-05, "Pretrain/Loss": 2.0792555809020996, "Pretrain/Loss (Raw)": 1.9044735431671143, "Pretrain/Step": 3365, "Pretrain/Step Time": 8.435731079429388} +{"Pretrain/Learning Rate": 4.723872011107303e-05, "Pretrain/Loss": 2.0809988975524902, "Pretrain/Loss (Raw)": 2.1967556476593018, "Pretrain/Step": 3366, "Pretrain/Step Time": 8.433152858167887} +{"Pretrain/Learning Rate": 4.7236780428178286e-05, "Pretrain/Loss": 2.0830135345458984, "Pretrain/Loss (Raw)": 2.380084753036499, "Pretrain/Step": 3367, "Pretrain/Step Time": 8.43603466451168} +{"Pretrain/Learning Rate": 4.723484010410165e-05, "Pretrain/Loss": 2.084472417831421, "Pretrain/Loss (Raw)": 2.2454018592834473, "Pretrain/Step": 3368, "Pretrain/Step Time": 8.43245772831142} +{"Pretrain/Learning Rate": 4.7232899138899075e-05, "Pretrain/Loss": 2.084932327270508, "Pretrain/Loss (Raw)": 2.17405366897583, "Pretrain/Step": 3369, "Pretrain/Step Time": 8.432420659810305} +{"Pretrain/Learning Rate": 4.723095753262653e-05, "Pretrain/Loss": 2.083827257156372, "Pretrain/Loss (Raw)": 2.121790885925293, "Pretrain/Step": 3370, "Pretrain/Step Time": 8.436006922274828} +{"Pretrain/Learning Rate": 4.7229015285339995e-05, "Pretrain/Loss": 2.0805108547210693, "Pretrain/Loss (Raw)": 1.6979966163635254, "Pretrain/Step": 3371, "Pretrain/Step Time": 8.434265047311783} +{"Pretrain/Learning Rate": 4.7227072397095474e-05, "Pretrain/Loss": 2.079899311065674, "Pretrain/Loss (Raw)": 2.1316933631896973, "Pretrain/Step": 3372, "Pretrain/Step Time": 8.43928837403655} +{"Pretrain/Learning Rate": 4.7225128867948996e-05, "Pretrain/Loss": 2.0789294242858887, "Pretrain/Loss (Raw)": 1.9439284801483154, "Pretrain/Step": 3373, "Pretrain/Step Time": 8.441384034231305} +{"Pretrain/Learning Rate": 4.722318469795659e-05, "Pretrain/Loss": 2.0813660621643066, "Pretrain/Loss (Raw)": 2.203518867492676, "Pretrain/Step": 3374, "Pretrain/Step Time": 8.435999361798167} +{"Pretrain/Learning Rate": 4.7221239887174314e-05, "Pretrain/Loss": 2.083609104156494, "Pretrain/Loss (Raw)": 2.154093027114868, "Pretrain/Step": 3375, "Pretrain/Step Time": 8.432918399572372} +{"Pretrain/Learning Rate": 4.721929443565826e-05, "Pretrain/Loss": 2.083639144897461, "Pretrain/Loss (Raw)": 1.9351495504379272, "Pretrain/Step": 3376, "Pretrain/Step Time": 8.436948029324412} +{"Pretrain/Learning Rate": 4.72173483434645e-05, "Pretrain/Loss": 2.0820302963256836, "Pretrain/Loss (Raw)": 2.0526175498962402, "Pretrain/Step": 3377, "Pretrain/Step Time": 8.436479426920414} +{"Pretrain/Learning Rate": 4.721540161064918e-05, "Pretrain/Loss": 2.078037738800049, "Pretrain/Loss (Raw)": 1.755318284034729, "Pretrain/Step": 3378, "Pretrain/Step Time": 8.435978580266237} +{"Pretrain/Learning Rate": 4.721345423726841e-05, "Pretrain/Loss": 2.079073905944824, "Pretrain/Loss (Raw)": 2.173015832901001, "Pretrain/Step": 3379, "Pretrain/Step Time": 8.440272681415081} +{"Pretrain/Learning Rate": 4.721150622337834e-05, "Pretrain/Loss": 2.0793519020080566, "Pretrain/Loss (Raw)": 2.0510051250457764, "Pretrain/Step": 3380, "Pretrain/Step Time": 8.43953938409686} +{"Pretrain/Learning Rate": 4.720955756903515e-05, "Pretrain/Loss": 2.079139232635498, "Pretrain/Loss (Raw)": 2.0744032859802246, "Pretrain/Step": 3381, "Pretrain/Step Time": 8.439849203452468} +{"Pretrain/Learning Rate": 4.7207608274295025e-05, "Pretrain/Loss": 2.080326557159424, "Pretrain/Loss (Raw)": 2.1697189807891846, "Pretrain/Step": 3382, "Pretrain/Step Time": 8.442524271085858} +{"Pretrain/Learning Rate": 4.7205658339214164e-05, "Pretrain/Loss": 2.0819642543792725, "Pretrain/Loss (Raw)": 2.2203681468963623, "Pretrain/Step": 3383, "Pretrain/Step Time": 8.437947856262326} +{"Pretrain/Learning Rate": 4.7203707763848805e-05, "Pretrain/Loss": 2.080486297607422, "Pretrain/Loss (Raw)": 1.8755152225494385, "Pretrain/Step": 3384, "Pretrain/Step Time": 8.436333741992712} +{"Pretrain/Learning Rate": 4.7201756548255186e-05, "Pretrain/Loss": 2.079643726348877, "Pretrain/Loss (Raw)": 1.9599510431289673, "Pretrain/Step": 3385, "Pretrain/Step Time": 8.430808505043387} +{"Pretrain/Learning Rate": 4.719980469248957e-05, "Pretrain/Loss": 2.0789928436279297, "Pretrain/Loss (Raw)": 2.222651958465576, "Pretrain/Step": 3386, "Pretrain/Step Time": 8.43737375177443} +{"Pretrain/Learning Rate": 4.7197852196608225e-05, "Pretrain/Loss": 2.080136299133301, "Pretrain/Loss (Raw)": 2.1267642974853516, "Pretrain/Step": 3387, "Pretrain/Step Time": 8.430984104052186} +{"Pretrain/Learning Rate": 4.719589906066747e-05, "Pretrain/Loss": 2.0789318084716797, "Pretrain/Loss (Raw)": 1.9025946855545044, "Pretrain/Step": 3388, "Pretrain/Step Time": 8.439020847901702} +{"Pretrain/Learning Rate": 4.719394528472362e-05, "Pretrain/Loss": 2.0775115489959717, "Pretrain/Loss (Raw)": 1.939154028892517, "Pretrain/Step": 3389, "Pretrain/Step Time": 8.437158962711692} +{"Pretrain/Learning Rate": 4.719199086883299e-05, "Pretrain/Loss": 2.0760111808776855, "Pretrain/Loss (Raw)": 2.179903030395508, "Pretrain/Step": 3390, "Pretrain/Step Time": 8.435055058449507} +{"Pretrain/Learning Rate": 4.719003581305195e-05, "Pretrain/Loss": 2.0747733116149902, "Pretrain/Loss (Raw)": 1.9781980514526367, "Pretrain/Step": 3391, "Pretrain/Step Time": 8.43501047231257} +{"Pretrain/Learning Rate": 4.718808011743687e-05, "Pretrain/Loss": 2.0749011039733887, "Pretrain/Loss (Raw)": 2.093689203262329, "Pretrain/Step": 3392, "Pretrain/Step Time": 8.436546605080366} +{"Pretrain/Learning Rate": 4.718612378204414e-05, "Pretrain/Loss": 2.074385643005371, "Pretrain/Loss (Raw)": 2.0205092430114746, "Pretrain/Step": 3393, "Pretrain/Step Time": 8.438452672213316} +{"Pretrain/Learning Rate": 4.718416680693018e-05, "Pretrain/Loss": 2.0733988285064697, "Pretrain/Loss (Raw)": 2.0525271892547607, "Pretrain/Step": 3394, "Pretrain/Step Time": 8.437462504953146} +{"Pretrain/Learning Rate": 4.7182209192151404e-05, "Pretrain/Loss": 2.0729331970214844, "Pretrain/Loss (Raw)": 2.0368735790252686, "Pretrain/Step": 3395, "Pretrain/Step Time": 8.44099435210228} +{"Pretrain/Learning Rate": 4.718025093776426e-05, "Pretrain/Loss": 2.073093891143799, "Pretrain/Loss (Raw)": 2.0704703330993652, "Pretrain/Step": 3396, "Pretrain/Step Time": 8.43919487670064} +{"Pretrain/Learning Rate": 4.717829204382522e-05, "Pretrain/Loss": 2.071624279022217, "Pretrain/Loss (Raw)": 1.9628552198410034, "Pretrain/Step": 3397, "Pretrain/Step Time": 8.44044241309166} +{"Pretrain/Learning Rate": 4.7176332510390766e-05, "Pretrain/Loss": 2.0700178146362305, "Pretrain/Loss (Raw)": 1.911688208580017, "Pretrain/Step": 3398, "Pretrain/Step Time": 8.44616361707449} +{"Pretrain/Learning Rate": 4.717437233751739e-05, "Pretrain/Loss": 2.0682873725891113, "Pretrain/Loss (Raw)": 1.9047716856002808, "Pretrain/Step": 3399, "Pretrain/Step Time": 8.44671344384551} +{"Pretrain/Learning Rate": 4.717241152526163e-05, "Pretrain/Loss": 2.069795608520508, "Pretrain/Loss (Raw)": 2.3224382400512695, "Pretrain/Step": 3400, "Pretrain/Step Time": 8.442175548523664} +{"Pretrain/Learning Rate": 4.717045007368e-05, "Pretrain/Loss": 2.0707337856292725, "Pretrain/Loss (Raw)": 2.0019991397857666, "Pretrain/Step": 3401, "Pretrain/Step Time": 8.43489894270897} +{"Pretrain/Learning Rate": 4.716848798282908e-05, "Pretrain/Loss": 2.070772647857666, "Pretrain/Loss (Raw)": 1.998508334159851, "Pretrain/Step": 3402, "Pretrain/Step Time": 8.443633116781712} +{"Pretrain/Learning Rate": 4.716652525276544e-05, "Pretrain/Loss": 2.0680136680603027, "Pretrain/Loss (Raw)": 1.6717661619186401, "Pretrain/Step": 3403, "Pretrain/Step Time": 8.44337534531951} +{"Pretrain/Learning Rate": 4.7164561883545663e-05, "Pretrain/Loss": 2.0685858726501465, "Pretrain/Loss (Raw)": 2.085317850112915, "Pretrain/Step": 3404, "Pretrain/Step Time": 8.441534986719489} +{"Pretrain/Learning Rate": 4.716259787522637e-05, "Pretrain/Loss": 2.0688934326171875, "Pretrain/Loss (Raw)": 2.149510145187378, "Pretrain/Step": 3405, "Pretrain/Step Time": 8.43981178291142} +{"Pretrain/Learning Rate": 4.716063322786419e-05, "Pretrain/Loss": 2.07159686088562, "Pretrain/Loss (Raw)": 2.177582263946533, "Pretrain/Step": 3406, "Pretrain/Step Time": 8.440596621483564} +{"Pretrain/Learning Rate": 4.715866794151578e-05, "Pretrain/Loss": 2.071890354156494, "Pretrain/Loss (Raw)": 1.8282976150512695, "Pretrain/Step": 3407, "Pretrain/Step Time": 8.44098879955709} +{"Pretrain/Learning Rate": 4.71567020162378e-05, "Pretrain/Loss": 2.0695183277130127, "Pretrain/Loss (Raw)": 2.037740707397461, "Pretrain/Step": 3408, "Pretrain/Step Time": 8.440647806972265} +{"Pretrain/Learning Rate": 4.7154735452086936e-05, "Pretrain/Loss": 2.070230722427368, "Pretrain/Loss (Raw)": 2.0476794242858887, "Pretrain/Step": 3409, "Pretrain/Step Time": 8.441052520647645} +{"Pretrain/Learning Rate": 4.715276824911989e-05, "Pretrain/Loss": 2.068779468536377, "Pretrain/Loss (Raw)": 1.9051342010498047, "Pretrain/Step": 3410, "Pretrain/Step Time": 8.442206628620625} +{"Pretrain/Learning Rate": 4.7150800407393394e-05, "Pretrain/Loss": 2.0662641525268555, "Pretrain/Loss (Raw)": 1.8770512342453003, "Pretrain/Step": 3411, "Pretrain/Step Time": 8.442524638026953} +{"Pretrain/Learning Rate": 4.714883192696418e-05, "Pretrain/Loss": 2.06762433052063, "Pretrain/Loss (Raw)": 2.125182867050171, "Pretrain/Step": 3412, "Pretrain/Step Time": 8.442392822355032} +{"Pretrain/Learning Rate": 4.7146862807889004e-05, "Pretrain/Loss": 2.069427967071533, "Pretrain/Loss (Raw)": 1.9947620630264282, "Pretrain/Step": 3413, "Pretrain/Step Time": 8.440009275451303} +{"Pretrain/Learning Rate": 4.714489305022466e-05, "Pretrain/Loss": 2.0676674842834473, "Pretrain/Loss (Raw)": 1.9286351203918457, "Pretrain/Step": 3414, "Pretrain/Step Time": 8.442983485758305} +{"Pretrain/Learning Rate": 4.714292265402793e-05, "Pretrain/Loss": 2.068162441253662, "Pretrain/Loss (Raw)": 2.1378657817840576, "Pretrain/Step": 3415, "Pretrain/Step Time": 8.436245800927281} +{"Pretrain/Learning Rate": 4.714095161935564e-05, "Pretrain/Loss": 2.068228244781494, "Pretrain/Loss (Raw)": 2.0756278038024902, "Pretrain/Step": 3416, "Pretrain/Step Time": 8.433143325150013} +{"Pretrain/Learning Rate": 4.713897994626462e-05, "Pretrain/Loss": 2.066272258758545, "Pretrain/Loss (Raw)": 1.647597074508667, "Pretrain/Step": 3417, "Pretrain/Step Time": 8.433515317738056} +{"Pretrain/Learning Rate": 4.7137007634811714e-05, "Pretrain/Loss": 2.0662732124328613, "Pretrain/Loss (Raw)": 2.1371641159057617, "Pretrain/Step": 3418, "Pretrain/Step Time": 8.431808289140463} +{"Pretrain/Learning Rate": 4.71350346850538e-05, "Pretrain/Loss": 2.0627150535583496, "Pretrain/Loss (Raw)": 1.8807713985443115, "Pretrain/Step": 3419, "Pretrain/Step Time": 8.436992151662707} +{"Pretrain/Learning Rate": 4.713306109704777e-05, "Pretrain/Loss": 2.0626864433288574, "Pretrain/Loss (Raw)": 2.0572428703308105, "Pretrain/Step": 3420, "Pretrain/Step Time": 8.434702906757593} +{"Pretrain/Learning Rate": 4.713108687085052e-05, "Pretrain/Loss": 2.064378023147583, "Pretrain/Loss (Raw)": 2.2740955352783203, "Pretrain/Step": 3421, "Pretrain/Step Time": 8.439623450860381} +{"Pretrain/Learning Rate": 4.7129112006518984e-05, "Pretrain/Loss": 2.063244104385376, "Pretrain/Loss (Raw)": 1.992457628250122, "Pretrain/Step": 3422, "Pretrain/Step Time": 8.440469313412905} +{"Pretrain/Learning Rate": 4.71271365041101e-05, "Pretrain/Loss": 2.0635714530944824, "Pretrain/Loss (Raw)": 2.238483428955078, "Pretrain/Step": 3423, "Pretrain/Step Time": 8.440576501190662} +{"Pretrain/Learning Rate": 4.7125160363680844e-05, "Pretrain/Loss": 2.0644967555999756, "Pretrain/Loss (Raw)": 2.077918291091919, "Pretrain/Step": 3424, "Pretrain/Step Time": 8.442693036049604} +{"Pretrain/Learning Rate": 4.7123183585288176e-05, "Pretrain/Loss": 2.059253692626953, "Pretrain/Loss (Raw)": 1.768085241317749, "Pretrain/Step": 3425, "Pretrain/Step Time": 8.442003617063165} +{"Pretrain/Learning Rate": 4.7121206168989106e-05, "Pretrain/Loss": 2.0592761039733887, "Pretrain/Loss (Raw)": 2.1066994667053223, "Pretrain/Step": 3426, "Pretrain/Step Time": 8.438719118013978} +{"Pretrain/Learning Rate": 4.711922811484066e-05, "Pretrain/Loss": 2.059009075164795, "Pretrain/Loss (Raw)": 2.136625051498413, "Pretrain/Step": 3427, "Pretrain/Step Time": 8.443752245977521} +{"Pretrain/Learning Rate": 4.711724942289986e-05, "Pretrain/Loss": 2.058361530303955, "Pretrain/Loss (Raw)": 2.0313491821289062, "Pretrain/Step": 3428, "Pretrain/Step Time": 8.442037681117654} +{"Pretrain/Learning Rate": 4.711527009322376e-05, "Pretrain/Loss": 2.0538716316223145, "Pretrain/Loss (Raw)": 1.602059006690979, "Pretrain/Step": 3429, "Pretrain/Step Time": 8.44377864152193} +{"Pretrain/Learning Rate": 4.7113290125869436e-05, "Pretrain/Loss": 2.0510897636413574, "Pretrain/Loss (Raw)": 1.8287770748138428, "Pretrain/Step": 3430, "Pretrain/Step Time": 8.443671856075525} +{"Pretrain/Learning Rate": 4.711130952089398e-05, "Pretrain/Loss": 2.0530359745025635, "Pretrain/Loss (Raw)": 2.283045530319214, "Pretrain/Step": 3431, "Pretrain/Step Time": 8.446255818009377} +{"Pretrain/Learning Rate": 4.7109328278354504e-05, "Pretrain/Loss": 2.055349349975586, "Pretrain/Loss (Raw)": 2.0674080848693848, "Pretrain/Step": 3432, "Pretrain/Step Time": 8.440940702334046} +{"Pretrain/Learning Rate": 4.710734639830814e-05, "Pretrain/Loss": 2.055210590362549, "Pretrain/Loss (Raw)": 2.012610912322998, "Pretrain/Step": 3433, "Pretrain/Step Time": 8.434492761269212} +{"Pretrain/Learning Rate": 4.7105363880812015e-05, "Pretrain/Loss": 2.0536396503448486, "Pretrain/Loss (Raw)": 2.0489871501922607, "Pretrain/Step": 3434, "Pretrain/Step Time": 8.433954888954759} +{"Pretrain/Learning Rate": 4.7103380725923315e-05, "Pretrain/Loss": 2.0539937019348145, "Pretrain/Loss (Raw)": 2.0316414833068848, "Pretrain/Step": 3435, "Pretrain/Step Time": 8.44075134024024} +{"Pretrain/Learning Rate": 4.71013969336992e-05, "Pretrain/Loss": 2.0551891326904297, "Pretrain/Loss (Raw)": 2.1046502590179443, "Pretrain/Step": 3436, "Pretrain/Step Time": 8.438453508540988} +{"Pretrain/Learning Rate": 4.70994125041969e-05, "Pretrain/Loss": 2.0527491569519043, "Pretrain/Loss (Raw)": 2.0254619121551514, "Pretrain/Step": 3437, "Pretrain/Step Time": 8.437253786250949} +{"Pretrain/Learning Rate": 4.709742743747362e-05, "Pretrain/Loss": 2.053457736968994, "Pretrain/Loss (Raw)": 2.0916640758514404, "Pretrain/Step": 3438, "Pretrain/Step Time": 8.441865466535091} +{"Pretrain/Learning Rate": 4.709544173358659e-05, "Pretrain/Loss": 2.0518531799316406, "Pretrain/Loss (Raw)": 2.1908152103424072, "Pretrain/Step": 3439, "Pretrain/Step Time": 8.440789632499218} +{"Pretrain/Learning Rate": 4.709345539259308e-05, "Pretrain/Loss": 2.0516586303710938, "Pretrain/Loss (Raw)": 1.9070961475372314, "Pretrain/Step": 3440, "Pretrain/Step Time": 8.447835724800825} +{"Pretrain/Learning Rate": 4.709146841455035e-05, "Pretrain/Loss": 2.0517046451568604, "Pretrain/Loss (Raw)": 1.9890882968902588, "Pretrain/Step": 3441, "Pretrain/Step Time": 8.444553177803755} +{"Pretrain/Learning Rate": 4.708948079951571e-05, "Pretrain/Loss": 2.0523266792297363, "Pretrain/Loss (Raw)": 2.0971617698669434, "Pretrain/Step": 3442, "Pretrain/Step Time": 8.441680613905191} +{"Pretrain/Learning Rate": 4.7087492547546455e-05, "Pretrain/Loss": 2.0540032386779785, "Pretrain/Loss (Raw)": 2.1199569702148438, "Pretrain/Step": 3443, "Pretrain/Step Time": 8.445556653663516} +{"Pretrain/Learning Rate": 4.7085503658699925e-05, "Pretrain/Loss": 2.057750701904297, "Pretrain/Loss (Raw)": 2.3184776306152344, "Pretrain/Step": 3444, "Pretrain/Step Time": 8.440811794251204} +{"Pretrain/Learning Rate": 4.708351413303347e-05, "Pretrain/Loss": 2.0590109825134277, "Pretrain/Loss (Raw)": 2.056126356124878, "Pretrain/Step": 3445, "Pretrain/Step Time": 8.443822521716356} +{"Pretrain/Learning Rate": 4.708152397060446e-05, "Pretrain/Loss": 2.0584964752197266, "Pretrain/Loss (Raw)": 2.264939308166504, "Pretrain/Step": 3446, "Pretrain/Step Time": 8.444120055064559} +{"Pretrain/Learning Rate": 4.707953317147026e-05, "Pretrain/Loss": 2.0575904846191406, "Pretrain/Loss (Raw)": 2.0688464641571045, "Pretrain/Step": 3447, "Pretrain/Step Time": 8.448290005326271} +{"Pretrain/Learning Rate": 4.707754173568829e-05, "Pretrain/Loss": 2.0549416542053223, "Pretrain/Loss (Raw)": 1.9082919359207153, "Pretrain/Step": 3448, "Pretrain/Step Time": 8.447831770405173} +{"Pretrain/Learning Rate": 4.707554966331597e-05, "Pretrain/Loss": 2.05424427986145, "Pretrain/Loss (Raw)": 2.0327858924865723, "Pretrain/Step": 3449, "Pretrain/Step Time": 8.43946073204279} +{"Pretrain/Learning Rate": 4.7073556954410734e-05, "Pretrain/Loss": 2.053341865539551, "Pretrain/Loss (Raw)": 1.8389538526535034, "Pretrain/Step": 3450, "Pretrain/Step Time": 8.439603917300701} +{"Pretrain/Learning Rate": 4.707156360903004e-05, "Pretrain/Loss": 2.0539422035217285, "Pretrain/Loss (Raw)": 2.0738072395324707, "Pretrain/Step": 3451, "Pretrain/Step Time": 8.440765691921115} +{"Pretrain/Learning Rate": 4.706956962723138e-05, "Pretrain/Loss": 2.0549745559692383, "Pretrain/Loss (Raw)": 2.120124340057373, "Pretrain/Step": 3452, "Pretrain/Step Time": 8.435064196586609} +{"Pretrain/Learning Rate": 4.7067575009072226e-05, "Pretrain/Loss": 2.0542986392974854, "Pretrain/Loss (Raw)": 2.0152742862701416, "Pretrain/Step": 3453, "Pretrain/Step Time": 8.440897637978196} +{"Pretrain/Learning Rate": 4.7065579754610114e-05, "Pretrain/Loss": 2.0531158447265625, "Pretrain/Loss (Raw)": 2.1303369998931885, "Pretrain/Step": 3454, "Pretrain/Step Time": 8.43701133877039} +{"Pretrain/Learning Rate": 4.706358386390256e-05, "Pretrain/Loss": 2.052642822265625, "Pretrain/Loss (Raw)": 1.9434142112731934, "Pretrain/Step": 3455, "Pretrain/Step Time": 8.438891248777509} +{"Pretrain/Learning Rate": 4.7061587337007116e-05, "Pretrain/Loss": 2.051492214202881, "Pretrain/Loss (Raw)": 2.001223564147949, "Pretrain/Step": 3456, "Pretrain/Step Time": 8.439607696607709} +{"Pretrain/Learning Rate": 4.705959017398136e-05, "Pretrain/Loss": 2.0522866249084473, "Pretrain/Loss (Raw)": 2.2030458450317383, "Pretrain/Step": 3457, "Pretrain/Step Time": 8.433970507234335} +{"Pretrain/Learning Rate": 4.705759237488288e-05, "Pretrain/Loss": 2.0525312423706055, "Pretrain/Loss (Raw)": 2.138216257095337, "Pretrain/Step": 3458, "Pretrain/Step Time": 8.43725960701704} +{"Pretrain/Learning Rate": 4.7055593939769257e-05, "Pretrain/Loss": 2.0539207458496094, "Pretrain/Loss (Raw)": 2.006085157394409, "Pretrain/Step": 3459, "Pretrain/Step Time": 8.436752535402775} +{"Pretrain/Learning Rate": 4.7053594868698136e-05, "Pretrain/Loss": 2.051760196685791, "Pretrain/Loss (Raw)": 1.9176158905029297, "Pretrain/Step": 3460, "Pretrain/Step Time": 8.436920205131173} +{"Pretrain/Learning Rate": 4.705159516172716e-05, "Pretrain/Loss": 2.0518994331359863, "Pretrain/Loss (Raw)": 2.0652577877044678, "Pretrain/Step": 3461, "Pretrain/Step Time": 8.438253065571189} +{"Pretrain/Learning Rate": 4.7049594818913975e-05, "Pretrain/Loss": 2.049886465072632, "Pretrain/Loss (Raw)": 1.8643547296524048, "Pretrain/Step": 3462, "Pretrain/Step Time": 8.438682520762086} +{"Pretrain/Learning Rate": 4.704759384031627e-05, "Pretrain/Loss": 2.0491080284118652, "Pretrain/Loss (Raw)": 2.0753087997436523, "Pretrain/Step": 3463, "Pretrain/Step Time": 8.44444240629673} +{"Pretrain/Learning Rate": 4.704559222599174e-05, "Pretrain/Loss": 2.0504705905914307, "Pretrain/Loss (Raw)": 1.8758699893951416, "Pretrain/Step": 3464, "Pretrain/Step Time": 8.445965828374028} +{"Pretrain/Learning Rate": 4.704358997599809e-05, "Pretrain/Loss": 2.048340082168579, "Pretrain/Loss (Raw)": 1.896479606628418, "Pretrain/Step": 3465, "Pretrain/Step Time": 8.449808280915022} +{"Pretrain/Learning Rate": 4.704158709039308e-05, "Pretrain/Loss": 2.048318386077881, "Pretrain/Loss (Raw)": 1.90400230884552, "Pretrain/Step": 3466, "Pretrain/Step Time": 8.439988728612661} +{"Pretrain/Learning Rate": 4.703958356923443e-05, "Pretrain/Loss": 2.0480732917785645, "Pretrain/Loss (Raw)": 2.1115150451660156, "Pretrain/Step": 3467, "Pretrain/Step Time": 8.44029999524355} +{"Pretrain/Learning Rate": 4.703757941257993e-05, "Pretrain/Loss": 2.04803729057312, "Pretrain/Loss (Raw)": 2.0422446727752686, "Pretrain/Step": 3468, "Pretrain/Step Time": 8.440297381952405} +{"Pretrain/Learning Rate": 4.703557462048737e-05, "Pretrain/Loss": 2.0499980449676514, "Pretrain/Loss (Raw)": 2.2695109844207764, "Pretrain/Step": 3469, "Pretrain/Step Time": 8.441149678081274} +{"Pretrain/Learning Rate": 4.7033569193014534e-05, "Pretrain/Loss": 2.050597667694092, "Pretrain/Loss (Raw)": 2.156022310256958, "Pretrain/Step": 3470, "Pretrain/Step Time": 8.445615444332361} +{"Pretrain/Learning Rate": 4.703156313021927e-05, "Pretrain/Loss": 2.0497045516967773, "Pretrain/Loss (Raw)": 2.0269999504089355, "Pretrain/Step": 3471, "Pretrain/Step Time": 8.450873328372836} +{"Pretrain/Learning Rate": 4.702955643215942e-05, "Pretrain/Loss": 2.0487101078033447, "Pretrain/Loss (Raw)": 2.015300750732422, "Pretrain/Step": 3472, "Pretrain/Step Time": 8.446004875004292} +{"Pretrain/Learning Rate": 4.702754909889284e-05, "Pretrain/Loss": 2.046780824661255, "Pretrain/Loss (Raw)": 1.9033461809158325, "Pretrain/Step": 3473, "Pretrain/Step Time": 8.447190131992102} +{"Pretrain/Learning Rate": 4.70255411304774e-05, "Pretrain/Loss": 2.047025680541992, "Pretrain/Loss (Raw)": 2.1217877864837646, "Pretrain/Step": 3474, "Pretrain/Step Time": 8.454004537314177} +{"Pretrain/Learning Rate": 4.702353252697102e-05, "Pretrain/Loss": 2.048649787902832, "Pretrain/Loss (Raw)": 2.0249743461608887, "Pretrain/Step": 3475, "Pretrain/Step Time": 8.452279303222895} +{"Pretrain/Learning Rate": 4.70215232884316e-05, "Pretrain/Loss": 2.0478644371032715, "Pretrain/Loss (Raw)": 1.9340020418167114, "Pretrain/Step": 3476, "Pretrain/Step Time": 8.450868841260672} +{"Pretrain/Learning Rate": 4.7019513414917085e-05, "Pretrain/Loss": 2.049056053161621, "Pretrain/Loss (Raw)": 2.268127679824829, "Pretrain/Step": 3477, "Pretrain/Step Time": 8.451846700161695} +{"Pretrain/Learning Rate": 4.701750290648542e-05, "Pretrain/Loss": 2.047095775604248, "Pretrain/Loss (Raw)": 2.008929491043091, "Pretrain/Step": 3478, "Pretrain/Step Time": 8.453886028379202} +{"Pretrain/Learning Rate": 4.7015491763194574e-05, "Pretrain/Loss": 2.047858715057373, "Pretrain/Loss (Raw)": 2.1421053409576416, "Pretrain/Step": 3479, "Pretrain/Step Time": 8.454907955601811} +{"Pretrain/Learning Rate": 4.7013479985102545e-05, "Pretrain/Loss": 2.0484585762023926, "Pretrain/Loss (Raw)": 2.0728821754455566, "Pretrain/Step": 3480, "Pretrain/Step Time": 8.449469877406955} +{"Pretrain/Learning Rate": 4.701146757226734e-05, "Pretrain/Loss": 2.050729274749756, "Pretrain/Loss (Raw)": 2.385265827178955, "Pretrain/Step": 3481, "Pretrain/Step Time": 8.452628819271922} +{"Pretrain/Learning Rate": 4.700945452474699e-05, "Pretrain/Loss": 2.0499396324157715, "Pretrain/Loss (Raw)": 2.0297610759735107, "Pretrain/Step": 3482, "Pretrain/Step Time": 8.442343203350902} +{"Pretrain/Learning Rate": 4.700744084259954e-05, "Pretrain/Loss": 2.0552759170532227, "Pretrain/Loss (Raw)": 2.736844301223755, "Pretrain/Step": 3483, "Pretrain/Step Time": 8.445346683263779} +{"Pretrain/Learning Rate": 4.7005426525883035e-05, "Pretrain/Loss": 2.057136058807373, "Pretrain/Loss (Raw)": 2.2208216190338135, "Pretrain/Step": 3484, "Pretrain/Step Time": 8.43987405858934} +{"Pretrain/Learning Rate": 4.700341157465557e-05, "Pretrain/Loss": 2.0577049255371094, "Pretrain/Loss (Raw)": 2.1216869354248047, "Pretrain/Step": 3485, "Pretrain/Step Time": 8.44417985714972} +{"Pretrain/Learning Rate": 4.700139598897525e-05, "Pretrain/Loss": 2.0558676719665527, "Pretrain/Loss (Raw)": 1.966037392616272, "Pretrain/Step": 3486, "Pretrain/Step Time": 8.449795607477427} +{"Pretrain/Learning Rate": 4.6999379768900174e-05, "Pretrain/Loss": 2.056049108505249, "Pretrain/Loss (Raw)": 2.2203335762023926, "Pretrain/Step": 3487, "Pretrain/Step Time": 8.447406720370054} +{"Pretrain/Learning Rate": 4.6997362914488504e-05, "Pretrain/Loss": 2.056788444519043, "Pretrain/Loss (Raw)": 2.229950189590454, "Pretrain/Step": 3488, "Pretrain/Step Time": 8.44954190403223} +{"Pretrain/Learning Rate": 4.699534542579838e-05, "Pretrain/Loss": 2.055812358856201, "Pretrain/Loss (Raw)": 1.9870809316635132, "Pretrain/Step": 3489, "Pretrain/Step Time": 8.450290327891707} +{"Pretrain/Learning Rate": 4.699332730288797e-05, "Pretrain/Loss": 2.0580055713653564, "Pretrain/Loss (Raw)": 2.283813238143921, "Pretrain/Step": 3490, "Pretrain/Step Time": 8.449425430968404} +{"Pretrain/Learning Rate": 4.6991308545815475e-05, "Pretrain/Loss": 2.054126739501953, "Pretrain/Loss (Raw)": 1.8494791984558105, "Pretrain/Step": 3491, "Pretrain/Step Time": 8.451597521081567} +{"Pretrain/Learning Rate": 4.69892891546391e-05, "Pretrain/Loss": 2.051807403564453, "Pretrain/Loss (Raw)": 1.8461955785751343, "Pretrain/Step": 3492, "Pretrain/Step Time": 8.450709963217378} +{"Pretrain/Learning Rate": 4.698726912941708e-05, "Pretrain/Loss": 2.05659818649292, "Pretrain/Loss (Raw)": 2.5176925659179688, "Pretrain/Step": 3493, "Pretrain/Step Time": 8.445696979761124} +{"Pretrain/Learning Rate": 4.6985248470207644e-05, "Pretrain/Loss": 2.055318593978882, "Pretrain/Loss (Raw)": 2.0329573154449463, "Pretrain/Step": 3494, "Pretrain/Step Time": 8.454987058416009} +{"Pretrain/Learning Rate": 4.6983227177069075e-05, "Pretrain/Loss": 2.0513172149658203, "Pretrain/Loss (Raw)": 1.8678900003433228, "Pretrain/Step": 3495, "Pretrain/Step Time": 8.453845907002687} +{"Pretrain/Learning Rate": 4.698120525005965e-05, "Pretrain/Loss": 2.050936222076416, "Pretrain/Loss (Raw)": 2.196648597717285, "Pretrain/Step": 3496, "Pretrain/Step Time": 8.456423508003354} +{"Pretrain/Learning Rate": 4.697918268923766e-05, "Pretrain/Loss": 2.050388813018799, "Pretrain/Loss (Raw)": 2.1039602756500244, "Pretrain/Step": 3497, "Pretrain/Step Time": 8.454507062211633} +{"Pretrain/Learning Rate": 4.697715949466143e-05, "Pretrain/Loss": 2.0464956760406494, "Pretrain/Loss (Raw)": 1.6234952211380005, "Pretrain/Step": 3498, "Pretrain/Step Time": 8.4539755564183} +{"Pretrain/Learning Rate": 4.69751356663893e-05, "Pretrain/Loss": 2.049431800842285, "Pretrain/Loss (Raw)": 2.073802947998047, "Pretrain/Step": 3499, "Pretrain/Step Time": 8.448188479989767} +{"Pretrain/Learning Rate": 4.6973111204479624e-05, "Pretrain/Loss": 2.049874782562256, "Pretrain/Loss (Raw)": 2.1884000301361084, "Pretrain/Step": 3500, "Pretrain/Step Time": 8.447474846616387} +{"Pretrain/Learning Rate": 4.697108610899078e-05, "Pretrain/Loss": 2.0502328872680664, "Pretrain/Loss (Raw)": 1.989801049232483, "Pretrain/Step": 3501, "Pretrain/Step Time": 8.44535550661385} +{"Pretrain/Learning Rate": 4.6969060379981157e-05, "Pretrain/Loss": 2.0484185218811035, "Pretrain/Loss (Raw)": 1.9712786674499512, "Pretrain/Step": 3502, "Pretrain/Step Time": 8.44467924721539} +{"Pretrain/Learning Rate": 4.6967034017509166e-05, "Pretrain/Loss": 2.0468783378601074, "Pretrain/Loss (Raw)": 1.956917405128479, "Pretrain/Step": 3503, "Pretrain/Step Time": 8.450296562165022} +{"Pretrain/Learning Rate": 4.6965007021633236e-05, "Pretrain/Loss": 2.0481505393981934, "Pretrain/Loss (Raw)": 2.0980019569396973, "Pretrain/Step": 3504, "Pretrain/Step Time": 8.446229105815291} +{"Pretrain/Learning Rate": 4.696297939241181e-05, "Pretrain/Loss": 2.048351526260376, "Pretrain/Loss (Raw)": 2.078335762023926, "Pretrain/Step": 3505, "Pretrain/Step Time": 8.449474217370152} +{"Pretrain/Learning Rate": 4.696095112990335e-05, "Pretrain/Loss": 2.0495223999023438, "Pretrain/Loss (Raw)": 1.9051729440689087, "Pretrain/Step": 3506, "Pretrain/Step Time": 8.449107617139816} +{"Pretrain/Learning Rate": 4.695892223416636e-05, "Pretrain/Loss": 2.0499162673950195, "Pretrain/Loss (Raw)": 2.223454713821411, "Pretrain/Step": 3507, "Pretrain/Step Time": 8.445805795490742} +{"Pretrain/Learning Rate": 4.695689270525931e-05, "Pretrain/Loss": 2.0501787662506104, "Pretrain/Loss (Raw)": 2.0846054553985596, "Pretrain/Step": 3508, "Pretrain/Step Time": 8.445712581276894} +{"Pretrain/Learning Rate": 4.6954862543240755e-05, "Pretrain/Loss": 2.049546718597412, "Pretrain/Loss (Raw)": 1.99349844455719, "Pretrain/Step": 3509, "Pretrain/Step Time": 8.44607382081449} +{"Pretrain/Learning Rate": 4.69528317481692e-05, "Pretrain/Loss": 2.048006296157837, "Pretrain/Loss (Raw)": 1.9725490808486938, "Pretrain/Step": 3510, "Pretrain/Step Time": 8.446518490090966} +{"Pretrain/Learning Rate": 4.695080032010323e-05, "Pretrain/Loss": 2.0458121299743652, "Pretrain/Loss (Raw)": 1.9394947290420532, "Pretrain/Step": 3511, "Pretrain/Step Time": 8.451561311259866} +{"Pretrain/Learning Rate": 4.6948768259101394e-05, "Pretrain/Loss": 2.04644775390625, "Pretrain/Loss (Raw)": 1.9568952322006226, "Pretrain/Step": 3512, "Pretrain/Step Time": 8.453235194087029} +{"Pretrain/Learning Rate": 4.694673556522231e-05, "Pretrain/Loss": 2.0466127395629883, "Pretrain/Loss (Raw)": 1.9810758829116821, "Pretrain/Step": 3513, "Pretrain/Step Time": 8.454784570261836} +{"Pretrain/Learning Rate": 4.6944702238524576e-05, "Pretrain/Loss": 2.044421911239624, "Pretrain/Loss (Raw)": 1.94222092628479, "Pretrain/Step": 3514, "Pretrain/Step Time": 8.452213693410158} +{"Pretrain/Learning Rate": 4.6942668279066815e-05, "Pretrain/Loss": 2.0469255447387695, "Pretrain/Loss (Raw)": 2.447195291519165, "Pretrain/Step": 3515, "Pretrain/Step Time": 8.452506303787231} +{"Pretrain/Learning Rate": 4.6940633686907683e-05, "Pretrain/Loss": 2.0479960441589355, "Pretrain/Loss (Raw)": 2.039651870727539, "Pretrain/Step": 3516, "Pretrain/Step Time": 8.443877849727869} +{"Pretrain/Learning Rate": 4.693859846210585e-05, "Pretrain/Loss": 2.0478601455688477, "Pretrain/Loss (Raw)": 1.9217356443405151, "Pretrain/Step": 3517, "Pretrain/Step Time": 8.445611948147416} +{"Pretrain/Learning Rate": 4.693656260472e-05, "Pretrain/Loss": 2.0468907356262207, "Pretrain/Loss (Raw)": 2.055844783782959, "Pretrain/Step": 3518, "Pretrain/Step Time": 8.44722380489111} +{"Pretrain/Learning Rate": 4.693452611480883e-05, "Pretrain/Loss": 2.050321102142334, "Pretrain/Loss (Raw)": 2.4172751903533936, "Pretrain/Step": 3519, "Pretrain/Step Time": 8.447658503428102} +{"Pretrain/Learning Rate": 4.693248899243106e-05, "Pretrain/Loss": 2.050548553466797, "Pretrain/Loss (Raw)": 2.122802257537842, "Pretrain/Step": 3520, "Pretrain/Step Time": 8.451510433107615} +{"Pretrain/Learning Rate": 4.6930451237645434e-05, "Pretrain/Loss": 2.049811363220215, "Pretrain/Loss (Raw)": 1.9261218309402466, "Pretrain/Step": 3521, "Pretrain/Step Time": 8.456163505092263} +{"Pretrain/Learning Rate": 4.6928412850510704e-05, "Pretrain/Loss": 2.0493640899658203, "Pretrain/Loss (Raw)": 1.99529230594635, "Pretrain/Step": 3522, "Pretrain/Step Time": 8.458661749958992} +{"Pretrain/Learning Rate": 4.6926373831085646e-05, "Pretrain/Loss": 2.0483717918395996, "Pretrain/Loss (Raw)": 1.9098669290542603, "Pretrain/Step": 3523, "Pretrain/Step Time": 8.45818448625505} +{"Pretrain/Learning Rate": 4.692433417942905e-05, "Pretrain/Loss": 2.047539472579956, "Pretrain/Loss (Raw)": 1.9639365673065186, "Pretrain/Step": 3524, "Pretrain/Step Time": 8.458707250654697} +{"Pretrain/Learning Rate": 4.692229389559975e-05, "Pretrain/Loss": 2.047539472579956, "Pretrain/Loss (Raw)": 1.9628503322601318, "Pretrain/Step": 3525, "Pretrain/Step Time": 8.458726400509477} +{"Pretrain/Learning Rate": 4.6920252979656556e-05, "Pretrain/Loss": 2.048532724380493, "Pretrain/Loss (Raw)": 2.0388145446777344, "Pretrain/Step": 3526, "Pretrain/Step Time": 8.451204348355532} +{"Pretrain/Learning Rate": 4.691821143165831e-05, "Pretrain/Loss": 2.0506606101989746, "Pretrain/Loss (Raw)": 2.1771440505981445, "Pretrain/Step": 3527, "Pretrain/Step Time": 8.45612358674407} +{"Pretrain/Learning Rate": 4.6916169251663895e-05, "Pretrain/Loss": 2.048002243041992, "Pretrain/Loss (Raw)": 1.9821749925613403, "Pretrain/Step": 3528, "Pretrain/Step Time": 8.462053775787354} +{"Pretrain/Learning Rate": 4.6914126439732184e-05, "Pretrain/Loss": 2.047353982925415, "Pretrain/Loss (Raw)": 1.9190199375152588, "Pretrain/Step": 3529, "Pretrain/Step Time": 8.46568594686687} +{"Pretrain/Learning Rate": 4.691208299592209e-05, "Pretrain/Loss": 2.0455288887023926, "Pretrain/Loss (Raw)": 1.7648857831954956, "Pretrain/Step": 3530, "Pretrain/Step Time": 8.459648689255118} +{"Pretrain/Learning Rate": 4.691003892029253e-05, "Pretrain/Loss": 2.048351764678955, "Pretrain/Loss (Raw)": 2.0330798625946045, "Pretrain/Step": 3531, "Pretrain/Step Time": 8.462678484618664} +{"Pretrain/Learning Rate": 4.6907994212902445e-05, "Pretrain/Loss": 2.0479416847229004, "Pretrain/Loss (Raw)": 2.032838821411133, "Pretrain/Step": 3532, "Pretrain/Step Time": 8.459283774718642} +{"Pretrain/Learning Rate": 4.690594887381079e-05, "Pretrain/Loss": 2.0483245849609375, "Pretrain/Loss (Raw)": 2.1985087394714355, "Pretrain/Step": 3533, "Pretrain/Step Time": 8.454129248857498} +{"Pretrain/Learning Rate": 4.690390290307653e-05, "Pretrain/Loss": 2.0470499992370605, "Pretrain/Loss (Raw)": 2.0144448280334473, "Pretrain/Step": 3534, "Pretrain/Step Time": 8.458095731213689} +{"Pretrain/Learning Rate": 4.690185630075869e-05, "Pretrain/Loss": 2.0468344688415527, "Pretrain/Loss (Raw)": 1.8007158041000366, "Pretrain/Step": 3535, "Pretrain/Step Time": 8.452484995126724} +{"Pretrain/Learning Rate": 4.689980906691626e-05, "Pretrain/Loss": 2.047971725463867, "Pretrain/Loss (Raw)": 2.1833205223083496, "Pretrain/Step": 3536, "Pretrain/Step Time": 8.455448249354959} +{"Pretrain/Learning Rate": 4.6897761201608265e-05, "Pretrain/Loss": 2.047211170196533, "Pretrain/Loss (Raw)": 1.9503313302993774, "Pretrain/Step": 3537, "Pretrain/Step Time": 8.464978199452162} +{"Pretrain/Learning Rate": 4.689571270489377e-05, "Pretrain/Loss": 2.047971248626709, "Pretrain/Loss (Raw)": 2.002408981323242, "Pretrain/Step": 3538, "Pretrain/Step Time": 8.462794402614236} +{"Pretrain/Learning Rate": 4.689366357683182e-05, "Pretrain/Loss": 2.047175168991089, "Pretrain/Loss (Raw)": 1.7751487493515015, "Pretrain/Step": 3539, "Pretrain/Step Time": 8.461798060685396} +{"Pretrain/Learning Rate": 4.689161381748153e-05, "Pretrain/Loss": 2.0466365814208984, "Pretrain/Loss (Raw)": 2.056253671646118, "Pretrain/Step": 3540, "Pretrain/Step Time": 8.46166636608541} +{"Pretrain/Learning Rate": 4.688956342690199e-05, "Pretrain/Loss": 2.0497658252716064, "Pretrain/Loss (Raw)": 2.3952975273132324, "Pretrain/Step": 3541, "Pretrain/Step Time": 8.459178678691387} +{"Pretrain/Learning Rate": 4.688751240515231e-05, "Pretrain/Loss": 2.0502357482910156, "Pretrain/Loss (Raw)": 1.9887791872024536, "Pretrain/Step": 3542, "Pretrain/Step Time": 8.457418404519558} +{"Pretrain/Learning Rate": 4.688546075229164e-05, "Pretrain/Loss": 2.050513982772827, "Pretrain/Loss (Raw)": 2.17350172996521, "Pretrain/Step": 3543, "Pretrain/Step Time": 8.459811029955745} +{"Pretrain/Learning Rate": 4.688340846837915e-05, "Pretrain/Loss": 2.0502400398254395, "Pretrain/Loss (Raw)": 2.0405547618865967, "Pretrain/Step": 3544, "Pretrain/Step Time": 8.460010673850775} +{"Pretrain/Learning Rate": 4.688135555347399e-05, "Pretrain/Loss": 2.053508758544922, "Pretrain/Loss (Raw)": 2.066009283065796, "Pretrain/Step": 3545, "Pretrain/Step Time": 8.453738322481513} +{"Pretrain/Learning Rate": 4.6879302007635374e-05, "Pretrain/Loss": 2.0526561737060547, "Pretrain/Loss (Raw)": 2.028024435043335, "Pretrain/Step": 3546, "Pretrain/Step Time": 8.451701505109668} +{"Pretrain/Learning Rate": 4.687724783092251e-05, "Pretrain/Loss": 2.0511927604675293, "Pretrain/Loss (Raw)": 1.6934630870819092, "Pretrain/Step": 3547, "Pretrain/Step Time": 8.452243592590094} +{"Pretrain/Learning Rate": 4.687519302339462e-05, "Pretrain/Loss": 2.052224636077881, "Pretrain/Loss (Raw)": 2.189302921295166, "Pretrain/Step": 3548, "Pretrain/Step Time": 8.45315952040255} +{"Pretrain/Learning Rate": 4.6873137585110964e-05, "Pretrain/Loss": 2.053694248199463, "Pretrain/Loss (Raw)": 2.462202310562134, "Pretrain/Step": 3549, "Pretrain/Step Time": 8.444181324914098} +{"Pretrain/Learning Rate": 4.687108151613081e-05, "Pretrain/Loss": 2.053968906402588, "Pretrain/Loss (Raw)": 2.0276224613189697, "Pretrain/Step": 3550, "Pretrain/Step Time": 8.44386793486774} +{"Pretrain/Learning Rate": 4.686902481651343e-05, "Pretrain/Loss": 2.0529112815856934, "Pretrain/Loss (Raw)": 2.1031076908111572, "Pretrain/Step": 3551, "Pretrain/Step Time": 8.442238273099065} +{"Pretrain/Learning Rate": 4.686696748631814e-05, "Pretrain/Loss": 2.0537900924682617, "Pretrain/Loss (Raw)": 2.190422534942627, "Pretrain/Step": 3552, "Pretrain/Step Time": 8.440362045541406} +{"Pretrain/Learning Rate": 4.686490952560426e-05, "Pretrain/Loss": 2.055642604827881, "Pretrain/Loss (Raw)": 2.0052037239074707, "Pretrain/Step": 3553, "Pretrain/Step Time": 8.443488072603941} +{"Pretrain/Learning Rate": 4.6862850934431126e-05, "Pretrain/Loss": 2.0549123287200928, "Pretrain/Loss (Raw)": 2.0132293701171875, "Pretrain/Step": 3554, "Pretrain/Step Time": 8.452260067686439} +{"Pretrain/Learning Rate": 4.6860791712858096e-05, "Pretrain/Loss": 2.0543644428253174, "Pretrain/Loss (Raw)": 2.066476583480835, "Pretrain/Step": 3555, "Pretrain/Step Time": 8.444061659276485} +{"Pretrain/Learning Rate": 4.6858731860944546e-05, "Pretrain/Loss": 2.0545339584350586, "Pretrain/Loss (Raw)": 2.053032875061035, "Pretrain/Step": 3556, "Pretrain/Step Time": 8.449868304654956} +{"Pretrain/Learning Rate": 4.685667137874988e-05, "Pretrain/Loss": 2.0591652393341064, "Pretrain/Loss (Raw)": 2.194885730743408, "Pretrain/Step": 3557, "Pretrain/Step Time": 8.451109295710921} +{"Pretrain/Learning Rate": 4.6854610266333496e-05, "Pretrain/Loss": 2.0600194931030273, "Pretrain/Loss (Raw)": 1.9381083250045776, "Pretrain/Step": 3558, "Pretrain/Step Time": 8.450137229636312} +{"Pretrain/Learning Rate": 4.685254852375484e-05, "Pretrain/Loss": 2.0571041107177734, "Pretrain/Loss (Raw)": 1.9098984003067017, "Pretrain/Step": 3559, "Pretrain/Step Time": 8.45146418735385} +{"Pretrain/Learning Rate": 4.685048615107334e-05, "Pretrain/Loss": 2.05865478515625, "Pretrain/Loss (Raw)": 2.2658793926239014, "Pretrain/Step": 3560, "Pretrain/Step Time": 8.4553431738168} +{"Pretrain/Learning Rate": 4.684842314834848e-05, "Pretrain/Loss": 2.0604844093322754, "Pretrain/Loss (Raw)": 2.2468185424804688, "Pretrain/Step": 3561, "Pretrain/Step Time": 8.457339556887746} +{"Pretrain/Learning Rate": 4.6846359515639744e-05, "Pretrain/Loss": 2.06014347076416, "Pretrain/Loss (Raw)": 2.0053064823150635, "Pretrain/Step": 3562, "Pretrain/Step Time": 8.455342000350356} +{"Pretrain/Learning Rate": 4.684429525300663e-05, "Pretrain/Loss": 2.0610241889953613, "Pretrain/Loss (Raw)": 2.144408702850342, "Pretrain/Step": 3563, "Pretrain/Step Time": 8.454445701092482} +{"Pretrain/Learning Rate": 4.684223036050866e-05, "Pretrain/Loss": 2.05991792678833, "Pretrain/Loss (Raw)": 1.963031530380249, "Pretrain/Step": 3564, "Pretrain/Step Time": 8.454406756907701} +{"Pretrain/Learning Rate": 4.684016483820538e-05, "Pretrain/Loss": 2.0592570304870605, "Pretrain/Loss (Raw)": 1.9408600330352783, "Pretrain/Step": 3565, "Pretrain/Step Time": 8.457962211221457} +{"Pretrain/Learning Rate": 4.683809868615634e-05, "Pretrain/Loss": 2.0573134422302246, "Pretrain/Loss (Raw)": 1.8428822755813599, "Pretrain/Step": 3566, "Pretrain/Step Time": 8.449347823858261} +{"Pretrain/Learning Rate": 4.683603190442112e-05, "Pretrain/Loss": 2.056917905807495, "Pretrain/Loss (Raw)": 2.140204429626465, "Pretrain/Step": 3567, "Pretrain/Step Time": 8.452302956953645} +{"Pretrain/Learning Rate": 4.683396449305931e-05, "Pretrain/Loss": 2.0581142902374268, "Pretrain/Loss (Raw)": 2.060239791870117, "Pretrain/Step": 3568, "Pretrain/Step Time": 8.446489792317152} +{"Pretrain/Learning Rate": 4.683189645213053e-05, "Pretrain/Loss": 2.058364152908325, "Pretrain/Loss (Raw)": 2.0210671424865723, "Pretrain/Step": 3569, "Pretrain/Step Time": 8.448002314195037} +{"Pretrain/Learning Rate": 4.68298277816944e-05, "Pretrain/Loss": 2.058600425720215, "Pretrain/Loss (Raw)": 2.127394676208496, "Pretrain/Step": 3570, "Pretrain/Step Time": 8.45361396484077} +{"Pretrain/Learning Rate": 4.682775848181058e-05, "Pretrain/Loss": 2.0579025745391846, "Pretrain/Loss (Raw)": 2.030649423599243, "Pretrain/Step": 3571, "Pretrain/Step Time": 8.453458586707711} +{"Pretrain/Learning Rate": 4.682568855253873e-05, "Pretrain/Loss": 2.05521297454834, "Pretrain/Loss (Raw)": 1.9742099046707153, "Pretrain/Step": 3572, "Pretrain/Step Time": 8.454845143482089} +{"Pretrain/Learning Rate": 4.682361799393854e-05, "Pretrain/Loss": 2.055223226547241, "Pretrain/Loss (Raw)": 2.057436943054199, "Pretrain/Step": 3573, "Pretrain/Step Time": 8.45148515701294} +{"Pretrain/Learning Rate": 4.682154680606971e-05, "Pretrain/Loss": 2.054863452911377, "Pretrain/Loss (Raw)": 2.2188880443573, "Pretrain/Step": 3574, "Pretrain/Step Time": 8.455404257401824} +{"Pretrain/Learning Rate": 4.681947498899196e-05, "Pretrain/Loss": 2.0515499114990234, "Pretrain/Loss (Raw)": 1.6447209119796753, "Pretrain/Step": 3575, "Pretrain/Step Time": 8.451144494116306} +{"Pretrain/Learning Rate": 4.681740254276503e-05, "Pretrain/Loss": 2.0522451400756836, "Pretrain/Loss (Raw)": 1.9972690343856812, "Pretrain/Step": 3576, "Pretrain/Step Time": 8.456728272140026} +{"Pretrain/Learning Rate": 4.6815329467448676e-05, "Pretrain/Loss": 2.053252935409546, "Pretrain/Loss (Raw)": 2.1617794036865234, "Pretrain/Step": 3577, "Pretrain/Step Time": 8.45894968509674} +{"Pretrain/Learning Rate": 4.681325576310267e-05, "Pretrain/Loss": 2.0559113025665283, "Pretrain/Loss (Raw)": 2.179206132888794, "Pretrain/Step": 3578, "Pretrain/Step Time": 8.45793491601944} +{"Pretrain/Learning Rate": 4.681118142978682e-05, "Pretrain/Loss": 2.0570030212402344, "Pretrain/Loss (Raw)": 2.213573932647705, "Pretrain/Step": 3579, "Pretrain/Step Time": 8.457897935062647} +{"Pretrain/Learning Rate": 4.680910646756093e-05, "Pretrain/Loss": 2.0580365657806396, "Pretrain/Loss (Raw)": 2.2524073123931885, "Pretrain/Step": 3580, "Pretrain/Step Time": 8.458688270300627} +{"Pretrain/Learning Rate": 4.680703087648483e-05, "Pretrain/Loss": 2.0593247413635254, "Pretrain/Loss (Raw)": 2.180189847946167, "Pretrain/Step": 3581, "Pretrain/Step Time": 8.458758410066366} +{"Pretrain/Learning Rate": 4.680495465661836e-05, "Pretrain/Loss": 2.0576632022857666, "Pretrain/Loss (Raw)": 1.9176234006881714, "Pretrain/Step": 3582, "Pretrain/Step Time": 8.458576751872897} +{"Pretrain/Learning Rate": 4.68028778080214e-05, "Pretrain/Loss": 2.0597283840179443, "Pretrain/Loss (Raw)": 2.2077715396881104, "Pretrain/Step": 3583, "Pretrain/Step Time": 8.456846920773387} +{"Pretrain/Learning Rate": 4.6800800330753824e-05, "Pretrain/Loss": 2.060551166534424, "Pretrain/Loss (Raw)": 2.106541872024536, "Pretrain/Step": 3584, "Pretrain/Step Time": 8.456011861562729} +{"Pretrain/Learning Rate": 4.679872222487555e-05, "Pretrain/Loss": 2.0607268810272217, "Pretrain/Loss (Raw)": 2.225518226623535, "Pretrain/Step": 3585, "Pretrain/Step Time": 8.461999511346221} +{"Pretrain/Learning Rate": 4.679664349044648e-05, "Pretrain/Loss": 2.0606954097747803, "Pretrain/Loss (Raw)": 2.1341991424560547, "Pretrain/Step": 3586, "Pretrain/Step Time": 8.4593726079911} +{"Pretrain/Learning Rate": 4.679456412752655e-05, "Pretrain/Loss": 2.0627307891845703, "Pretrain/Loss (Raw)": 2.266646385192871, "Pretrain/Step": 3587, "Pretrain/Step Time": 8.464205069467425} +{"Pretrain/Learning Rate": 4.679248413617574e-05, "Pretrain/Loss": 2.063664197921753, "Pretrain/Loss (Raw)": 2.037045955657959, "Pretrain/Step": 3588, "Pretrain/Step Time": 8.464000834152102} +{"Pretrain/Learning Rate": 4.679040351645402e-05, "Pretrain/Loss": 2.0625975131988525, "Pretrain/Loss (Raw)": 1.9287333488464355, "Pretrain/Step": 3589, "Pretrain/Step Time": 8.46380839496851} +{"Pretrain/Learning Rate": 4.678832226842136e-05, "Pretrain/Loss": 2.0652410984039307, "Pretrain/Loss (Raw)": 2.202744483947754, "Pretrain/Step": 3590, "Pretrain/Step Time": 8.460599461570382} +{"Pretrain/Learning Rate": 4.678624039213779e-05, "Pretrain/Loss": 2.0644664764404297, "Pretrain/Loss (Raw)": 1.9761571884155273, "Pretrain/Step": 3591, "Pretrain/Step Time": 8.45712647587061} +{"Pretrain/Learning Rate": 4.678415788766334e-05, "Pretrain/Loss": 2.06502628326416, "Pretrain/Loss (Raw)": 1.9475423097610474, "Pretrain/Step": 3592, "Pretrain/Step Time": 8.460134478285909} +{"Pretrain/Learning Rate": 4.678207475505806e-05, "Pretrain/Loss": 2.0671403408050537, "Pretrain/Loss (Raw)": 2.167050838470459, "Pretrain/Step": 3593, "Pretrain/Step Time": 8.457534635439515} +{"Pretrain/Learning Rate": 4.677999099438201e-05, "Pretrain/Loss": 2.0676262378692627, "Pretrain/Loss (Raw)": 1.9662035703659058, "Pretrain/Step": 3594, "Pretrain/Step Time": 8.456251740455627} +{"Pretrain/Learning Rate": 4.677790660569526e-05, "Pretrain/Loss": 2.0679564476013184, "Pretrain/Loss (Raw)": 2.153778076171875, "Pretrain/Step": 3595, "Pretrain/Step Time": 8.456962011754513} +{"Pretrain/Learning Rate": 4.6775821589057934e-05, "Pretrain/Loss": 2.067655563354492, "Pretrain/Loss (Raw)": 2.0037312507629395, "Pretrain/Step": 3596, "Pretrain/Step Time": 8.454300610348582} +{"Pretrain/Learning Rate": 4.677373594453014e-05, "Pretrain/Loss": 2.066605806350708, "Pretrain/Loss (Raw)": 2.135145902633667, "Pretrain/Step": 3597, "Pretrain/Step Time": 8.456012830138206} +{"Pretrain/Learning Rate": 4.677164967217203e-05, "Pretrain/Loss": 2.066837787628174, "Pretrain/Loss (Raw)": 2.185709238052368, "Pretrain/Step": 3598, "Pretrain/Step Time": 8.452242992818356} +{"Pretrain/Learning Rate": 4.6769562772043734e-05, "Pretrain/Loss": 2.0691945552825928, "Pretrain/Loss (Raw)": 2.328681707382202, "Pretrain/Step": 3599, "Pretrain/Step Time": 8.448769366368651} +{"Pretrain/Learning Rate": 4.676747524420545e-05, "Pretrain/Loss": 2.0685486793518066, "Pretrain/Loss (Raw)": 1.932633638381958, "Pretrain/Step": 3600, "Pretrain/Step Time": 8.44972742907703} +{"Pretrain/Learning Rate": 4.676538708871736e-05, "Pretrain/Loss": 2.068783760070801, "Pretrain/Loss (Raw)": 1.933415412902832, "Pretrain/Step": 3601, "Pretrain/Step Time": 8.448939876630902} +{"Pretrain/Learning Rate": 4.676329830563968e-05, "Pretrain/Loss": 2.0646767616271973, "Pretrain/Loss (Raw)": 1.5961211919784546, "Pretrain/Step": 3602, "Pretrain/Step Time": 8.442341910675168} +{"Pretrain/Learning Rate": 4.6761208895032635e-05, "Pretrain/Loss": 2.0650594234466553, "Pretrain/Loss (Raw)": 2.07393217086792, "Pretrain/Step": 3603, "Pretrain/Step Time": 8.448781311511993} +{"Pretrain/Learning Rate": 4.6759118856956474e-05, "Pretrain/Loss": 2.0636048316955566, "Pretrain/Loss (Raw)": 1.7478004693984985, "Pretrain/Step": 3604, "Pretrain/Step Time": 8.452101167291403} +{"Pretrain/Learning Rate": 4.6757028191471455e-05, "Pretrain/Loss": 2.0611581802368164, "Pretrain/Loss (Raw)": 1.95497727394104, "Pretrain/Step": 3605, "Pretrain/Step Time": 8.450369538739324} +{"Pretrain/Learning Rate": 4.675493689863787e-05, "Pretrain/Loss": 2.0610880851745605, "Pretrain/Loss (Raw)": 1.9999735355377197, "Pretrain/Step": 3606, "Pretrain/Step Time": 8.446762567386031} +{"Pretrain/Learning Rate": 4.6752844978516006e-05, "Pretrain/Loss": 2.0599470138549805, "Pretrain/Loss (Raw)": 1.9960488080978394, "Pretrain/Step": 3607, "Pretrain/Step Time": 8.447646979242563} +{"Pretrain/Learning Rate": 4.67507524311662e-05, "Pretrain/Loss": 2.0596675872802734, "Pretrain/Loss (Raw)": 2.037095308303833, "Pretrain/Step": 3608, "Pretrain/Step Time": 8.449899531900883} +{"Pretrain/Learning Rate": 4.6748659256648784e-05, "Pretrain/Loss": 2.0576207637786865, "Pretrain/Loss (Raw)": 2.123267412185669, "Pretrain/Step": 3609, "Pretrain/Step Time": 8.452172994613647} +{"Pretrain/Learning Rate": 4.674656545502411e-05, "Pretrain/Loss": 2.0577449798583984, "Pretrain/Loss (Raw)": 2.045667886734009, "Pretrain/Step": 3610, "Pretrain/Step Time": 8.45265018939972} +{"Pretrain/Learning Rate": 4.6744471026352544e-05, "Pretrain/Loss": 2.051668405532837, "Pretrain/Loss (Raw)": 1.9590320587158203, "Pretrain/Step": 3611, "Pretrain/Step Time": 8.451951777562499} +{"Pretrain/Learning Rate": 4.674237597069449e-05, "Pretrain/Loss": 2.0538392066955566, "Pretrain/Loss (Raw)": 2.498697280883789, "Pretrain/Step": 3612, "Pretrain/Step Time": 8.453700518235564} +{"Pretrain/Learning Rate": 4.674028028811035e-05, "Pretrain/Loss": 2.052704095840454, "Pretrain/Loss (Raw)": 1.9763708114624023, "Pretrain/Step": 3613, "Pretrain/Step Time": 8.450809987261891} +{"Pretrain/Learning Rate": 4.673818397866055e-05, "Pretrain/Loss": 2.054616689682007, "Pretrain/Loss (Raw)": 2.2108633518218994, "Pretrain/Step": 3614, "Pretrain/Step Time": 8.44906011596322} +{"Pretrain/Learning Rate": 4.673608704240555e-05, "Pretrain/Loss": 2.0527355670928955, "Pretrain/Loss (Raw)": 1.979570984840393, "Pretrain/Step": 3615, "Pretrain/Step Time": 8.44697150401771} +{"Pretrain/Learning Rate": 4.67339894794058e-05, "Pretrain/Loss": 2.0522851943969727, "Pretrain/Loss (Raw)": 2.1722891330718994, "Pretrain/Step": 3616, "Pretrain/Step Time": 8.446803012862802} +{"Pretrain/Learning Rate": 4.6731891289721786e-05, "Pretrain/Loss": 2.052797317504883, "Pretrain/Loss (Raw)": 2.0526113510131836, "Pretrain/Step": 3617, "Pretrain/Step Time": 8.44331387616694} +{"Pretrain/Learning Rate": 4.6729792473414005e-05, "Pretrain/Loss": 2.0507283210754395, "Pretrain/Loss (Raw)": 2.0190017223358154, "Pretrain/Step": 3618, "Pretrain/Step Time": 8.446396213024855} +{"Pretrain/Learning Rate": 4.672769303054297e-05, "Pretrain/Loss": 2.0538201332092285, "Pretrain/Loss (Raw)": 2.245234727859497, "Pretrain/Step": 3619, "Pretrain/Step Time": 8.446760158985853} +{"Pretrain/Learning Rate": 4.672559296116923e-05, "Pretrain/Loss": 2.056809425354004, "Pretrain/Loss (Raw)": 2.2288014888763428, "Pretrain/Step": 3620, "Pretrain/Step Time": 8.449959754943848} +{"Pretrain/Learning Rate": 4.672349226535333e-05, "Pretrain/Loss": 2.052520275115967, "Pretrain/Loss (Raw)": 1.968675971031189, "Pretrain/Step": 3621, "Pretrain/Step Time": 8.450590258464217} +{"Pretrain/Learning Rate": 4.672139094315584e-05, "Pretrain/Loss": 2.052298069000244, "Pretrain/Loss (Raw)": 2.00455904006958, "Pretrain/Step": 3622, "Pretrain/Step Time": 8.44405546784401} +{"Pretrain/Learning Rate": 4.671928899463736e-05, "Pretrain/Loss": 2.0534520149230957, "Pretrain/Loss (Raw)": 2.01556658744812, "Pretrain/Step": 3623, "Pretrain/Step Time": 8.448749333620071} +{"Pretrain/Learning Rate": 4.671718641985849e-05, "Pretrain/Loss": 2.0535058975219727, "Pretrain/Loss (Raw)": 2.203523635864258, "Pretrain/Step": 3624, "Pretrain/Step Time": 8.447676591575146} +{"Pretrain/Learning Rate": 4.671508321887986e-05, "Pretrain/Loss": 2.0530636310577393, "Pretrain/Loss (Raw)": 2.047370433807373, "Pretrain/Step": 3625, "Pretrain/Step Time": 8.456223784014583} +{"Pretrain/Learning Rate": 4.6712979391762124e-05, "Pretrain/Loss": 2.0576322078704834, "Pretrain/Loss (Raw)": 2.2082772254943848, "Pretrain/Step": 3626, "Pretrain/Step Time": 8.451573930680752} +{"Pretrain/Learning Rate": 4.671087493856592e-05, "Pretrain/Loss": 2.056891679763794, "Pretrain/Loss (Raw)": 1.9790085554122925, "Pretrain/Step": 3627, "Pretrain/Step Time": 8.456289729103446} +{"Pretrain/Learning Rate": 4.6708769859351955e-05, "Pretrain/Loss": 2.0557122230529785, "Pretrain/Loss (Raw)": 2.0374438762664795, "Pretrain/Step": 3628, "Pretrain/Step Time": 8.455357072874904} +{"Pretrain/Learning Rate": 4.67066641541809e-05, "Pretrain/Loss": 2.0549213886260986, "Pretrain/Loss (Raw)": 1.8885602951049805, "Pretrain/Step": 3629, "Pretrain/Step Time": 8.453283745795488} +{"Pretrain/Learning Rate": 4.670455782311349e-05, "Pretrain/Loss": 2.0554378032684326, "Pretrain/Loss (Raw)": 2.037393093109131, "Pretrain/Step": 3630, "Pretrain/Step Time": 8.454765915870667} +{"Pretrain/Learning Rate": 4.670245086621047e-05, "Pretrain/Loss": 2.0548722743988037, "Pretrain/Loss (Raw)": 1.884520411491394, "Pretrain/Step": 3631, "Pretrain/Step Time": 8.447990940883756} +{"Pretrain/Learning Rate": 4.6700343283532565e-05, "Pretrain/Loss": 2.0549557209014893, "Pretrain/Loss (Raw)": 2.108670234680176, "Pretrain/Step": 3632, "Pretrain/Step Time": 8.450782360509038} +{"Pretrain/Learning Rate": 4.669823507514056e-05, "Pretrain/Loss": 2.0552220344543457, "Pretrain/Loss (Raw)": 2.112459421157837, "Pretrain/Step": 3633, "Pretrain/Step Time": 8.447743471711874} +{"Pretrain/Learning Rate": 4.669612624109525e-05, "Pretrain/Loss": 2.0564801692962646, "Pretrain/Loss (Raw)": 2.0661985874176025, "Pretrain/Step": 3634, "Pretrain/Step Time": 8.449528137221932} +{"Pretrain/Learning Rate": 4.6694016781457426e-05, "Pretrain/Loss": 2.055790424346924, "Pretrain/Loss (Raw)": 2.135158061981201, "Pretrain/Step": 3635, "Pretrain/Step Time": 8.454950731247663} +{"Pretrain/Learning Rate": 4.6691906696287926e-05, "Pretrain/Loss": 2.055751085281372, "Pretrain/Loss (Raw)": 2.079571008682251, "Pretrain/Step": 3636, "Pretrain/Step Time": 8.454148340970278} +{"Pretrain/Learning Rate": 4.6689795985647586e-05, "Pretrain/Loss": 2.0564675331115723, "Pretrain/Loss (Raw)": 2.0852062702178955, "Pretrain/Step": 3637, "Pretrain/Step Time": 8.453949311748147} +{"Pretrain/Learning Rate": 4.668768464959727e-05, "Pretrain/Loss": 2.0568156242370605, "Pretrain/Loss (Raw)": 2.0171101093292236, "Pretrain/Step": 3638, "Pretrain/Step Time": 8.453421844169497} +{"Pretrain/Learning Rate": 4.668557268819785e-05, "Pretrain/Loss": 2.0566675662994385, "Pretrain/Loss (Raw)": 1.9205290079116821, "Pretrain/Step": 3639, "Pretrain/Step Time": 8.454565711319447} +{"Pretrain/Learning Rate": 4.668346010151024e-05, "Pretrain/Loss": 2.0580062866210938, "Pretrain/Loss (Raw)": 2.1282460689544678, "Pretrain/Step": 3640, "Pretrain/Step Time": 8.447562709450722} +{"Pretrain/Learning Rate": 4.668134688959534e-05, "Pretrain/Loss": 2.0587148666381836, "Pretrain/Loss (Raw)": 2.0717599391937256, "Pretrain/Step": 3641, "Pretrain/Step Time": 8.452399972826242} +{"Pretrain/Learning Rate": 4.6679233052514087e-05, "Pretrain/Loss": 2.059727430343628, "Pretrain/Loss (Raw)": 2.071876049041748, "Pretrain/Step": 3642, "Pretrain/Step Time": 8.454600494354963} +{"Pretrain/Learning Rate": 4.667711859032743e-05, "Pretrain/Loss": 2.0551695823669434, "Pretrain/Loss (Raw)": 1.8637776374816895, "Pretrain/Step": 3643, "Pretrain/Step Time": 8.453367536887527} +{"Pretrain/Learning Rate": 4.6675003503096335e-05, "Pretrain/Loss": 2.056265354156494, "Pretrain/Loss (Raw)": 2.1799137592315674, "Pretrain/Step": 3644, "Pretrain/Step Time": 8.45582172833383} +{"Pretrain/Learning Rate": 4.66728877908818e-05, "Pretrain/Loss": 2.0565905570983887, "Pretrain/Loss (Raw)": 1.9633536338806152, "Pretrain/Step": 3645, "Pretrain/Step Time": 8.452489087358117} +{"Pretrain/Learning Rate": 4.6670771453744824e-05, "Pretrain/Loss": 2.057143449783325, "Pretrain/Loss (Raw)": 2.1266367435455322, "Pretrain/Step": 3646, "Pretrain/Step Time": 8.450825940817595} +{"Pretrain/Learning Rate": 4.666865449174643e-05, "Pretrain/Loss": 2.0545156002044678, "Pretrain/Loss (Raw)": 2.0808775424957275, "Pretrain/Step": 3647, "Pretrain/Step Time": 8.452498145401478} +{"Pretrain/Learning Rate": 4.666653690494766e-05, "Pretrain/Loss": 2.0509395599365234, "Pretrain/Loss (Raw)": 1.6650598049163818, "Pretrain/Step": 3648, "Pretrain/Step Time": 8.446387279778719} +{"Pretrain/Learning Rate": 4.666441869340957e-05, "Pretrain/Loss": 2.051166534423828, "Pretrain/Loss (Raw)": 1.9551907777786255, "Pretrain/Step": 3649, "Pretrain/Step Time": 8.443144999444485} +{"Pretrain/Learning Rate": 4.6662299857193236e-05, "Pretrain/Loss": 2.0526795387268066, "Pretrain/Loss (Raw)": 2.1889865398406982, "Pretrain/Step": 3650, "Pretrain/Step Time": 8.439405309036374} +{"Pretrain/Learning Rate": 4.666018039635977e-05, "Pretrain/Loss": 2.0525431632995605, "Pretrain/Loss (Raw)": 1.8924016952514648, "Pretrain/Step": 3651, "Pretrain/Step Time": 8.443099670112133} +{"Pretrain/Learning Rate": 4.665806031097026e-05, "Pretrain/Loss": 2.0530717372894287, "Pretrain/Loss (Raw)": 2.031590461730957, "Pretrain/Step": 3652, "Pretrain/Step Time": 8.443344853818417} +{"Pretrain/Learning Rate": 4.6655939601085854e-05, "Pretrain/Loss": 2.052690029144287, "Pretrain/Loss (Raw)": 1.9139715433120728, "Pretrain/Step": 3653, "Pretrain/Step Time": 8.44335563853383} +{"Pretrain/Learning Rate": 4.6653818266767693e-05, "Pretrain/Loss": 2.052553176879883, "Pretrain/Loss (Raw)": 2.0212955474853516, "Pretrain/Step": 3654, "Pretrain/Step Time": 8.447733609005809} +{"Pretrain/Learning Rate": 4.6651696308076943e-05, "Pretrain/Loss": 2.051208734512329, "Pretrain/Loss (Raw)": 2.005072832107544, "Pretrain/Step": 3655, "Pretrain/Step Time": 8.444383962079883} +{"Pretrain/Learning Rate": 4.66495737250748e-05, "Pretrain/Loss": 2.050962209701538, "Pretrain/Loss (Raw)": 1.9506007432937622, "Pretrain/Step": 3656, "Pretrain/Step Time": 8.440074587240815} +{"Pretrain/Learning Rate": 4.664745051782245e-05, "Pretrain/Loss": 2.052915573120117, "Pretrain/Loss (Raw)": 2.1690616607666016, "Pretrain/Step": 3657, "Pretrain/Step Time": 8.446131356060505} +{"Pretrain/Learning Rate": 4.664532668638114e-05, "Pretrain/Loss": 2.054745674133301, "Pretrain/Loss (Raw)": 1.9991768598556519, "Pretrain/Step": 3658, "Pretrain/Step Time": 8.443827094510198} +{"Pretrain/Learning Rate": 4.664320223081208e-05, "Pretrain/Loss": 2.055549383163452, "Pretrain/Loss (Raw)": 2.135915756225586, "Pretrain/Step": 3659, "Pretrain/Step Time": 8.44465029425919} +{"Pretrain/Learning Rate": 4.664107715117655e-05, "Pretrain/Loss": 2.0546536445617676, "Pretrain/Loss (Raw)": 1.918192744255066, "Pretrain/Step": 3660, "Pretrain/Step Time": 8.446054939180613} +{"Pretrain/Learning Rate": 4.663895144753582e-05, "Pretrain/Loss": 2.0533740520477295, "Pretrain/Loss (Raw)": 2.034712553024292, "Pretrain/Step": 3661, "Pretrain/Step Time": 8.447885066270828} +{"Pretrain/Learning Rate": 4.6636825119951164e-05, "Pretrain/Loss": 2.0529348850250244, "Pretrain/Loss (Raw)": 1.9582544565200806, "Pretrain/Step": 3662, "Pretrain/Step Time": 8.443901615217328} +{"Pretrain/Learning Rate": 4.6634698168483924e-05, "Pretrain/Loss": 2.055729866027832, "Pretrain/Loss (Raw)": 2.158433198928833, "Pretrain/Step": 3663, "Pretrain/Step Time": 8.444243222475052} +{"Pretrain/Learning Rate": 4.6632570593195404e-05, "Pretrain/Loss": 2.05311918258667, "Pretrain/Loss (Raw)": 1.8491854667663574, "Pretrain/Step": 3664, "Pretrain/Step Time": 8.445318212732673} +{"Pretrain/Learning Rate": 4.663044239414697e-05, "Pretrain/Loss": 2.0554723739624023, "Pretrain/Loss (Raw)": 2.251533269882202, "Pretrain/Step": 3665, "Pretrain/Step Time": 8.43453260883689} +{"Pretrain/Learning Rate": 4.6628313571399974e-05, "Pretrain/Loss": 2.056980848312378, "Pretrain/Loss (Raw)": 2.195502519607544, "Pretrain/Step": 3666, "Pretrain/Step Time": 8.435687277466059} +{"Pretrain/Learning Rate": 4.66261841250158e-05, "Pretrain/Loss": 2.0584163665771484, "Pretrain/Loss (Raw)": 1.9589030742645264, "Pretrain/Step": 3667, "Pretrain/Step Time": 8.438808215782046} +{"Pretrain/Learning Rate": 4.6624054055055855e-05, "Pretrain/Loss": 2.0567634105682373, "Pretrain/Loss (Raw)": 1.8446581363677979, "Pretrain/Step": 3668, "Pretrain/Step Time": 8.43546056188643} +{"Pretrain/Learning Rate": 4.662192336158155e-05, "Pretrain/Loss": 2.0530149936676025, "Pretrain/Loss (Raw)": 1.9154928922653198, "Pretrain/Step": 3669, "Pretrain/Step Time": 8.442754989489913} +{"Pretrain/Learning Rate": 4.661979204465434e-05, "Pretrain/Loss": 2.0543301105499268, "Pretrain/Loss (Raw)": 2.1571195125579834, "Pretrain/Step": 3670, "Pretrain/Step Time": 8.447508003562689} +{"Pretrain/Learning Rate": 4.661766010433566e-05, "Pretrain/Loss": 2.0520572662353516, "Pretrain/Loss (Raw)": 1.88258695602417, "Pretrain/Step": 3671, "Pretrain/Step Time": 8.448233613744378} +{"Pretrain/Learning Rate": 4.661552754068699e-05, "Pretrain/Loss": 2.0521483421325684, "Pretrain/Loss (Raw)": 2.0522069931030273, "Pretrain/Step": 3672, "Pretrain/Step Time": 8.44902109913528} +{"Pretrain/Learning Rate": 4.6613394353769816e-05, "Pretrain/Loss": 2.051403522491455, "Pretrain/Loss (Raw)": 1.9706594944000244, "Pretrain/Step": 3673, "Pretrain/Step Time": 8.453662868589163} +{"Pretrain/Learning Rate": 4.6611260543645664e-05, "Pretrain/Loss": 2.0540452003479004, "Pretrain/Loss (Raw)": 2.3661720752716064, "Pretrain/Step": 3674, "Pretrain/Step Time": 8.455572336912155} +{"Pretrain/Learning Rate": 4.6609126110376035e-05, "Pretrain/Loss": 2.0572874546051025, "Pretrain/Loss (Raw)": 2.1084704399108887, "Pretrain/Step": 3675, "Pretrain/Step Time": 8.450745528563857} +{"Pretrain/Learning Rate": 4.66069910540225e-05, "Pretrain/Loss": 2.0576605796813965, "Pretrain/Loss (Raw)": 2.237070083618164, "Pretrain/Step": 3676, "Pretrain/Step Time": 8.451609157025814} +{"Pretrain/Learning Rate": 4.6604855374646605e-05, "Pretrain/Loss": 2.0545361042022705, "Pretrain/Loss (Raw)": 2.062253713607788, "Pretrain/Step": 3677, "Pretrain/Step Time": 8.452849738299847} +{"Pretrain/Learning Rate": 4.660271907230993e-05, "Pretrain/Loss": 2.054673671722412, "Pretrain/Loss (Raw)": 2.045224905014038, "Pretrain/Step": 3678, "Pretrain/Step Time": 8.452064774930477} +{"Pretrain/Learning Rate": 4.660058214707409e-05, "Pretrain/Loss": 2.053816318511963, "Pretrain/Loss (Raw)": 1.9933979511260986, "Pretrain/Step": 3679, "Pretrain/Step Time": 8.45476146414876} +{"Pretrain/Learning Rate": 4.6598444599000685e-05, "Pretrain/Loss": 2.052809953689575, "Pretrain/Loss (Raw)": 2.061575412750244, "Pretrain/Step": 3680, "Pretrain/Step Time": 8.449443651363254} +{"Pretrain/Learning Rate": 4.659630642815136e-05, "Pretrain/Loss": 2.052889108657837, "Pretrain/Loss (Raw)": 2.0153372287750244, "Pretrain/Step": 3681, "Pretrain/Step Time": 8.44652502797544} +{"Pretrain/Learning Rate": 4.659416763458776e-05, "Pretrain/Loss": 2.0537590980529785, "Pretrain/Loss (Raw)": 2.124601125717163, "Pretrain/Step": 3682, "Pretrain/Step Time": 8.443164806813002} +{"Pretrain/Learning Rate": 4.659202821837156e-05, "Pretrain/Loss": 2.0539989471435547, "Pretrain/Loss (Raw)": 2.097172498703003, "Pretrain/Step": 3683, "Pretrain/Step Time": 8.446816658601165} +{"Pretrain/Learning Rate": 4.6589888179564445e-05, "Pretrain/Loss": 2.0527334213256836, "Pretrain/Loss (Raw)": 1.8910417556762695, "Pretrain/Step": 3684, "Pretrain/Step Time": 8.441825304180384} +{"Pretrain/Learning Rate": 4.658774751822813e-05, "Pretrain/Loss": 2.051644802093506, "Pretrain/Loss (Raw)": 2.0555551052093506, "Pretrain/Step": 3685, "Pretrain/Step Time": 8.441715333610773} +{"Pretrain/Learning Rate": 4.658560623442433e-05, "Pretrain/Loss": 2.055117130279541, "Pretrain/Loss (Raw)": 2.3825697898864746, "Pretrain/Step": 3686, "Pretrain/Step Time": 8.445060458034277} +{"Pretrain/Learning Rate": 4.658346432821479e-05, "Pretrain/Loss": 2.0523102283477783, "Pretrain/Loss (Raw)": 1.5506129264831543, "Pretrain/Step": 3687, "Pretrain/Step Time": 8.443989733234048} +{"Pretrain/Learning Rate": 4.658132179966128e-05, "Pretrain/Loss": 2.051680088043213, "Pretrain/Loss (Raw)": 2.1851909160614014, "Pretrain/Step": 3688, "Pretrain/Step Time": 8.44445133395493} +{"Pretrain/Learning Rate": 4.657917864882556e-05, "Pretrain/Loss": 2.0486080646514893, "Pretrain/Loss (Raw)": 1.85361909866333, "Pretrain/Step": 3689, "Pretrain/Step Time": 8.441496841609478} +{"Pretrain/Learning Rate": 4.657703487576944e-05, "Pretrain/Loss": 2.049699306488037, "Pretrain/Loss (Raw)": 2.145008087158203, "Pretrain/Step": 3690, "Pretrain/Step Time": 8.442053562030196} +{"Pretrain/Learning Rate": 4.657489048055473e-05, "Pretrain/Loss": 2.0496468544006348, "Pretrain/Loss (Raw)": 2.1376848220825195, "Pretrain/Step": 3691, "Pretrain/Step Time": 8.44107998907566} +{"Pretrain/Learning Rate": 4.657274546324326e-05, "Pretrain/Loss": 2.048285961151123, "Pretrain/Loss (Raw)": 1.788823127746582, "Pretrain/Step": 3692, "Pretrain/Step Time": 8.444037791341543} +{"Pretrain/Learning Rate": 4.657059982389688e-05, "Pretrain/Loss": 2.0504672527313232, "Pretrain/Loss (Raw)": 2.2200686931610107, "Pretrain/Step": 3693, "Pretrain/Step Time": 8.442405328154564} +{"Pretrain/Learning Rate": 4.656845356257747e-05, "Pretrain/Loss": 2.0520403385162354, "Pretrain/Loss (Raw)": 2.0442416667938232, "Pretrain/Step": 3694, "Pretrain/Step Time": 8.440986385568976} +{"Pretrain/Learning Rate": 4.65663066793469e-05, "Pretrain/Loss": 2.0510993003845215, "Pretrain/Loss (Raw)": 2.0197396278381348, "Pretrain/Step": 3695, "Pretrain/Step Time": 8.442043939605355} +{"Pretrain/Learning Rate": 4.656415917426708e-05, "Pretrain/Loss": 2.0510430335998535, "Pretrain/Loss (Raw)": 2.053058385848999, "Pretrain/Step": 3696, "Pretrain/Step Time": 8.44266433082521} +{"Pretrain/Learning Rate": 4.656201104739993e-05, "Pretrain/Loss": 2.052238702774048, "Pretrain/Loss (Raw)": 2.1740915775299072, "Pretrain/Step": 3697, "Pretrain/Step Time": 8.441084422171116} +{"Pretrain/Learning Rate": 4.65598622988074e-05, "Pretrain/Loss": 2.0522613525390625, "Pretrain/Loss (Raw)": 2.130296230316162, "Pretrain/Step": 3698, "Pretrain/Step Time": 8.436464289203286} +{"Pretrain/Learning Rate": 4.655771292855143e-05, "Pretrain/Loss": 2.0528616905212402, "Pretrain/Loss (Raw)": 2.1074962615966797, "Pretrain/Step": 3699, "Pretrain/Step Time": 8.434473166242242} +{"Pretrain/Learning Rate": 4.655556293669401e-05, "Pretrain/Loss": 2.0537924766540527, "Pretrain/Loss (Raw)": 2.09336519241333, "Pretrain/Step": 3700, "Pretrain/Step Time": 8.439943322911859} +{"Pretrain/Learning Rate": 4.655341232329712e-05, "Pretrain/Loss": 2.0530099868774414, "Pretrain/Loss (Raw)": 1.9572479724884033, "Pretrain/Step": 3701, "Pretrain/Step Time": 8.441504241898656} +{"Pretrain/Learning Rate": 4.6551261088422795e-05, "Pretrain/Loss": 2.0512373447418213, "Pretrain/Loss (Raw)": 1.9920101165771484, "Pretrain/Step": 3702, "Pretrain/Step Time": 8.43802366219461} +{"Pretrain/Learning Rate": 4.6549109232133034e-05, "Pretrain/Loss": 2.053863286972046, "Pretrain/Loss (Raw)": 1.9808344841003418, "Pretrain/Step": 3703, "Pretrain/Step Time": 8.43986515328288} +{"Pretrain/Learning Rate": 4.6546956754489915e-05, "Pretrain/Loss": 2.0541574954986572, "Pretrain/Loss (Raw)": 2.0349204540252686, "Pretrain/Step": 3704, "Pretrain/Step Time": 8.438803967088461} +{"Pretrain/Learning Rate": 4.6544803655555475e-05, "Pretrain/Loss": 2.0512022972106934, "Pretrain/Loss (Raw)": 1.7835321426391602, "Pretrain/Step": 3705, "Pretrain/Step Time": 8.438586490228772} +{"Pretrain/Learning Rate": 4.654264993539181e-05, "Pretrain/Loss": 2.0509860515594482, "Pretrain/Loss (Raw)": 2.1515204906463623, "Pretrain/Step": 3706, "Pretrain/Step Time": 8.436647752299905} +{"Pretrain/Learning Rate": 4.654049559406103e-05, "Pretrain/Loss": 2.04864764213562, "Pretrain/Loss (Raw)": 1.9142440557479858, "Pretrain/Step": 3707, "Pretrain/Step Time": 8.440849276259542} +{"Pretrain/Learning Rate": 4.653834063162523e-05, "Pretrain/Loss": 2.0460479259490967, "Pretrain/Loss (Raw)": 1.9196490049362183, "Pretrain/Step": 3708, "Pretrain/Step Time": 8.438596922904253} +{"Pretrain/Learning Rate": 4.6536185048146575e-05, "Pretrain/Loss": 2.0448555946350098, "Pretrain/Loss (Raw)": 2.027564764022827, "Pretrain/Step": 3709, "Pretrain/Step Time": 8.436962617561221} +{"Pretrain/Learning Rate": 4.65340288436872e-05, "Pretrain/Loss": 2.045279026031494, "Pretrain/Loss (Raw)": 1.9718523025512695, "Pretrain/Step": 3710, "Pretrain/Step Time": 8.438361102715135} +{"Pretrain/Learning Rate": 4.6531872018309286e-05, "Pretrain/Loss": 2.0441246032714844, "Pretrain/Loss (Raw)": 2.0599803924560547, "Pretrain/Step": 3711, "Pretrain/Step Time": 8.437132567167282} +{"Pretrain/Learning Rate": 4.652971457207502e-05, "Pretrain/Loss": 2.0429301261901855, "Pretrain/Loss (Raw)": 1.9536635875701904, "Pretrain/Step": 3712, "Pretrain/Step Time": 8.435233946889639} +{"Pretrain/Learning Rate": 4.652755650504661e-05, "Pretrain/Loss": 2.0432944297790527, "Pretrain/Loss (Raw)": 2.272143840789795, "Pretrain/Step": 3713, "Pretrain/Step Time": 8.431826923042536} +{"Pretrain/Learning Rate": 4.652539781728629e-05, "Pretrain/Loss": 2.0442662239074707, "Pretrain/Loss (Raw)": 2.2586092948913574, "Pretrain/Step": 3714, "Pretrain/Step Time": 8.431955767795444} +{"Pretrain/Learning Rate": 4.6523238508856296e-05, "Pretrain/Loss": 2.0414223670959473, "Pretrain/Loss (Raw)": 1.9025771617889404, "Pretrain/Step": 3715, "Pretrain/Step Time": 8.428422702476382} +{"Pretrain/Learning Rate": 4.652107857981889e-05, "Pretrain/Loss": 2.0402355194091797, "Pretrain/Loss (Raw)": 1.885178565979004, "Pretrain/Step": 3716, "Pretrain/Step Time": 8.431781051680446} +{"Pretrain/Learning Rate": 4.651891803023636e-05, "Pretrain/Loss": 2.041482448577881, "Pretrain/Loss (Raw)": 2.0883352756500244, "Pretrain/Step": 3717, "Pretrain/Step Time": 8.432060148566961} +{"Pretrain/Learning Rate": 4.651675686017099e-05, "Pretrain/Loss": 2.03977370262146, "Pretrain/Loss (Raw)": 1.9840203523635864, "Pretrain/Step": 3718, "Pretrain/Step Time": 8.432388287037611} +{"Pretrain/Learning Rate": 4.6514595069685106e-05, "Pretrain/Loss": 2.0389699935913086, "Pretrain/Loss (Raw)": 1.8732593059539795, "Pretrain/Step": 3719, "Pretrain/Step Time": 8.432911163195968} +{"Pretrain/Learning Rate": 4.6512432658841044e-05, "Pretrain/Loss": 2.0387208461761475, "Pretrain/Loss (Raw)": 1.9156614542007446, "Pretrain/Step": 3720, "Pretrain/Step Time": 8.431658482179046} +{"Pretrain/Learning Rate": 4.6510269627701154e-05, "Pretrain/Loss": 2.036846160888672, "Pretrain/Loss (Raw)": 1.9270962476730347, "Pretrain/Step": 3721, "Pretrain/Step Time": 8.433229364454746} +{"Pretrain/Learning Rate": 4.65081059763278e-05, "Pretrain/Loss": 2.038800001144409, "Pretrain/Loss (Raw)": 2.216282606124878, "Pretrain/Step": 3722, "Pretrain/Step Time": 8.434898978099227} +{"Pretrain/Learning Rate": 4.650594170478337e-05, "Pretrain/Loss": 2.037076950073242, "Pretrain/Loss (Raw)": 1.9332202672958374, "Pretrain/Step": 3723, "Pretrain/Step Time": 8.437069995328784} +{"Pretrain/Learning Rate": 4.650377681313027e-05, "Pretrain/Loss": 2.0380191802978516, "Pretrain/Loss (Raw)": 2.1243722438812256, "Pretrain/Step": 3724, "Pretrain/Step Time": 8.437074348330498} +{"Pretrain/Learning Rate": 4.6501611301430924e-05, "Pretrain/Loss": 2.0380630493164062, "Pretrain/Loss (Raw)": 2.1407785415649414, "Pretrain/Step": 3725, "Pretrain/Step Time": 8.435210712254047} +{"Pretrain/Learning Rate": 4.649944516974778e-05, "Pretrain/Loss": 2.036424160003662, "Pretrain/Loss (Raw)": 1.9759101867675781, "Pretrain/Step": 3726, "Pretrain/Step Time": 8.433950578793883} +{"Pretrain/Learning Rate": 4.649727841814329e-05, "Pretrain/Loss": 2.034482479095459, "Pretrain/Loss (Raw)": 2.080141305923462, "Pretrain/Step": 3727, "Pretrain/Step Time": 8.435017948970199} +{"Pretrain/Learning Rate": 4.649511104667993e-05, "Pretrain/Loss": 2.036083698272705, "Pretrain/Loss (Raw)": 2.1375763416290283, "Pretrain/Step": 3728, "Pretrain/Step Time": 8.434490073472261} +{"Pretrain/Learning Rate": 4.6492943055420194e-05, "Pretrain/Loss": 2.0372631549835205, "Pretrain/Loss (Raw)": 2.084407329559326, "Pretrain/Step": 3729, "Pretrain/Step Time": 8.431360434740782} +{"Pretrain/Learning Rate": 4.64907744444266e-05, "Pretrain/Loss": 2.0419983863830566, "Pretrain/Loss (Raw)": 2.2021961212158203, "Pretrain/Step": 3730, "Pretrain/Step Time": 8.431419406086206} +{"Pretrain/Learning Rate": 4.6488605213761674e-05, "Pretrain/Loss": 2.0420544147491455, "Pretrain/Loss (Raw)": 2.0811269283294678, "Pretrain/Step": 3731, "Pretrain/Step Time": 8.422870572656393} +{"Pretrain/Learning Rate": 4.6486435363487965e-05, "Pretrain/Loss": 2.042837142944336, "Pretrain/Loss (Raw)": 1.8480002880096436, "Pretrain/Step": 3732, "Pretrain/Step Time": 8.42414323054254} +{"Pretrain/Learning Rate": 4.648426489366803e-05, "Pretrain/Loss": 2.0486271381378174, "Pretrain/Loss (Raw)": 2.696096658706665, "Pretrain/Step": 3733, "Pretrain/Step Time": 8.426117489114404} +{"Pretrain/Learning Rate": 4.6482093804364477e-05, "Pretrain/Loss": 2.0491983890533447, "Pretrain/Loss (Raw)": 2.0730738639831543, "Pretrain/Step": 3734, "Pretrain/Step Time": 8.42921213246882} +{"Pretrain/Learning Rate": 4.647992209563988e-05, "Pretrain/Loss": 2.048595428466797, "Pretrain/Loss (Raw)": 1.9188717603683472, "Pretrain/Step": 3735, "Pretrain/Step Time": 8.42851977236569} +{"Pretrain/Learning Rate": 4.647774976755688e-05, "Pretrain/Loss": 2.047560214996338, "Pretrain/Loss (Raw)": 1.9045823812484741, "Pretrain/Step": 3736, "Pretrain/Step Time": 8.434194380417466} +{"Pretrain/Learning Rate": 4.6475576820178114e-05, "Pretrain/Loss": 2.0471110343933105, "Pretrain/Loss (Raw)": 2.065793752670288, "Pretrain/Step": 3737, "Pretrain/Step Time": 8.428659783676267} +{"Pretrain/Learning Rate": 4.6473403253566214e-05, "Pretrain/Loss": 2.048185110092163, "Pretrain/Loss (Raw)": 2.1831185817718506, "Pretrain/Step": 3738, "Pretrain/Step Time": 8.430378487333655} +{"Pretrain/Learning Rate": 4.6471229067783875e-05, "Pretrain/Loss": 2.0466721057891846, "Pretrain/Loss (Raw)": 1.7653940916061401, "Pretrain/Step": 3739, "Pretrain/Step Time": 8.42904469370842} +{"Pretrain/Learning Rate": 4.6469054262893785e-05, "Pretrain/Loss": 2.0432281494140625, "Pretrain/Loss (Raw)": 2.057859420776367, "Pretrain/Step": 3740, "Pretrain/Step Time": 8.429648591205478} +{"Pretrain/Learning Rate": 4.646687883895864e-05, "Pretrain/Loss": 2.043311595916748, "Pretrain/Loss (Raw)": 1.9870821237564087, "Pretrain/Step": 3741, "Pretrain/Step Time": 8.428385065868497} +{"Pretrain/Learning Rate": 4.646470279604119e-05, "Pretrain/Loss": 2.0413084030151367, "Pretrain/Loss (Raw)": 1.9544459581375122, "Pretrain/Step": 3742, "Pretrain/Step Time": 8.426922585815191} +{"Pretrain/Learning Rate": 4.646252613420416e-05, "Pretrain/Loss": 2.0415987968444824, "Pretrain/Loss (Raw)": 2.0167229175567627, "Pretrain/Step": 3743, "Pretrain/Step Time": 8.432008365169168} +{"Pretrain/Learning Rate": 4.6460348853510314e-05, "Pretrain/Loss": 2.040867805480957, "Pretrain/Loss (Raw)": 2.0787241458892822, "Pretrain/Step": 3744, "Pretrain/Step Time": 8.428636094555259} +{"Pretrain/Learning Rate": 4.645817095402245e-05, "Pretrain/Loss": 2.040248155593872, "Pretrain/Loss (Raw)": 1.9733080863952637, "Pretrain/Step": 3745, "Pretrain/Step Time": 8.429820386692882} +{"Pretrain/Learning Rate": 4.645599243580334e-05, "Pretrain/Loss": 2.0410447120666504, "Pretrain/Loss (Raw)": 2.12095308303833, "Pretrain/Step": 3746, "Pretrain/Step Time": 8.426356298848987} +{"Pretrain/Learning Rate": 4.645381329891583e-05, "Pretrain/Loss": 2.04048490524292, "Pretrain/Loss (Raw)": 2.1735877990722656, "Pretrain/Step": 3747, "Pretrain/Step Time": 8.42395543679595} +{"Pretrain/Learning Rate": 4.6451633543422727e-05, "Pretrain/Loss": 2.038301467895508, "Pretrain/Loss (Raw)": 1.9492981433868408, "Pretrain/Step": 3748, "Pretrain/Step Time": 8.424988554790616} +{"Pretrain/Learning Rate": 4.644945316938689e-05, "Pretrain/Loss": 2.03773832321167, "Pretrain/Loss (Raw)": 1.8966336250305176, "Pretrain/Step": 3749, "Pretrain/Step Time": 8.426828105002642} +{"Pretrain/Learning Rate": 4.6447272176871194e-05, "Pretrain/Loss": 2.0382721424102783, "Pretrain/Loss (Raw)": 2.0728652477264404, "Pretrain/Step": 3750, "Pretrain/Step Time": 8.427503166720271} +{"Pretrain/Learning Rate": 4.6445090565938524e-05, "Pretrain/Loss": 2.0371599197387695, "Pretrain/Loss (Raw)": 1.8731995820999146, "Pretrain/Step": 3751, "Pretrain/Step Time": 8.42342745885253} +{"Pretrain/Learning Rate": 4.644290833665179e-05, "Pretrain/Loss": 2.036931276321411, "Pretrain/Loss (Raw)": 2.1742565631866455, "Pretrain/Step": 3752, "Pretrain/Step Time": 8.425621682778} +{"Pretrain/Learning Rate": 4.64407254890739e-05, "Pretrain/Loss": 2.036255359649658, "Pretrain/Loss (Raw)": 1.9608521461486816, "Pretrain/Step": 3753, "Pretrain/Step Time": 8.423396497964859} +{"Pretrain/Learning Rate": 4.643854202326782e-05, "Pretrain/Loss": 2.035121440887451, "Pretrain/Loss (Raw)": 2.0631227493286133, "Pretrain/Step": 3754, "Pretrain/Step Time": 8.421703990548849} +{"Pretrain/Learning Rate": 4.643635793929648e-05, "Pretrain/Loss": 2.034989356994629, "Pretrain/Loss (Raw)": 1.9621341228485107, "Pretrain/Step": 3755, "Pretrain/Step Time": 8.42449669726193} +{"Pretrain/Learning Rate": 4.6434173237222876e-05, "Pretrain/Loss": 2.035048007965088, "Pretrain/Loss (Raw)": 2.0449488162994385, "Pretrain/Step": 3756, "Pretrain/Step Time": 8.425718473270535} +{"Pretrain/Learning Rate": 4.6431987917110005e-05, "Pretrain/Loss": 2.0363497734069824, "Pretrain/Loss (Raw)": 2.0551862716674805, "Pretrain/Step": 3757, "Pretrain/Step Time": 8.42632564343512} +{"Pretrain/Learning Rate": 4.6429801979020863e-05, "Pretrain/Loss": 2.0372934341430664, "Pretrain/Loss (Raw)": 2.158154249191284, "Pretrain/Step": 3758, "Pretrain/Step Time": 8.423755628988147} +{"Pretrain/Learning Rate": 4.642761542301849e-05, "Pretrain/Loss": 2.038463592529297, "Pretrain/Loss (Raw)": 2.034303903579712, "Pretrain/Step": 3759, "Pretrain/Step Time": 8.42810402624309} +{"Pretrain/Learning Rate": 4.642542824916592e-05, "Pretrain/Loss": 2.038339138031006, "Pretrain/Loss (Raw)": 2.0927305221557617, "Pretrain/Step": 3760, "Pretrain/Step Time": 8.424816006794572} +{"Pretrain/Learning Rate": 4.642324045752625e-05, "Pretrain/Loss": 2.037372589111328, "Pretrain/Loss (Raw)": 1.988760232925415, "Pretrain/Step": 3761, "Pretrain/Step Time": 8.427627421915531} +{"Pretrain/Learning Rate": 4.6421052048162534e-05, "Pretrain/Loss": 2.0374183654785156, "Pretrain/Loss (Raw)": 2.0720574855804443, "Pretrain/Step": 3762, "Pretrain/Step Time": 8.424768377095461} +{"Pretrain/Learning Rate": 4.641886302113788e-05, "Pretrain/Loss": 2.0369009971618652, "Pretrain/Loss (Raw)": 2.0689218044281006, "Pretrain/Step": 3763, "Pretrain/Step Time": 8.417888771742582} +{"Pretrain/Learning Rate": 4.641667337651542e-05, "Pretrain/Loss": 2.0372681617736816, "Pretrain/Loss (Raw)": 2.12658953666687, "Pretrain/Step": 3764, "Pretrain/Step Time": 8.419417766854167} +{"Pretrain/Learning Rate": 4.641448311435828e-05, "Pretrain/Loss": 2.0355539321899414, "Pretrain/Loss (Raw)": 1.865779161453247, "Pretrain/Step": 3765, "Pretrain/Step Time": 8.422038238495588} +{"Pretrain/Learning Rate": 4.64122922347296e-05, "Pretrain/Loss": 2.03666353225708, "Pretrain/Loss (Raw)": 2.1591649055480957, "Pretrain/Step": 3766, "Pretrain/Step Time": 8.422270890325308} +{"Pretrain/Learning Rate": 4.641010073769258e-05, "Pretrain/Loss": 2.0389175415039062, "Pretrain/Loss (Raw)": 2.209005832672119, "Pretrain/Step": 3767, "Pretrain/Step Time": 8.419489372521639} +{"Pretrain/Learning Rate": 4.64079086233104e-05, "Pretrain/Loss": 2.0390267372131348, "Pretrain/Loss (Raw)": 2.1422274112701416, "Pretrain/Step": 3768, "Pretrain/Step Time": 8.423574956133962} +{"Pretrain/Learning Rate": 4.6405715891646264e-05, "Pretrain/Loss": 2.0397348403930664, "Pretrain/Loss (Raw)": 2.1623988151550293, "Pretrain/Step": 3769, "Pretrain/Step Time": 8.423982301726937} +{"Pretrain/Learning Rate": 4.6403522542763396e-05, "Pretrain/Loss": 2.0392813682556152, "Pretrain/Loss (Raw)": 2.01381778717041, "Pretrain/Step": 3770, "Pretrain/Step Time": 8.420505283400416} +{"Pretrain/Learning Rate": 4.6401328576725044e-05, "Pretrain/Loss": 2.0408267974853516, "Pretrain/Loss (Raw)": 2.061619281768799, "Pretrain/Step": 3771, "Pretrain/Step Time": 8.423946494236588} +{"Pretrain/Learning Rate": 4.639913399359448e-05, "Pretrain/Loss": 2.039102554321289, "Pretrain/Loss (Raw)": 1.959194302558899, "Pretrain/Step": 3772, "Pretrain/Step Time": 8.420776633545756} +{"Pretrain/Learning Rate": 4.6396938793434966e-05, "Pretrain/Loss": 2.0369250774383545, "Pretrain/Loss (Raw)": 1.6846541166305542, "Pretrain/Step": 3773, "Pretrain/Step Time": 8.422956200316548} +{"Pretrain/Learning Rate": 4.63947429763098e-05, "Pretrain/Loss": 2.035335063934326, "Pretrain/Loss (Raw)": 1.9231101274490356, "Pretrain/Step": 3774, "Pretrain/Step Time": 8.422399207949638} +{"Pretrain/Learning Rate": 4.639254654228231e-05, "Pretrain/Loss": 2.034891128540039, "Pretrain/Loss (Raw)": 2.024042844772339, "Pretrain/Step": 3775, "Pretrain/Step Time": 8.421413764357567} +{"Pretrain/Learning Rate": 4.6390349491415817e-05, "Pretrain/Loss": 2.037353038787842, "Pretrain/Loss (Raw)": 1.9802073240280151, "Pretrain/Step": 3776, "Pretrain/Step Time": 8.422011956572533} +{"Pretrain/Learning Rate": 4.638815182377368e-05, "Pretrain/Loss": 2.039752721786499, "Pretrain/Loss (Raw)": 2.2623281478881836, "Pretrain/Step": 3777, "Pretrain/Step Time": 8.421736041083932} +{"Pretrain/Learning Rate": 4.6385953539419255e-05, "Pretrain/Loss": 2.038587808609009, "Pretrain/Loss (Raw)": 2.0398950576782227, "Pretrain/Step": 3778, "Pretrain/Step Time": 8.423306940123439} +{"Pretrain/Learning Rate": 4.6383754638415944e-05, "Pretrain/Loss": 2.037912368774414, "Pretrain/Loss (Raw)": 1.8059124946594238, "Pretrain/Step": 3779, "Pretrain/Step Time": 8.416268318891525} +{"Pretrain/Learning Rate": 4.638155512082714e-05, "Pretrain/Loss": 2.040294647216797, "Pretrain/Loss (Raw)": 2.3365323543548584, "Pretrain/Step": 3780, "Pretrain/Step Time": 8.417240304872394} +{"Pretrain/Learning Rate": 4.637935498671627e-05, "Pretrain/Loss": 2.041874647140503, "Pretrain/Loss (Raw)": 2.1162102222442627, "Pretrain/Step": 3781, "Pretrain/Step Time": 8.418647453188896} +{"Pretrain/Learning Rate": 4.637715423614677e-05, "Pretrain/Loss": 2.0401511192321777, "Pretrain/Loss (Raw)": 1.8006879091262817, "Pretrain/Step": 3782, "Pretrain/Step Time": 8.420958586037159} +{"Pretrain/Learning Rate": 4.6374952869182084e-05, "Pretrain/Loss": 2.040792465209961, "Pretrain/Loss (Raw)": 2.087181329727173, "Pretrain/Step": 3783, "Pretrain/Step Time": 8.420010747388005} +{"Pretrain/Learning Rate": 4.637275088588572e-05, "Pretrain/Loss": 2.0421271324157715, "Pretrain/Loss (Raw)": 2.1214232444763184, "Pretrain/Step": 3784, "Pretrain/Step Time": 8.421283917501569} +{"Pretrain/Learning Rate": 4.6370548286321135e-05, "Pretrain/Loss": 2.041057586669922, "Pretrain/Loss (Raw)": 2.0321624279022217, "Pretrain/Step": 3785, "Pretrain/Step Time": 8.416345711797476} +{"Pretrain/Learning Rate": 4.6368345070551865e-05, "Pretrain/Loss": 2.0405328273773193, "Pretrain/Loss (Raw)": 1.9319896697998047, "Pretrain/Step": 3786, "Pretrain/Step Time": 8.41693951189518} +{"Pretrain/Learning Rate": 4.6366141238641425e-05, "Pretrain/Loss": 2.041491746902466, "Pretrain/Loss (Raw)": 2.2586655616760254, "Pretrain/Step": 3787, "Pretrain/Step Time": 8.416183970868587} +{"Pretrain/Learning Rate": 4.6363936790653374e-05, "Pretrain/Loss": 2.044480562210083, "Pretrain/Loss (Raw)": 2.3007757663726807, "Pretrain/Step": 3788, "Pretrain/Step Time": 8.419775698333979} +{"Pretrain/Learning Rate": 4.6361731726651254e-05, "Pretrain/Loss": 2.044410467147827, "Pretrain/Loss (Raw)": 2.025750160217285, "Pretrain/Step": 3789, "Pretrain/Step Time": 8.419830739498138} +{"Pretrain/Learning Rate": 4.635952604669867e-05, "Pretrain/Loss": 2.0453672409057617, "Pretrain/Loss (Raw)": 2.080711841583252, "Pretrain/Step": 3790, "Pretrain/Step Time": 8.418924460187554} +{"Pretrain/Learning Rate": 4.6357319750859196e-05, "Pretrain/Loss": 2.044508934020996, "Pretrain/Loss (Raw)": 2.048557758331299, "Pretrain/Step": 3791, "Pretrain/Step Time": 8.419252503663301} +{"Pretrain/Learning Rate": 4.635511283919647e-05, "Pretrain/Loss": 2.046806812286377, "Pretrain/Loss (Raw)": 2.1433298587799072, "Pretrain/Step": 3792, "Pretrain/Step Time": 8.418119311332703} +{"Pretrain/Learning Rate": 4.635290531177412e-05, "Pretrain/Loss": 2.043389081954956, "Pretrain/Loss (Raw)": 1.8140738010406494, "Pretrain/Step": 3793, "Pretrain/Step Time": 8.424520757049322} +{"Pretrain/Learning Rate": 4.6350697168655795e-05, "Pretrain/Loss": 2.041954517364502, "Pretrain/Loss (Raw)": 2.0118601322174072, "Pretrain/Step": 3794, "Pretrain/Step Time": 8.424419490620494} +{"Pretrain/Learning Rate": 4.634848840990517e-05, "Pretrain/Loss": 2.0443248748779297, "Pretrain/Loss (Raw)": 2.2623066902160645, "Pretrain/Step": 3795, "Pretrain/Step Time": 8.422958640381694} +{"Pretrain/Learning Rate": 4.634627903558593e-05, "Pretrain/Loss": 2.046196460723877, "Pretrain/Loss (Raw)": 2.084205150604248, "Pretrain/Step": 3796, "Pretrain/Step Time": 8.425041513517499} +{"Pretrain/Learning Rate": 4.6344069045761786e-05, "Pretrain/Loss": 2.048879623413086, "Pretrain/Loss (Raw)": 2.258944034576416, "Pretrain/Step": 3797, "Pretrain/Step Time": 8.41880152747035} +{"Pretrain/Learning Rate": 4.634185844049646e-05, "Pretrain/Loss": 2.0484185218811035, "Pretrain/Loss (Raw)": 2.098114490509033, "Pretrain/Step": 3798, "Pretrain/Step Time": 8.420264400541782} +{"Pretrain/Learning Rate": 4.6339647219853684e-05, "Pretrain/Loss": 2.050546169281006, "Pretrain/Loss (Raw)": 2.154937505722046, "Pretrain/Step": 3799, "Pretrain/Step Time": 8.419966731220484} +{"Pretrain/Learning Rate": 4.633743538389723e-05, "Pretrain/Loss": 2.0506839752197266, "Pretrain/Loss (Raw)": 2.069838523864746, "Pretrain/Step": 3800, "Pretrain/Step Time": 8.419495895504951} +{"Pretrain/Learning Rate": 4.633522293269086e-05, "Pretrain/Loss": 2.051945209503174, "Pretrain/Loss (Raw)": 2.1320881843566895, "Pretrain/Step": 3801, "Pretrain/Step Time": 8.417698020115495} +{"Pretrain/Learning Rate": 4.633300986629838e-05, "Pretrain/Loss": 2.049203395843506, "Pretrain/Loss (Raw)": 2.0152037143707275, "Pretrain/Step": 3802, "Pretrain/Step Time": 8.420073485001922} +{"Pretrain/Learning Rate": 4.633079618478361e-05, "Pretrain/Loss": 2.04925799369812, "Pretrain/Loss (Raw)": 2.115464448928833, "Pretrain/Step": 3803, "Pretrain/Step Time": 8.417928194627166} +{"Pretrain/Learning Rate": 4.632858188821035e-05, "Pretrain/Loss": 2.048746109008789, "Pretrain/Loss (Raw)": 2.171570062637329, "Pretrain/Step": 3804, "Pretrain/Step Time": 8.423756178468466} +{"Pretrain/Learning Rate": 4.632636697664249e-05, "Pretrain/Loss": 2.0492043495178223, "Pretrain/Loss (Raw)": 2.1209118366241455, "Pretrain/Step": 3805, "Pretrain/Step Time": 8.42330101504922} +{"Pretrain/Learning Rate": 4.6324151450143854e-05, "Pretrain/Loss": 2.0474390983581543, "Pretrain/Loss (Raw)": 1.8192733526229858, "Pretrain/Step": 3806, "Pretrain/Step Time": 8.426830191165209} +{"Pretrain/Learning Rate": 4.632193530877835e-05, "Pretrain/Loss": 2.0474910736083984, "Pretrain/Loss (Raw)": 2.0000522136688232, "Pretrain/Step": 3807, "Pretrain/Step Time": 8.425562115386128} +{"Pretrain/Learning Rate": 4.631971855260987e-05, "Pretrain/Loss": 2.047508716583252, "Pretrain/Loss (Raw)": 2.0638437271118164, "Pretrain/Step": 3808, "Pretrain/Step Time": 8.425739960744977} +{"Pretrain/Learning Rate": 4.631750118170234e-05, "Pretrain/Loss": 2.053117036819458, "Pretrain/Loss (Raw)": 2.733191728591919, "Pretrain/Step": 3809, "Pretrain/Step Time": 8.427043221890926} +{"Pretrain/Learning Rate": 4.6315283196119685e-05, "Pretrain/Loss": 2.054302453994751, "Pretrain/Loss (Raw)": 2.2763118743896484, "Pretrain/Step": 3810, "Pretrain/Step Time": 8.424194172024727} +{"Pretrain/Learning Rate": 4.631306459592587e-05, "Pretrain/Loss": 2.0537123680114746, "Pretrain/Loss (Raw)": 2.0216567516326904, "Pretrain/Step": 3811, "Pretrain/Step Time": 8.42511347308755} +{"Pretrain/Learning Rate": 4.631084538118486e-05, "Pretrain/Loss": 2.0552189350128174, "Pretrain/Loss (Raw)": 2.083881139755249, "Pretrain/Step": 3812, "Pretrain/Step Time": 8.426060281693935} +{"Pretrain/Learning Rate": 4.630862555196065e-05, "Pretrain/Loss": 2.058244466781616, "Pretrain/Loss (Raw)": 2.4428083896636963, "Pretrain/Step": 3813, "Pretrain/Step Time": 8.42207107692957} +{"Pretrain/Learning Rate": 4.630640510831724e-05, "Pretrain/Loss": 2.0549557209014893, "Pretrain/Loss (Raw)": 1.961626648902893, "Pretrain/Step": 3814, "Pretrain/Step Time": 8.42140262387693} +{"Pretrain/Learning Rate": 4.6304184050318655e-05, "Pretrain/Loss": 2.0585992336273193, "Pretrain/Loss (Raw)": 2.0169785022735596, "Pretrain/Step": 3815, "Pretrain/Step Time": 8.418591184541583} +{"Pretrain/Learning Rate": 4.630196237802895e-05, "Pretrain/Loss": 2.0580742359161377, "Pretrain/Loss (Raw)": 2.117992877960205, "Pretrain/Step": 3816, "Pretrain/Step Time": 8.4214221034199} +{"Pretrain/Learning Rate": 4.629974009151217e-05, "Pretrain/Loss": 2.059274911880493, "Pretrain/Loss (Raw)": 2.0073118209838867, "Pretrain/Step": 3817, "Pretrain/Step Time": 8.424818841740489} +{"Pretrain/Learning Rate": 4.6297517190832405e-05, "Pretrain/Loss": 2.059035539627075, "Pretrain/Loss (Raw)": 2.114335536956787, "Pretrain/Step": 3818, "Pretrain/Step Time": 8.424181433394551} +{"Pretrain/Learning Rate": 4.629529367605374e-05, "Pretrain/Loss": 2.0583274364471436, "Pretrain/Loss (Raw)": 2.0470635890960693, "Pretrain/Step": 3819, "Pretrain/Step Time": 8.422270901501179} +{"Pretrain/Learning Rate": 4.62930695472403e-05, "Pretrain/Loss": 2.059271812438965, "Pretrain/Loss (Raw)": 1.9097100496292114, "Pretrain/Step": 3820, "Pretrain/Step Time": 8.423124870285392} +{"Pretrain/Learning Rate": 4.629084480445621e-05, "Pretrain/Loss": 2.057816743850708, "Pretrain/Loss (Raw)": 2.0338263511657715, "Pretrain/Step": 3821, "Pretrain/Step Time": 8.424138110131025} +{"Pretrain/Learning Rate": 4.628861944776561e-05, "Pretrain/Loss": 2.057351589202881, "Pretrain/Loss (Raw)": 1.9846930503845215, "Pretrain/Step": 3822, "Pretrain/Step Time": 8.42794798873365} +{"Pretrain/Learning Rate": 4.628639347723268e-05, "Pretrain/Loss": 2.057899236679077, "Pretrain/Loss (Raw)": 2.089827299118042, "Pretrain/Step": 3823, "Pretrain/Step Time": 8.42566811479628} +{"Pretrain/Learning Rate": 4.628416689292161e-05, "Pretrain/Loss": 2.058103084564209, "Pretrain/Loss (Raw)": 2.0791633129119873, "Pretrain/Step": 3824, "Pretrain/Step Time": 8.4264330919832} +{"Pretrain/Learning Rate": 4.628193969489658e-05, "Pretrain/Loss": 2.056518793106079, "Pretrain/Loss (Raw)": 1.9712989330291748, "Pretrain/Step": 3825, "Pretrain/Step Time": 8.427052587270737} +{"Pretrain/Learning Rate": 4.627971188322183e-05, "Pretrain/Loss": 2.055227279663086, "Pretrain/Loss (Raw)": 1.9649767875671387, "Pretrain/Step": 3826, "Pretrain/Step Time": 8.431424679234624} +{"Pretrain/Learning Rate": 4.627748345796158e-05, "Pretrain/Loss": 2.0559661388397217, "Pretrain/Loss (Raw)": 2.2020981311798096, "Pretrain/Step": 3827, "Pretrain/Step Time": 8.434192165732384} +{"Pretrain/Learning Rate": 4.62752544191801e-05, "Pretrain/Loss": 2.056835174560547, "Pretrain/Loss (Raw)": 2.204564332962036, "Pretrain/Step": 3828, "Pretrain/Step Time": 8.426287397742271} +{"Pretrain/Learning Rate": 4.627302476694166e-05, "Pretrain/Loss": 2.0572597980499268, "Pretrain/Loss (Raw)": 2.011624336242676, "Pretrain/Step": 3829, "Pretrain/Step Time": 8.424817634746432} +{"Pretrain/Learning Rate": 4.627079450131054e-05, "Pretrain/Loss": 2.057041645050049, "Pretrain/Loss (Raw)": 1.964082956314087, "Pretrain/Step": 3830, "Pretrain/Step Time": 8.426327217370272} +{"Pretrain/Learning Rate": 4.626856362235106e-05, "Pretrain/Loss": 2.0565476417541504, "Pretrain/Loss (Raw)": 1.9175922870635986, "Pretrain/Step": 3831, "Pretrain/Step Time": 8.425141669809818} +{"Pretrain/Learning Rate": 4.6266332130127546e-05, "Pretrain/Loss": 2.054751396179199, "Pretrain/Loss (Raw)": 1.8049923181533813, "Pretrain/Step": 3832, "Pretrain/Step Time": 8.42230162769556} +{"Pretrain/Learning Rate": 4.626410002470433e-05, "Pretrain/Loss": 2.0556063652038574, "Pretrain/Loss (Raw)": 1.8929924964904785, "Pretrain/Step": 3833, "Pretrain/Step Time": 8.42410539649427} +{"Pretrain/Learning Rate": 4.6261867306145776e-05, "Pretrain/Loss": 2.0560364723205566, "Pretrain/Loss (Raw)": 2.2065682411193848, "Pretrain/Step": 3834, "Pretrain/Step Time": 8.426753424108028} +{"Pretrain/Learning Rate": 4.625963397451627e-05, "Pretrain/Loss": 2.058318853378296, "Pretrain/Loss (Raw)": 2.206392765045166, "Pretrain/Step": 3835, "Pretrain/Step Time": 8.422322357073426} +{"Pretrain/Learning Rate": 4.625740002988021e-05, "Pretrain/Loss": 2.0576343536376953, "Pretrain/Loss (Raw)": 1.8320200443267822, "Pretrain/Step": 3836, "Pretrain/Step Time": 8.426520267501473} +{"Pretrain/Learning Rate": 4.6255165472301995e-05, "Pretrain/Loss": 2.0578393936157227, "Pretrain/Loss (Raw)": 2.05381178855896, "Pretrain/Step": 3837, "Pretrain/Step Time": 8.421809079125524} +{"Pretrain/Learning Rate": 4.625293030184608e-05, "Pretrain/Loss": 2.0592949390411377, "Pretrain/Loss (Raw)": 2.158179521560669, "Pretrain/Step": 3838, "Pretrain/Step Time": 8.42450213059783} +{"Pretrain/Learning Rate": 4.62506945185769e-05, "Pretrain/Loss": 2.059800148010254, "Pretrain/Loss (Raw)": 2.1246297359466553, "Pretrain/Step": 3839, "Pretrain/Step Time": 8.427375866100192} +{"Pretrain/Learning Rate": 4.624845812255892e-05, "Pretrain/Loss": 2.0614876747131348, "Pretrain/Loss (Raw)": 2.169675350189209, "Pretrain/Step": 3840, "Pretrain/Step Time": 8.425659719854593} +{"Pretrain/Learning Rate": 4.624622111385663e-05, "Pretrain/Loss": 2.0606210231781006, "Pretrain/Loss (Raw)": 2.1611955165863037, "Pretrain/Step": 3841, "Pretrain/Step Time": 8.42929146438837} +{"Pretrain/Learning Rate": 4.6243983492534534e-05, "Pretrain/Loss": 2.0614819526672363, "Pretrain/Loss (Raw)": 2.3688242435455322, "Pretrain/Step": 3842, "Pretrain/Step Time": 8.426189914345741} +{"Pretrain/Learning Rate": 4.624174525865715e-05, "Pretrain/Loss": 2.0648930072784424, "Pretrain/Loss (Raw)": 2.3392133712768555, "Pretrain/Step": 3843, "Pretrain/Step Time": 8.428071470931172} +{"Pretrain/Learning Rate": 4.623950641228901e-05, "Pretrain/Loss": 2.0659358501434326, "Pretrain/Loss (Raw)": 2.0186314582824707, "Pretrain/Step": 3844, "Pretrain/Step Time": 8.424834802746773} +{"Pretrain/Learning Rate": 4.623726695349469e-05, "Pretrain/Loss": 2.06522798538208, "Pretrain/Loss (Raw)": 1.9977519512176514, "Pretrain/Step": 3845, "Pretrain/Step Time": 8.423399895429611} +{"Pretrain/Learning Rate": 4.623502688233873e-05, "Pretrain/Loss": 2.065857410430908, "Pretrain/Loss (Raw)": 2.0645711421966553, "Pretrain/Step": 3846, "Pretrain/Step Time": 8.42566642910242} +{"Pretrain/Learning Rate": 4.6232786198885746e-05, "Pretrain/Loss": 2.0667648315429688, "Pretrain/Loss (Raw)": 1.9893898963928223, "Pretrain/Step": 3847, "Pretrain/Step Time": 8.423285868018866} +{"Pretrain/Learning Rate": 4.623054490320034e-05, "Pretrain/Loss": 2.0658254623413086, "Pretrain/Loss (Raw)": 1.7954188585281372, "Pretrain/Step": 3848, "Pretrain/Step Time": 8.428270487114787} +{"Pretrain/Learning Rate": 4.622830299534715e-05, "Pretrain/Loss": 2.0669705867767334, "Pretrain/Loss (Raw)": 2.0736868381500244, "Pretrain/Step": 3849, "Pretrain/Step Time": 8.429305229336023} +{"Pretrain/Learning Rate": 4.6226060475390796e-05, "Pretrain/Loss": 2.066005229949951, "Pretrain/Loss (Raw)": 2.092693328857422, "Pretrain/Step": 3850, "Pretrain/Step Time": 8.430386373773217} +{"Pretrain/Learning Rate": 4.6223817343395955e-05, "Pretrain/Loss": 2.067767858505249, "Pretrain/Loss (Raw)": 2.1588799953460693, "Pretrain/Step": 3851, "Pretrain/Step Time": 8.42793128080666} +{"Pretrain/Learning Rate": 4.6221573599427305e-05, "Pretrain/Loss": 2.0684590339660645, "Pretrain/Loss (Raw)": 2.2128355503082275, "Pretrain/Step": 3852, "Pretrain/Step Time": 8.42926912382245} +{"Pretrain/Learning Rate": 4.621932924354954e-05, "Pretrain/Loss": 2.0684261322021484, "Pretrain/Loss (Raw)": 2.1365747451782227, "Pretrain/Step": 3853, "Pretrain/Step Time": 8.42649943754077} +{"Pretrain/Learning Rate": 4.6217084275827366e-05, "Pretrain/Loss": 2.070006847381592, "Pretrain/Loss (Raw)": 2.178239107131958, "Pretrain/Step": 3854, "Pretrain/Step Time": 8.429946707561612} +{"Pretrain/Learning Rate": 4.621483869632553e-05, "Pretrain/Loss": 2.0700278282165527, "Pretrain/Loss (Raw)": 2.0828237533569336, "Pretrain/Step": 3855, "Pretrain/Step Time": 8.433904148638248} +{"Pretrain/Learning Rate": 4.6212592505108776e-05, "Pretrain/Loss": 2.070054531097412, "Pretrain/Loss (Raw)": 2.1409847736358643, "Pretrain/Step": 3856, "Pretrain/Step Time": 8.432172551751137} +{"Pretrain/Learning Rate": 4.621034570224187e-05, "Pretrain/Loss": 2.0682590007781982, "Pretrain/Loss (Raw)": 1.8545695543289185, "Pretrain/Step": 3857, "Pretrain/Step Time": 8.433378482237458} +{"Pretrain/Learning Rate": 4.6208098287789605e-05, "Pretrain/Loss": 2.0675511360168457, "Pretrain/Loss (Raw)": 2.111605405807495, "Pretrain/Step": 3858, "Pretrain/Step Time": 8.438728362321854} +{"Pretrain/Learning Rate": 4.620585026181676e-05, "Pretrain/Loss": 2.067579984664917, "Pretrain/Loss (Raw)": 2.0848183631896973, "Pretrain/Step": 3859, "Pretrain/Step Time": 8.441639797762036} +{"Pretrain/Learning Rate": 4.6203601624388184e-05, "Pretrain/Loss": 2.065603733062744, "Pretrain/Loss (Raw)": 1.5950368642807007, "Pretrain/Step": 3860, "Pretrain/Step Time": 8.4346889462322} +{"Pretrain/Learning Rate": 4.6201352375568706e-05, "Pretrain/Loss": 2.061706066131592, "Pretrain/Loss (Raw)": 2.197225570678711, "Pretrain/Step": 3861, "Pretrain/Step Time": 8.431868178769946} +{"Pretrain/Learning Rate": 4.6199102515423175e-05, "Pretrain/Loss": 2.0622007846832275, "Pretrain/Loss (Raw)": 2.136376142501831, "Pretrain/Step": 3862, "Pretrain/Step Time": 8.430187055841088} +{"Pretrain/Learning Rate": 4.619685204401647e-05, "Pretrain/Loss": 2.0653748512268066, "Pretrain/Loss (Raw)": 2.325120210647583, "Pretrain/Step": 3863, "Pretrain/Step Time": 8.428481820970774} +{"Pretrain/Learning Rate": 4.619460096141347e-05, "Pretrain/Loss": 2.066559076309204, "Pretrain/Loss (Raw)": 2.056196689605713, "Pretrain/Step": 3864, "Pretrain/Step Time": 8.42705244384706} +{"Pretrain/Learning Rate": 4.61923492676791e-05, "Pretrain/Loss": 2.065545082092285, "Pretrain/Loss (Raw)": 1.9360029697418213, "Pretrain/Step": 3865, "Pretrain/Step Time": 8.429728012531996} +{"Pretrain/Learning Rate": 4.619009696287827e-05, "Pretrain/Loss": 2.0663888454437256, "Pretrain/Loss (Raw)": 2.2910966873168945, "Pretrain/Step": 3866, "Pretrain/Step Time": 8.43270787037909} +{"Pretrain/Learning Rate": 4.618784404707594e-05, "Pretrain/Loss": 2.069160223007202, "Pretrain/Loss (Raw)": 2.120124101638794, "Pretrain/Step": 3867, "Pretrain/Step Time": 8.431172993034124} +{"Pretrain/Learning Rate": 4.618559052033706e-05, "Pretrain/Loss": 2.0704853534698486, "Pretrain/Loss (Raw)": 2.227482795715332, "Pretrain/Step": 3868, "Pretrain/Step Time": 8.43699044175446} +{"Pretrain/Learning Rate": 4.618333638272661e-05, "Pretrain/Loss": 2.073996067047119, "Pretrain/Loss (Raw)": 2.436488389968872, "Pretrain/Step": 3869, "Pretrain/Step Time": 8.435925608500838} +{"Pretrain/Learning Rate": 4.61810816343096e-05, "Pretrain/Loss": 2.074413776397705, "Pretrain/Loss (Raw)": 2.007906913757324, "Pretrain/Step": 3870, "Pretrain/Step Time": 8.436227632686496} +{"Pretrain/Learning Rate": 4.617882627515102e-05, "Pretrain/Loss": 2.074193000793457, "Pretrain/Loss (Raw)": 1.9884364604949951, "Pretrain/Step": 3871, "Pretrain/Step Time": 8.436984710395336} +{"Pretrain/Learning Rate": 4.6176570305315925e-05, "Pretrain/Loss": 2.0732619762420654, "Pretrain/Loss (Raw)": 1.9595704078674316, "Pretrain/Step": 3872, "Pretrain/Step Time": 8.438512586057186} +{"Pretrain/Learning Rate": 4.617431372486935e-05, "Pretrain/Loss": 2.07468318939209, "Pretrain/Loss (Raw)": 2.1552000045776367, "Pretrain/Step": 3873, "Pretrain/Step Time": 8.439414558932185} +{"Pretrain/Learning Rate": 4.617205653387636e-05, "Pretrain/Loss": 2.074711561203003, "Pretrain/Loss (Raw)": 2.1245861053466797, "Pretrain/Step": 3874, "Pretrain/Step Time": 8.443566638976336} +{"Pretrain/Learning Rate": 4.616979873240205e-05, "Pretrain/Loss": 2.0736501216888428, "Pretrain/Loss (Raw)": 2.0377426147460938, "Pretrain/Step": 3875, "Pretrain/Step Time": 8.442254800349474} +{"Pretrain/Learning Rate": 4.616754032051152e-05, "Pretrain/Loss": 2.0739798545837402, "Pretrain/Loss (Raw)": 1.991495966911316, "Pretrain/Step": 3876, "Pretrain/Step Time": 8.438286025077105} +{"Pretrain/Learning Rate": 4.616528129826988e-05, "Pretrain/Loss": 2.0749354362487793, "Pretrain/Loss (Raw)": 2.0189387798309326, "Pretrain/Step": 3877, "Pretrain/Step Time": 8.436741527169943} +{"Pretrain/Learning Rate": 4.616302166574227e-05, "Pretrain/Loss": 2.0755951404571533, "Pretrain/Loss (Raw)": 2.1573126316070557, "Pretrain/Step": 3878, "Pretrain/Step Time": 8.436079576611519} +{"Pretrain/Learning Rate": 4.616076142299386e-05, "Pretrain/Loss": 2.075387477874756, "Pretrain/Loss (Raw)": 1.8466187715530396, "Pretrain/Step": 3879, "Pretrain/Step Time": 8.437230726704001} +{"Pretrain/Learning Rate": 4.615850057008981e-05, "Pretrain/Loss": 2.0730509757995605, "Pretrain/Loss (Raw)": 1.875208854675293, "Pretrain/Step": 3880, "Pretrain/Step Time": 8.434388417750597} +{"Pretrain/Learning Rate": 4.615623910709531e-05, "Pretrain/Loss": 2.0726728439331055, "Pretrain/Loss (Raw)": 1.9124464988708496, "Pretrain/Step": 3881, "Pretrain/Step Time": 8.431279946118593} +{"Pretrain/Learning Rate": 4.615397703407557e-05, "Pretrain/Loss": 2.0706324577331543, "Pretrain/Loss (Raw)": 1.801925539970398, "Pretrain/Step": 3882, "Pretrain/Step Time": 8.438331592828035} +{"Pretrain/Learning Rate": 4.6151714351095806e-05, "Pretrain/Loss": 2.0720760822296143, "Pretrain/Loss (Raw)": 2.1469171047210693, "Pretrain/Step": 3883, "Pretrain/Step Time": 8.43178203701973} +{"Pretrain/Learning Rate": 4.6149451058221286e-05, "Pretrain/Loss": 2.0731940269470215, "Pretrain/Loss (Raw)": 2.1880416870117188, "Pretrain/Step": 3884, "Pretrain/Step Time": 8.43041013367474} +{"Pretrain/Learning Rate": 4.6147187155517243e-05, "Pretrain/Loss": 2.0730674266815186, "Pretrain/Loss (Raw)": 2.0390005111694336, "Pretrain/Step": 3885, "Pretrain/Step Time": 8.431161250919104} +{"Pretrain/Learning Rate": 4.614492264304897e-05, "Pretrain/Loss": 2.0708465576171875, "Pretrain/Loss (Raw)": 1.87389075756073, "Pretrain/Step": 3886, "Pretrain/Step Time": 8.436577081680298} +{"Pretrain/Learning Rate": 4.614265752088176e-05, "Pretrain/Loss": 2.0711660385131836, "Pretrain/Loss (Raw)": 2.07519793510437, "Pretrain/Step": 3887, "Pretrain/Step Time": 8.432319279760122} +{"Pretrain/Learning Rate": 4.614039178908093e-05, "Pretrain/Loss": 2.0694544315338135, "Pretrain/Loss (Raw)": 1.8736423254013062, "Pretrain/Step": 3888, "Pretrain/Step Time": 8.437531765550375} +{"Pretrain/Learning Rate": 4.613812544771179e-05, "Pretrain/Loss": 2.069828748703003, "Pretrain/Loss (Raw)": 2.0366718769073486, "Pretrain/Step": 3889, "Pretrain/Step Time": 8.430581878870726} +{"Pretrain/Learning Rate": 4.6135858496839716e-05, "Pretrain/Loss": 2.068084239959717, "Pretrain/Loss (Raw)": 1.848743200302124, "Pretrain/Step": 3890, "Pretrain/Step Time": 8.434032153338194} +{"Pretrain/Learning Rate": 4.6133590936530056e-05, "Pretrain/Loss": 2.068010091781616, "Pretrain/Loss (Raw)": 2.059458017349243, "Pretrain/Step": 3891, "Pretrain/Step Time": 8.433388149365783} +{"Pretrain/Learning Rate": 4.6131322766848204e-05, "Pretrain/Loss": 2.0686376094818115, "Pretrain/Loss (Raw)": 2.2068898677825928, "Pretrain/Step": 3892, "Pretrain/Step Time": 8.434452729299664} +{"Pretrain/Learning Rate": 4.612905398785956e-05, "Pretrain/Loss": 2.0702381134033203, "Pretrain/Loss (Raw)": 2.0706586837768555, "Pretrain/Step": 3893, "Pretrain/Step Time": 8.428911108523607} +{"Pretrain/Learning Rate": 4.6126784599629534e-05, "Pretrain/Loss": 2.0717554092407227, "Pretrain/Loss (Raw)": 2.3533756732940674, "Pretrain/Step": 3894, "Pretrain/Step Time": 8.431337235495448} +{"Pretrain/Learning Rate": 4.6124514602223566e-05, "Pretrain/Loss": 2.06872820854187, "Pretrain/Loss (Raw)": 1.8215287923812866, "Pretrain/Step": 3895, "Pretrain/Step Time": 8.430480051785707} +{"Pretrain/Learning Rate": 4.612224399570711e-05, "Pretrain/Loss": 2.0692622661590576, "Pretrain/Loss (Raw)": 2.210594415664673, "Pretrain/Step": 3896, "Pretrain/Step Time": 8.428779128938913} +{"Pretrain/Learning Rate": 4.611997278014565e-05, "Pretrain/Loss": 2.0707218647003174, "Pretrain/Loss (Raw)": 2.349210262298584, "Pretrain/Step": 3897, "Pretrain/Step Time": 8.427352426573634} +{"Pretrain/Learning Rate": 4.6117700955604655e-05, "Pretrain/Loss": 2.071716785430908, "Pretrain/Loss (Raw)": 2.141148805618286, "Pretrain/Step": 3898, "Pretrain/Step Time": 8.433008212596178} +{"Pretrain/Learning Rate": 4.611542852214964e-05, "Pretrain/Loss": 2.0702803134918213, "Pretrain/Loss (Raw)": 1.8777694702148438, "Pretrain/Step": 3899, "Pretrain/Step Time": 8.430343188345432} +{"Pretrain/Learning Rate": 4.6113155479846124e-05, "Pretrain/Loss": 2.071009635925293, "Pretrain/Loss (Raw)": 2.0525524616241455, "Pretrain/Step": 3900, "Pretrain/Step Time": 8.434830309823155} +{"Pretrain/Learning Rate": 4.611088182875966e-05, "Pretrain/Loss": 2.073507785797119, "Pretrain/Loss (Raw)": 2.004410743713379, "Pretrain/Step": 3901, "Pretrain/Step Time": 8.43650384992361} +{"Pretrain/Learning Rate": 4.61086075689558e-05, "Pretrain/Loss": 2.0753719806671143, "Pretrain/Loss (Raw)": 2.161731481552124, "Pretrain/Step": 3902, "Pretrain/Step Time": 8.437110245227814} +{"Pretrain/Learning Rate": 4.610633270050012e-05, "Pretrain/Loss": 2.074195384979248, "Pretrain/Loss (Raw)": 1.8734519481658936, "Pretrain/Step": 3903, "Pretrain/Step Time": 8.436998223885894} +{"Pretrain/Learning Rate": 4.610405722345822e-05, "Pretrain/Loss": 2.0743472576141357, "Pretrain/Loss (Raw)": 1.9996395111083984, "Pretrain/Step": 3904, "Pretrain/Step Time": 8.438677510246634} +{"Pretrain/Learning Rate": 4.6101781137895704e-05, "Pretrain/Loss": 2.07375431060791, "Pretrain/Loss (Raw)": 2.1864571571350098, "Pretrain/Step": 3905, "Pretrain/Step Time": 8.440915308892727} +{"Pretrain/Learning Rate": 4.60995044438782e-05, "Pretrain/Loss": 2.073695659637451, "Pretrain/Loss (Raw)": 2.032355785369873, "Pretrain/Step": 3906, "Pretrain/Step Time": 8.439828034490347} +{"Pretrain/Learning Rate": 4.6097227141471365e-05, "Pretrain/Loss": 2.075216770172119, "Pretrain/Loss (Raw)": 2.0006110668182373, "Pretrain/Step": 3907, "Pretrain/Step Time": 8.445477528497577} +{"Pretrain/Learning Rate": 4.609494923074086e-05, "Pretrain/Loss": 2.072704792022705, "Pretrain/Loss (Raw)": 2.0149991512298584, "Pretrain/Step": 3908, "Pretrain/Step Time": 8.445877227932215} +{"Pretrain/Learning Rate": 4.6092670711752364e-05, "Pretrain/Loss": 2.071469783782959, "Pretrain/Loss (Raw)": 1.9581408500671387, "Pretrain/Step": 3909, "Pretrain/Step Time": 8.443657984957099} +{"Pretrain/Learning Rate": 4.6090391584571566e-05, "Pretrain/Loss": 2.072878837585449, "Pretrain/Loss (Raw)": 1.9810540676116943, "Pretrain/Step": 3910, "Pretrain/Step Time": 8.439701264724135} +{"Pretrain/Learning Rate": 4.608811184926421e-05, "Pretrain/Loss": 2.0740044116973877, "Pretrain/Loss (Raw)": 2.2312471866607666, "Pretrain/Step": 3911, "Pretrain/Step Time": 8.439728723838925} +{"Pretrain/Learning Rate": 4.6085831505896e-05, "Pretrain/Loss": 2.075471878051758, "Pretrain/Loss (Raw)": 2.309237241744995, "Pretrain/Step": 3912, "Pretrain/Step Time": 8.43700155057013} +{"Pretrain/Learning Rate": 4.6083550554532715e-05, "Pretrain/Loss": 2.074531316757202, "Pretrain/Loss (Raw)": 1.9117825031280518, "Pretrain/Step": 3913, "Pretrain/Step Time": 8.438929865136743} +{"Pretrain/Learning Rate": 4.608126899524011e-05, "Pretrain/Loss": 2.0754568576812744, "Pretrain/Loss (Raw)": 2.0504655838012695, "Pretrain/Step": 3914, "Pretrain/Step Time": 8.439615922048688} +{"Pretrain/Learning Rate": 4.607898682808398e-05, "Pretrain/Loss": 2.074795722961426, "Pretrain/Loss (Raw)": 2.174057960510254, "Pretrain/Step": 3915, "Pretrain/Step Time": 8.437490647658706} +{"Pretrain/Learning Rate": 4.607670405313012e-05, "Pretrain/Loss": 2.07356333732605, "Pretrain/Loss (Raw)": 2.1429951190948486, "Pretrain/Step": 3916, "Pretrain/Step Time": 8.435702968388796} +{"Pretrain/Learning Rate": 4.6074420670444354e-05, "Pretrain/Loss": 2.074523448944092, "Pretrain/Loss (Raw)": 2.148672342300415, "Pretrain/Step": 3917, "Pretrain/Step Time": 8.435768850147724} +{"Pretrain/Learning Rate": 4.6072136680092525e-05, "Pretrain/Loss": 2.073139190673828, "Pretrain/Loss (Raw)": 1.903516411781311, "Pretrain/Step": 3918, "Pretrain/Step Time": 8.437507756054401} +{"Pretrain/Learning Rate": 4.606985208214049e-05, "Pretrain/Loss": 2.073976516723633, "Pretrain/Loss (Raw)": 2.155736207962036, "Pretrain/Step": 3919, "Pretrain/Step Time": 8.438390219584107} +{"Pretrain/Learning Rate": 4.606756687665412e-05, "Pretrain/Loss": 2.072856903076172, "Pretrain/Loss (Raw)": 2.000033378601074, "Pretrain/Step": 3920, "Pretrain/Step Time": 8.4395234528929} +{"Pretrain/Learning Rate": 4.606528106369932e-05, "Pretrain/Loss": 2.0760154724121094, "Pretrain/Loss (Raw)": 2.218360424041748, "Pretrain/Step": 3921, "Pretrain/Step Time": 8.433726117014885} +{"Pretrain/Learning Rate": 4.606299464334198e-05, "Pretrain/Loss": 2.076859712600708, "Pretrain/Loss (Raw)": 2.119933843612671, "Pretrain/Step": 3922, "Pretrain/Step Time": 8.434432381764054} +{"Pretrain/Learning Rate": 4.6060707615648046e-05, "Pretrain/Loss": 2.075817823410034, "Pretrain/Loss (Raw)": 2.1289327144622803, "Pretrain/Step": 3923, "Pretrain/Step Time": 8.43553040921688} +{"Pretrain/Learning Rate": 4.6058419980683455e-05, "Pretrain/Loss": 2.0746142864227295, "Pretrain/Loss (Raw)": 1.9301505088806152, "Pretrain/Step": 3924, "Pretrain/Step Time": 8.433862341567874} +{"Pretrain/Learning Rate": 4.605613173851416e-05, "Pretrain/Loss": 2.0733978748321533, "Pretrain/Loss (Raw)": 2.1032299995422363, "Pretrain/Step": 3925, "Pretrain/Step Time": 8.438817916437984} +{"Pretrain/Learning Rate": 4.605384288920616e-05, "Pretrain/Loss": 2.073126792907715, "Pretrain/Loss (Raw)": 2.063429832458496, "Pretrain/Step": 3926, "Pretrain/Step Time": 8.435491656884551} +{"Pretrain/Learning Rate": 4.6051553432825436e-05, "Pretrain/Loss": 2.071983814239502, "Pretrain/Loss (Raw)": 2.0086381435394287, "Pretrain/Step": 3927, "Pretrain/Step Time": 8.432613363489509} +{"Pretrain/Learning Rate": 4.604926336943801e-05, "Pretrain/Loss": 2.0729563236236572, "Pretrain/Loss (Raw)": 2.194304943084717, "Pretrain/Step": 3928, "Pretrain/Step Time": 8.43531408160925} +{"Pretrain/Learning Rate": 4.604697269910992e-05, "Pretrain/Loss": 2.0736124515533447, "Pretrain/Loss (Raw)": 2.2160778045654297, "Pretrain/Step": 3929, "Pretrain/Step Time": 8.433359194546938} +{"Pretrain/Learning Rate": 4.6044681421907204e-05, "Pretrain/Loss": 2.07412052154541, "Pretrain/Loss (Raw)": 2.0802319049835205, "Pretrain/Step": 3930, "Pretrain/Step Time": 8.430688014253974} +{"Pretrain/Learning Rate": 4.6042389537895935e-05, "Pretrain/Loss": 2.0729799270629883, "Pretrain/Loss (Raw)": 1.969469666481018, "Pretrain/Step": 3931, "Pretrain/Step Time": 8.436214454472065} +{"Pretrain/Learning Rate": 4.604009704714219e-05, "Pretrain/Loss": 2.0726189613342285, "Pretrain/Loss (Raw)": 2.125385284423828, "Pretrain/Step": 3932, "Pretrain/Step Time": 8.430029978975654} +{"Pretrain/Learning Rate": 4.6037803949712094e-05, "Pretrain/Loss": 2.0724973678588867, "Pretrain/Loss (Raw)": 2.105360269546509, "Pretrain/Step": 3933, "Pretrain/Step Time": 8.431227277964354} +{"Pretrain/Learning Rate": 4.603551024567174e-05, "Pretrain/Loss": 2.0724852085113525, "Pretrain/Loss (Raw)": 1.8176943063735962, "Pretrain/Step": 3934, "Pretrain/Step Time": 8.425994958728552} +{"Pretrain/Learning Rate": 4.603321593508728e-05, "Pretrain/Loss": 2.072645425796509, "Pretrain/Loss (Raw)": 2.0205562114715576, "Pretrain/Step": 3935, "Pretrain/Step Time": 8.426888501271605} +{"Pretrain/Learning Rate": 4.603092101802487e-05, "Pretrain/Loss": 2.0708940029144287, "Pretrain/Loss (Raw)": 1.839666485786438, "Pretrain/Step": 3936, "Pretrain/Step Time": 8.433733014389873} +{"Pretrain/Learning Rate": 4.602862549455068e-05, "Pretrain/Loss": 2.0655741691589355, "Pretrain/Loss (Raw)": 2.0522587299346924, "Pretrain/Step": 3937, "Pretrain/Step Time": 8.432622533291578} +{"Pretrain/Learning Rate": 4.602632936473089e-05, "Pretrain/Loss": 2.0646209716796875, "Pretrain/Loss (Raw)": 2.1542892456054688, "Pretrain/Step": 3938, "Pretrain/Step Time": 8.4297648165375} +{"Pretrain/Learning Rate": 4.602403262863172e-05, "Pretrain/Loss": 2.0649118423461914, "Pretrain/Loss (Raw)": 2.058887004852295, "Pretrain/Step": 3939, "Pretrain/Step Time": 8.432538563385606} +{"Pretrain/Learning Rate": 4.602173528631939e-05, "Pretrain/Loss": 2.0641794204711914, "Pretrain/Loss (Raw)": 1.9901338815689087, "Pretrain/Step": 3940, "Pretrain/Step Time": 8.430841440334916} +{"Pretrain/Learning Rate": 4.601943733786014e-05, "Pretrain/Loss": 2.0609865188598633, "Pretrain/Loss (Raw)": 2.034090757369995, "Pretrain/Step": 3941, "Pretrain/Step Time": 8.434751193970442} +{"Pretrain/Learning Rate": 4.6017138783320234e-05, "Pretrain/Loss": 2.0613629817962646, "Pretrain/Loss (Raw)": 2.0098516941070557, "Pretrain/Step": 3942, "Pretrain/Step Time": 8.436848038807511} +{"Pretrain/Learning Rate": 4.601483962276595e-05, "Pretrain/Loss": 2.061501979827881, "Pretrain/Loss (Raw)": 2.034745931625366, "Pretrain/Step": 3943, "Pretrain/Step Time": 8.435468999668956} +{"Pretrain/Learning Rate": 4.6012539856263574e-05, "Pretrain/Loss": 2.0598387718200684, "Pretrain/Loss (Raw)": 1.905113697052002, "Pretrain/Step": 3944, "Pretrain/Step Time": 8.430348755791783} +{"Pretrain/Learning Rate": 4.6010239483879425e-05, "Pretrain/Loss": 2.060415744781494, "Pretrain/Loss (Raw)": 2.081167697906494, "Pretrain/Step": 3945, "Pretrain/Step Time": 8.430088808760047} +{"Pretrain/Learning Rate": 4.6007938505679836e-05, "Pretrain/Loss": 2.05830717086792, "Pretrain/Loss (Raw)": 1.8444256782531738, "Pretrain/Step": 3946, "Pretrain/Step Time": 8.429283332079649} +{"Pretrain/Learning Rate": 4.600563692173115e-05, "Pretrain/Loss": 2.055870532989502, "Pretrain/Loss (Raw)": 1.7351789474487305, "Pretrain/Step": 3947, "Pretrain/Step Time": 8.428183240815997} +{"Pretrain/Learning Rate": 4.600333473209973e-05, "Pretrain/Loss": 2.057276725769043, "Pretrain/Loss (Raw)": 2.0897066593170166, "Pretrain/Step": 3948, "Pretrain/Step Time": 8.426277004182339} +{"Pretrain/Learning Rate": 4.6001031936851955e-05, "Pretrain/Loss": 2.057187557220459, "Pretrain/Loss (Raw)": 2.022416353225708, "Pretrain/Step": 3949, "Pretrain/Step Time": 8.422772884368896} +{"Pretrain/Learning Rate": 4.5998728536054234e-05, "Pretrain/Loss": 2.058290481567383, "Pretrain/Loss (Raw)": 2.1258742809295654, "Pretrain/Step": 3950, "Pretrain/Step Time": 8.424700373783708} +{"Pretrain/Learning Rate": 4.5996424529772974e-05, "Pretrain/Loss": 2.057809829711914, "Pretrain/Loss (Raw)": 2.0282866954803467, "Pretrain/Step": 3951, "Pretrain/Step Time": 8.427328238263726} +{"Pretrain/Learning Rate": 4.5994119918074616e-05, "Pretrain/Loss": 2.0559604167938232, "Pretrain/Loss (Raw)": 1.8424500226974487, "Pretrain/Step": 3952, "Pretrain/Step Time": 8.42770953476429} +{"Pretrain/Learning Rate": 4.5991814701025617e-05, "Pretrain/Loss": 2.054098129272461, "Pretrain/Loss (Raw)": 1.7329092025756836, "Pretrain/Step": 3953, "Pretrain/Step Time": 8.427949979901314} +{"Pretrain/Learning Rate": 4.5989508878692436e-05, "Pretrain/Loss": 2.055175304412842, "Pretrain/Loss (Raw)": 2.1028475761413574, "Pretrain/Step": 3954, "Pretrain/Step Time": 8.424513194710016} +{"Pretrain/Learning Rate": 4.5987202451141557e-05, "Pretrain/Loss": 2.054582118988037, "Pretrain/Loss (Raw)": 2.126192569732666, "Pretrain/Step": 3955, "Pretrain/Step Time": 8.41724132373929} +{"Pretrain/Learning Rate": 4.5984895418439494e-05, "Pretrain/Loss": 2.0528340339660645, "Pretrain/Loss (Raw)": 1.9808027744293213, "Pretrain/Step": 3956, "Pretrain/Step Time": 8.421646509319544} +{"Pretrain/Learning Rate": 4.5982587780652764e-05, "Pretrain/Loss": 2.052680015563965, "Pretrain/Loss (Raw)": 1.991896629333496, "Pretrain/Step": 3957, "Pretrain/Step Time": 8.42521158605814} +{"Pretrain/Learning Rate": 4.5980279537847904e-05, "Pretrain/Loss": 2.0527360439300537, "Pretrain/Loss (Raw)": 1.9712984561920166, "Pretrain/Step": 3958, "Pretrain/Step Time": 8.425344793125987} +{"Pretrain/Learning Rate": 4.597797069009148e-05, "Pretrain/Loss": 2.0543839931488037, "Pretrain/Loss (Raw)": 2.1285061836242676, "Pretrain/Step": 3959, "Pretrain/Step Time": 8.423961218446493} +{"Pretrain/Learning Rate": 4.5975661237450055e-05, "Pretrain/Loss": 2.057068347930908, "Pretrain/Loss (Raw)": 2.148603916168213, "Pretrain/Step": 3960, "Pretrain/Step Time": 8.425311841070652} +{"Pretrain/Learning Rate": 4.5973351179990234e-05, "Pretrain/Loss": 2.0582478046417236, "Pretrain/Loss (Raw)": 2.0439603328704834, "Pretrain/Step": 3961, "Pretrain/Step Time": 8.424765519797802} +{"Pretrain/Learning Rate": 4.597104051777861e-05, "Pretrain/Loss": 2.058501720428467, "Pretrain/Loss (Raw)": 2.2390525341033936, "Pretrain/Step": 3962, "Pretrain/Step Time": 8.42343076877296} +{"Pretrain/Learning Rate": 4.596872925088181e-05, "Pretrain/Loss": 2.0587480068206787, "Pretrain/Loss (Raw)": 2.2379188537597656, "Pretrain/Step": 3963, "Pretrain/Step Time": 8.42472417652607} +{"Pretrain/Learning Rate": 4.5966417379366495e-05, "Pretrain/Loss": 2.0611486434936523, "Pretrain/Loss (Raw)": 2.1393375396728516, "Pretrain/Step": 3964, "Pretrain/Step Time": 8.422548163682222} +{"Pretrain/Learning Rate": 4.5964104903299306e-05, "Pretrain/Loss": 2.063598155975342, "Pretrain/Loss (Raw)": 2.3673157691955566, "Pretrain/Step": 3965, "Pretrain/Step Time": 8.42500433139503} +{"Pretrain/Learning Rate": 4.596179182274694e-05, "Pretrain/Loss": 2.063093662261963, "Pretrain/Loss (Raw)": 2.0936124324798584, "Pretrain/Step": 3966, "Pretrain/Step Time": 8.42436109110713} +{"Pretrain/Learning Rate": 4.595947813777608e-05, "Pretrain/Loss": 2.0603251457214355, "Pretrain/Loss (Raw)": 1.7702720165252686, "Pretrain/Step": 3967, "Pretrain/Step Time": 8.423769740387797} +{"Pretrain/Learning Rate": 4.595716384845344e-05, "Pretrain/Loss": 2.059438943862915, "Pretrain/Loss (Raw)": 2.056220054626465, "Pretrain/Step": 3968, "Pretrain/Step Time": 8.426502604037523} +{"Pretrain/Learning Rate": 4.595484895484576e-05, "Pretrain/Loss": 2.057663917541504, "Pretrain/Loss (Raw)": 1.934003233909607, "Pretrain/Step": 3969, "Pretrain/Step Time": 8.421751020476222} +{"Pretrain/Learning Rate": 4.595253345701978e-05, "Pretrain/Loss": 2.0575685501098633, "Pretrain/Loss (Raw)": 2.356590509414673, "Pretrain/Step": 3970, "Pretrain/Step Time": 8.427830457687378} +{"Pretrain/Learning Rate": 4.595021735504227e-05, "Pretrain/Loss": 2.0552759170532227, "Pretrain/Loss (Raw)": 2.0457863807678223, "Pretrain/Step": 3971, "Pretrain/Step Time": 8.42704414576292} +{"Pretrain/Learning Rate": 4.594790064898001e-05, "Pretrain/Loss": 2.055875778198242, "Pretrain/Loss (Raw)": 2.095404624938965, "Pretrain/Step": 3972, "Pretrain/Step Time": 8.42501114308834} +{"Pretrain/Learning Rate": 4.59455833388998e-05, "Pretrain/Loss": 2.057070016860962, "Pretrain/Loss (Raw)": 2.150596857070923, "Pretrain/Step": 3973, "Pretrain/Step Time": 8.425290562212467} +{"Pretrain/Learning Rate": 4.594326542486846e-05, "Pretrain/Loss": 2.0576136112213135, "Pretrain/Loss (Raw)": 2.134174108505249, "Pretrain/Step": 3974, "Pretrain/Step Time": 8.426331881433725} +{"Pretrain/Learning Rate": 4.594094690695283e-05, "Pretrain/Loss": 2.0580201148986816, "Pretrain/Loss (Raw)": 2.0414085388183594, "Pretrain/Step": 3975, "Pretrain/Step Time": 8.428847875446081} +{"Pretrain/Learning Rate": 4.593862778521976e-05, "Pretrain/Loss": 2.0596563816070557, "Pretrain/Loss (Raw)": 2.004862070083618, "Pretrain/Step": 3976, "Pretrain/Step Time": 8.424762666225433} +{"Pretrain/Learning Rate": 4.593630805973611e-05, "Pretrain/Loss": 2.0604302883148193, "Pretrain/Loss (Raw)": 2.1727569103240967, "Pretrain/Step": 3977, "Pretrain/Step Time": 8.420654388144612} +{"Pretrain/Learning Rate": 4.593398773056878e-05, "Pretrain/Loss": 2.059727907180786, "Pretrain/Loss (Raw)": 2.002761125564575, "Pretrain/Step": 3978, "Pretrain/Step Time": 8.42492507211864} +{"Pretrain/Learning Rate": 4.593166679778467e-05, "Pretrain/Loss": 2.0605039596557617, "Pretrain/Loss (Raw)": 2.2582333087921143, "Pretrain/Step": 3979, "Pretrain/Step Time": 8.423012578859925} +{"Pretrain/Learning Rate": 4.592934526145071e-05, "Pretrain/Loss": 2.0578298568725586, "Pretrain/Loss (Raw)": 1.8705339431762695, "Pretrain/Step": 3980, "Pretrain/Step Time": 8.423661043867469} +{"Pretrain/Learning Rate": 4.592702312163383e-05, "Pretrain/Loss": 2.0585734844207764, "Pretrain/Loss (Raw)": 2.231794595718384, "Pretrain/Step": 3981, "Pretrain/Step Time": 8.428389579057693} +{"Pretrain/Learning Rate": 4.592470037840099e-05, "Pretrain/Loss": 2.0583536624908447, "Pretrain/Loss (Raw)": 2.1500911712646484, "Pretrain/Step": 3982, "Pretrain/Step Time": 8.426855420693755} +{"Pretrain/Learning Rate": 4.592237703181916e-05, "Pretrain/Loss": 2.058544158935547, "Pretrain/Loss (Raw)": 2.1072027683258057, "Pretrain/Step": 3983, "Pretrain/Step Time": 8.423256825655699} +{"Pretrain/Learning Rate": 4.592005308195534e-05, "Pretrain/Loss": 2.0576930046081543, "Pretrain/Loss (Raw)": 2.0320236682891846, "Pretrain/Step": 3984, "Pretrain/Step Time": 8.427023874595761} +{"Pretrain/Learning Rate": 4.591772852887655e-05, "Pretrain/Loss": 2.0593512058258057, "Pretrain/Loss (Raw)": 2.0668485164642334, "Pretrain/Step": 3985, "Pretrain/Step Time": 8.427032293751836} +{"Pretrain/Learning Rate": 4.591540337264979e-05, "Pretrain/Loss": 2.058389663696289, "Pretrain/Loss (Raw)": 1.9885220527648926, "Pretrain/Step": 3986, "Pretrain/Step Time": 8.429409310221672} +{"Pretrain/Learning Rate": 4.5913077613342123e-05, "Pretrain/Loss": 2.0592079162597656, "Pretrain/Loss (Raw)": 2.1895525455474854, "Pretrain/Step": 3987, "Pretrain/Step Time": 8.429525651037693} +{"Pretrain/Learning Rate": 4.59107512510206e-05, "Pretrain/Loss": 2.062499761581421, "Pretrain/Loss (Raw)": 2.0163943767547607, "Pretrain/Step": 3988, "Pretrain/Step Time": 8.430310705676675} +{"Pretrain/Learning Rate": 4.590842428575232e-05, "Pretrain/Loss": 2.0610218048095703, "Pretrain/Loss (Raw)": 2.008042812347412, "Pretrain/Step": 3989, "Pretrain/Step Time": 8.436833845451474} +{"Pretrain/Learning Rate": 4.5906096717604354e-05, "Pretrain/Loss": 2.0599942207336426, "Pretrain/Loss (Raw)": 2.004856824874878, "Pretrain/Step": 3990, "Pretrain/Step Time": 8.432763453572989} +{"Pretrain/Learning Rate": 4.5903768546643824e-05, "Pretrain/Loss": 2.058548927307129, "Pretrain/Loss (Raw)": 2.140118360519409, "Pretrain/Step": 3991, "Pretrain/Step Time": 8.435926573351026} +{"Pretrain/Learning Rate": 4.5901439772937874e-05, "Pretrain/Loss": 2.0565192699432373, "Pretrain/Loss (Raw)": 1.7963796854019165, "Pretrain/Step": 3992, "Pretrain/Step Time": 8.430540677160025} +{"Pretrain/Learning Rate": 4.5899110396553636e-05, "Pretrain/Loss": 2.05777645111084, "Pretrain/Loss (Raw)": 2.0969319343566895, "Pretrain/Step": 3993, "Pretrain/Step Time": 8.43023626320064} +{"Pretrain/Learning Rate": 4.5896780417558284e-05, "Pretrain/Loss": 2.05671763420105, "Pretrain/Loss (Raw)": 2.1555593013763428, "Pretrain/Step": 3994, "Pretrain/Step Time": 8.425837526097894} +{"Pretrain/Learning Rate": 4.589444983601899e-05, "Pretrain/Loss": 2.055368423461914, "Pretrain/Loss (Raw)": 1.9474356174468994, "Pretrain/Step": 3995, "Pretrain/Step Time": 8.428424434736371} +{"Pretrain/Learning Rate": 4.589211865200298e-05, "Pretrain/Loss": 2.0525896549224854, "Pretrain/Loss (Raw)": 1.8717942237854004, "Pretrain/Step": 3996, "Pretrain/Step Time": 8.424334606155753} +{"Pretrain/Learning Rate": 4.588978686557746e-05, "Pretrain/Loss": 2.048715114593506, "Pretrain/Loss (Raw)": 1.940565586090088, "Pretrain/Step": 3997, "Pretrain/Step Time": 8.423894431442022} +{"Pretrain/Learning Rate": 4.588745447680965e-05, "Pretrain/Loss": 2.0471060276031494, "Pretrain/Loss (Raw)": 1.8019213676452637, "Pretrain/Step": 3998, "Pretrain/Step Time": 8.42686870507896} +{"Pretrain/Learning Rate": 4.588512148576681e-05, "Pretrain/Loss": 2.0492804050445557, "Pretrain/Loss (Raw)": 2.266763925552368, "Pretrain/Step": 3999, "Pretrain/Step Time": 8.422666635364294} +{"Pretrain/Learning Rate": 4.588278789251623e-05, "Pretrain/Loss": 2.05013370513916, "Pretrain/Loss (Raw)": 2.0688071250915527, "Pretrain/Step": 4000, "Pretrain/Step Time": 8.425605731084943} +{"Pretrain/Learning Rate": 4.588045369712518e-05, "Pretrain/Loss": 2.0499446392059326, "Pretrain/Loss (Raw)": 2.130990982055664, "Pretrain/Step": 4001, "Pretrain/Step Time": 8.424793727695942} +{"Pretrain/Learning Rate": 4.587811889966096e-05, "Pretrain/Loss": 2.049992561340332, "Pretrain/Loss (Raw)": 2.130739688873291, "Pretrain/Step": 4002, "Pretrain/Step Time": 8.424920722842216} +{"Pretrain/Learning Rate": 4.5875783500190905e-05, "Pretrain/Loss": 2.0503387451171875, "Pretrain/Loss (Raw)": 2.082038640975952, "Pretrain/Step": 4003, "Pretrain/Step Time": 8.426311323419213} +{"Pretrain/Learning Rate": 4.587344749878234e-05, "Pretrain/Loss": 2.04909610748291, "Pretrain/Loss (Raw)": 1.8324291706085205, "Pretrain/Step": 4004, "Pretrain/Step Time": 8.425749795511365} +{"Pretrain/Learning Rate": 4.587111089550264e-05, "Pretrain/Loss": 2.0497488975524902, "Pretrain/Loss (Raw)": 2.102525234222412, "Pretrain/Step": 4005, "Pretrain/Step Time": 8.427578007802367} +{"Pretrain/Learning Rate": 4.5868773690419174e-05, "Pretrain/Loss": 2.0492959022521973, "Pretrain/Loss (Raw)": 2.09932541847229, "Pretrain/Step": 4006, "Pretrain/Step Time": 8.424217011779547} +{"Pretrain/Learning Rate": 4.586643588359933e-05, "Pretrain/Loss": 2.051706314086914, "Pretrain/Loss (Raw)": 2.155133008956909, "Pretrain/Step": 4007, "Pretrain/Step Time": 8.425145644694567} +{"Pretrain/Learning Rate": 4.58640974751105e-05, "Pretrain/Loss": 2.052745819091797, "Pretrain/Loss (Raw)": 2.0082569122314453, "Pretrain/Step": 4008, "Pretrain/Step Time": 8.424169966951013} +{"Pretrain/Learning Rate": 4.5861758465020146e-05, "Pretrain/Loss": 2.0538315773010254, "Pretrain/Loss (Raw)": 2.051417112350464, "Pretrain/Step": 4009, "Pretrain/Step Time": 8.425780532881618} +{"Pretrain/Learning Rate": 4.585941885339569e-05, "Pretrain/Loss": 2.054266929626465, "Pretrain/Loss (Raw)": 1.857649564743042, "Pretrain/Step": 4010, "Pretrain/Step Time": 8.419980924576521} +{"Pretrain/Learning Rate": 4.585707864030459e-05, "Pretrain/Loss": 2.052239179611206, "Pretrain/Loss (Raw)": 1.8873769044876099, "Pretrain/Step": 4011, "Pretrain/Step Time": 8.425125181674957} +{"Pretrain/Learning Rate": 4.585473782581433e-05, "Pretrain/Loss": 2.0513741970062256, "Pretrain/Loss (Raw)": 2.0773303508758545, "Pretrain/Step": 4012, "Pretrain/Step Time": 8.423845171928406} +{"Pretrain/Learning Rate": 4.585239640999242e-05, "Pretrain/Loss": 2.0510692596435547, "Pretrain/Loss (Raw)": 1.999961256980896, "Pretrain/Step": 4013, "Pretrain/Step Time": 8.426010373979807} +{"Pretrain/Learning Rate": 4.585005439290635e-05, "Pretrain/Loss": 2.051982879638672, "Pretrain/Loss (Raw)": 1.9908207654953003, "Pretrain/Step": 4014, "Pretrain/Step Time": 8.423230404034257} +{"Pretrain/Learning Rate": 4.584771177462365e-05, "Pretrain/Loss": 2.0496225357055664, "Pretrain/Loss (Raw)": 1.7730929851531982, "Pretrain/Step": 4015, "Pretrain/Step Time": 8.425207629799843} +{"Pretrain/Learning Rate": 4.584536855521189e-05, "Pretrain/Loss": 2.053100109100342, "Pretrain/Loss (Raw)": 2.3187472820281982, "Pretrain/Step": 4016, "Pretrain/Step Time": 8.424693651497364} +{"Pretrain/Learning Rate": 4.584302473473862e-05, "Pretrain/Loss": 2.053077459335327, "Pretrain/Loss (Raw)": 2.0337886810302734, "Pretrain/Step": 4017, "Pretrain/Step Time": 8.429194800555706} +{"Pretrain/Learning Rate": 4.5840680313271424e-05, "Pretrain/Loss": 2.0552029609680176, "Pretrain/Loss (Raw)": 2.1208138465881348, "Pretrain/Step": 4018, "Pretrain/Step Time": 8.43365235067904} +{"Pretrain/Learning Rate": 4.583833529087791e-05, "Pretrain/Loss": 2.0558629035949707, "Pretrain/Loss (Raw)": 2.143921136856079, "Pretrain/Step": 4019, "Pretrain/Step Time": 8.437695564702153} +{"Pretrain/Learning Rate": 4.583598966762568e-05, "Pretrain/Loss": 2.0534913539886475, "Pretrain/Loss (Raw)": 1.9033328294754028, "Pretrain/Step": 4020, "Pretrain/Step Time": 8.437283182516694} +{"Pretrain/Learning Rate": 4.583364344358238e-05, "Pretrain/Loss": 2.053309440612793, "Pretrain/Loss (Raw)": 2.0473883152008057, "Pretrain/Step": 4021, "Pretrain/Step Time": 8.439782846719027} +{"Pretrain/Learning Rate": 4.583129661881565e-05, "Pretrain/Loss": 2.0527658462524414, "Pretrain/Loss (Raw)": 2.283780813217163, "Pretrain/Step": 4022, "Pretrain/Step Time": 8.436587642878294} +{"Pretrain/Learning Rate": 4.582894919339318e-05, "Pretrain/Loss": 2.05475115776062, "Pretrain/Loss (Raw)": 2.0756590366363525, "Pretrain/Step": 4023, "Pretrain/Step Time": 8.43393605016172} +{"Pretrain/Learning Rate": 4.582660116738263e-05, "Pretrain/Loss": 2.0545263290405273, "Pretrain/Loss (Raw)": 2.181813955307007, "Pretrain/Step": 4024, "Pretrain/Step Time": 8.436425881460309} +{"Pretrain/Learning Rate": 4.582425254085173e-05, "Pretrain/Loss": 2.0514986515045166, "Pretrain/Loss (Raw)": 1.9616535902023315, "Pretrain/Step": 4025, "Pretrain/Step Time": 8.437224173918366} +{"Pretrain/Learning Rate": 4.582190331386818e-05, "Pretrain/Loss": 2.0506067276000977, "Pretrain/Loss (Raw)": 2.026989221572876, "Pretrain/Step": 4026, "Pretrain/Step Time": 8.431228309869766} +{"Pretrain/Learning Rate": 4.5819553486499725e-05, "Pretrain/Loss": 2.052994728088379, "Pretrain/Loss (Raw)": 2.1834418773651123, "Pretrain/Step": 4027, "Pretrain/Step Time": 8.430022742599249} +{"Pretrain/Learning Rate": 4.5817203058814126e-05, "Pretrain/Loss": 2.0533111095428467, "Pretrain/Loss (Raw)": 2.0930514335632324, "Pretrain/Step": 4028, "Pretrain/Step Time": 8.429860657081008} +{"Pretrain/Learning Rate": 4.581485203087915e-05, "Pretrain/Loss": 2.0540034770965576, "Pretrain/Loss (Raw)": 2.093034267425537, "Pretrain/Step": 4029, "Pretrain/Step Time": 8.426173340529203} +{"Pretrain/Learning Rate": 4.581250040276259e-05, "Pretrain/Loss": 2.0529346466064453, "Pretrain/Loss (Raw)": 2.0249125957489014, "Pretrain/Step": 4030, "Pretrain/Step Time": 8.425580548122525} +{"Pretrain/Learning Rate": 4.5810148174532265e-05, "Pretrain/Loss": 2.0548410415649414, "Pretrain/Loss (Raw)": 2.1174774169921875, "Pretrain/Step": 4031, "Pretrain/Step Time": 8.429378164932132} +{"Pretrain/Learning Rate": 4.5807795346255974e-05, "Pretrain/Loss": 2.056042194366455, "Pretrain/Loss (Raw)": 2.153377056121826, "Pretrain/Step": 4032, "Pretrain/Step Time": 8.42793652229011} +{"Pretrain/Learning Rate": 4.5805441918001575e-05, "Pretrain/Loss": 2.055943250656128, "Pretrain/Loss (Raw)": 2.1737890243530273, "Pretrain/Step": 4033, "Pretrain/Step Time": 8.423861742019653} +{"Pretrain/Learning Rate": 4.5803087889836923e-05, "Pretrain/Loss": 2.057279109954834, "Pretrain/Loss (Raw)": 2.203350067138672, "Pretrain/Step": 4034, "Pretrain/Step Time": 8.432388380169868} +{"Pretrain/Learning Rate": 4.58007332618299e-05, "Pretrain/Loss": 2.0578606128692627, "Pretrain/Loss (Raw)": 2.075052261352539, "Pretrain/Step": 4035, "Pretrain/Step Time": 8.42618309520185} +{"Pretrain/Learning Rate": 4.579837803404839e-05, "Pretrain/Loss": 2.05794620513916, "Pretrain/Loss (Raw)": 2.025965690612793, "Pretrain/Step": 4036, "Pretrain/Step Time": 8.429767282679677} +{"Pretrain/Learning Rate": 4.579602220656032e-05, "Pretrain/Loss": 2.0593008995056152, "Pretrain/Loss (Raw)": 2.131516456604004, "Pretrain/Step": 4037, "Pretrain/Step Time": 8.433649057522416} +{"Pretrain/Learning Rate": 4.579366577943361e-05, "Pretrain/Loss": 2.0590085983276367, "Pretrain/Loss (Raw)": 1.943651795387268, "Pretrain/Step": 4038, "Pretrain/Step Time": 8.430026553571224} +{"Pretrain/Learning Rate": 4.57913087527362e-05, "Pretrain/Loss": 2.0572638511657715, "Pretrain/Loss (Raw)": 2.007937431335449, "Pretrain/Step": 4039, "Pretrain/Step Time": 8.432168325409293} +{"Pretrain/Learning Rate": 4.578895112653606e-05, "Pretrain/Loss": 2.05558443069458, "Pretrain/Loss (Raw)": 2.0942418575286865, "Pretrain/Step": 4040, "Pretrain/Step Time": 8.432876262813807} +{"Pretrain/Learning Rate": 4.578659290090117e-05, "Pretrain/Loss": 2.0541114807128906, "Pretrain/Loss (Raw)": 1.7232599258422852, "Pretrain/Step": 4041, "Pretrain/Step Time": 8.432317765429616} +{"Pretrain/Learning Rate": 4.578423407589953e-05, "Pretrain/Loss": 2.055482864379883, "Pretrain/Loss (Raw)": 2.2259905338287354, "Pretrain/Step": 4042, "Pretrain/Step Time": 8.433210192248225} +{"Pretrain/Learning Rate": 4.5781874651599155e-05, "Pretrain/Loss": 2.0527024269104004, "Pretrain/Loss (Raw)": 1.8181512355804443, "Pretrain/Step": 4043, "Pretrain/Step Time": 8.434352118521929} +{"Pretrain/Learning Rate": 4.577951462806807e-05, "Pretrain/Loss": 2.0506844520568848, "Pretrain/Loss (Raw)": 1.8846927881240845, "Pretrain/Step": 4044, "Pretrain/Step Time": 8.432187071070075} +{"Pretrain/Learning Rate": 4.577715400537433e-05, "Pretrain/Loss": 2.049086332321167, "Pretrain/Loss (Raw)": 1.9441474676132202, "Pretrain/Step": 4045, "Pretrain/Step Time": 8.434980457648635} +{"Pretrain/Learning Rate": 4.5774792783586004e-05, "Pretrain/Loss": 2.0503182411193848, "Pretrain/Loss (Raw)": 2.0612003803253174, "Pretrain/Step": 4046, "Pretrain/Step Time": 8.436039065942168} +{"Pretrain/Learning Rate": 4.577243096277117e-05, "Pretrain/Loss": 2.0461530685424805, "Pretrain/Loss (Raw)": 1.6225979328155518, "Pretrain/Step": 4047, "Pretrain/Step Time": 8.437872774899006} +{"Pretrain/Learning Rate": 4.5770068542997935e-05, "Pretrain/Loss": 2.046631336212158, "Pretrain/Loss (Raw)": 2.061213254928589, "Pretrain/Step": 4048, "Pretrain/Step Time": 8.432454723864794} +{"Pretrain/Learning Rate": 4.576770552433441e-05, "Pretrain/Loss": 2.046254873275757, "Pretrain/Loss (Raw)": 2.170185089111328, "Pretrain/Step": 4049, "Pretrain/Step Time": 8.434218663722277} +{"Pretrain/Learning Rate": 4.576534190684874e-05, "Pretrain/Loss": 2.045698642730713, "Pretrain/Loss (Raw)": 2.0487265586853027, "Pretrain/Step": 4050, "Pretrain/Step Time": 8.4328728672117} +{"Pretrain/Learning Rate": 4.5762977690609075e-05, "Pretrain/Loss": 2.0458199977874756, "Pretrain/Loss (Raw)": 2.1444895267486572, "Pretrain/Step": 4051, "Pretrain/Step Time": 8.433750187978148} +{"Pretrain/Learning Rate": 4.576061287568358e-05, "Pretrain/Loss": 2.04618501663208, "Pretrain/Loss (Raw)": 1.976875901222229, "Pretrain/Step": 4052, "Pretrain/Step Time": 8.436563676223159} +{"Pretrain/Learning Rate": 4.575824746214046e-05, "Pretrain/Loss": 2.0463287830352783, "Pretrain/Loss (Raw)": 2.1216349601745605, "Pretrain/Step": 4053, "Pretrain/Step Time": 8.437836417928338} +{"Pretrain/Learning Rate": 4.57558814500479e-05, "Pretrain/Loss": 2.046751022338867, "Pretrain/Loss (Raw)": 2.1174633502960205, "Pretrain/Step": 4054, "Pretrain/Step Time": 8.434556325897574} +{"Pretrain/Learning Rate": 4.5753514839474134e-05, "Pretrain/Loss": 2.045498847961426, "Pretrain/Loss (Raw)": 1.8483637571334839, "Pretrain/Step": 4055, "Pretrain/Step Time": 8.440702425315976} +{"Pretrain/Learning Rate": 4.5751147630487394e-05, "Pretrain/Loss": 2.0441133975982666, "Pretrain/Loss (Raw)": 2.016947031021118, "Pretrain/Step": 4056, "Pretrain/Step Time": 8.436581363901496} +{"Pretrain/Learning Rate": 4.574877982315594e-05, "Pretrain/Loss": 2.0427632331848145, "Pretrain/Loss (Raw)": 2.0432331562042236, "Pretrain/Step": 4057, "Pretrain/Step Time": 8.435359550639987} +{"Pretrain/Learning Rate": 4.574641141754805e-05, "Pretrain/Loss": 2.042574405670166, "Pretrain/Loss (Raw)": 2.0560779571533203, "Pretrain/Step": 4058, "Pretrain/Step Time": 8.438545601442456} +{"Pretrain/Learning Rate": 4.574404241373201e-05, "Pretrain/Loss": 2.0422656536102295, "Pretrain/Loss (Raw)": 1.9299674034118652, "Pretrain/Step": 4059, "Pretrain/Step Time": 8.435283089056611} +{"Pretrain/Learning Rate": 4.5741672811776136e-05, "Pretrain/Loss": 2.0413522720336914, "Pretrain/Loss (Raw)": 2.008490800857544, "Pretrain/Step": 4060, "Pretrain/Step Time": 8.436752509325743} +{"Pretrain/Learning Rate": 4.573930261174874e-05, "Pretrain/Loss": 2.040398597717285, "Pretrain/Loss (Raw)": 1.9832834005355835, "Pretrain/Step": 4061, "Pretrain/Step Time": 8.436880063265562} +{"Pretrain/Learning Rate": 4.5736931813718176e-05, "Pretrain/Loss": 2.043152332305908, "Pretrain/Loss (Raw)": 2.1701817512512207, "Pretrain/Step": 4062, "Pretrain/Step Time": 8.446779320016503} +{"Pretrain/Learning Rate": 4.5734560417752805e-05, "Pretrain/Loss": 2.0430381298065186, "Pretrain/Loss (Raw)": 2.0059194564819336, "Pretrain/Step": 4063, "Pretrain/Step Time": 8.444961156696081} +{"Pretrain/Learning Rate": 4.5732188423921e-05, "Pretrain/Loss": 2.04640531539917, "Pretrain/Loss (Raw)": 2.270659923553467, "Pretrain/Step": 4064, "Pretrain/Step Time": 8.44555776193738} +{"Pretrain/Learning Rate": 4.572981583229116e-05, "Pretrain/Loss": 2.047915458679199, "Pretrain/Loss (Raw)": 2.2455763816833496, "Pretrain/Step": 4065, "Pretrain/Step Time": 8.447598483413458} +{"Pretrain/Learning Rate": 4.5727442642931685e-05, "Pretrain/Loss": 2.0468015670776367, "Pretrain/Loss (Raw)": 2.0116889476776123, "Pretrain/Step": 4066, "Pretrain/Step Time": 8.450664639472961} +{"Pretrain/Learning Rate": 4.5725068855911024e-05, "Pretrain/Loss": 2.046708106994629, "Pretrain/Loss (Raw)": 2.046926498413086, "Pretrain/Step": 4067, "Pretrain/Step Time": 8.44684392772615} +{"Pretrain/Learning Rate": 4.57226944712976e-05, "Pretrain/Loss": 2.04719877243042, "Pretrain/Loss (Raw)": 2.052931547164917, "Pretrain/Step": 4068, "Pretrain/Step Time": 8.452086750417948} +{"Pretrain/Learning Rate": 4.57203194891599e-05, "Pretrain/Loss": 2.0467381477355957, "Pretrain/Loss (Raw)": 1.9751348495483398, "Pretrain/Step": 4069, "Pretrain/Step Time": 8.449875293299556} +{"Pretrain/Learning Rate": 4.57179439095664e-05, "Pretrain/Loss": 2.048396348953247, "Pretrain/Loss (Raw)": 2.2221131324768066, "Pretrain/Step": 4070, "Pretrain/Step Time": 8.44606576859951} +{"Pretrain/Learning Rate": 4.571556773258557e-05, "Pretrain/Loss": 2.0488975048065186, "Pretrain/Loss (Raw)": 2.098888874053955, "Pretrain/Step": 4071, "Pretrain/Step Time": 8.446060502901673} +{"Pretrain/Learning Rate": 4.571319095828597e-05, "Pretrain/Loss": 2.0511183738708496, "Pretrain/Loss (Raw)": 2.189404010772705, "Pretrain/Step": 4072, "Pretrain/Step Time": 8.444697400555015} +{"Pretrain/Learning Rate": 4.57108135867361e-05, "Pretrain/Loss": 2.0499520301818848, "Pretrain/Loss (Raw)": 1.9318451881408691, "Pretrain/Step": 4073, "Pretrain/Step Time": 8.44392367452383} +{"Pretrain/Learning Rate": 4.570843561800452e-05, "Pretrain/Loss": 2.0518276691436768, "Pretrain/Loss (Raw)": 2.0845155715942383, "Pretrain/Step": 4074, "Pretrain/Step Time": 8.444378715008497} +{"Pretrain/Learning Rate": 4.570605705215981e-05, "Pretrain/Loss": 2.054212808609009, "Pretrain/Loss (Raw)": 2.040473699569702, "Pretrain/Step": 4075, "Pretrain/Step Time": 8.45003804191947} +{"Pretrain/Learning Rate": 4.570367788927052e-05, "Pretrain/Loss": 2.0535058975219727, "Pretrain/Loss (Raw)": 1.999228835105896, "Pretrain/Step": 4076, "Pretrain/Step Time": 8.446230039000511} +{"Pretrain/Learning Rate": 4.570129812940529e-05, "Pretrain/Loss": 2.052673578262329, "Pretrain/Loss (Raw)": 1.9158929586410522, "Pretrain/Step": 4077, "Pretrain/Step Time": 8.449879275634885} +{"Pretrain/Learning Rate": 4.569891777263272e-05, "Pretrain/Loss": 2.0536625385284424, "Pretrain/Loss (Raw)": 2.252455711364746, "Pretrain/Step": 4078, "Pretrain/Step Time": 8.444660706445575} +{"Pretrain/Learning Rate": 4.569653681902144e-05, "Pretrain/Loss": 2.0531420707702637, "Pretrain/Loss (Raw)": 1.961662769317627, "Pretrain/Step": 4079, "Pretrain/Step Time": 8.444390911608934} +{"Pretrain/Learning Rate": 4.569415526864012e-05, "Pretrain/Loss": 2.0563912391662598, "Pretrain/Loss (Raw)": 2.2583673000335693, "Pretrain/Step": 4080, "Pretrain/Step Time": 8.446379728615284} +{"Pretrain/Learning Rate": 4.5691773121557415e-05, "Pretrain/Loss": 2.0593419075012207, "Pretrain/Loss (Raw)": 2.110546350479126, "Pretrain/Step": 4081, "Pretrain/Step Time": 8.445642901584506} +{"Pretrain/Learning Rate": 4.568939037784202e-05, "Pretrain/Loss": 2.056870937347412, "Pretrain/Loss (Raw)": 1.786594271659851, "Pretrain/Step": 4082, "Pretrain/Step Time": 8.444584196433425} +{"Pretrain/Learning Rate": 4.568700703756264e-05, "Pretrain/Loss": 2.054107666015625, "Pretrain/Loss (Raw)": 1.7724716663360596, "Pretrain/Step": 4083, "Pretrain/Step Time": 8.447104213759303} +{"Pretrain/Learning Rate": 4.568462310078799e-05, "Pretrain/Loss": 2.0552420616149902, "Pretrain/Loss (Raw)": 2.12601375579834, "Pretrain/Step": 4084, "Pretrain/Step Time": 8.44478869996965} +{"Pretrain/Learning Rate": 4.568223856758683e-05, "Pretrain/Loss": 2.0580520629882812, "Pretrain/Loss (Raw)": 2.3515865802764893, "Pretrain/Step": 4085, "Pretrain/Step Time": 8.44396840967238} +{"Pretrain/Learning Rate": 4.5679853438027884e-05, "Pretrain/Loss": 2.059483766555786, "Pretrain/Loss (Raw)": 2.154575824737549, "Pretrain/Step": 4086, "Pretrain/Step Time": 8.443152783438563} +{"Pretrain/Learning Rate": 4.567746771217995e-05, "Pretrain/Loss": 2.057694911956787, "Pretrain/Loss (Raw)": 1.899520993232727, "Pretrain/Step": 4087, "Pretrain/Step Time": 8.441055176779628} +{"Pretrain/Learning Rate": 4.5675081390111805e-05, "Pretrain/Loss": 2.057516098022461, "Pretrain/Loss (Raw)": 2.1256885528564453, "Pretrain/Step": 4088, "Pretrain/Step Time": 8.438096845522523} +{"Pretrain/Learning Rate": 4.567269447189228e-05, "Pretrain/Loss": 2.058128595352173, "Pretrain/Loss (Raw)": 2.122373104095459, "Pretrain/Step": 4089, "Pretrain/Step Time": 8.438501194119453} +{"Pretrain/Learning Rate": 4.5670306957590166e-05, "Pretrain/Loss": 2.054454803466797, "Pretrain/Loss (Raw)": 1.7688186168670654, "Pretrain/Step": 4090, "Pretrain/Step Time": 8.43937879614532} +{"Pretrain/Learning Rate": 4.5667918847274324e-05, "Pretrain/Loss": 2.0526344776153564, "Pretrain/Loss (Raw)": 2.004908323287964, "Pretrain/Step": 4091, "Pretrain/Step Time": 8.43962281383574} +{"Pretrain/Learning Rate": 4.566553014101361e-05, "Pretrain/Loss": 2.050956964492798, "Pretrain/Loss (Raw)": 1.924600601196289, "Pretrain/Step": 4092, "Pretrain/Step Time": 8.442078346386552} +{"Pretrain/Learning Rate": 4.566314083887692e-05, "Pretrain/Loss": 2.0485219955444336, "Pretrain/Loss (Raw)": 2.0556535720825195, "Pretrain/Step": 4093, "Pretrain/Step Time": 8.441231187433004} +{"Pretrain/Learning Rate": 4.5660750940933114e-05, "Pretrain/Loss": 2.0488946437835693, "Pretrain/Loss (Raw)": 2.14131498336792, "Pretrain/Step": 4094, "Pretrain/Step Time": 8.439831567928195} +{"Pretrain/Learning Rate": 4.565836044725112e-05, "Pretrain/Loss": 2.0520172119140625, "Pretrain/Loss (Raw)": 2.169964075088501, "Pretrain/Step": 4095, "Pretrain/Step Time": 8.439231611788273} +{"Pretrain/Learning Rate": 4.5655969357899874e-05, "Pretrain/Loss": 2.0514581203460693, "Pretrain/Loss (Raw)": 1.9846599102020264, "Pretrain/Step": 4096, "Pretrain/Step Time": 8.438032416626811} +{"Pretrain/Learning Rate": 4.565357767294831e-05, "Pretrain/Loss": 2.0520758628845215, "Pretrain/Loss (Raw)": 2.0130515098571777, "Pretrain/Step": 4097, "Pretrain/Step Time": 8.444653499871492} +{"Pretrain/Learning Rate": 4.565118539246539e-05, "Pretrain/Loss": 2.0499041080474854, "Pretrain/Loss (Raw)": 2.0786261558532715, "Pretrain/Step": 4098, "Pretrain/Step Time": 8.43927239254117} +{"Pretrain/Learning Rate": 4.56487925165201e-05, "Pretrain/Loss": 2.0507242679595947, "Pretrain/Loss (Raw)": 2.1507482528686523, "Pretrain/Step": 4099, "Pretrain/Step Time": 8.438988894224167} +{"Pretrain/Learning Rate": 4.5646399045181437e-05, "Pretrain/Loss": 2.0494472980499268, "Pretrain/Loss (Raw)": 1.9319775104522705, "Pretrain/Step": 4100, "Pretrain/Step Time": 8.441444892436266} +{"Pretrain/Learning Rate": 4.56440049785184e-05, "Pretrain/Loss": 2.0489015579223633, "Pretrain/Loss (Raw)": 2.0807526111602783, "Pretrain/Step": 4101, "Pretrain/Step Time": 8.443250816315413} +{"Pretrain/Learning Rate": 4.5641610316600046e-05, "Pretrain/Loss": 2.049191951751709, "Pretrain/Loss (Raw)": 2.1713457107543945, "Pretrain/Step": 4102, "Pretrain/Step Time": 8.44409878924489} +{"Pretrain/Learning Rate": 4.563921505949541e-05, "Pretrain/Loss": 2.0515589714050293, "Pretrain/Loss (Raw)": 2.3443498611450195, "Pretrain/Step": 4103, "Pretrain/Step Time": 8.447334334254265} +{"Pretrain/Learning Rate": 4.563681920727355e-05, "Pretrain/Loss": 2.051572799682617, "Pretrain/Loss (Raw)": 2.006639003753662, "Pretrain/Step": 4104, "Pretrain/Step Time": 8.44478939846158} +{"Pretrain/Learning Rate": 4.5634422760003556e-05, "Pretrain/Loss": 2.051271915435791, "Pretrain/Loss (Raw)": 2.1342380046844482, "Pretrain/Step": 4105, "Pretrain/Step Time": 8.44280911423266} +{"Pretrain/Learning Rate": 4.563202571775454e-05, "Pretrain/Loss": 2.052647113800049, "Pretrain/Loss (Raw)": 2.1788089275360107, "Pretrain/Step": 4106, "Pretrain/Step Time": 8.440758276730776} +{"Pretrain/Learning Rate": 4.5629628080595596e-05, "Pretrain/Loss": 2.052215814590454, "Pretrain/Loss (Raw)": 2.2030200958251953, "Pretrain/Step": 4107, "Pretrain/Step Time": 8.44760037586093} +{"Pretrain/Learning Rate": 4.562722984859587e-05, "Pretrain/Loss": 2.0530717372894287, "Pretrain/Loss (Raw)": 1.9800702333450317, "Pretrain/Step": 4108, "Pretrain/Step Time": 8.446390878409147} +{"Pretrain/Learning Rate": 4.562483102182452e-05, "Pretrain/Loss": 2.051631450653076, "Pretrain/Loss (Raw)": 2.047452449798584, "Pretrain/Step": 4109, "Pretrain/Step Time": 8.44148507155478} +{"Pretrain/Learning Rate": 4.56224316003507e-05, "Pretrain/Loss": 2.050740957260132, "Pretrain/Loss (Raw)": 2.0361247062683105, "Pretrain/Step": 4110, "Pretrain/Step Time": 8.440968239679933} +{"Pretrain/Learning Rate": 4.56200315842436e-05, "Pretrain/Loss": 2.0520405769348145, "Pretrain/Loss (Raw)": 2.2735435962677, "Pretrain/Step": 4111, "Pretrain/Step Time": 8.439345428720117} +{"Pretrain/Learning Rate": 4.5617630973572436e-05, "Pretrain/Loss": 2.0515174865722656, "Pretrain/Loss (Raw)": 1.9650561809539795, "Pretrain/Step": 4112, "Pretrain/Step Time": 8.438972059637308} +{"Pretrain/Learning Rate": 4.561522976840641e-05, "Pretrain/Loss": 2.050577163696289, "Pretrain/Loss (Raw)": 1.9465222358703613, "Pretrain/Step": 4113, "Pretrain/Step Time": 8.440398583188653} +{"Pretrain/Learning Rate": 4.561282796881476e-05, "Pretrain/Loss": 2.050262212753296, "Pretrain/Loss (Raw)": 1.9481858015060425, "Pretrain/Step": 4114, "Pretrain/Step Time": 8.436753945425153} +{"Pretrain/Learning Rate": 4.5610425574866755e-05, "Pretrain/Loss": 2.048250436782837, "Pretrain/Loss (Raw)": 1.9320343732833862, "Pretrain/Step": 4115, "Pretrain/Step Time": 8.438172243535519} +{"Pretrain/Learning Rate": 4.560802258663166e-05, "Pretrain/Loss": 2.0482213497161865, "Pretrain/Loss (Raw)": 2.0126655101776123, "Pretrain/Step": 4116, "Pretrain/Step Time": 8.441240584477782} +{"Pretrain/Learning Rate": 4.5605619004178754e-05, "Pretrain/Loss": 2.0489695072174072, "Pretrain/Loss (Raw)": 2.1038269996643066, "Pretrain/Step": 4117, "Pretrain/Step Time": 8.440121969208121} +{"Pretrain/Learning Rate": 4.5603214827577355e-05, "Pretrain/Loss": 2.0513386726379395, "Pretrain/Loss (Raw)": 2.308140993118286, "Pretrain/Step": 4118, "Pretrain/Step Time": 8.4434425663203} +{"Pretrain/Learning Rate": 4.560081005689678e-05, "Pretrain/Loss": 2.0530102252960205, "Pretrain/Loss (Raw)": 2.354036331176758, "Pretrain/Step": 4119, "Pretrain/Step Time": 8.439625792205334} +{"Pretrain/Learning Rate": 4.5598404692206375e-05, "Pretrain/Loss": 2.0556468963623047, "Pretrain/Loss (Raw)": 2.1338789463043213, "Pretrain/Step": 4120, "Pretrain/Step Time": 8.439706660807133} +{"Pretrain/Learning Rate": 4.559599873357548e-05, "Pretrain/Loss": 2.053769588470459, "Pretrain/Loss (Raw)": 1.8566279411315918, "Pretrain/Step": 4121, "Pretrain/Step Time": 8.439317481592298} +{"Pretrain/Learning Rate": 4.5593592181073494e-05, "Pretrain/Loss": 2.050154685974121, "Pretrain/Loss (Raw)": 1.6928642988204956, "Pretrain/Step": 4122, "Pretrain/Step Time": 8.443673828616738} +{"Pretrain/Learning Rate": 4.5591185034769785e-05, "Pretrain/Loss": 2.0502989292144775, "Pretrain/Loss (Raw)": 1.9658907651901245, "Pretrain/Step": 4123, "Pretrain/Step Time": 8.442914348095655} +{"Pretrain/Learning Rate": 4.558877729473378e-05, "Pretrain/Loss": 2.051966905593872, "Pretrain/Loss (Raw)": 2.0852746963500977, "Pretrain/Step": 4124, "Pretrain/Step Time": 8.443143861368299} +{"Pretrain/Learning Rate": 4.558636896103489e-05, "Pretrain/Loss": 2.05239200592041, "Pretrain/Loss (Raw)": 1.9949790239334106, "Pretrain/Step": 4125, "Pretrain/Step Time": 8.44479226320982} +{"Pretrain/Learning Rate": 4.5583960033742553e-05, "Pretrain/Loss": 2.0508036613464355, "Pretrain/Loss (Raw)": 1.598633050918579, "Pretrain/Step": 4126, "Pretrain/Step Time": 8.443547870963812} +{"Pretrain/Learning Rate": 4.558155051292625e-05, "Pretrain/Loss": 2.048144817352295, "Pretrain/Loss (Raw)": 1.9264326095581055, "Pretrain/Step": 4127, "Pretrain/Step Time": 8.445195831358433} +{"Pretrain/Learning Rate": 4.557914039865545e-05, "Pretrain/Loss": 2.046318769454956, "Pretrain/Loss (Raw)": 1.8350815773010254, "Pretrain/Step": 4128, "Pretrain/Step Time": 8.443125391378999} +{"Pretrain/Learning Rate": 4.5576729690999646e-05, "Pretrain/Loss": 2.0445404052734375, "Pretrain/Loss (Raw)": 1.9033523797988892, "Pretrain/Step": 4129, "Pretrain/Step Time": 8.44199982099235} +{"Pretrain/Learning Rate": 4.557431839002834e-05, "Pretrain/Loss": 2.042903423309326, "Pretrain/Loss (Raw)": 1.9211978912353516, "Pretrain/Step": 4130, "Pretrain/Step Time": 8.444839473813772} +{"Pretrain/Learning Rate": 4.557190649581107e-05, "Pretrain/Loss": 2.0408718585968018, "Pretrain/Loss (Raw)": 1.8219982385635376, "Pretrain/Step": 4131, "Pretrain/Step Time": 8.44535101391375} +{"Pretrain/Learning Rate": 4.556949400841737e-05, "Pretrain/Loss": 2.0402188301086426, "Pretrain/Loss (Raw)": 1.7488471269607544, "Pretrain/Step": 4132, "Pretrain/Step Time": 8.44663742557168} +{"Pretrain/Learning Rate": 4.556708092791682e-05, "Pretrain/Loss": 2.041213035583496, "Pretrain/Loss (Raw)": 2.22979474067688, "Pretrain/Step": 4133, "Pretrain/Step Time": 8.444271489977837} +{"Pretrain/Learning Rate": 4.556466725437899e-05, "Pretrain/Loss": 2.0412392616271973, "Pretrain/Loss (Raw)": 2.1027028560638428, "Pretrain/Step": 4134, "Pretrain/Step Time": 8.448083218187094} +{"Pretrain/Learning Rate": 4.556225298787348e-05, "Pretrain/Loss": 2.037954807281494, "Pretrain/Loss (Raw)": 1.734715461730957, "Pretrain/Step": 4135, "Pretrain/Step Time": 8.451289217919111} +{"Pretrain/Learning Rate": 4.555983812846989e-05, "Pretrain/Loss": 2.039719820022583, "Pretrain/Loss (Raw)": 2.2341670989990234, "Pretrain/Step": 4136, "Pretrain/Step Time": 8.45082662627101} +{"Pretrain/Learning Rate": 4.555742267623787e-05, "Pretrain/Loss": 2.0383896827697754, "Pretrain/Loss (Raw)": 1.8811672925949097, "Pretrain/Step": 4137, "Pretrain/Step Time": 8.450352935120463} +{"Pretrain/Learning Rate": 4.555500663124705e-05, "Pretrain/Loss": 2.0402157306671143, "Pretrain/Loss (Raw)": 2.0913805961608887, "Pretrain/Step": 4138, "Pretrain/Step Time": 8.450842641294003} +{"Pretrain/Learning Rate": 4.555258999356711e-05, "Pretrain/Loss": 2.04067063331604, "Pretrain/Loss (Raw)": 1.9455949068069458, "Pretrain/Step": 4139, "Pretrain/Step Time": 8.458140276372433} +{"Pretrain/Learning Rate": 4.555017276326773e-05, "Pretrain/Loss": 2.0391082763671875, "Pretrain/Loss (Raw)": 1.8773151636123657, "Pretrain/Step": 4140, "Pretrain/Step Time": 8.459180381149054} +{"Pretrain/Learning Rate": 4.55477549404186e-05, "Pretrain/Loss": 2.041132926940918, "Pretrain/Loss (Raw)": 2.2591378688812256, "Pretrain/Step": 4141, "Pretrain/Step Time": 8.457617681473494} +{"Pretrain/Learning Rate": 4.5545336525089444e-05, "Pretrain/Loss": 2.042410135269165, "Pretrain/Loss (Raw)": 2.1543266773223877, "Pretrain/Step": 4142, "Pretrain/Step Time": 8.454532204195857} +{"Pretrain/Learning Rate": 4.554291751734999e-05, "Pretrain/Loss": 2.044739007949829, "Pretrain/Loss (Raw)": 2.071167469024658, "Pretrain/Step": 4143, "Pretrain/Step Time": 8.455992937088013} +{"Pretrain/Learning Rate": 4.554049791727e-05, "Pretrain/Loss": 2.0427968502044678, "Pretrain/Loss (Raw)": 2.0701756477355957, "Pretrain/Step": 4144, "Pretrain/Step Time": 8.454621691256762} +{"Pretrain/Learning Rate": 4.553807772491922e-05, "Pretrain/Loss": 2.042349100112915, "Pretrain/Loss (Raw)": 1.9764573574066162, "Pretrain/Step": 4145, "Pretrain/Step Time": 8.4567346945405} +{"Pretrain/Learning Rate": 4.553565694036745e-05, "Pretrain/Loss": 2.041417121887207, "Pretrain/Loss (Raw)": 2.0015528202056885, "Pretrain/Step": 4146, "Pretrain/Step Time": 8.454924419522285} +{"Pretrain/Learning Rate": 4.55332355636845e-05, "Pretrain/Loss": 2.0408310890197754, "Pretrain/Loss (Raw)": 2.068882703781128, "Pretrain/Step": 4147, "Pretrain/Step Time": 8.452582228928804} +{"Pretrain/Learning Rate": 4.5530813594940164e-05, "Pretrain/Loss": 2.0420963764190674, "Pretrain/Loss (Raw)": 2.06528639793396, "Pretrain/Step": 4148, "Pretrain/Step Time": 8.453522393479943} +{"Pretrain/Learning Rate": 4.55283910342043e-05, "Pretrain/Loss": 2.041543960571289, "Pretrain/Loss (Raw)": 1.9766650199890137, "Pretrain/Step": 4149, "Pretrain/Step Time": 8.451602704823017} +{"Pretrain/Learning Rate": 4.552596788154675e-05, "Pretrain/Loss": 2.0394704341888428, "Pretrain/Loss (Raw)": 2.0183897018432617, "Pretrain/Step": 4150, "Pretrain/Step Time": 8.450321651995182} +{"Pretrain/Learning Rate": 4.552354413703738e-05, "Pretrain/Loss": 2.037898540496826, "Pretrain/Loss (Raw)": 1.8744419813156128, "Pretrain/Step": 4151, "Pretrain/Step Time": 8.455109955742955} +{"Pretrain/Learning Rate": 4.552111980074609e-05, "Pretrain/Loss": 2.0365867614746094, "Pretrain/Loss (Raw)": 2.0139236450195312, "Pretrain/Step": 4152, "Pretrain/Step Time": 8.45662914775312} +{"Pretrain/Learning Rate": 4.5518694872742774e-05, "Pretrain/Loss": 2.0398945808410645, "Pretrain/Loss (Raw)": 2.3850693702697754, "Pretrain/Step": 4153, "Pretrain/Step Time": 8.452847564592957} +{"Pretrain/Learning Rate": 4.551626935309736e-05, "Pretrain/Loss": 2.041199207305908, "Pretrain/Loss (Raw)": 2.193991184234619, "Pretrain/Step": 4154, "Pretrain/Step Time": 8.455532521009445} +{"Pretrain/Learning Rate": 4.5513843241879774e-05, "Pretrain/Loss": 2.0401971340179443, "Pretrain/Loss (Raw)": 2.055156946182251, "Pretrain/Step": 4155, "Pretrain/Step Time": 8.457005130127072} +{"Pretrain/Learning Rate": 4.551141653915999e-05, "Pretrain/Loss": 2.039717674255371, "Pretrain/Loss (Raw)": 2.031675100326538, "Pretrain/Step": 4156, "Pretrain/Step Time": 8.456781767308712} +{"Pretrain/Learning Rate": 4.550898924500796e-05, "Pretrain/Loss": 2.0368192195892334, "Pretrain/Loss (Raw)": 1.7220346927642822, "Pretrain/Step": 4157, "Pretrain/Step Time": 8.459233654662967} +{"Pretrain/Learning Rate": 4.550656135949369e-05, "Pretrain/Loss": 2.0356760025024414, "Pretrain/Loss (Raw)": 1.8785792589187622, "Pretrain/Step": 4158, "Pretrain/Step Time": 8.45801018923521} +{"Pretrain/Learning Rate": 4.550413288268717e-05, "Pretrain/Loss": 2.0354254245758057, "Pretrain/Loss (Raw)": 2.085411310195923, "Pretrain/Step": 4159, "Pretrain/Step Time": 8.45650938525796} +{"Pretrain/Learning Rate": 4.550170381465845e-05, "Pretrain/Loss": 2.0403146743774414, "Pretrain/Loss (Raw)": 2.779209852218628, "Pretrain/Step": 4160, "Pretrain/Step Time": 8.458763422444463} +{"Pretrain/Learning Rate": 4.5499274155477535e-05, "Pretrain/Loss": 2.038572072982788, "Pretrain/Loss (Raw)": 1.950703740119934, "Pretrain/Step": 4161, "Pretrain/Step Time": 8.46016493998468} +{"Pretrain/Learning Rate": 4.549684390521451e-05, "Pretrain/Loss": 2.0372138023376465, "Pretrain/Loss (Raw)": 2.029527425765991, "Pretrain/Step": 4162, "Pretrain/Step Time": 8.450707944110036} +{"Pretrain/Learning Rate": 4.549441306393943e-05, "Pretrain/Loss": 2.0371761322021484, "Pretrain/Loss (Raw)": 2.0702109336853027, "Pretrain/Step": 4163, "Pretrain/Step Time": 8.459749391302466} +{"Pretrain/Learning Rate": 4.5491981631722416e-05, "Pretrain/Loss": 2.036026954650879, "Pretrain/Loss (Raw)": 1.8788774013519287, "Pretrain/Step": 4164, "Pretrain/Step Time": 8.45186467282474} +{"Pretrain/Learning Rate": 4.548954960863354e-05, "Pretrain/Loss": 2.0356369018554688, "Pretrain/Loss (Raw)": 2.081561326980591, "Pretrain/Step": 4165, "Pretrain/Step Time": 8.4531220626086} +{"Pretrain/Learning Rate": 4.5487116994742954e-05, "Pretrain/Loss": 2.0372514724731445, "Pretrain/Loss (Raw)": 2.150334119796753, "Pretrain/Step": 4166, "Pretrain/Step Time": 8.456078903749585} +{"Pretrain/Learning Rate": 4.54846837901208e-05, "Pretrain/Loss": 2.036794662475586, "Pretrain/Loss (Raw)": 1.949477195739746, "Pretrain/Step": 4167, "Pretrain/Step Time": 8.455712409690022} +{"Pretrain/Learning Rate": 4.548224999483721e-05, "Pretrain/Loss": 2.0356125831604004, "Pretrain/Loss (Raw)": 1.942903757095337, "Pretrain/Step": 4168, "Pretrain/Step Time": 8.456887766718864} +{"Pretrain/Learning Rate": 4.5479815608962397e-05, "Pretrain/Loss": 2.037433624267578, "Pretrain/Loss (Raw)": 1.9563758373260498, "Pretrain/Step": 4169, "Pretrain/Step Time": 8.459493132308125} +{"Pretrain/Learning Rate": 4.547738063256653e-05, "Pretrain/Loss": 2.0373640060424805, "Pretrain/Loss (Raw)": 2.2170958518981934, "Pretrain/Step": 4170, "Pretrain/Step Time": 8.45565003529191} +{"Pretrain/Learning Rate": 4.5474945065719826e-05, "Pretrain/Loss": 2.0384600162506104, "Pretrain/Loss (Raw)": 1.958426594734192, "Pretrain/Step": 4171, "Pretrain/Step Time": 8.461044946685433} +{"Pretrain/Learning Rate": 4.547250890849252e-05, "Pretrain/Loss": 2.038501739501953, "Pretrain/Loss (Raw)": 1.890016794204712, "Pretrain/Step": 4172, "Pretrain/Step Time": 8.462381979450583} +{"Pretrain/Learning Rate": 4.547007216095485e-05, "Pretrain/Loss": 2.0407373905181885, "Pretrain/Loss (Raw)": 2.2303225994110107, "Pretrain/Step": 4173, "Pretrain/Step Time": 8.457691116258502} +{"Pretrain/Learning Rate": 4.546763482317708e-05, "Pretrain/Loss": 2.0393691062927246, "Pretrain/Loss (Raw)": 1.886080026626587, "Pretrain/Step": 4174, "Pretrain/Step Time": 8.460969058796763} +{"Pretrain/Learning Rate": 4.546519689522949e-05, "Pretrain/Loss": 2.041550397872925, "Pretrain/Loss (Raw)": 1.9018068313598633, "Pretrain/Step": 4175, "Pretrain/Step Time": 8.459725003689528} +{"Pretrain/Learning Rate": 4.546275837718237e-05, "Pretrain/Loss": 2.041938543319702, "Pretrain/Loss (Raw)": 2.1108689308166504, "Pretrain/Step": 4176, "Pretrain/Step Time": 8.460112858563662} +{"Pretrain/Learning Rate": 4.546031926910604e-05, "Pretrain/Loss": 2.0421478748321533, "Pretrain/Loss (Raw)": 2.1969714164733887, "Pretrain/Step": 4177, "Pretrain/Step Time": 8.464150428771973} +{"Pretrain/Learning Rate": 4.545787957107083e-05, "Pretrain/Loss": 2.040360450744629, "Pretrain/Loss (Raw)": 1.8199546337127686, "Pretrain/Step": 4178, "Pretrain/Step Time": 8.463594822213054} +{"Pretrain/Learning Rate": 4.545543928314708e-05, "Pretrain/Loss": 2.039966344833374, "Pretrain/Loss (Raw)": 2.09403657913208, "Pretrain/Step": 4179, "Pretrain/Step Time": 8.466524127870798} +{"Pretrain/Learning Rate": 4.545299840540517e-05, "Pretrain/Loss": 2.040511131286621, "Pretrain/Loss (Raw)": 2.0466179847717285, "Pretrain/Step": 4180, "Pretrain/Step Time": 8.465335428714752} +{"Pretrain/Learning Rate": 4.545055693791546e-05, "Pretrain/Loss": 2.0391154289245605, "Pretrain/Loss (Raw)": 1.9429931640625, "Pretrain/Step": 4181, "Pretrain/Step Time": 8.464557632803917} +{"Pretrain/Learning Rate": 4.544811488074835e-05, "Pretrain/Loss": 2.03944730758667, "Pretrain/Loss (Raw)": 2.159935474395752, "Pretrain/Step": 4182, "Pretrain/Step Time": 8.462520491331816} +{"Pretrain/Learning Rate": 4.544567223397427e-05, "Pretrain/Loss": 2.041686773300171, "Pretrain/Loss (Raw)": 2.1350152492523193, "Pretrain/Step": 4183, "Pretrain/Step Time": 8.46247156150639} +{"Pretrain/Learning Rate": 4.5443228997663644e-05, "Pretrain/Loss": 2.043221950531006, "Pretrain/Loss (Raw)": 2.213463306427002, "Pretrain/Step": 4184, "Pretrain/Step Time": 8.463632073253393} +{"Pretrain/Learning Rate": 4.5440785171886925e-05, "Pretrain/Loss": 2.0426597595214844, "Pretrain/Loss (Raw)": 1.9712342023849487, "Pretrain/Step": 4185, "Pretrain/Step Time": 8.466924959793687} +{"Pretrain/Learning Rate": 4.543834075671457e-05, "Pretrain/Loss": 2.043576240539551, "Pretrain/Loss (Raw)": 2.1733956336975098, "Pretrain/Step": 4186, "Pretrain/Step Time": 8.465511025860906} +{"Pretrain/Learning Rate": 4.543589575221707e-05, "Pretrain/Loss": 2.04295015335083, "Pretrain/Loss (Raw)": 1.8498303890228271, "Pretrain/Step": 4187, "Pretrain/Step Time": 8.464701984077692} +{"Pretrain/Learning Rate": 4.5433450158464924e-05, "Pretrain/Loss": 2.044137477874756, "Pretrain/Loss (Raw)": 2.1605029106140137, "Pretrain/Step": 4188, "Pretrain/Step Time": 8.468313701450825} +{"Pretrain/Learning Rate": 4.543100397552864e-05, "Pretrain/Loss": 2.044342041015625, "Pretrain/Loss (Raw)": 2.0094220638275146, "Pretrain/Step": 4189, "Pretrain/Step Time": 8.468753222376108} +{"Pretrain/Learning Rate": 4.542855720347877e-05, "Pretrain/Loss": 2.0427446365356445, "Pretrain/Loss (Raw)": 1.9657410383224487, "Pretrain/Step": 4190, "Pretrain/Step Time": 8.463493213057518} +{"Pretrain/Learning Rate": 4.542610984238585e-05, "Pretrain/Loss": 2.0414297580718994, "Pretrain/Loss (Raw)": 1.8376011848449707, "Pretrain/Step": 4191, "Pretrain/Step Time": 8.467074362561107} +{"Pretrain/Learning Rate": 4.542366189232045e-05, "Pretrain/Loss": 2.04007625579834, "Pretrain/Loss (Raw)": 2.0974011421203613, "Pretrain/Step": 4192, "Pretrain/Step Time": 8.461495840921998} +{"Pretrain/Learning Rate": 4.542121335335315e-05, "Pretrain/Loss": 2.0386078357696533, "Pretrain/Loss (Raw)": 2.0576345920562744, "Pretrain/Step": 4193, "Pretrain/Step Time": 8.458996411412954} +{"Pretrain/Learning Rate": 4.5418764225554575e-05, "Pretrain/Loss": 2.037114143371582, "Pretrain/Loss (Raw)": 1.8204883337020874, "Pretrain/Step": 4194, "Pretrain/Step Time": 8.462833158671856} +{"Pretrain/Learning Rate": 4.541631450899532e-05, "Pretrain/Loss": 2.038001537322998, "Pretrain/Loss (Raw)": 2.1605286598205566, "Pretrain/Step": 4195, "Pretrain/Step Time": 8.463462464511395} +{"Pretrain/Learning Rate": 4.541386420374603e-05, "Pretrain/Loss": 2.036832332611084, "Pretrain/Loss (Raw)": 1.9032784700393677, "Pretrain/Step": 4196, "Pretrain/Step Time": 8.459967376664281} +{"Pretrain/Learning Rate": 4.541141330987735e-05, "Pretrain/Loss": 2.038564920425415, "Pretrain/Loss (Raw)": 2.1968846321105957, "Pretrain/Step": 4197, "Pretrain/Step Time": 8.459709487855434} +{"Pretrain/Learning Rate": 4.540896182745996e-05, "Pretrain/Loss": 2.0356764793395996, "Pretrain/Loss (Raw)": 1.8524070978164673, "Pretrain/Step": 4198, "Pretrain/Step Time": 8.459188202396035} +{"Pretrain/Learning Rate": 4.5406509756564554e-05, "Pretrain/Loss": 2.034195899963379, "Pretrain/Loss (Raw)": 1.9093576669692993, "Pretrain/Step": 4199, "Pretrain/Step Time": 8.463662752881646} +{"Pretrain/Learning Rate": 4.540405709726181e-05, "Pretrain/Loss": 2.031771659851074, "Pretrain/Loss (Raw)": 1.8791277408599854, "Pretrain/Step": 4200, "Pretrain/Step Time": 8.465014159679413} +{"Pretrain/Learning Rate": 4.5401603849622467e-05, "Pretrain/Loss": 2.032285690307617, "Pretrain/Loss (Raw)": 1.9976259469985962, "Pretrain/Step": 4201, "Pretrain/Step Time": 8.465720338746905} +{"Pretrain/Learning Rate": 4.5399150013717265e-05, "Pretrain/Loss": 2.032788038253784, "Pretrain/Loss (Raw)": 2.148815870285034, "Pretrain/Step": 4202, "Pretrain/Step Time": 8.465770963579416} +{"Pretrain/Learning Rate": 4.539669558961694e-05, "Pretrain/Loss": 2.034511089324951, "Pretrain/Loss (Raw)": 2.261012315750122, "Pretrain/Step": 4203, "Pretrain/Step Time": 8.46328697539866} +{"Pretrain/Learning Rate": 4.539424057739229e-05, "Pretrain/Loss": 2.0333304405212402, "Pretrain/Loss (Raw)": 1.8481416702270508, "Pretrain/Step": 4204, "Pretrain/Step Time": 8.462962625548244} +{"Pretrain/Learning Rate": 4.5391784977114085e-05, "Pretrain/Loss": 2.0347766876220703, "Pretrain/Loss (Raw)": 2.100983142852783, "Pretrain/Step": 4205, "Pretrain/Step Time": 8.467996692284942} +{"Pretrain/Learning Rate": 4.538932878885313e-05, "Pretrain/Loss": 2.0347206592559814, "Pretrain/Loss (Raw)": 2.2452821731567383, "Pretrain/Step": 4206, "Pretrain/Step Time": 8.469998631626368} +{"Pretrain/Learning Rate": 4.538687201268027e-05, "Pretrain/Loss": 2.0355331897735596, "Pretrain/Loss (Raw)": 2.065642833709717, "Pretrain/Step": 4207, "Pretrain/Step Time": 8.46627219952643} +{"Pretrain/Learning Rate": 4.5384414648666305e-05, "Pretrain/Loss": 2.0331106185913086, "Pretrain/Loss (Raw)": 1.9483191967010498, "Pretrain/Step": 4208, "Pretrain/Step Time": 8.470128593966365} +{"Pretrain/Learning Rate": 4.538195669688213e-05, "Pretrain/Loss": 2.0324549674987793, "Pretrain/Loss (Raw)": 2.0266151428222656, "Pretrain/Step": 4209, "Pretrain/Step Time": 8.471755381673574} +{"Pretrain/Learning Rate": 4.537949815739859e-05, "Pretrain/Loss": 2.0375897884368896, "Pretrain/Loss (Raw)": 2.4438371658325195, "Pretrain/Step": 4210, "Pretrain/Step Time": 8.475622206926346} +{"Pretrain/Learning Rate": 4.5377039030286594e-05, "Pretrain/Loss": 2.040548801422119, "Pretrain/Loss (Raw)": 2.1512327194213867, "Pretrain/Step": 4211, "Pretrain/Step Time": 8.48118306323886} +{"Pretrain/Learning Rate": 4.5374579315617046e-05, "Pretrain/Loss": 2.039681911468506, "Pretrain/Loss (Raw)": 2.0150721073150635, "Pretrain/Step": 4212, "Pretrain/Step Time": 8.48025557026267} +{"Pretrain/Learning Rate": 4.537211901346086e-05, "Pretrain/Loss": 2.0364675521850586, "Pretrain/Loss (Raw)": 1.9401178359985352, "Pretrain/Step": 4213, "Pretrain/Step Time": 8.477163404226303} +{"Pretrain/Learning Rate": 4.536965812388899e-05, "Pretrain/Loss": 2.034236431121826, "Pretrain/Loss (Raw)": 1.8689998388290405, "Pretrain/Step": 4214, "Pretrain/Step Time": 8.477402513846755} +{"Pretrain/Learning Rate": 4.536719664697238e-05, "Pretrain/Loss": 2.035832166671753, "Pretrain/Loss (Raw)": 2.1037755012512207, "Pretrain/Step": 4215, "Pretrain/Step Time": 8.478926675394177} +{"Pretrain/Learning Rate": 4.536473458278202e-05, "Pretrain/Loss": 2.0356791019439697, "Pretrain/Loss (Raw)": 2.1060969829559326, "Pretrain/Step": 4216, "Pretrain/Step Time": 8.485111344605684} +{"Pretrain/Learning Rate": 4.536227193138889e-05, "Pretrain/Loss": 2.0354480743408203, "Pretrain/Loss (Raw)": 2.092791795730591, "Pretrain/Step": 4217, "Pretrain/Step Time": 8.481047756969929} +{"Pretrain/Learning Rate": 4.5359808692864e-05, "Pretrain/Loss": 2.0368285179138184, "Pretrain/Loss (Raw)": 1.9455132484436035, "Pretrain/Step": 4218, "Pretrain/Step Time": 8.482106296345592} +{"Pretrain/Learning Rate": 4.5357344867278384e-05, "Pretrain/Loss": 2.037397861480713, "Pretrain/Loss (Raw)": 2.0778021812438965, "Pretrain/Step": 4219, "Pretrain/Step Time": 8.482927216216922} +{"Pretrain/Learning Rate": 4.535488045470309e-05, "Pretrain/Loss": 2.037773609161377, "Pretrain/Loss (Raw)": 1.972699761390686, "Pretrain/Step": 4220, "Pretrain/Step Time": 8.481756178662181} +{"Pretrain/Learning Rate": 4.535241545520915e-05, "Pretrain/Loss": 2.0343871116638184, "Pretrain/Loss (Raw)": 1.622140884399414, "Pretrain/Step": 4221, "Pretrain/Step Time": 8.48100115917623} +{"Pretrain/Learning Rate": 4.5349949868867666e-05, "Pretrain/Loss": 2.03195858001709, "Pretrain/Loss (Raw)": 1.8304815292358398, "Pretrain/Step": 4222, "Pretrain/Step Time": 8.480783931910992} +{"Pretrain/Learning Rate": 4.534748369574972e-05, "Pretrain/Loss": 2.031581163406372, "Pretrain/Loss (Raw)": 2.1216611862182617, "Pretrain/Step": 4223, "Pretrain/Step Time": 8.47994221560657} +{"Pretrain/Learning Rate": 4.534501693592642e-05, "Pretrain/Loss": 2.0315208435058594, "Pretrain/Loss (Raw)": 1.9769330024719238, "Pretrain/Step": 4224, "Pretrain/Step Time": 8.476992379873991} +{"Pretrain/Learning Rate": 4.534254958946891e-05, "Pretrain/Loss": 2.032278060913086, "Pretrain/Loss (Raw)": 2.1099987030029297, "Pretrain/Step": 4225, "Pretrain/Step Time": 8.477497087791562} +{"Pretrain/Learning Rate": 4.5340081656448316e-05, "Pretrain/Loss": 2.0322420597076416, "Pretrain/Loss (Raw)": 2.073990821838379, "Pretrain/Step": 4226, "Pretrain/Step Time": 8.480678582563996} +{"Pretrain/Learning Rate": 4.533761313693582e-05, "Pretrain/Loss": 2.0306413173675537, "Pretrain/Loss (Raw)": 1.9458744525909424, "Pretrain/Step": 4227, "Pretrain/Step Time": 8.483306307345629} +{"Pretrain/Learning Rate": 4.533514403100258e-05, "Pretrain/Loss": 2.0316076278686523, "Pretrain/Loss (Raw)": 2.0556857585906982, "Pretrain/Step": 4228, "Pretrain/Step Time": 8.480831352993846} +{"Pretrain/Learning Rate": 4.5332674338719784e-05, "Pretrain/Loss": 2.0305728912353516, "Pretrain/Loss (Raw)": 1.94826340675354, "Pretrain/Step": 4229, "Pretrain/Step Time": 8.4802356492728} +{"Pretrain/Learning Rate": 4.5330204060158665e-05, "Pretrain/Loss": 2.030441999435425, "Pretrain/Loss (Raw)": 2.1546168327331543, "Pretrain/Step": 4230, "Pretrain/Step Time": 8.478083107620478} +{"Pretrain/Learning Rate": 4.532773319539045e-05, "Pretrain/Loss": 2.0283026695251465, "Pretrain/Loss (Raw)": 2.0705058574676514, "Pretrain/Step": 4231, "Pretrain/Step Time": 8.474149338901043} +{"Pretrain/Learning Rate": 4.5325261744486366e-05, "Pretrain/Loss": 2.028632402420044, "Pretrain/Loss (Raw)": 2.0488407611846924, "Pretrain/Step": 4232, "Pretrain/Step Time": 8.473294768482447} +{"Pretrain/Learning Rate": 4.53227897075177e-05, "Pretrain/Loss": 2.0280580520629883, "Pretrain/Loss (Raw)": 2.06074595451355, "Pretrain/Step": 4233, "Pretrain/Step Time": 8.484023842960596} +{"Pretrain/Learning Rate": 4.5320317084555715e-05, "Pretrain/Loss": 2.0276739597320557, "Pretrain/Loss (Raw)": 2.129624128341675, "Pretrain/Step": 4234, "Pretrain/Step Time": 8.480447700247169} +{"Pretrain/Learning Rate": 4.5317843875671706e-05, "Pretrain/Loss": 2.0262227058410645, "Pretrain/Loss (Raw)": 2.017272710800171, "Pretrain/Step": 4235, "Pretrain/Step Time": 8.478612566366792} +{"Pretrain/Learning Rate": 4.5315370080937e-05, "Pretrain/Loss": 2.02712082862854, "Pretrain/Loss (Raw)": 2.095024824142456, "Pretrain/Step": 4236, "Pretrain/Step Time": 8.477532969787717} +{"Pretrain/Learning Rate": 4.531289570042292e-05, "Pretrain/Loss": 2.0274956226348877, "Pretrain/Loss (Raw)": 2.0954084396362305, "Pretrain/Step": 4237, "Pretrain/Step Time": 8.479110965505242} +{"Pretrain/Learning Rate": 4.531042073420081e-05, "Pretrain/Loss": 2.0286548137664795, "Pretrain/Loss (Raw)": 2.1845130920410156, "Pretrain/Step": 4238, "Pretrain/Step Time": 8.479144860059023} +{"Pretrain/Learning Rate": 4.530794518234203e-05, "Pretrain/Loss": 2.028033494949341, "Pretrain/Loss (Raw)": 2.1940248012542725, "Pretrain/Step": 4239, "Pretrain/Step Time": 8.476971535012126} +{"Pretrain/Learning Rate": 4.530546904491797e-05, "Pretrain/Loss": 2.028843879699707, "Pretrain/Loss (Raw)": 2.068772077560425, "Pretrain/Step": 4240, "Pretrain/Step Time": 8.478885618969798} +{"Pretrain/Learning Rate": 4.530299232200002e-05, "Pretrain/Loss": 2.0306081771850586, "Pretrain/Loss (Raw)": 2.172362804412842, "Pretrain/Step": 4241, "Pretrain/Step Time": 8.47764396853745} +{"Pretrain/Learning Rate": 4.530051501365962e-05, "Pretrain/Loss": 2.0316381454467773, "Pretrain/Loss (Raw)": 2.0800108909606934, "Pretrain/Step": 4242, "Pretrain/Step Time": 8.48001030832529} +{"Pretrain/Learning Rate": 4.529803711996816e-05, "Pretrain/Loss": 2.0325491428375244, "Pretrain/Loss (Raw)": 2.0486533641815186, "Pretrain/Step": 4243, "Pretrain/Step Time": 8.475238198414445} +{"Pretrain/Learning Rate": 4.5295558640997115e-05, "Pretrain/Loss": 2.0329365730285645, "Pretrain/Loss (Raw)": 2.0622482299804688, "Pretrain/Step": 4244, "Pretrain/Step Time": 8.476560102775693} +{"Pretrain/Learning Rate": 4.529307957681794e-05, "Pretrain/Loss": 2.0310497283935547, "Pretrain/Loss (Raw)": 1.8623147010803223, "Pretrain/Step": 4245, "Pretrain/Step Time": 8.47097629122436} +{"Pretrain/Learning Rate": 4.529059992750213e-05, "Pretrain/Loss": 2.0295066833496094, "Pretrain/Loss (Raw)": 2.1106338500976562, "Pretrain/Step": 4246, "Pretrain/Step Time": 8.472419504076242} +{"Pretrain/Learning Rate": 4.528811969312117e-05, "Pretrain/Loss": 2.0273141860961914, "Pretrain/Loss (Raw)": 2.073380708694458, "Pretrain/Step": 4247, "Pretrain/Step Time": 8.47306015715003} +{"Pretrain/Learning Rate": 4.528563887374658e-05, "Pretrain/Loss": 2.025855302810669, "Pretrain/Loss (Raw)": 1.9471513032913208, "Pretrain/Step": 4248, "Pretrain/Step Time": 8.473040724173188} +{"Pretrain/Learning Rate": 4.528315746944989e-05, "Pretrain/Loss": 2.026787281036377, "Pretrain/Loss (Raw)": 1.9759008884429932, "Pretrain/Step": 4249, "Pretrain/Step Time": 8.469673652201891} +{"Pretrain/Learning Rate": 4.528067548030266e-05, "Pretrain/Loss": 2.0283701419830322, "Pretrain/Loss (Raw)": 1.8954771757125854, "Pretrain/Step": 4250, "Pretrain/Step Time": 8.471139373257756} +{"Pretrain/Learning Rate": 4.527819290637644e-05, "Pretrain/Loss": 2.029041290283203, "Pretrain/Loss (Raw)": 2.051832437515259, "Pretrain/Step": 4251, "Pretrain/Step Time": 8.472988059744239} +{"Pretrain/Learning Rate": 4.527570974774283e-05, "Pretrain/Loss": 2.0288805961608887, "Pretrain/Loss (Raw)": 2.0646812915802, "Pretrain/Step": 4252, "Pretrain/Step Time": 8.470175167545676} +{"Pretrain/Learning Rate": 4.527322600447342e-05, "Pretrain/Loss": 2.0311028957366943, "Pretrain/Loss (Raw)": 2.279442071914673, "Pretrain/Step": 4253, "Pretrain/Step Time": 8.47246577590704} +{"Pretrain/Learning Rate": 4.527074167663984e-05, "Pretrain/Loss": 2.0353596210479736, "Pretrain/Loss (Raw)": 2.1435017585754395, "Pretrain/Step": 4254, "Pretrain/Step Time": 8.46838690713048} +{"Pretrain/Learning Rate": 4.5268256764313696e-05, "Pretrain/Loss": 2.0369088649749756, "Pretrain/Loss (Raw)": 2.1247341632843018, "Pretrain/Step": 4255, "Pretrain/Step Time": 8.474070753902197} +{"Pretrain/Learning Rate": 4.526577126756667e-05, "Pretrain/Loss": 2.0392110347747803, "Pretrain/Loss (Raw)": 2.129757881164551, "Pretrain/Step": 4256, "Pretrain/Step Time": 8.473415615037084} +{"Pretrain/Learning Rate": 4.526328518647042e-05, "Pretrain/Loss": 2.0393784046173096, "Pretrain/Loss (Raw)": 1.9247758388519287, "Pretrain/Step": 4257, "Pretrain/Step Time": 8.47275180183351} +{"Pretrain/Learning Rate": 4.5260798521096614e-05, "Pretrain/Loss": 2.039875030517578, "Pretrain/Loss (Raw)": 1.9847534894943237, "Pretrain/Step": 4258, "Pretrain/Step Time": 8.467536557465792} +{"Pretrain/Learning Rate": 4.525831127151697e-05, "Pretrain/Loss": 2.0418529510498047, "Pretrain/Loss (Raw)": 2.0751895904541016, "Pretrain/Step": 4259, "Pretrain/Step Time": 8.4717584438622} +{"Pretrain/Learning Rate": 4.52558234378032e-05, "Pretrain/Loss": 2.045060873031616, "Pretrain/Loss (Raw)": 2.159430503845215, "Pretrain/Step": 4260, "Pretrain/Step Time": 8.47234209626913} +{"Pretrain/Learning Rate": 4.525333502002704e-05, "Pretrain/Loss": 2.042398452758789, "Pretrain/Loss (Raw)": 1.8890180587768555, "Pretrain/Step": 4261, "Pretrain/Step Time": 8.475709395483136} +{"Pretrain/Learning Rate": 4.5250846018260244e-05, "Pretrain/Loss": 2.043440341949463, "Pretrain/Loss (Raw)": 2.236070394515991, "Pretrain/Step": 4262, "Pretrain/Step Time": 8.47369067557156} +{"Pretrain/Learning Rate": 4.524835643257458e-05, "Pretrain/Loss": 2.045012950897217, "Pretrain/Loss (Raw)": 1.935996174812317, "Pretrain/Step": 4263, "Pretrain/Step Time": 8.467611907050014} +{"Pretrain/Learning Rate": 4.524586626304183e-05, "Pretrain/Loss": 2.0419936180114746, "Pretrain/Loss (Raw)": 1.8477154970169067, "Pretrain/Step": 4264, "Pretrain/Step Time": 8.466608701273799} +{"Pretrain/Learning Rate": 4.52433755097338e-05, "Pretrain/Loss": 2.042025327682495, "Pretrain/Loss (Raw)": 1.8852180242538452, "Pretrain/Step": 4265, "Pretrain/Step Time": 8.46804704144597} +{"Pretrain/Learning Rate": 4.524088417272231e-05, "Pretrain/Loss": 2.0406079292297363, "Pretrain/Loss (Raw)": 1.909940481185913, "Pretrain/Step": 4266, "Pretrain/Step Time": 8.468067485839128} +{"Pretrain/Learning Rate": 4.5238392252079196e-05, "Pretrain/Loss": 2.0438289642333984, "Pretrain/Loss (Raw)": 2.357896327972412, "Pretrain/Step": 4267, "Pretrain/Step Time": 8.463802114129066} +{"Pretrain/Learning Rate": 4.5235899747876305e-05, "Pretrain/Loss": 2.0446953773498535, "Pretrain/Loss (Raw)": 1.9882014989852905, "Pretrain/Step": 4268, "Pretrain/Step Time": 8.46420368552208} +{"Pretrain/Learning Rate": 4.5233406660185505e-05, "Pretrain/Loss": 2.0435714721679688, "Pretrain/Loss (Raw)": 2.115285634994507, "Pretrain/Step": 4269, "Pretrain/Step Time": 8.465082220733166} +{"Pretrain/Learning Rate": 4.523091298907869e-05, "Pretrain/Loss": 2.044041872024536, "Pretrain/Loss (Raw)": 2.2145612239837646, "Pretrain/Step": 4270, "Pretrain/Step Time": 8.469475708901882} +{"Pretrain/Learning Rate": 4.522841873462776e-05, "Pretrain/Loss": 2.04499888420105, "Pretrain/Loss (Raw)": 2.193650722503662, "Pretrain/Step": 4271, "Pretrain/Step Time": 8.465489473193884} +{"Pretrain/Learning Rate": 4.522592389690464e-05, "Pretrain/Loss": 2.0456981658935547, "Pretrain/Loss (Raw)": 2.159695863723755, "Pretrain/Step": 4272, "Pretrain/Step Time": 8.468825725838542} +{"Pretrain/Learning Rate": 4.522342847598127e-05, "Pretrain/Loss": 2.0469555854797363, "Pretrain/Loss (Raw)": 2.1374049186706543, "Pretrain/Step": 4273, "Pretrain/Step Time": 8.467851744964719} +{"Pretrain/Learning Rate": 4.522093247192959e-05, "Pretrain/Loss": 2.047268867492676, "Pretrain/Loss (Raw)": 2.0416476726531982, "Pretrain/Step": 4274, "Pretrain/Step Time": 8.462421126663685} +{"Pretrain/Learning Rate": 4.521843588482157e-05, "Pretrain/Loss": 2.0454280376434326, "Pretrain/Loss (Raw)": 1.8332613706588745, "Pretrain/Step": 4275, "Pretrain/Step Time": 8.461948931217194} +{"Pretrain/Learning Rate": 4.521593871472921e-05, "Pretrain/Loss": 2.0475616455078125, "Pretrain/Loss (Raw)": 2.3383703231811523, "Pretrain/Step": 4276, "Pretrain/Step Time": 8.461273241788149} +{"Pretrain/Learning Rate": 4.521344096172451e-05, "Pretrain/Loss": 2.0481033325195312, "Pretrain/Loss (Raw)": 2.0460364818573, "Pretrain/Step": 4277, "Pretrain/Step Time": 8.46324985101819} +{"Pretrain/Learning Rate": 4.521094262587948e-05, "Pretrain/Loss": 2.0473132133483887, "Pretrain/Loss (Raw)": 1.9172372817993164, "Pretrain/Step": 4278, "Pretrain/Step Time": 8.463984915986657} +{"Pretrain/Learning Rate": 4.520844370726618e-05, "Pretrain/Loss": 2.0482966899871826, "Pretrain/Loss (Raw)": 2.0003087520599365, "Pretrain/Step": 4279, "Pretrain/Step Time": 8.460055029019713} +{"Pretrain/Learning Rate": 4.520594420595664e-05, "Pretrain/Loss": 2.046966791152954, "Pretrain/Loss (Raw)": 1.8437108993530273, "Pretrain/Step": 4280, "Pretrain/Step Time": 8.459578773006797} +{"Pretrain/Learning Rate": 4.520344412202295e-05, "Pretrain/Loss": 2.044398069381714, "Pretrain/Loss (Raw)": 2.0562710762023926, "Pretrain/Step": 4281, "Pretrain/Step Time": 8.457471922039986} +{"Pretrain/Learning Rate": 4.520094345553719e-05, "Pretrain/Loss": 2.0421299934387207, "Pretrain/Loss (Raw)": 1.9036686420440674, "Pretrain/Step": 4282, "Pretrain/Step Time": 8.457523237913847} +{"Pretrain/Learning Rate": 4.5198442206571474e-05, "Pretrain/Loss": 2.041982889175415, "Pretrain/Loss (Raw)": 2.036343574523926, "Pretrain/Step": 4283, "Pretrain/Step Time": 8.464347921311855} +{"Pretrain/Learning Rate": 4.519594037519791e-05, "Pretrain/Loss": 2.041936159133911, "Pretrain/Loss (Raw)": 2.0256834030151367, "Pretrain/Step": 4284, "Pretrain/Step Time": 8.460228467360139} +{"Pretrain/Learning Rate": 4.519343796148864e-05, "Pretrain/Loss": 2.0441951751708984, "Pretrain/Loss (Raw)": 2.0112037658691406, "Pretrain/Step": 4285, "Pretrain/Step Time": 8.460152916610241} +{"Pretrain/Learning Rate": 4.519093496551582e-05, "Pretrain/Loss": 2.0452280044555664, "Pretrain/Loss (Raw)": 2.0107829570770264, "Pretrain/Step": 4286, "Pretrain/Step Time": 8.46183510683477} +{"Pretrain/Learning Rate": 4.518843138735162e-05, "Pretrain/Loss": 2.044309139251709, "Pretrain/Loss (Raw)": 1.967781662940979, "Pretrain/Step": 4287, "Pretrain/Step Time": 8.46073428913951} +{"Pretrain/Learning Rate": 4.5185927227068247e-05, "Pretrain/Loss": 2.0403378009796143, "Pretrain/Loss (Raw)": 2.270885467529297, "Pretrain/Step": 4288, "Pretrain/Step Time": 8.461371740326285} +{"Pretrain/Learning Rate": 4.5183422484737886e-05, "Pretrain/Loss": 2.040973424911499, "Pretrain/Loss (Raw)": 2.03206205368042, "Pretrain/Step": 4289, "Pretrain/Step Time": 8.46138946712017} +{"Pretrain/Learning Rate": 4.518091716043277e-05, "Pretrain/Loss": 2.040583610534668, "Pretrain/Loss (Raw)": 1.9796127080917358, "Pretrain/Step": 4290, "Pretrain/Step Time": 8.463517688214779} +{"Pretrain/Learning Rate": 4.5178411254225126e-05, "Pretrain/Loss": 2.039618968963623, "Pretrain/Loss (Raw)": 1.9467298984527588, "Pretrain/Step": 4291, "Pretrain/Step Time": 8.456923527643085} +{"Pretrain/Learning Rate": 4.517590476618722e-05, "Pretrain/Loss": 2.0414187908172607, "Pretrain/Loss (Raw)": 2.1092827320098877, "Pretrain/Step": 4292, "Pretrain/Step Time": 8.461420336738229} +{"Pretrain/Learning Rate": 4.517339769639133e-05, "Pretrain/Loss": 2.0400643348693848, "Pretrain/Loss (Raw)": 1.9081988334655762, "Pretrain/Step": 4293, "Pretrain/Step Time": 8.457432460039854} +{"Pretrain/Learning Rate": 4.517089004490973e-05, "Pretrain/Loss": 2.038679361343384, "Pretrain/Loss (Raw)": 1.9730491638183594, "Pretrain/Step": 4294, "Pretrain/Step Time": 8.461685417219996} +{"Pretrain/Learning Rate": 4.516838181181474e-05, "Pretrain/Loss": 2.039111614227295, "Pretrain/Loss (Raw)": 2.0047826766967773, "Pretrain/Step": 4295, "Pretrain/Step Time": 8.458715673536062} +{"Pretrain/Learning Rate": 4.516587299717867e-05, "Pretrain/Loss": 2.0395922660827637, "Pretrain/Loss (Raw)": 2.0044357776641846, "Pretrain/Step": 4296, "Pretrain/Step Time": 8.459870690479875} +{"Pretrain/Learning Rate": 4.5163363601073886e-05, "Pretrain/Loss": 2.041247844696045, "Pretrain/Loss (Raw)": 2.1682896614074707, "Pretrain/Step": 4297, "Pretrain/Step Time": 8.452219458296895} +{"Pretrain/Learning Rate": 4.516085362357271e-05, "Pretrain/Loss": 2.0381131172180176, "Pretrain/Loss (Raw)": 1.8158761262893677, "Pretrain/Step": 4298, "Pretrain/Step Time": 8.456504190340638} +{"Pretrain/Learning Rate": 4.5158343064747546e-05, "Pretrain/Loss": 2.0394723415374756, "Pretrain/Loss (Raw)": 2.1323792934417725, "Pretrain/Step": 4299, "Pretrain/Step Time": 8.452134786173701} +{"Pretrain/Learning Rate": 4.515583192467076e-05, "Pretrain/Loss": 2.041232109069824, "Pretrain/Loss (Raw)": 2.1152596473693848, "Pretrain/Step": 4300, "Pretrain/Step Time": 8.450974943116307} +{"Pretrain/Learning Rate": 4.515332020341477e-05, "Pretrain/Loss": 2.0384483337402344, "Pretrain/Loss (Raw)": 1.8740228414535522, "Pretrain/Step": 4301, "Pretrain/Step Time": 8.456231281161308} +{"Pretrain/Learning Rate": 4.5150807901052e-05, "Pretrain/Loss": 2.039369583129883, "Pretrain/Loss (Raw)": 2.004002094268799, "Pretrain/Step": 4302, "Pretrain/Step Time": 8.456533078104258} +{"Pretrain/Learning Rate": 4.514829501765489e-05, "Pretrain/Loss": 2.0408873558044434, "Pretrain/Loss (Raw)": 2.096052885055542, "Pretrain/Step": 4303, "Pretrain/Step Time": 8.452220195904374} +{"Pretrain/Learning Rate": 4.51457815532959e-05, "Pretrain/Loss": 2.040773868560791, "Pretrain/Loss (Raw)": 2.096378803253174, "Pretrain/Step": 4304, "Pretrain/Step Time": 8.455957951024175} +{"Pretrain/Learning Rate": 4.514326750804749e-05, "Pretrain/Loss": 2.0390360355377197, "Pretrain/Loss (Raw)": 1.9745007753372192, "Pretrain/Step": 4305, "Pretrain/Step Time": 8.451078986749053} +{"Pretrain/Learning Rate": 4.514075288198217e-05, "Pretrain/Loss": 2.040506362915039, "Pretrain/Loss (Raw)": 2.0081734657287598, "Pretrain/Step": 4306, "Pretrain/Step Time": 8.448483252897859} +{"Pretrain/Learning Rate": 4.5138237675172445e-05, "Pretrain/Loss": 2.0421533584594727, "Pretrain/Loss (Raw)": 2.3048183917999268, "Pretrain/Step": 4307, "Pretrain/Step Time": 8.442191218957305} +{"Pretrain/Learning Rate": 4.5135721887690827e-05, "Pretrain/Loss": 2.0402684211730957, "Pretrain/Loss (Raw)": 1.8053779602050781, "Pretrain/Step": 4308, "Pretrain/Step Time": 8.446406623348594} +{"Pretrain/Learning Rate": 4.513320551960986e-05, "Pretrain/Loss": 2.0410587787628174, "Pretrain/Loss (Raw)": 2.0441393852233887, "Pretrain/Step": 4309, "Pretrain/Step Time": 8.44696655496955} +{"Pretrain/Learning Rate": 4.513068857100211e-05, "Pretrain/Loss": 2.039950132369995, "Pretrain/Loss (Raw)": 2.0180442333221436, "Pretrain/Step": 4310, "Pretrain/Step Time": 8.449857983738184} +{"Pretrain/Learning Rate": 4.5128171041940145e-05, "Pretrain/Loss": 2.0395901203155518, "Pretrain/Loss (Raw)": 2.088921070098877, "Pretrain/Step": 4311, "Pretrain/Step Time": 8.444689122959971} +{"Pretrain/Learning Rate": 4.5125652932496555e-05, "Pretrain/Loss": 2.037879467010498, "Pretrain/Loss (Raw)": 1.9945080280303955, "Pretrain/Step": 4312, "Pretrain/Step Time": 8.443682134151459} +{"Pretrain/Learning Rate": 4.512313424274395e-05, "Pretrain/Loss": 2.037611484527588, "Pretrain/Loss (Raw)": 1.9369168281555176, "Pretrain/Step": 4313, "Pretrain/Step Time": 8.440457712858915} +{"Pretrain/Learning Rate": 4.512061497275496e-05, "Pretrain/Loss": 2.0373222827911377, "Pretrain/Loss (Raw)": 2.1363954544067383, "Pretrain/Step": 4314, "Pretrain/Step Time": 8.439770558848977} +{"Pretrain/Learning Rate": 4.511809512260222e-05, "Pretrain/Loss": 2.0407605171203613, "Pretrain/Loss (Raw)": 2.2899181842803955, "Pretrain/Step": 4315, "Pretrain/Step Time": 8.440666230395436} +{"Pretrain/Learning Rate": 4.511557469235839e-05, "Pretrain/Loss": 2.0396790504455566, "Pretrain/Loss (Raw)": 2.022063732147217, "Pretrain/Step": 4316, "Pretrain/Step Time": 8.440321596339345} +{"Pretrain/Learning Rate": 4.511305368209614e-05, "Pretrain/Loss": 2.0399577617645264, "Pretrain/Loss (Raw)": 2.045093536376953, "Pretrain/Step": 4317, "Pretrain/Step Time": 8.437606703490019} +{"Pretrain/Learning Rate": 4.511053209188817e-05, "Pretrain/Loss": 2.041008472442627, "Pretrain/Loss (Raw)": 2.100247383117676, "Pretrain/Step": 4318, "Pretrain/Step Time": 8.437278416007757} +{"Pretrain/Learning Rate": 4.510800992180717e-05, "Pretrain/Loss": 2.0423946380615234, "Pretrain/Loss (Raw)": 2.0150504112243652, "Pretrain/Step": 4319, "Pretrain/Step Time": 8.435999197885394} +{"Pretrain/Learning Rate": 4.51054871719259e-05, "Pretrain/Loss": 2.041532516479492, "Pretrain/Loss (Raw)": 1.987004280090332, "Pretrain/Step": 4320, "Pretrain/Step Time": 8.438277585431933} +{"Pretrain/Learning Rate": 4.510296384231707e-05, "Pretrain/Loss": 2.040492057800293, "Pretrain/Loss (Raw)": 1.9244767427444458, "Pretrain/Step": 4321, "Pretrain/Step Time": 8.438467182219028} +{"Pretrain/Learning Rate": 4.510043993305345e-05, "Pretrain/Loss": 2.0425338745117188, "Pretrain/Loss (Raw)": 2.0818352699279785, "Pretrain/Step": 4322, "Pretrain/Step Time": 8.438478957861662} +{"Pretrain/Learning Rate": 4.5097915444207817e-05, "Pretrain/Loss": 2.042959451675415, "Pretrain/Loss (Raw)": 2.214996576309204, "Pretrain/Step": 4323, "Pretrain/Step Time": 8.433502208441496} +{"Pretrain/Learning Rate": 4.5095390375852955e-05, "Pretrain/Loss": 2.044053554534912, "Pretrain/Loss (Raw)": 2.043348550796509, "Pretrain/Step": 4324, "Pretrain/Step Time": 8.433878105133772} +{"Pretrain/Learning Rate": 4.5092864728061686e-05, "Pretrain/Loss": 2.0429911613464355, "Pretrain/Loss (Raw)": 2.0608623027801514, "Pretrain/Step": 4325, "Pretrain/Step Time": 8.439022613689303} +{"Pretrain/Learning Rate": 4.5090338500906826e-05, "Pretrain/Loss": 2.0449647903442383, "Pretrain/Loss (Raw)": 2.105062246322632, "Pretrain/Step": 4326, "Pretrain/Step Time": 8.440420361235738} +{"Pretrain/Learning Rate": 4.5087811694461214e-05, "Pretrain/Loss": 2.0452914237976074, "Pretrain/Loss (Raw)": 1.9511739015579224, "Pretrain/Step": 4327, "Pretrain/Step Time": 8.43963405676186} +{"Pretrain/Learning Rate": 4.508528430879771e-05, "Pretrain/Loss": 2.045583724975586, "Pretrain/Loss (Raw)": 1.9165241718292236, "Pretrain/Step": 4328, "Pretrain/Step Time": 8.437468534335494} +{"Pretrain/Learning Rate": 4.5082756343989195e-05, "Pretrain/Loss": 2.045618772506714, "Pretrain/Loss (Raw)": 2.0021018981933594, "Pretrain/Step": 4329, "Pretrain/Step Time": 8.435865871608257} +{"Pretrain/Learning Rate": 4.508022780010856e-05, "Pretrain/Loss": 2.046746253967285, "Pretrain/Loss (Raw)": 2.293182134628296, "Pretrain/Step": 4330, "Pretrain/Step Time": 8.43670423142612} +{"Pretrain/Learning Rate": 4.507769867722871e-05, "Pretrain/Loss": 2.0461299419403076, "Pretrain/Loss (Raw)": 2.182115077972412, "Pretrain/Step": 4331, "Pretrain/Step Time": 8.4336267542094} +{"Pretrain/Learning Rate": 4.507516897542258e-05, "Pretrain/Loss": 2.0466561317443848, "Pretrain/Loss (Raw)": 1.9154727458953857, "Pretrain/Step": 4332, "Pretrain/Step Time": 8.440291969105601} +{"Pretrain/Learning Rate": 4.507263869476309e-05, "Pretrain/Loss": 2.050055742263794, "Pretrain/Loss (Raw)": 2.5361311435699463, "Pretrain/Step": 4333, "Pretrain/Step Time": 8.433282127603889} +{"Pretrain/Learning Rate": 4.5070107835323225e-05, "Pretrain/Loss": 2.0503487586975098, "Pretrain/Loss (Raw)": 2.2828028202056885, "Pretrain/Step": 4334, "Pretrain/Step Time": 8.430333185940981} +{"Pretrain/Learning Rate": 4.506757639717595e-05, "Pretrain/Loss": 2.0491676330566406, "Pretrain/Loss (Raw)": 1.9144771099090576, "Pretrain/Step": 4335, "Pretrain/Step Time": 8.436463998630643} +{"Pretrain/Learning Rate": 4.506504438039425e-05, "Pretrain/Loss": 2.0508131980895996, "Pretrain/Loss (Raw)": 2.1589205265045166, "Pretrain/Step": 4336, "Pretrain/Step Time": 8.431760504841805} +{"Pretrain/Learning Rate": 4.506251178505114e-05, "Pretrain/Loss": 2.052180051803589, "Pretrain/Loss (Raw)": 2.201578140258789, "Pretrain/Step": 4337, "Pretrain/Step Time": 8.428792040795088} +{"Pretrain/Learning Rate": 4.5059978611219644e-05, "Pretrain/Loss": 2.0495920181274414, "Pretrain/Loss (Raw)": 2.1125895977020264, "Pretrain/Step": 4338, "Pretrain/Step Time": 8.426958113908768} +{"Pretrain/Learning Rate": 4.505744485897281e-05, "Pretrain/Loss": 2.0491180419921875, "Pretrain/Loss (Raw)": 2.090555429458618, "Pretrain/Step": 4339, "Pretrain/Step Time": 8.422878500074148} +{"Pretrain/Learning Rate": 4.50549105283837e-05, "Pretrain/Loss": 2.0488593578338623, "Pretrain/Loss (Raw)": 1.981943964958191, "Pretrain/Step": 4340, "Pretrain/Step Time": 8.427037741988897} +{"Pretrain/Learning Rate": 4.5052375619525374e-05, "Pretrain/Loss": 2.0509068965911865, "Pretrain/Loss (Raw)": 2.2022135257720947, "Pretrain/Step": 4341, "Pretrain/Step Time": 8.429475096985698} +{"Pretrain/Learning Rate": 4.504984013247093e-05, "Pretrain/Loss": 2.0528512001037598, "Pretrain/Loss (Raw)": 2.1178572177886963, "Pretrain/Step": 4342, "Pretrain/Step Time": 8.432448893785477} +{"Pretrain/Learning Rate": 4.504730406729349e-05, "Pretrain/Loss": 2.0529961585998535, "Pretrain/Loss (Raw)": 2.122347593307495, "Pretrain/Step": 4343, "Pretrain/Step Time": 8.434443023055792} +{"Pretrain/Learning Rate": 4.504476742406616e-05, "Pretrain/Loss": 2.053248882293701, "Pretrain/Loss (Raw)": 2.1384189128875732, "Pretrain/Step": 4344, "Pretrain/Step Time": 8.431785618886352} +{"Pretrain/Learning Rate": 4.50422302028621e-05, "Pretrain/Loss": 2.0518722534179688, "Pretrain/Loss (Raw)": 1.9165856838226318, "Pretrain/Step": 4345, "Pretrain/Step Time": 8.434749471023679} +{"Pretrain/Learning Rate": 4.5039692403754456e-05, "Pretrain/Loss": 2.0533628463745117, "Pretrain/Loss (Raw)": 2.1363344192504883, "Pretrain/Step": 4346, "Pretrain/Step Time": 8.433894852176309} +{"Pretrain/Learning Rate": 4.503715402681641e-05, "Pretrain/Loss": 2.0542571544647217, "Pretrain/Loss (Raw)": 2.192281723022461, "Pretrain/Step": 4347, "Pretrain/Step Time": 8.430098719894886} +{"Pretrain/Learning Rate": 4.5034615072121154e-05, "Pretrain/Loss": 2.0583648681640625, "Pretrain/Loss (Raw)": 2.498486280441284, "Pretrain/Step": 4348, "Pretrain/Step Time": 8.43394366838038} +{"Pretrain/Learning Rate": 4.503207553974189e-05, "Pretrain/Loss": 2.0624730587005615, "Pretrain/Loss (Raw)": 2.147982120513916, "Pretrain/Step": 4349, "Pretrain/Step Time": 8.436943471431732} +{"Pretrain/Learning Rate": 4.502953542975186e-05, "Pretrain/Loss": 2.0637402534484863, "Pretrain/Loss (Raw)": 1.9926878213882446, "Pretrain/Step": 4350, "Pretrain/Step Time": 8.43616010248661} +{"Pretrain/Learning Rate": 4.502699474222429e-05, "Pretrain/Loss": 2.063230514526367, "Pretrain/Loss (Raw)": 2.0563926696777344, "Pretrain/Step": 4351, "Pretrain/Step Time": 8.442389206960797} +{"Pretrain/Learning Rate": 4.5024453477232444e-05, "Pretrain/Loss": 2.0638461112976074, "Pretrain/Loss (Raw)": 2.055755615234375, "Pretrain/Step": 4352, "Pretrain/Step Time": 8.44477898068726} +{"Pretrain/Learning Rate": 4.50219116348496e-05, "Pretrain/Loss": 2.0650582313537598, "Pretrain/Loss (Raw)": 2.2651467323303223, "Pretrain/Step": 4353, "Pretrain/Step Time": 8.441953467205167} +{"Pretrain/Learning Rate": 4.5019369215149045e-05, "Pretrain/Loss": 2.0652246475219727, "Pretrain/Loss (Raw)": 2.0952670574188232, "Pretrain/Step": 4354, "Pretrain/Step Time": 8.43920206092298} +{"Pretrain/Learning Rate": 4.501682621820409e-05, "Pretrain/Loss": 2.0666723251342773, "Pretrain/Loss (Raw)": 2.1311800479888916, "Pretrain/Step": 4355, "Pretrain/Step Time": 8.435891158878803} +{"Pretrain/Learning Rate": 4.5014282644088066e-05, "Pretrain/Loss": 2.0693228244781494, "Pretrain/Loss (Raw)": 2.3949501514434814, "Pretrain/Step": 4356, "Pretrain/Step Time": 8.434453209862113} +{"Pretrain/Learning Rate": 4.5011738492874315e-05, "Pretrain/Loss": 2.0687198638916016, "Pretrain/Loss (Raw)": 1.8710787296295166, "Pretrain/Step": 4357, "Pretrain/Step Time": 8.435262219980359} +{"Pretrain/Learning Rate": 4.5009193764636195e-05, "Pretrain/Loss": 2.0694289207458496, "Pretrain/Loss (Raw)": 2.2453842163085938, "Pretrain/Step": 4358, "Pretrain/Step Time": 8.44023047760129} +{"Pretrain/Learning Rate": 4.5006648459447064e-05, "Pretrain/Loss": 2.0696189403533936, "Pretrain/Loss (Raw)": 2.094832181930542, "Pretrain/Step": 4359, "Pretrain/Step Time": 8.440868277102709} +{"Pretrain/Learning Rate": 4.500410257738034e-05, "Pretrain/Loss": 2.069650411605835, "Pretrain/Loss (Raw)": 2.0528743267059326, "Pretrain/Step": 4360, "Pretrain/Step Time": 8.442137490957975} +{"Pretrain/Learning Rate": 4.5001556118509416e-05, "Pretrain/Loss": 2.068647861480713, "Pretrain/Loss (Raw)": 1.9324041604995728, "Pretrain/Step": 4361, "Pretrain/Step Time": 8.43295532464981} +{"Pretrain/Learning Rate": 4.499900908290772e-05, "Pretrain/Loss": 2.068244218826294, "Pretrain/Loss (Raw)": 2.077969551086426, "Pretrain/Step": 4362, "Pretrain/Step Time": 8.43433059193194} +{"Pretrain/Learning Rate": 4.4996461470648696e-05, "Pretrain/Loss": 2.0656604766845703, "Pretrain/Loss (Raw)": 1.6865715980529785, "Pretrain/Step": 4363, "Pretrain/Step Time": 8.432290134951472} +{"Pretrain/Learning Rate": 4.49939132818058e-05, "Pretrain/Loss": 2.06471586227417, "Pretrain/Loss (Raw)": 1.974084496498108, "Pretrain/Step": 4364, "Pretrain/Step Time": 8.432530200108886} +{"Pretrain/Learning Rate": 4.4991364516452514e-05, "Pretrain/Loss": 2.067171096801758, "Pretrain/Loss (Raw)": 2.4096930027008057, "Pretrain/Step": 4365, "Pretrain/Step Time": 8.435665905475616} +{"Pretrain/Learning Rate": 4.498881517466233e-05, "Pretrain/Loss": 2.066403388977051, "Pretrain/Loss (Raw)": 2.086244821548462, "Pretrain/Step": 4366, "Pretrain/Step Time": 8.438661001622677} +{"Pretrain/Learning Rate": 4.498626525650874e-05, "Pretrain/Loss": 2.0658085346221924, "Pretrain/Loss (Raw)": 2.1178953647613525, "Pretrain/Step": 4367, "Pretrain/Step Time": 8.443776499480009} +{"Pretrain/Learning Rate": 4.498371476206529e-05, "Pretrain/Loss": 2.066650867462158, "Pretrain/Loss (Raw)": 2.176551103591919, "Pretrain/Step": 4368, "Pretrain/Step Time": 8.439918434247375} +{"Pretrain/Learning Rate": 4.4981163691405505e-05, "Pretrain/Loss": 2.066025495529175, "Pretrain/Loss (Raw)": 2.092339277267456, "Pretrain/Step": 4369, "Pretrain/Step Time": 8.442212721332908} +{"Pretrain/Learning Rate": 4.4978612044602955e-05, "Pretrain/Loss": 2.0668752193450928, "Pretrain/Loss (Raw)": 2.188767194747925, "Pretrain/Step": 4370, "Pretrain/Step Time": 8.437558269128203} +{"Pretrain/Learning Rate": 4.497605982173121e-05, "Pretrain/Loss": 2.067707061767578, "Pretrain/Loss (Raw)": 2.1551568508148193, "Pretrain/Step": 4371, "Pretrain/Step Time": 8.435602143406868} +{"Pretrain/Learning Rate": 4.497350702286386e-05, "Pretrain/Loss": 2.067600965499878, "Pretrain/Loss (Raw)": 2.0486433506011963, "Pretrain/Step": 4372, "Pretrain/Step Time": 8.433533055707812} +{"Pretrain/Learning Rate": 4.4970953648074515e-05, "Pretrain/Loss": 2.0690183639526367, "Pretrain/Loss (Raw)": 2.043731927871704, "Pretrain/Step": 4373, "Pretrain/Step Time": 8.438457043841481} +{"Pretrain/Learning Rate": 4.4968399697436804e-05, "Pretrain/Loss": 2.0688185691833496, "Pretrain/Loss (Raw)": 2.0850894451141357, "Pretrain/Step": 4374, "Pretrain/Step Time": 8.43630189448595} +{"Pretrain/Learning Rate": 4.496584517102436e-05, "Pretrain/Loss": 2.0689234733581543, "Pretrain/Loss (Raw)": 2.0868124961853027, "Pretrain/Step": 4375, "Pretrain/Step Time": 8.44113989546895} +{"Pretrain/Learning Rate": 4.496329006891085e-05, "Pretrain/Loss": 2.0696163177490234, "Pretrain/Loss (Raw)": 2.0358099937438965, "Pretrain/Step": 4376, "Pretrain/Step Time": 8.443127885460854} +{"Pretrain/Learning Rate": 4.496073439116994e-05, "Pretrain/Loss": 2.069253921508789, "Pretrain/Loss (Raw)": 1.929505467414856, "Pretrain/Step": 4377, "Pretrain/Step Time": 8.443727327510715} +{"Pretrain/Learning Rate": 4.4958178137875326e-05, "Pretrain/Loss": 2.071171283721924, "Pretrain/Loss (Raw)": 2.1409196853637695, "Pretrain/Step": 4378, "Pretrain/Step Time": 8.43707985803485} +{"Pretrain/Learning Rate": 4.495562130910072e-05, "Pretrain/Loss": 2.069093704223633, "Pretrain/Loss (Raw)": 1.7858939170837402, "Pretrain/Step": 4379, "Pretrain/Step Time": 8.43503056652844} +{"Pretrain/Learning Rate": 4.4953063904919837e-05, "Pretrain/Loss": 2.068748712539673, "Pretrain/Loss (Raw)": 2.020521879196167, "Pretrain/Step": 4380, "Pretrain/Step Time": 8.436758037656546} +{"Pretrain/Learning Rate": 4.495050592540643e-05, "Pretrain/Loss": 2.0668458938598633, "Pretrain/Loss (Raw)": 2.0358726978302, "Pretrain/Step": 4381, "Pretrain/Step Time": 8.437249314039946} +{"Pretrain/Learning Rate": 4.4947947370634234e-05, "Pretrain/Loss": 2.0672290325164795, "Pretrain/Loss (Raw)": 2.1925418376922607, "Pretrain/Step": 4382, "Pretrain/Step Time": 8.44140432588756} +{"Pretrain/Learning Rate": 4.4945388240677045e-05, "Pretrain/Loss": 2.066948413848877, "Pretrain/Loss (Raw)": 2.0888168811798096, "Pretrain/Step": 4383, "Pretrain/Step Time": 8.43459441140294} +{"Pretrain/Learning Rate": 4.494282853560865e-05, "Pretrain/Loss": 2.0674543380737305, "Pretrain/Loss (Raw)": 2.1945221424102783, "Pretrain/Step": 4384, "Pretrain/Step Time": 8.436154011636972} +{"Pretrain/Learning Rate": 4.4940268255502847e-05, "Pretrain/Loss": 2.0684385299682617, "Pretrain/Loss (Raw)": 2.050764799118042, "Pretrain/Step": 4385, "Pretrain/Step Time": 8.43267883732915} +{"Pretrain/Learning Rate": 4.493770740043347e-05, "Pretrain/Loss": 2.0712778568267822, "Pretrain/Loss (Raw)": 2.348177194595337, "Pretrain/Step": 4386, "Pretrain/Step Time": 8.436126319691539} +{"Pretrain/Learning Rate": 4.493514597047436e-05, "Pretrain/Loss": 2.0717597007751465, "Pretrain/Loss (Raw)": 2.1368565559387207, "Pretrain/Step": 4387, "Pretrain/Step Time": 8.433316607028246} +{"Pretrain/Learning Rate": 4.493258396569936e-05, "Pretrain/Loss": 2.071176052093506, "Pretrain/Loss (Raw)": 2.0847129821777344, "Pretrain/Step": 4388, "Pretrain/Step Time": 8.4357237983495} +{"Pretrain/Learning Rate": 4.493002138618236e-05, "Pretrain/Loss": 2.0730795860290527, "Pretrain/Loss (Raw)": 2.1326887607574463, "Pretrain/Step": 4389, "Pretrain/Step Time": 8.431820226833224} +{"Pretrain/Learning Rate": 4.492745823199725e-05, "Pretrain/Loss": 2.071058988571167, "Pretrain/Loss (Raw)": 1.9774248600006104, "Pretrain/Step": 4390, "Pretrain/Step Time": 8.434555143117905} +{"Pretrain/Learning Rate": 4.492489450321791e-05, "Pretrain/Loss": 2.072701930999756, "Pretrain/Loss (Raw)": 2.1463024616241455, "Pretrain/Step": 4391, "Pretrain/Step Time": 8.437353832647204} +{"Pretrain/Learning Rate": 4.492233019991829e-05, "Pretrain/Loss": 2.0756547451019287, "Pretrain/Loss (Raw)": 2.2256886959075928, "Pretrain/Step": 4392, "Pretrain/Step Time": 8.444384204223752} +{"Pretrain/Learning Rate": 4.491976532217232e-05, "Pretrain/Loss": 2.078345775604248, "Pretrain/Loss (Raw)": 2.2296395301818848, "Pretrain/Step": 4393, "Pretrain/Step Time": 8.440766911953688} +{"Pretrain/Learning Rate": 4.491719987005397e-05, "Pretrain/Loss": 2.0798726081848145, "Pretrain/Loss (Raw)": 2.1053779125213623, "Pretrain/Step": 4394, "Pretrain/Step Time": 8.441671336069703} +{"Pretrain/Learning Rate": 4.49146338436372e-05, "Pretrain/Loss": 2.079068660736084, "Pretrain/Loss (Raw)": 2.255009412765503, "Pretrain/Step": 4395, "Pretrain/Step Time": 8.433966249227524} +{"Pretrain/Learning Rate": 4.4912067242996e-05, "Pretrain/Loss": 2.079671859741211, "Pretrain/Loss (Raw)": 2.065432071685791, "Pretrain/Step": 4396, "Pretrain/Step Time": 8.434507213532925} +{"Pretrain/Learning Rate": 4.490950006820438e-05, "Pretrain/Loss": 2.0791068077087402, "Pretrain/Loss (Raw)": 2.0429210662841797, "Pretrain/Step": 4397, "Pretrain/Step Time": 8.431644910946488} +{"Pretrain/Learning Rate": 4.490693231933636e-05, "Pretrain/Loss": 2.0787758827209473, "Pretrain/Loss (Raw)": 2.172211170196533, "Pretrain/Step": 4398, "Pretrain/Step Time": 8.43062107078731} +{"Pretrain/Learning Rate": 4.490436399646597e-05, "Pretrain/Loss": 2.0750813484191895, "Pretrain/Loss (Raw)": 1.7207530736923218, "Pretrain/Step": 4399, "Pretrain/Step Time": 8.440255338326097} +{"Pretrain/Learning Rate": 4.4901795099667294e-05, "Pretrain/Loss": 2.0716946125030518, "Pretrain/Loss (Raw)": 1.7261918783187866, "Pretrain/Step": 4400, "Pretrain/Step Time": 8.43881507217884} +{"Pretrain/Learning Rate": 4.489922562901437e-05, "Pretrain/Loss": 2.0702598094940186, "Pretrain/Loss (Raw)": 1.9537538290023804, "Pretrain/Step": 4401, "Pretrain/Step Time": 8.43458423577249} +{"Pretrain/Learning Rate": 4.489665558458132e-05, "Pretrain/Loss": 2.071709632873535, "Pretrain/Loss (Raw)": 2.227215528488159, "Pretrain/Step": 4402, "Pretrain/Step Time": 8.433836029842496} +{"Pretrain/Learning Rate": 4.4894084966442215e-05, "Pretrain/Loss": 2.074770450592041, "Pretrain/Loss (Raw)": 2.225055456161499, "Pretrain/Step": 4403, "Pretrain/Step Time": 8.432618826627731} +{"Pretrain/Learning Rate": 4.48915137746712e-05, "Pretrain/Loss": 2.072844982147217, "Pretrain/Loss (Raw)": 2.091886281967163, "Pretrain/Step": 4404, "Pretrain/Step Time": 8.434994906187057} +{"Pretrain/Learning Rate": 4.488894200934242e-05, "Pretrain/Loss": 2.0722947120666504, "Pretrain/Loss (Raw)": 1.975636601448059, "Pretrain/Step": 4405, "Pretrain/Step Time": 8.432252693921328} +{"Pretrain/Learning Rate": 4.488636967053e-05, "Pretrain/Loss": 2.0736680030822754, "Pretrain/Loss (Raw)": 2.092989206314087, "Pretrain/Step": 4406, "Pretrain/Step Time": 8.429878925904632} +{"Pretrain/Learning Rate": 4.488379675830814e-05, "Pretrain/Loss": 2.0741851329803467, "Pretrain/Loss (Raw)": 2.0665242671966553, "Pretrain/Step": 4407, "Pretrain/Step Time": 8.432284476235509} +{"Pretrain/Learning Rate": 4.488122327275101e-05, "Pretrain/Loss": 2.0746705532073975, "Pretrain/Loss (Raw)": 1.905835509300232, "Pretrain/Step": 4408, "Pretrain/Step Time": 8.43382503464818} +{"Pretrain/Learning Rate": 4.4878649213932836e-05, "Pretrain/Loss": 2.0751240253448486, "Pretrain/Loss (Raw)": 2.1143224239349365, "Pretrain/Step": 4409, "Pretrain/Step Time": 8.434929609298706} +{"Pretrain/Learning Rate": 4.487607458192781e-05, "Pretrain/Loss": 2.07572078704834, "Pretrain/Loss (Raw)": 1.9800676107406616, "Pretrain/Step": 4410, "Pretrain/Step Time": 8.435638349503279} +{"Pretrain/Learning Rate": 4.487349937681019e-05, "Pretrain/Loss": 2.0772457122802734, "Pretrain/Loss (Raw)": 2.231523275375366, "Pretrain/Step": 4411, "Pretrain/Step Time": 8.430518290027976} +{"Pretrain/Learning Rate": 4.4870923598654224e-05, "Pretrain/Loss": 2.076643943786621, "Pretrain/Loss (Raw)": 1.9486464262008667, "Pretrain/Step": 4412, "Pretrain/Step Time": 8.430992795154452} +{"Pretrain/Learning Rate": 4.486834724753419e-05, "Pretrain/Loss": 2.0759990215301514, "Pretrain/Loss (Raw)": 1.928657054901123, "Pretrain/Step": 4413, "Pretrain/Step Time": 8.432666298002005} +{"Pretrain/Learning Rate": 4.486577032352437e-05, "Pretrain/Loss": 2.075924873352051, "Pretrain/Loss (Raw)": 2.0012948513031006, "Pretrain/Step": 4414, "Pretrain/Step Time": 8.428657317534089} +{"Pretrain/Learning Rate": 4.486319282669906e-05, "Pretrain/Loss": 2.0769238471984863, "Pretrain/Loss (Raw)": 2.0956499576568604, "Pretrain/Step": 4415, "Pretrain/Step Time": 8.435550207272172} +{"Pretrain/Learning Rate": 4.486061475713259e-05, "Pretrain/Loss": 2.0745275020599365, "Pretrain/Loss (Raw)": 1.9641320705413818, "Pretrain/Step": 4416, "Pretrain/Step Time": 8.437377678230405} +{"Pretrain/Learning Rate": 4.4858036114899296e-05, "Pretrain/Loss": 2.075601577758789, "Pretrain/Loss (Raw)": 2.169564723968506, "Pretrain/Step": 4417, "Pretrain/Step Time": 8.434532450512052} +{"Pretrain/Learning Rate": 4.485545690007353e-05, "Pretrain/Loss": 2.0758376121520996, "Pretrain/Loss (Raw)": 2.0098350048065186, "Pretrain/Step": 4418, "Pretrain/Step Time": 8.436183169484138} +{"Pretrain/Learning Rate": 4.4852877112729666e-05, "Pretrain/Loss": 2.0781843662261963, "Pretrain/Loss (Raw)": 2.2470927238464355, "Pretrain/Step": 4419, "Pretrain/Step Time": 8.43716662377119} +{"Pretrain/Learning Rate": 4.485029675294207e-05, "Pretrain/Loss": 2.0786397457122803, "Pretrain/Loss (Raw)": 2.1675777435302734, "Pretrain/Step": 4420, "Pretrain/Step Time": 8.439812909811735} +{"Pretrain/Learning Rate": 4.4847715820785174e-05, "Pretrain/Loss": 2.0795044898986816, "Pretrain/Loss (Raw)": 2.0188779830932617, "Pretrain/Step": 4421, "Pretrain/Step Time": 8.439785024151206} +{"Pretrain/Learning Rate": 4.484513431633338e-05, "Pretrain/Loss": 2.080308437347412, "Pretrain/Loss (Raw)": 2.075960636138916, "Pretrain/Step": 4422, "Pretrain/Step Time": 8.435506856068969} +{"Pretrain/Learning Rate": 4.484255223966113e-05, "Pretrain/Loss": 2.0818533897399902, "Pretrain/Loss (Raw)": 2.2025375366210938, "Pretrain/Step": 4423, "Pretrain/Step Time": 8.439040118828416} +{"Pretrain/Learning Rate": 4.483996959084287e-05, "Pretrain/Loss": 2.083902597427368, "Pretrain/Loss (Raw)": 2.266735076904297, "Pretrain/Step": 4424, "Pretrain/Step Time": 8.43975323624909} +{"Pretrain/Learning Rate": 4.483738636995308e-05, "Pretrain/Loss": 2.0839684009552, "Pretrain/Loss (Raw)": 2.1767282485961914, "Pretrain/Step": 4425, "Pretrain/Step Time": 8.440668679773808} +{"Pretrain/Learning Rate": 4.483480257706624e-05, "Pretrain/Loss": 2.0854110717773438, "Pretrain/Loss (Raw)": 2.000519275665283, "Pretrain/Step": 4426, "Pretrain/Step Time": 8.437568390741944} +{"Pretrain/Learning Rate": 4.483221821225684e-05, "Pretrain/Loss": 2.0848875045776367, "Pretrain/Loss (Raw)": 2.0653796195983887, "Pretrain/Step": 4427, "Pretrain/Step Time": 8.440706828609109} +{"Pretrain/Learning Rate": 4.4829633275599414e-05, "Pretrain/Loss": 2.0848937034606934, "Pretrain/Loss (Raw)": 2.1160356998443604, "Pretrain/Step": 4428, "Pretrain/Step Time": 8.438816636800766} +{"Pretrain/Learning Rate": 4.4827047767168486e-05, "Pretrain/Loss": 2.0863494873046875, "Pretrain/Loss (Raw)": 2.060382604598999, "Pretrain/Step": 4429, "Pretrain/Step Time": 8.436205592006445} +{"Pretrain/Learning Rate": 4.482446168703862e-05, "Pretrain/Loss": 2.086477279663086, "Pretrain/Loss (Raw)": 2.020339012145996, "Pretrain/Step": 4430, "Pretrain/Step Time": 8.430758265778422} +{"Pretrain/Learning Rate": 4.482187503528438e-05, "Pretrain/Loss": 2.0871691703796387, "Pretrain/Loss (Raw)": 2.184634208679199, "Pretrain/Step": 4431, "Pretrain/Step Time": 8.440597139298916} +{"Pretrain/Learning Rate": 4.4819287811980336e-05, "Pretrain/Loss": 2.087700366973877, "Pretrain/Loss (Raw)": 2.1643543243408203, "Pretrain/Step": 4432, "Pretrain/Step Time": 8.442387472838163} +{"Pretrain/Learning Rate": 4.4816700017201105e-05, "Pretrain/Loss": 2.087395429611206, "Pretrain/Loss (Raw)": 1.9354758262634277, "Pretrain/Step": 4433, "Pretrain/Step Time": 8.4424670599401} +{"Pretrain/Learning Rate": 4.4814111651021295e-05, "Pretrain/Loss": 2.0887227058410645, "Pretrain/Loss (Raw)": 2.17806339263916, "Pretrain/Step": 4434, "Pretrain/Step Time": 8.445676576346159} +{"Pretrain/Learning Rate": 4.4811522713515553e-05, "Pretrain/Loss": 2.0853381156921387, "Pretrain/Loss (Raw)": 1.87159264087677, "Pretrain/Step": 4435, "Pretrain/Step Time": 8.44346440397203} +{"Pretrain/Learning Rate": 4.4808933204758506e-05, "Pretrain/Loss": 2.087409496307373, "Pretrain/Loss (Raw)": 2.070523500442505, "Pretrain/Step": 4436, "Pretrain/Step Time": 8.4411717094481} +{"Pretrain/Learning Rate": 4.480634312482484e-05, "Pretrain/Loss": 2.08725643157959, "Pretrain/Loss (Raw)": 2.024548292160034, "Pretrain/Step": 4437, "Pretrain/Step Time": 8.436212968081236} +{"Pretrain/Learning Rate": 4.480375247378924e-05, "Pretrain/Loss": 2.0888638496398926, "Pretrain/Loss (Raw)": 2.2237932682037354, "Pretrain/Step": 4438, "Pretrain/Step Time": 8.435401236638427} +{"Pretrain/Learning Rate": 4.4801161251726395e-05, "Pretrain/Loss": 2.0897216796875, "Pretrain/Loss (Raw)": 2.1987199783325195, "Pretrain/Step": 4439, "Pretrain/Step Time": 8.437127346172929} +{"Pretrain/Learning Rate": 4.479856945871103e-05, "Pretrain/Loss": 2.090379476547241, "Pretrain/Loss (Raw)": 2.078711986541748, "Pretrain/Step": 4440, "Pretrain/Step Time": 8.43971298262477} +{"Pretrain/Learning Rate": 4.479597709481785e-05, "Pretrain/Loss": 2.091334104537964, "Pretrain/Loss (Raw)": 2.059102773666382, "Pretrain/Step": 4441, "Pretrain/Step Time": 8.441920083016157} +{"Pretrain/Learning Rate": 4.479338416012165e-05, "Pretrain/Loss": 2.0913448333740234, "Pretrain/Loss (Raw)": 2.137753486633301, "Pretrain/Step": 4442, "Pretrain/Step Time": 8.440558090806007} +{"Pretrain/Learning Rate": 4.479079065469716e-05, "Pretrain/Loss": 2.088641405105591, "Pretrain/Loss (Raw)": 1.9439003467559814, "Pretrain/Step": 4443, "Pretrain/Step Time": 8.440822888165712} +{"Pretrain/Learning Rate": 4.4788196578619165e-05, "Pretrain/Loss": 2.0909523963928223, "Pretrain/Loss (Raw)": 2.3178672790527344, "Pretrain/Step": 4444, "Pretrain/Step Time": 8.436765979975462} +{"Pretrain/Learning Rate": 4.4785601931962484e-05, "Pretrain/Loss": 2.091362953186035, "Pretrain/Loss (Raw)": 2.0976505279541016, "Pretrain/Step": 4445, "Pretrain/Step Time": 8.440123874694109} +{"Pretrain/Learning Rate": 4.478300671480192e-05, "Pretrain/Loss": 2.0921266078948975, "Pretrain/Loss (Raw)": 2.197990894317627, "Pretrain/Step": 4446, "Pretrain/Step Time": 8.435807511210442} +{"Pretrain/Learning Rate": 4.47804109272123e-05, "Pretrain/Loss": 2.0931661128997803, "Pretrain/Loss (Raw)": 2.148087978363037, "Pretrain/Step": 4447, "Pretrain/Step Time": 8.442048134282231} +{"Pretrain/Learning Rate": 4.477781456926847e-05, "Pretrain/Loss": 2.093003034591675, "Pretrain/Loss (Raw)": 1.9661314487457275, "Pretrain/Step": 4448, "Pretrain/Step Time": 8.44315374828875} +{"Pretrain/Learning Rate": 4.4775217641045306e-05, "Pretrain/Loss": 2.093398332595825, "Pretrain/Loss (Raw)": 1.9750845432281494, "Pretrain/Step": 4449, "Pretrain/Step Time": 8.446685371920466} +{"Pretrain/Learning Rate": 4.477262014261768e-05, "Pretrain/Loss": 2.092043399810791, "Pretrain/Loss (Raw)": 1.9084440469741821, "Pretrain/Step": 4450, "Pretrain/Step Time": 8.44114456512034} +{"Pretrain/Learning Rate": 4.477002207406049e-05, "Pretrain/Loss": 2.091442584991455, "Pretrain/Loss (Raw)": 2.1380667686462402, "Pretrain/Step": 4451, "Pretrain/Step Time": 8.443726679310203} +{"Pretrain/Learning Rate": 4.476742343544865e-05, "Pretrain/Loss": 2.089728593826294, "Pretrain/Loss (Raw)": 1.823940634727478, "Pretrain/Step": 4452, "Pretrain/Step Time": 8.443529084324837} +{"Pretrain/Learning Rate": 4.4764824226857095e-05, "Pretrain/Loss": 2.089970350265503, "Pretrain/Loss (Raw)": 2.0918045043945312, "Pretrain/Step": 4453, "Pretrain/Step Time": 8.439380712807178} +{"Pretrain/Learning Rate": 4.476222444836076e-05, "Pretrain/Loss": 2.0920002460479736, "Pretrain/Loss (Raw)": 2.364896297454834, "Pretrain/Step": 4454, "Pretrain/Step Time": 8.438313027843833} +{"Pretrain/Learning Rate": 4.475962410003462e-05, "Pretrain/Loss": 2.091315746307373, "Pretrain/Loss (Raw)": 1.8635681867599487, "Pretrain/Step": 4455, "Pretrain/Step Time": 8.43425102159381} +{"Pretrain/Learning Rate": 4.475702318195364e-05, "Pretrain/Loss": 2.091989517211914, "Pretrain/Loss (Raw)": 2.0027506351470947, "Pretrain/Step": 4456, "Pretrain/Step Time": 8.43704567477107} +{"Pretrain/Learning Rate": 4.4754421694192835e-05, "Pretrain/Loss": 2.093187093734741, "Pretrain/Loss (Raw)": 2.1554038524627686, "Pretrain/Step": 4457, "Pretrain/Step Time": 8.439360490068793} +{"Pretrain/Learning Rate": 4.47518196368272e-05, "Pretrain/Loss": 2.0916054248809814, "Pretrain/Loss (Raw)": 2.090725898742676, "Pretrain/Step": 4458, "Pretrain/Step Time": 8.448389306664467} +{"Pretrain/Learning Rate": 4.4749217009931775e-05, "Pretrain/Loss": 2.091369152069092, "Pretrain/Loss (Raw)": 2.151872158050537, "Pretrain/Step": 4459, "Pretrain/Step Time": 8.44686035439372} +{"Pretrain/Learning Rate": 4.4746613813581595e-05, "Pretrain/Loss": 2.091872215270996, "Pretrain/Loss (Raw)": 1.979856014251709, "Pretrain/Step": 4460, "Pretrain/Step Time": 8.442385083064437} +{"Pretrain/Learning Rate": 4.474401004785173e-05, "Pretrain/Loss": 2.0869078636169434, "Pretrain/Loss (Raw)": 1.9007019996643066, "Pretrain/Step": 4461, "Pretrain/Step Time": 8.442346204072237} +{"Pretrain/Learning Rate": 4.4741405712817255e-05, "Pretrain/Loss": 2.087028741836548, "Pretrain/Loss (Raw)": 2.2982876300811768, "Pretrain/Step": 4462, "Pretrain/Step Time": 8.44386738166213} +{"Pretrain/Learning Rate": 4.4738800808553256e-05, "Pretrain/Loss": 2.0875916481018066, "Pretrain/Loss (Raw)": 1.9865057468414307, "Pretrain/Step": 4463, "Pretrain/Step Time": 8.445986852049828} +{"Pretrain/Learning Rate": 4.4736195335134854e-05, "Pretrain/Loss": 2.0876097679138184, "Pretrain/Loss (Raw)": 2.161224842071533, "Pretrain/Step": 4464, "Pretrain/Step Time": 8.445738684386015} +{"Pretrain/Learning Rate": 4.473358929263717e-05, "Pretrain/Loss": 2.087052822113037, "Pretrain/Loss (Raw)": 2.1303021907806396, "Pretrain/Step": 4465, "Pretrain/Step Time": 8.454653410241008} +{"Pretrain/Learning Rate": 4.473098268113536e-05, "Pretrain/Loss": 2.086519718170166, "Pretrain/Loss (Raw)": 2.044367551803589, "Pretrain/Step": 4466, "Pretrain/Step Time": 8.453435461968184} +{"Pretrain/Learning Rate": 4.472837550070456e-05, "Pretrain/Loss": 2.0848188400268555, "Pretrain/Loss (Raw)": 1.872832179069519, "Pretrain/Step": 4467, "Pretrain/Step Time": 8.450123442336917} +{"Pretrain/Learning Rate": 4.4725767751419964e-05, "Pretrain/Loss": 2.0866827964782715, "Pretrain/Loss (Raw)": 2.2205214500427246, "Pretrain/Step": 4468, "Pretrain/Step Time": 8.448073763400316} +{"Pretrain/Learning Rate": 4.472315943335677e-05, "Pretrain/Loss": 2.084857702255249, "Pretrain/Loss (Raw)": 1.9686129093170166, "Pretrain/Step": 4469, "Pretrain/Step Time": 8.445095513015985} +{"Pretrain/Learning Rate": 4.472055054659017e-05, "Pretrain/Loss": 2.0842318534851074, "Pretrain/Loss (Raw)": 2.0377817153930664, "Pretrain/Step": 4470, "Pretrain/Step Time": 8.441928746178746} +{"Pretrain/Learning Rate": 4.4717941091195395e-05, "Pretrain/Loss": 2.084486722946167, "Pretrain/Loss (Raw)": 2.1549293994903564, "Pretrain/Step": 4471, "Pretrain/Step Time": 8.4394187964499} +{"Pretrain/Learning Rate": 4.471533106724769e-05, "Pretrain/Loss": 2.085338592529297, "Pretrain/Loss (Raw)": 2.247464418411255, "Pretrain/Step": 4472, "Pretrain/Step Time": 8.439718155190349} +{"Pretrain/Learning Rate": 4.4712720474822314e-05, "Pretrain/Loss": 2.0854828357696533, "Pretrain/Loss (Raw)": 1.9350680112838745, "Pretrain/Step": 4473, "Pretrain/Step Time": 8.438430925831199} +{"Pretrain/Learning Rate": 4.471010931399454e-05, "Pretrain/Loss": 2.0831046104431152, "Pretrain/Loss (Raw)": 1.8319129943847656, "Pretrain/Step": 4474, "Pretrain/Step Time": 8.439146867021918} +{"Pretrain/Learning Rate": 4.470749758483966e-05, "Pretrain/Loss": 2.0809051990509033, "Pretrain/Loss (Raw)": 1.9107304811477661, "Pretrain/Step": 4475, "Pretrain/Step Time": 8.441294476389885} +{"Pretrain/Learning Rate": 4.470488528743298e-05, "Pretrain/Loss": 2.0774965286254883, "Pretrain/Loss (Raw)": 2.062222957611084, "Pretrain/Step": 4476, "Pretrain/Step Time": 8.436356598511338} +{"Pretrain/Learning Rate": 4.470227242184982e-05, "Pretrain/Loss": 2.077446460723877, "Pretrain/Loss (Raw)": 2.1415369510650635, "Pretrain/Step": 4477, "Pretrain/Step Time": 8.433923378586769} +{"Pretrain/Learning Rate": 4.469965898816553e-05, "Pretrain/Loss": 2.0767159461975098, "Pretrain/Loss (Raw)": 1.899207353591919, "Pretrain/Step": 4478, "Pretrain/Step Time": 8.438613843172789} +{"Pretrain/Learning Rate": 4.4697044986455454e-05, "Pretrain/Loss": 2.0778651237487793, "Pretrain/Loss (Raw)": 2.203476667404175, "Pretrain/Step": 4479, "Pretrain/Step Time": 8.43393538147211} +{"Pretrain/Learning Rate": 4.4694430416794975e-05, "Pretrain/Loss": 2.0798306465148926, "Pretrain/Loss (Raw)": 2.3073465824127197, "Pretrain/Step": 4480, "Pretrain/Step Time": 8.438123162835836} +{"Pretrain/Learning Rate": 4.469181527925948e-05, "Pretrain/Loss": 2.077834367752075, "Pretrain/Loss (Raw)": 2.009624481201172, "Pretrain/Step": 4481, "Pretrain/Step Time": 8.43605854921043} +{"Pretrain/Learning Rate": 4.468919957392437e-05, "Pretrain/Loss": 2.077012538909912, "Pretrain/Loss (Raw)": 1.9900786876678467, "Pretrain/Step": 4482, "Pretrain/Step Time": 8.43985247053206} +{"Pretrain/Learning Rate": 4.468658330086507e-05, "Pretrain/Loss": 2.0754284858703613, "Pretrain/Loss (Raw)": 1.9284056425094604, "Pretrain/Step": 4483, "Pretrain/Step Time": 8.440557261928916} +{"Pretrain/Learning Rate": 4.468396646015702e-05, "Pretrain/Loss": 2.073218822479248, "Pretrain/Loss (Raw)": 2.112105369567871, "Pretrain/Step": 4484, "Pretrain/Step Time": 8.442835872992873} +{"Pretrain/Learning Rate": 4.468134905187567e-05, "Pretrain/Loss": 2.074248790740967, "Pretrain/Loss (Raw)": 2.0029163360595703, "Pretrain/Step": 4485, "Pretrain/Step Time": 8.440848050639033} +{"Pretrain/Learning Rate": 4.46787310760965e-05, "Pretrain/Loss": 2.073185920715332, "Pretrain/Loss (Raw)": 2.109353542327881, "Pretrain/Step": 4486, "Pretrain/Step Time": 8.43567163683474} +{"Pretrain/Learning Rate": 4.467611253289499e-05, "Pretrain/Loss": 2.0734810829162598, "Pretrain/Loss (Raw)": 2.1325833797454834, "Pretrain/Step": 4487, "Pretrain/Step Time": 8.4367033559829} +{"Pretrain/Learning Rate": 4.4673493422346646e-05, "Pretrain/Loss": 2.0729641914367676, "Pretrain/Loss (Raw)": 1.9867517948150635, "Pretrain/Step": 4488, "Pretrain/Step Time": 8.435770304873586} +{"Pretrain/Learning Rate": 4.4670873744526984e-05, "Pretrain/Loss": 2.0737788677215576, "Pretrain/Loss (Raw)": 2.0366766452789307, "Pretrain/Step": 4489, "Pretrain/Step Time": 8.440312124788761} +{"Pretrain/Learning Rate": 4.466825349951155e-05, "Pretrain/Loss": 2.0739381313323975, "Pretrain/Loss (Raw)": 2.098339557647705, "Pretrain/Step": 4490, "Pretrain/Step Time": 8.441754024475813} +{"Pretrain/Learning Rate": 4.4665632687375886e-05, "Pretrain/Loss": 2.0749995708465576, "Pretrain/Loss (Raw)": 1.8224408626556396, "Pretrain/Step": 4491, "Pretrain/Step Time": 8.445318803191185} +{"Pretrain/Learning Rate": 4.466301130819557e-05, "Pretrain/Loss": 2.0736629962921143, "Pretrain/Loss (Raw)": 1.8030154705047607, "Pretrain/Step": 4492, "Pretrain/Step Time": 8.445382576435804} +{"Pretrain/Learning Rate": 4.466038936204618e-05, "Pretrain/Loss": 2.070105791091919, "Pretrain/Loss (Raw)": 1.9543458223342896, "Pretrain/Step": 4493, "Pretrain/Step Time": 8.441866356879473} +{"Pretrain/Learning Rate": 4.4657766849003334e-05, "Pretrain/Loss": 2.0690112113952637, "Pretrain/Loss (Raw)": 1.946152687072754, "Pretrain/Step": 4494, "Pretrain/Step Time": 8.438856003805995} +{"Pretrain/Learning Rate": 4.465514376914264e-05, "Pretrain/Loss": 2.067593574523926, "Pretrain/Loss (Raw)": 1.9364253282546997, "Pretrain/Step": 4495, "Pretrain/Step Time": 8.437951957806945} +{"Pretrain/Learning Rate": 4.465252012253972e-05, "Pretrain/Loss": 2.066239595413208, "Pretrain/Loss (Raw)": 2.00325345993042, "Pretrain/Step": 4496, "Pretrain/Step Time": 8.436517503112555} +{"Pretrain/Learning Rate": 4.464989590927023e-05, "Pretrain/Loss": 2.066486358642578, "Pretrain/Loss (Raw)": 2.123950481414795, "Pretrain/Step": 4497, "Pretrain/Step Time": 8.437800792977214} +{"Pretrain/Learning Rate": 4.464727112940986e-05, "Pretrain/Loss": 2.065422773361206, "Pretrain/Loss (Raw)": 2.052605152130127, "Pretrain/Step": 4498, "Pretrain/Step Time": 8.439032342284918} +{"Pretrain/Learning Rate": 4.464464578303427e-05, "Pretrain/Loss": 2.065523147583008, "Pretrain/Loss (Raw)": 2.1680123805999756, "Pretrain/Step": 4499, "Pretrain/Step Time": 8.443661831319332} +{"Pretrain/Learning Rate": 4.464201987021917e-05, "Pretrain/Loss": 2.0669729709625244, "Pretrain/Loss (Raw)": 2.23421311378479, "Pretrain/Step": 4500, "Pretrain/Step Time": 8.445735735818744} +{"Pretrain/Learning Rate": 4.4639393391040274e-05, "Pretrain/Loss": 2.06674861907959, "Pretrain/Loss (Raw)": 2.0149893760681152, "Pretrain/Step": 4501, "Pretrain/Step Time": 8.441022733226418} +{"Pretrain/Learning Rate": 4.463676634557331e-05, "Pretrain/Loss": 2.066312313079834, "Pretrain/Loss (Raw)": 2.0292651653289795, "Pretrain/Step": 4502, "Pretrain/Step Time": 8.44038661941886} +{"Pretrain/Learning Rate": 4.463413873389403e-05, "Pretrain/Loss": 2.0651702880859375, "Pretrain/Loss (Raw)": 1.940606951713562, "Pretrain/Step": 4503, "Pretrain/Step Time": 8.43808650225401} +{"Pretrain/Learning Rate": 4.46315105560782e-05, "Pretrain/Loss": 2.06503963470459, "Pretrain/Loss (Raw)": 2.019113302230835, "Pretrain/Step": 4504, "Pretrain/Step Time": 8.439319923520088} +{"Pretrain/Learning Rate": 4.4628881812201614e-05, "Pretrain/Loss": 2.0695903301239014, "Pretrain/Loss (Raw)": 2.512000799179077, "Pretrain/Step": 4505, "Pretrain/Step Time": 8.439372580498457} +{"Pretrain/Learning Rate": 4.462625250234005e-05, "Pretrain/Loss": 2.0691075325012207, "Pretrain/Loss (Raw)": 2.0791051387786865, "Pretrain/Step": 4506, "Pretrain/Step Time": 8.448396125808358} +{"Pretrain/Learning Rate": 4.462362262656933e-05, "Pretrain/Loss": 2.0715091228485107, "Pretrain/Loss (Raw)": 2.09332013130188, "Pretrain/Step": 4507, "Pretrain/Step Time": 8.454444201663136} +{"Pretrain/Learning Rate": 4.4620992184965294e-05, "Pretrain/Loss": 2.070723056793213, "Pretrain/Loss (Raw)": 1.9198994636535645, "Pretrain/Step": 4508, "Pretrain/Step Time": 8.451907513663173} +{"Pretrain/Learning Rate": 4.4618361177603774e-05, "Pretrain/Loss": 2.069286346435547, "Pretrain/Loss (Raw)": 1.851979374885559, "Pretrain/Step": 4509, "Pretrain/Step Time": 8.447261955589056} +{"Pretrain/Learning Rate": 4.461572960456064e-05, "Pretrain/Loss": 2.067659854888916, "Pretrain/Loss (Raw)": 1.9843196868896484, "Pretrain/Step": 4510, "Pretrain/Step Time": 8.444916024804115} +{"Pretrain/Learning Rate": 4.461309746591177e-05, "Pretrain/Loss": 2.069554567337036, "Pretrain/Loss (Raw)": 2.331362009048462, "Pretrain/Step": 4511, "Pretrain/Step Time": 8.445274349302053} +{"Pretrain/Learning Rate": 4.4610464761733054e-05, "Pretrain/Loss": 2.0688910484313965, "Pretrain/Loss (Raw)": 2.109591245651245, "Pretrain/Step": 4512, "Pretrain/Step Time": 8.448700189590454} +{"Pretrain/Learning Rate": 4.460783149210042e-05, "Pretrain/Loss": 2.0680429935455322, "Pretrain/Loss (Raw)": 1.942219614982605, "Pretrain/Step": 4513, "Pretrain/Step Time": 8.45130524970591} +{"Pretrain/Learning Rate": 4.460519765708979e-05, "Pretrain/Loss": 2.066044569015503, "Pretrain/Loss (Raw)": 2.092374086380005, "Pretrain/Step": 4514, "Pretrain/Step Time": 8.447886617854238} +{"Pretrain/Learning Rate": 4.4602563256777094e-05, "Pretrain/Loss": 2.0646138191223145, "Pretrain/Loss (Raw)": 1.9536913633346558, "Pretrain/Step": 4515, "Pretrain/Step Time": 8.448405433446169} +{"Pretrain/Learning Rate": 4.459992829123832e-05, "Pretrain/Loss": 2.0641987323760986, "Pretrain/Loss (Raw)": 2.0315916538238525, "Pretrain/Step": 4516, "Pretrain/Step Time": 8.44668392650783} +{"Pretrain/Learning Rate": 4.4597292760549425e-05, "Pretrain/Loss": 2.064236879348755, "Pretrain/Loss (Raw)": 2.1375646591186523, "Pretrain/Step": 4517, "Pretrain/Step Time": 8.447096521034837} +{"Pretrain/Learning Rate": 4.4594656664786404e-05, "Pretrain/Loss": 2.064180850982666, "Pretrain/Loss (Raw)": 1.9702893495559692, "Pretrain/Step": 4518, "Pretrain/Step Time": 8.444924203678966} +{"Pretrain/Learning Rate": 4.459202000402528e-05, "Pretrain/Loss": 2.063778877258301, "Pretrain/Loss (Raw)": 2.0948331356048584, "Pretrain/Step": 4519, "Pretrain/Step Time": 8.443592488765717} +{"Pretrain/Learning Rate": 4.458938277834206e-05, "Pretrain/Loss": 2.061336040496826, "Pretrain/Loss (Raw)": 1.913010835647583, "Pretrain/Step": 4520, "Pretrain/Step Time": 8.441015059128404} +{"Pretrain/Learning Rate": 4.458674498781281e-05, "Pretrain/Loss": 2.060224771499634, "Pretrain/Loss (Raw)": 2.087390661239624, "Pretrain/Step": 4521, "Pretrain/Step Time": 8.443811984732747} +{"Pretrain/Learning Rate": 4.458410663251357e-05, "Pretrain/Loss": 2.0591838359832764, "Pretrain/Loss (Raw)": 1.9721362590789795, "Pretrain/Step": 4522, "Pretrain/Step Time": 8.446352828294039} +{"Pretrain/Learning Rate": 4.458146771252041e-05, "Pretrain/Loss": 2.057922840118408, "Pretrain/Loss (Raw)": 2.09358286857605, "Pretrain/Step": 4523, "Pretrain/Step Time": 8.45260670222342} +{"Pretrain/Learning Rate": 4.4578828227909445e-05, "Pretrain/Loss": 2.0596344470977783, "Pretrain/Loss (Raw)": 2.2845218181610107, "Pretrain/Step": 4524, "Pretrain/Step Time": 8.450070098042488} +{"Pretrain/Learning Rate": 4.457618817875677e-05, "Pretrain/Loss": 2.060554027557373, "Pretrain/Loss (Raw)": 2.1606638431549072, "Pretrain/Step": 4525, "Pretrain/Step Time": 8.450828447937965} +{"Pretrain/Learning Rate": 4.457354756513851e-05, "Pretrain/Loss": 2.061044216156006, "Pretrain/Loss (Raw)": 2.2349448204040527, "Pretrain/Step": 4526, "Pretrain/Step Time": 8.449682103469968} +{"Pretrain/Learning Rate": 4.45709063871308e-05, "Pretrain/Loss": 2.0638866424560547, "Pretrain/Loss (Raw)": 2.0845797061920166, "Pretrain/Step": 4527, "Pretrain/Step Time": 8.443834327161312} +{"Pretrain/Learning Rate": 4.45682646448098e-05, "Pretrain/Loss": 2.066570281982422, "Pretrain/Loss (Raw)": 2.0696921348571777, "Pretrain/Step": 4528, "Pretrain/Step Time": 8.441358970478177} +{"Pretrain/Learning Rate": 4.456562233825169e-05, "Pretrain/Loss": 2.0686893463134766, "Pretrain/Loss (Raw)": 2.224977970123291, "Pretrain/Step": 4529, "Pretrain/Step Time": 8.446583423763514} +{"Pretrain/Learning Rate": 4.4562979467532645e-05, "Pretrain/Loss": 2.0657646656036377, "Pretrain/Loss (Raw)": 1.8528873920440674, "Pretrain/Step": 4530, "Pretrain/Step Time": 8.449204625561833} +{"Pretrain/Learning Rate": 4.456033603272888e-05, "Pretrain/Loss": 2.0645625591278076, "Pretrain/Loss (Raw)": 2.0711588859558105, "Pretrain/Step": 4531, "Pretrain/Step Time": 8.450757414102554} +{"Pretrain/Learning Rate": 4.455769203391662e-05, "Pretrain/Loss": 2.064929723739624, "Pretrain/Loss (Raw)": 2.1388731002807617, "Pretrain/Step": 4532, "Pretrain/Step Time": 8.447976808995008} +{"Pretrain/Learning Rate": 4.455504747117209e-05, "Pretrain/Loss": 2.0657668113708496, "Pretrain/Loss (Raw)": 2.0827901363372803, "Pretrain/Step": 4533, "Pretrain/Step Time": 8.448892952874303} +{"Pretrain/Learning Rate": 4.4552402344571556e-05, "Pretrain/Loss": 2.0647077560424805, "Pretrain/Loss (Raw)": 1.9574501514434814, "Pretrain/Step": 4534, "Pretrain/Step Time": 8.451688837260008} +{"Pretrain/Learning Rate": 4.4549756654191285e-05, "Pretrain/Loss": 2.0648276805877686, "Pretrain/Loss (Raw)": 2.0818827152252197, "Pretrain/Step": 4535, "Pretrain/Step Time": 8.450010878965259} +{"Pretrain/Learning Rate": 4.454711040010756e-05, "Pretrain/Loss": 2.0657243728637695, "Pretrain/Loss (Raw)": 2.020597457885742, "Pretrain/Step": 4536, "Pretrain/Step Time": 8.445789080113173} +{"Pretrain/Learning Rate": 4.454446358239669e-05, "Pretrain/Loss": 2.0663750171661377, "Pretrain/Loss (Raw)": 2.197605848312378, "Pretrain/Step": 4537, "Pretrain/Step Time": 8.449068425223231} +{"Pretrain/Learning Rate": 4.454181620113499e-05, "Pretrain/Loss": 2.0653162002563477, "Pretrain/Loss (Raw)": 1.8445303440093994, "Pretrain/Step": 4538, "Pretrain/Step Time": 8.448579436168075} +{"Pretrain/Learning Rate": 4.453916825639879e-05, "Pretrain/Loss": 2.065347194671631, "Pretrain/Loss (Raw)": 2.235503673553467, "Pretrain/Step": 4539, "Pretrain/Step Time": 8.446644451469183} +{"Pretrain/Learning Rate": 4.453651974826445e-05, "Pretrain/Loss": 2.0648064613342285, "Pretrain/Loss (Raw)": 1.879409909248352, "Pretrain/Step": 4540, "Pretrain/Step Time": 8.447413863614202} +{"Pretrain/Learning Rate": 4.4533870676808336e-05, "Pretrain/Loss": 2.066115379333496, "Pretrain/Loss (Raw)": 2.0962095260620117, "Pretrain/Step": 4541, "Pretrain/Step Time": 8.444335190579295} +{"Pretrain/Learning Rate": 4.453122104210683e-05, "Pretrain/Loss": 2.0688486099243164, "Pretrain/Loss (Raw)": 2.3511669635772705, "Pretrain/Step": 4542, "Pretrain/Step Time": 8.4460882935673} +{"Pretrain/Learning Rate": 4.452857084423634e-05, "Pretrain/Loss": 2.0688278675079346, "Pretrain/Loss (Raw)": 2.0929837226867676, "Pretrain/Step": 4543, "Pretrain/Step Time": 8.435787081718445} +{"Pretrain/Learning Rate": 4.452592008327327e-05, "Pretrain/Loss": 2.070997714996338, "Pretrain/Loss (Raw)": 2.2418789863586426, "Pretrain/Step": 4544, "Pretrain/Step Time": 8.434425162151456} +{"Pretrain/Learning Rate": 4.452326875929407e-05, "Pretrain/Loss": 2.0698142051696777, "Pretrain/Loss (Raw)": 2.0180656909942627, "Pretrain/Step": 4545, "Pretrain/Step Time": 8.437500627711415} +{"Pretrain/Learning Rate": 4.452061687237516e-05, "Pretrain/Loss": 2.0692355632781982, "Pretrain/Loss (Raw)": 1.9357776641845703, "Pretrain/Step": 4546, "Pretrain/Step Time": 8.438580917194486} +{"Pretrain/Learning Rate": 4.4517964422593036e-05, "Pretrain/Loss": 2.0663514137268066, "Pretrain/Loss (Raw)": 1.8779268264770508, "Pretrain/Step": 4547, "Pretrain/Step Time": 8.441783057525754} +{"Pretrain/Learning Rate": 4.451531141002416e-05, "Pretrain/Loss": 2.065861225128174, "Pretrain/Loss (Raw)": 2.104809045791626, "Pretrain/Step": 4548, "Pretrain/Step Time": 8.437091009691358} +{"Pretrain/Learning Rate": 4.451265783474505e-05, "Pretrain/Loss": 2.066352367401123, "Pretrain/Loss (Raw)": 2.0817501544952393, "Pretrain/Step": 4549, "Pretrain/Step Time": 8.43620540946722} +{"Pretrain/Learning Rate": 4.45100036968322e-05, "Pretrain/Loss": 2.0672173500061035, "Pretrain/Loss (Raw)": 2.186701774597168, "Pretrain/Step": 4550, "Pretrain/Step Time": 8.44015052728355} +{"Pretrain/Learning Rate": 4.450734899636214e-05, "Pretrain/Loss": 2.066403865814209, "Pretrain/Loss (Raw)": 2.0984086990356445, "Pretrain/Step": 4551, "Pretrain/Step Time": 8.436788611114025} +{"Pretrain/Learning Rate": 4.450469373341143e-05, "Pretrain/Loss": 2.064910888671875, "Pretrain/Loss (Raw)": 2.0756540298461914, "Pretrain/Step": 4552, "Pretrain/Step Time": 8.436573628336191} +{"Pretrain/Learning Rate": 4.4502037908056626e-05, "Pretrain/Loss": 2.0636491775512695, "Pretrain/Loss (Raw)": 2.0151939392089844, "Pretrain/Step": 4553, "Pretrain/Step Time": 8.443625761196017} +{"Pretrain/Learning Rate": 4.449938152037431e-05, "Pretrain/Loss": 2.0643439292907715, "Pretrain/Loss (Raw)": 2.0894370079040527, "Pretrain/Step": 4554, "Pretrain/Step Time": 8.443111084401608} +{"Pretrain/Learning Rate": 4.449672457044107e-05, "Pretrain/Loss": 2.0621275901794434, "Pretrain/Loss (Raw)": 1.7817057371139526, "Pretrain/Step": 4555, "Pretrain/Step Time": 8.441489296033978} +{"Pretrain/Learning Rate": 4.4494067058333514e-05, "Pretrain/Loss": 2.0605316162109375, "Pretrain/Loss (Raw)": 1.9117558002471924, "Pretrain/Step": 4556, "Pretrain/Step Time": 8.44767078757286} +{"Pretrain/Learning Rate": 4.4491408984128293e-05, "Pretrain/Loss": 2.063013792037964, "Pretrain/Loss (Raw)": 2.3780884742736816, "Pretrain/Step": 4557, "Pretrain/Step Time": 8.445075254887342} +{"Pretrain/Learning Rate": 4.448875034790202e-05, "Pretrain/Loss": 2.0650787353515625, "Pretrain/Loss (Raw)": 2.284684896469116, "Pretrain/Step": 4558, "Pretrain/Step Time": 8.44660597294569} +{"Pretrain/Learning Rate": 4.448609114973138e-05, "Pretrain/Loss": 2.062652587890625, "Pretrain/Loss (Raw)": 1.874090552330017, "Pretrain/Step": 4559, "Pretrain/Step Time": 8.439972039312124} +{"Pretrain/Learning Rate": 4.448343138969303e-05, "Pretrain/Loss": 2.065272331237793, "Pretrain/Loss (Raw)": 2.4996700286865234, "Pretrain/Step": 4560, "Pretrain/Step Time": 8.43598759174347} +{"Pretrain/Learning Rate": 4.448077106786367e-05, "Pretrain/Loss": 2.0655455589294434, "Pretrain/Loss (Raw)": 1.970418095588684, "Pretrain/Step": 4561, "Pretrain/Step Time": 8.435785816982388} +{"Pretrain/Learning Rate": 4.447811018432002e-05, "Pretrain/Loss": 2.0631508827209473, "Pretrain/Loss (Raw)": 1.8715723752975464, "Pretrain/Step": 4562, "Pretrain/Step Time": 8.437186492606997} +{"Pretrain/Learning Rate": 4.447544873913878e-05, "Pretrain/Loss": 2.065570831298828, "Pretrain/Loss (Raw)": 2.1813461780548096, "Pretrain/Step": 4563, "Pretrain/Step Time": 8.444158425554633} +{"Pretrain/Learning Rate": 4.447278673239672e-05, "Pretrain/Loss": 2.0649685859680176, "Pretrain/Loss (Raw)": 1.993432879447937, "Pretrain/Step": 4564, "Pretrain/Step Time": 8.441942740231752} +{"Pretrain/Learning Rate": 4.447012416417057e-05, "Pretrain/Loss": 2.064314603805542, "Pretrain/Loss (Raw)": 1.9408248662948608, "Pretrain/Step": 4565, "Pretrain/Step Time": 8.442449601367116} +{"Pretrain/Learning Rate": 4.4467461034537125e-05, "Pretrain/Loss": 2.0634799003601074, "Pretrain/Loss (Raw)": 2.1169514656066895, "Pretrain/Step": 4566, "Pretrain/Step Time": 8.443697966635227} +{"Pretrain/Learning Rate": 4.446479734357316e-05, "Pretrain/Loss": 2.063016414642334, "Pretrain/Loss (Raw)": 2.1394100189208984, "Pretrain/Step": 4567, "Pretrain/Step Time": 8.447558250278234} +{"Pretrain/Learning Rate": 4.4462133091355484e-05, "Pretrain/Loss": 2.0635766983032227, "Pretrain/Loss (Raw)": 2.1504006385803223, "Pretrain/Step": 4568, "Pretrain/Step Time": 8.447925791144371} +{"Pretrain/Learning Rate": 4.445946827796092e-05, "Pretrain/Loss": 2.064840316772461, "Pretrain/Loss (Raw)": 2.220828056335449, "Pretrain/Step": 4569, "Pretrain/Step Time": 8.450342439115047} +{"Pretrain/Learning Rate": 4.4456802903466304e-05, "Pretrain/Loss": 2.064492702484131, "Pretrain/Loss (Raw)": 2.093301296234131, "Pretrain/Step": 4570, "Pretrain/Step Time": 8.454896224662662} +{"Pretrain/Learning Rate": 4.44541369679485e-05, "Pretrain/Loss": 2.0649938583374023, "Pretrain/Loss (Raw)": 2.008046865463257, "Pretrain/Step": 4571, "Pretrain/Step Time": 8.452940881252289} +{"Pretrain/Learning Rate": 4.445147047148436e-05, "Pretrain/Loss": 2.0620670318603516, "Pretrain/Loss (Raw)": 1.9431967735290527, "Pretrain/Step": 4572, "Pretrain/Step Time": 8.455369159579277} +{"Pretrain/Learning Rate": 4.444880341415079e-05, "Pretrain/Loss": 2.061325788497925, "Pretrain/Loss (Raw)": 2.0027873516082764, "Pretrain/Step": 4573, "Pretrain/Step Time": 8.453850105404854} +{"Pretrain/Learning Rate": 4.444613579602469e-05, "Pretrain/Loss": 2.060669422149658, "Pretrain/Loss (Raw)": 2.1139895915985107, "Pretrain/Step": 4574, "Pretrain/Step Time": 8.456576818600297} +{"Pretrain/Learning Rate": 4.444346761718295e-05, "Pretrain/Loss": 2.058488368988037, "Pretrain/Loss (Raw)": 1.8689202070236206, "Pretrain/Step": 4575, "Pretrain/Step Time": 8.449107317253947} +{"Pretrain/Learning Rate": 4.444079887770255e-05, "Pretrain/Loss": 2.058687925338745, "Pretrain/Loss (Raw)": 1.9916564226150513, "Pretrain/Step": 4576, "Pretrain/Step Time": 8.449511369690299} +{"Pretrain/Learning Rate": 4.4438129577660414e-05, "Pretrain/Loss": 2.059743642807007, "Pretrain/Loss (Raw)": 2.110220193862915, "Pretrain/Step": 4577, "Pretrain/Step Time": 8.44540686532855} +{"Pretrain/Learning Rate": 4.443545971713351e-05, "Pretrain/Loss": 2.061614990234375, "Pretrain/Loss (Raw)": 2.148000478744507, "Pretrain/Step": 4578, "Pretrain/Step Time": 8.447283184155822} +{"Pretrain/Learning Rate": 4.443278929619883e-05, "Pretrain/Loss": 2.0603365898132324, "Pretrain/Loss (Raw)": 1.9744243621826172, "Pretrain/Step": 4579, "Pretrain/Step Time": 8.451790360733867} +{"Pretrain/Learning Rate": 4.443011831493337e-05, "Pretrain/Loss": 2.0641279220581055, "Pretrain/Loss (Raw)": 2.309203863143921, "Pretrain/Step": 4580, "Pretrain/Step Time": 8.448903663083911} +{"Pretrain/Learning Rate": 4.442744677341414e-05, "Pretrain/Loss": 2.064852714538574, "Pretrain/Loss (Raw)": 2.1846091747283936, "Pretrain/Step": 4581, "Pretrain/Step Time": 8.449892425909638} +{"Pretrain/Learning Rate": 4.442477467171819e-05, "Pretrain/Loss": 2.0623934268951416, "Pretrain/Loss (Raw)": 2.0500986576080322, "Pretrain/Step": 4582, "Pretrain/Step Time": 8.44830759242177} +{"Pretrain/Learning Rate": 4.4422102009922545e-05, "Pretrain/Loss": 2.0636463165283203, "Pretrain/Loss (Raw)": 2.023956537246704, "Pretrain/Step": 4583, "Pretrain/Step Time": 8.45147100649774} +{"Pretrain/Learning Rate": 4.441942878810428e-05, "Pretrain/Loss": 2.064396858215332, "Pretrain/Loss (Raw)": 2.0987815856933594, "Pretrain/Step": 4584, "Pretrain/Step Time": 8.45156549103558} +{"Pretrain/Learning Rate": 4.4416755006340484e-05, "Pretrain/Loss": 2.063749074935913, "Pretrain/Loss (Raw)": 2.0725021362304688, "Pretrain/Step": 4585, "Pretrain/Step Time": 8.454826172441244} +{"Pretrain/Learning Rate": 4.4414080664708235e-05, "Pretrain/Loss": 2.063107967376709, "Pretrain/Loss (Raw)": 2.008655071258545, "Pretrain/Step": 4586, "Pretrain/Step Time": 8.447551731020212} +{"Pretrain/Learning Rate": 4.4411405763284665e-05, "Pretrain/Loss": 2.0629656314849854, "Pretrain/Loss (Raw)": 2.1336677074432373, "Pretrain/Step": 4587, "Pretrain/Step Time": 8.450053758919239} +{"Pretrain/Learning Rate": 4.440873030214689e-05, "Pretrain/Loss": 2.065080404281616, "Pretrain/Loss (Raw)": 2.250534772872925, "Pretrain/Step": 4588, "Pretrain/Step Time": 8.44987127929926} +{"Pretrain/Learning Rate": 4.4406054281372055e-05, "Pretrain/Loss": 2.0671486854553223, "Pretrain/Loss (Raw)": 2.1654469966888428, "Pretrain/Step": 4589, "Pretrain/Step Time": 8.449064234271646} +{"Pretrain/Learning Rate": 4.440337770103734e-05, "Pretrain/Loss": 2.062772750854492, "Pretrain/Loss (Raw)": 1.7381905317306519, "Pretrain/Step": 4590, "Pretrain/Step Time": 8.453260105103254} +{"Pretrain/Learning Rate": 4.440070056121989e-05, "Pretrain/Loss": 2.062575101852417, "Pretrain/Loss (Raw)": 1.961180329322815, "Pretrain/Step": 4591, "Pretrain/Step Time": 8.447271130979061} +{"Pretrain/Learning Rate": 4.439802286199693e-05, "Pretrain/Loss": 2.06250262260437, "Pretrain/Loss (Raw)": 2.15195631980896, "Pretrain/Step": 4592, "Pretrain/Step Time": 8.44444072060287} +{"Pretrain/Learning Rate": 4.4395344603445644e-05, "Pretrain/Loss": 2.0630359649658203, "Pretrain/Loss (Raw)": 2.198554039001465, "Pretrain/Step": 4593, "Pretrain/Step Time": 8.441523689776659} +{"Pretrain/Learning Rate": 4.4392665785643276e-05, "Pretrain/Loss": 2.0611085891723633, "Pretrain/Loss (Raw)": 1.7976585626602173, "Pretrain/Step": 4594, "Pretrain/Step Time": 8.440274145454168} +{"Pretrain/Learning Rate": 4.438998640866705e-05, "Pretrain/Loss": 2.063037872314453, "Pretrain/Loss (Raw)": 2.1197903156280518, "Pretrain/Step": 4595, "Pretrain/Step Time": 8.443287178874016} +{"Pretrain/Learning Rate": 4.4387306472594244e-05, "Pretrain/Loss": 2.0625011920928955, "Pretrain/Loss (Raw)": 2.151827812194824, "Pretrain/Step": 4596, "Pretrain/Step Time": 8.443503636866808} +{"Pretrain/Learning Rate": 4.438462597750213e-05, "Pretrain/Loss": 2.062206983566284, "Pretrain/Loss (Raw)": 1.9309669733047485, "Pretrain/Step": 4597, "Pretrain/Step Time": 8.446472788229585} +{"Pretrain/Learning Rate": 4.438194492346798e-05, "Pretrain/Loss": 2.062534809112549, "Pretrain/Loss (Raw)": 2.0797042846679688, "Pretrain/Step": 4598, "Pretrain/Step Time": 8.447308350354433} +{"Pretrain/Learning Rate": 4.437926331056912e-05, "Pretrain/Loss": 2.061859607696533, "Pretrain/Loss (Raw)": 2.0685274600982666, "Pretrain/Step": 4599, "Pretrain/Step Time": 8.447072580456734} +{"Pretrain/Learning Rate": 4.4376581138882855e-05, "Pretrain/Loss": 2.059670925140381, "Pretrain/Loss (Raw)": 1.967341423034668, "Pretrain/Step": 4600, "Pretrain/Step Time": 8.445011662319303} +{"Pretrain/Learning Rate": 4.437389840848654e-05, "Pretrain/Loss": 2.059607744216919, "Pretrain/Loss (Raw)": 1.9269651174545288, "Pretrain/Step": 4601, "Pretrain/Step Time": 8.447022665292025} +{"Pretrain/Learning Rate": 4.437121511945752e-05, "Pretrain/Loss": 2.0603246688842773, "Pretrain/Loss (Raw)": 1.923685073852539, "Pretrain/Step": 4602, "Pretrain/Step Time": 8.447194159030914} +{"Pretrain/Learning Rate": 4.436853127187316e-05, "Pretrain/Loss": 2.0617434978485107, "Pretrain/Loss (Raw)": 2.0923385620117188, "Pretrain/Step": 4603, "Pretrain/Step Time": 8.453213645145297} +{"Pretrain/Learning Rate": 4.436584686581087e-05, "Pretrain/Loss": 2.0628914833068848, "Pretrain/Loss (Raw)": 2.2091498374938965, "Pretrain/Step": 4604, "Pretrain/Step Time": 8.453471835702658} +{"Pretrain/Learning Rate": 4.436316190134802e-05, "Pretrain/Loss": 2.0638716220855713, "Pretrain/Loss (Raw)": 2.267015218734741, "Pretrain/Step": 4605, "Pretrain/Step Time": 8.454366764053702} +{"Pretrain/Learning Rate": 4.4360476378562054e-05, "Pretrain/Loss": 2.0654547214508057, "Pretrain/Loss (Raw)": 2.101832628250122, "Pretrain/Step": 4606, "Pretrain/Step Time": 8.448489170521498} +{"Pretrain/Learning Rate": 4.43577902975304e-05, "Pretrain/Loss": 2.0643041133880615, "Pretrain/Loss (Raw)": 2.0561916828155518, "Pretrain/Step": 4607, "Pretrain/Step Time": 8.448279354721308} +{"Pretrain/Learning Rate": 4.435510365833051e-05, "Pretrain/Loss": 2.0623416900634766, "Pretrain/Loss (Raw)": 2.0561680793762207, "Pretrain/Step": 4608, "Pretrain/Step Time": 8.441835848614573} +{"Pretrain/Learning Rate": 4.435241646103986e-05, "Pretrain/Loss": 2.0624451637268066, "Pretrain/Loss (Raw)": 2.022874355316162, "Pretrain/Step": 4609, "Pretrain/Step Time": 8.44462126120925} +{"Pretrain/Learning Rate": 4.434972870573591e-05, "Pretrain/Loss": 2.063441753387451, "Pretrain/Loss (Raw)": 2.117609977722168, "Pretrain/Step": 4610, "Pretrain/Step Time": 8.439575089141726} +{"Pretrain/Learning Rate": 4.434704039249618e-05, "Pretrain/Loss": 2.0645546913146973, "Pretrain/Loss (Raw)": 2.0708720684051514, "Pretrain/Step": 4611, "Pretrain/Step Time": 8.443658540025353} +{"Pretrain/Learning Rate": 4.434435152139817e-05, "Pretrain/Loss": 2.0646910667419434, "Pretrain/Loss (Raw)": 2.129551887512207, "Pretrain/Step": 4612, "Pretrain/Step Time": 8.444987995550036} +{"Pretrain/Learning Rate": 4.434166209251943e-05, "Pretrain/Loss": 2.0654056072235107, "Pretrain/Loss (Raw)": 2.094404935836792, "Pretrain/Step": 4613, "Pretrain/Step Time": 8.446812653914094} +{"Pretrain/Learning Rate": 4.43389721059375e-05, "Pretrain/Loss": 2.065728187561035, "Pretrain/Loss (Raw)": 2.150644540786743, "Pretrain/Step": 4614, "Pretrain/Step Time": 8.44615570642054} +{"Pretrain/Learning Rate": 4.433628156172994e-05, "Pretrain/Loss": 2.0635416507720947, "Pretrain/Loss (Raw)": 1.852708101272583, "Pretrain/Step": 4615, "Pretrain/Step Time": 8.446861542761326} +{"Pretrain/Learning Rate": 4.4333590459974335e-05, "Pretrain/Loss": 2.0635733604431152, "Pretrain/Loss (Raw)": 1.990807294845581, "Pretrain/Step": 4616, "Pretrain/Step Time": 8.446436515077949} +{"Pretrain/Learning Rate": 4.433089880074827e-05, "Pretrain/Loss": 2.064115047454834, "Pretrain/Loss (Raw)": 2.106001377105713, "Pretrain/Step": 4617, "Pretrain/Step Time": 8.446513291448355} +{"Pretrain/Learning Rate": 4.4328206584129374e-05, "Pretrain/Loss": 2.0642683506011963, "Pretrain/Loss (Raw)": 2.1179699897766113, "Pretrain/Step": 4618, "Pretrain/Step Time": 8.44788788817823} +{"Pretrain/Learning Rate": 4.4325513810195264e-05, "Pretrain/Loss": 2.0648438930511475, "Pretrain/Loss (Raw)": 1.8961169719696045, "Pretrain/Step": 4619, "Pretrain/Step Time": 8.445110335946083} +{"Pretrain/Learning Rate": 4.432282047902358e-05, "Pretrain/Loss": 2.0680947303771973, "Pretrain/Loss (Raw)": 2.219120502471924, "Pretrain/Step": 4620, "Pretrain/Step Time": 8.44678301922977} +{"Pretrain/Learning Rate": 4.4320126590692e-05, "Pretrain/Loss": 2.068173885345459, "Pretrain/Loss (Raw)": 1.964457392692566, "Pretrain/Step": 4621, "Pretrain/Step Time": 8.449167193844914} +{"Pretrain/Learning Rate": 4.431743214527818e-05, "Pretrain/Loss": 2.0708370208740234, "Pretrain/Loss (Raw)": 2.287064552307129, "Pretrain/Step": 4622, "Pretrain/Step Time": 8.44744118116796} +{"Pretrain/Learning Rate": 4.431473714285983e-05, "Pretrain/Loss": 2.072789192199707, "Pretrain/Loss (Raw)": 2.186279296875, "Pretrain/Step": 4623, "Pretrain/Step Time": 8.444951724261045} +{"Pretrain/Learning Rate": 4.4312041583514645e-05, "Pretrain/Loss": 2.070885181427002, "Pretrain/Loss (Raw)": 1.7595340013504028, "Pretrain/Step": 4624, "Pretrain/Step Time": 8.451172420755029} +{"Pretrain/Learning Rate": 4.4309345467320365e-05, "Pretrain/Loss": 2.071413993835449, "Pretrain/Loss (Raw)": 2.1916611194610596, "Pretrain/Step": 4625, "Pretrain/Step Time": 8.447559604421258} +{"Pretrain/Learning Rate": 4.4306648794354706e-05, "Pretrain/Loss": 2.0720198154449463, "Pretrain/Loss (Raw)": 2.130126476287842, "Pretrain/Step": 4626, "Pretrain/Step Time": 8.447327468544245} +{"Pretrain/Learning Rate": 4.430395156469545e-05, "Pretrain/Loss": 2.0727670192718506, "Pretrain/Loss (Raw)": 2.263652801513672, "Pretrain/Step": 4627, "Pretrain/Step Time": 8.444977467879653} +{"Pretrain/Learning Rate": 4.430125377842035e-05, "Pretrain/Loss": 2.0717220306396484, "Pretrain/Loss (Raw)": 2.1004490852355957, "Pretrain/Step": 4628, "Pretrain/Step Time": 8.443031648173928} +{"Pretrain/Learning Rate": 4.429855543560721e-05, "Pretrain/Loss": 2.0718727111816406, "Pretrain/Loss (Raw)": 2.034282684326172, "Pretrain/Step": 4629, "Pretrain/Step Time": 8.443712908774614} +{"Pretrain/Learning Rate": 4.4295856536333825e-05, "Pretrain/Loss": 2.0712883472442627, "Pretrain/Loss (Raw)": 1.9544857740402222, "Pretrain/Step": 4630, "Pretrain/Step Time": 8.449178852140903} +{"Pretrain/Learning Rate": 4.429315708067802e-05, "Pretrain/Loss": 2.071568489074707, "Pretrain/Loss (Raw)": 1.9764785766601562, "Pretrain/Step": 4631, "Pretrain/Step Time": 8.44683955796063} +{"Pretrain/Learning Rate": 4.4290457068717636e-05, "Pretrain/Loss": 2.072247266769409, "Pretrain/Loss (Raw)": 2.10598087310791, "Pretrain/Step": 4632, "Pretrain/Step Time": 8.444210475310683} +{"Pretrain/Learning Rate": 4.428775650053052e-05, "Pretrain/Loss": 2.067183494567871, "Pretrain/Loss (Raw)": 1.8638559579849243, "Pretrain/Step": 4633, "Pretrain/Step Time": 8.44566042535007} +{"Pretrain/Learning Rate": 4.428505537619454e-05, "Pretrain/Loss": 2.066307783126831, "Pretrain/Loss (Raw)": 1.966977596282959, "Pretrain/Step": 4634, "Pretrain/Step Time": 8.443048493936658} +{"Pretrain/Learning Rate": 4.4282353695787584e-05, "Pretrain/Loss": 2.0673599243164062, "Pretrain/Loss (Raw)": 2.2279961109161377, "Pretrain/Step": 4635, "Pretrain/Step Time": 8.437429247424006} +{"Pretrain/Learning Rate": 4.427965145938755e-05, "Pretrain/Loss": 2.069558620452881, "Pretrain/Loss (Raw)": 2.201322317123413, "Pretrain/Step": 4636, "Pretrain/Step Time": 8.437146931886673} +{"Pretrain/Learning Rate": 4.427694866707236e-05, "Pretrain/Loss": 2.070261240005493, "Pretrain/Loss (Raw)": 1.9419441223144531, "Pretrain/Step": 4637, "Pretrain/Step Time": 8.439512079581618} +{"Pretrain/Learning Rate": 4.4274245318919946e-05, "Pretrain/Loss": 2.071333646774292, "Pretrain/Loss (Raw)": 2.1215808391571045, "Pretrain/Step": 4638, "Pretrain/Step Time": 8.443626530468464} +{"Pretrain/Learning Rate": 4.4271541415008255e-05, "Pretrain/Loss": 2.0684189796447754, "Pretrain/Loss (Raw)": 1.9582695960998535, "Pretrain/Step": 4639, "Pretrain/Step Time": 8.444503009319305} +{"Pretrain/Learning Rate": 4.426883695541525e-05, "Pretrain/Loss": 2.0678110122680664, "Pretrain/Loss (Raw)": 2.0317718982696533, "Pretrain/Step": 4640, "Pretrain/Step Time": 8.438882071524858} +{"Pretrain/Learning Rate": 4.426613194021892e-05, "Pretrain/Loss": 2.0711684226989746, "Pretrain/Loss (Raw)": 2.3719727993011475, "Pretrain/Step": 4641, "Pretrain/Step Time": 8.440660921856761} +{"Pretrain/Learning Rate": 4.426342636949725e-05, "Pretrain/Loss": 2.070725440979004, "Pretrain/Loss (Raw)": 2.0356805324554443, "Pretrain/Step": 4642, "Pretrain/Step Time": 8.43822731077671} +{"Pretrain/Learning Rate": 4.426072024332827e-05, "Pretrain/Loss": 2.0730862617492676, "Pretrain/Loss (Raw)": 2.255866765975952, "Pretrain/Step": 4643, "Pretrain/Step Time": 8.436530226841569} +{"Pretrain/Learning Rate": 4.425801356178999e-05, "Pretrain/Loss": 2.073309898376465, "Pretrain/Loss (Raw)": 2.0602240562438965, "Pretrain/Step": 4644, "Pretrain/Step Time": 8.44204705953598} +{"Pretrain/Learning Rate": 4.425530632496047e-05, "Pretrain/Loss": 2.0724127292633057, "Pretrain/Loss (Raw)": 2.0227248668670654, "Pretrain/Step": 4645, "Pretrain/Step Time": 8.44092615135014} +{"Pretrain/Learning Rate": 4.4252598532917763e-05, "Pretrain/Loss": 2.0717086791992188, "Pretrain/Loss (Raw)": 1.8801764249801636, "Pretrain/Step": 4646, "Pretrain/Step Time": 8.44781151600182} +{"Pretrain/Learning Rate": 4.424989018573996e-05, "Pretrain/Loss": 2.0709939002990723, "Pretrain/Loss (Raw)": 2.0033414363861084, "Pretrain/Step": 4647, "Pretrain/Step Time": 8.450277052819729} +{"Pretrain/Learning Rate": 4.424718128350513e-05, "Pretrain/Loss": 2.072490930557251, "Pretrain/Loss (Raw)": 2.104637861251831, "Pretrain/Step": 4648, "Pretrain/Step Time": 8.446893647313118} +{"Pretrain/Learning Rate": 4.42444718262914e-05, "Pretrain/Loss": 2.0722804069519043, "Pretrain/Loss (Raw)": 2.0604233741760254, "Pretrain/Step": 4649, "Pretrain/Step Time": 8.442462660372257} +{"Pretrain/Learning Rate": 4.42417618141769e-05, "Pretrain/Loss": 2.073814630508423, "Pretrain/Loss (Raw)": 2.168520450592041, "Pretrain/Step": 4650, "Pretrain/Step Time": 8.441185865551233} +{"Pretrain/Learning Rate": 4.423905124723975e-05, "Pretrain/Loss": 2.0711493492126465, "Pretrain/Loss (Raw)": 1.7524343729019165, "Pretrain/Step": 4651, "Pretrain/Step Time": 8.438828622922301} +{"Pretrain/Learning Rate": 4.423634012555813e-05, "Pretrain/Loss": 2.0701630115509033, "Pretrain/Loss (Raw)": 2.1582722663879395, "Pretrain/Step": 4652, "Pretrain/Step Time": 8.440491506829858} +{"Pretrain/Learning Rate": 4.4233628449210194e-05, "Pretrain/Loss": 2.0695390701293945, "Pretrain/Loss (Raw)": 2.0807905197143555, "Pretrain/Step": 4653, "Pretrain/Step Time": 8.44225987419486} +{"Pretrain/Learning Rate": 4.423091621827415e-05, "Pretrain/Loss": 2.068912982940674, "Pretrain/Loss (Raw)": 2.154836654663086, "Pretrain/Step": 4654, "Pretrain/Step Time": 8.438976589590311} +{"Pretrain/Learning Rate": 4.4228203432828184e-05, "Pretrain/Loss": 2.0687029361724854, "Pretrain/Loss (Raw)": 2.0576703548431396, "Pretrain/Step": 4655, "Pretrain/Step Time": 8.444251166656613} +{"Pretrain/Learning Rate": 4.422549009295054e-05, "Pretrain/Loss": 2.0672452449798584, "Pretrain/Loss (Raw)": 1.8831168413162231, "Pretrain/Step": 4656, "Pretrain/Step Time": 8.443596074357629} +{"Pretrain/Learning Rate": 4.4222776198719426e-05, "Pretrain/Loss": 2.0647692680358887, "Pretrain/Loss (Raw)": 1.9080148935317993, "Pretrain/Step": 4657, "Pretrain/Step Time": 8.438589319586754} +{"Pretrain/Learning Rate": 4.422006175021312e-05, "Pretrain/Loss": 2.067124843597412, "Pretrain/Loss (Raw)": 2.1544511318206787, "Pretrain/Step": 4658, "Pretrain/Step Time": 8.441768564283848} +{"Pretrain/Learning Rate": 4.421734674750988e-05, "Pretrain/Loss": 2.0672338008880615, "Pretrain/Loss (Raw)": 2.085078001022339, "Pretrain/Step": 4659, "Pretrain/Step Time": 8.440398110076785} +{"Pretrain/Learning Rate": 4.421463119068801e-05, "Pretrain/Loss": 2.0667405128479004, "Pretrain/Loss (Raw)": 2.0757343769073486, "Pretrain/Step": 4660, "Pretrain/Step Time": 8.441309349611402} +{"Pretrain/Learning Rate": 4.421191507982577e-05, "Pretrain/Loss": 2.0663623809814453, "Pretrain/Loss (Raw)": 2.034369707107544, "Pretrain/Step": 4661, "Pretrain/Step Time": 8.441890375688672} +{"Pretrain/Learning Rate": 4.420919841500152e-05, "Pretrain/Loss": 2.065498113632202, "Pretrain/Loss (Raw)": 1.8468643426895142, "Pretrain/Step": 4662, "Pretrain/Step Time": 8.447555903345346} +{"Pretrain/Learning Rate": 4.420648119629357e-05, "Pretrain/Loss": 2.064033031463623, "Pretrain/Loss (Raw)": 1.894336462020874, "Pretrain/Step": 4663, "Pretrain/Step Time": 8.449243450537324} +{"Pretrain/Learning Rate": 4.420376342378027e-05, "Pretrain/Loss": 2.0658376216888428, "Pretrain/Loss (Raw)": 2.2515993118286133, "Pretrain/Step": 4664, "Pretrain/Step Time": 8.448305618017912} +{"Pretrain/Learning Rate": 4.420104509753999e-05, "Pretrain/Loss": 2.0665321350097656, "Pretrain/Loss (Raw)": 2.2864797115325928, "Pretrain/Step": 4665, "Pretrain/Step Time": 8.45309673808515} +{"Pretrain/Learning Rate": 4.419832621765112e-05, "Pretrain/Loss": 2.0684616565704346, "Pretrain/Loss (Raw)": 2.0915255546569824, "Pretrain/Step": 4666, "Pretrain/Step Time": 8.452013418078423} +{"Pretrain/Learning Rate": 4.419560678419203e-05, "Pretrain/Loss": 2.067349910736084, "Pretrain/Loss (Raw)": 2.0932178497314453, "Pretrain/Step": 4667, "Pretrain/Step Time": 8.453026792034507} +{"Pretrain/Learning Rate": 4.419288679724117e-05, "Pretrain/Loss": 2.0674405097961426, "Pretrain/Loss (Raw)": 1.8909856081008911, "Pretrain/Step": 4668, "Pretrain/Step Time": 8.46184553578496} +{"Pretrain/Learning Rate": 4.419016625687694e-05, "Pretrain/Loss": 2.0668625831604004, "Pretrain/Loss (Raw)": 2.0222485065460205, "Pretrain/Step": 4669, "Pretrain/Step Time": 8.459983499720693} +{"Pretrain/Learning Rate": 4.418744516317779e-05, "Pretrain/Loss": 2.0658035278320312, "Pretrain/Loss (Raw)": 2.215592384338379, "Pretrain/Step": 4670, "Pretrain/Step Time": 8.46945621818304} +{"Pretrain/Learning Rate": 4.418472351622219e-05, "Pretrain/Loss": 2.0646533966064453, "Pretrain/Loss (Raw)": 1.9457752704620361, "Pretrain/Step": 4671, "Pretrain/Step Time": 8.47253667935729} +{"Pretrain/Learning Rate": 4.4182001316088614e-05, "Pretrain/Loss": 2.0648956298828125, "Pretrain/Loss (Raw)": 2.2728686332702637, "Pretrain/Step": 4672, "Pretrain/Step Time": 8.467627707868814} +{"Pretrain/Learning Rate": 4.4179278562855554e-05, "Pretrain/Loss": 2.063173294067383, "Pretrain/Loss (Raw)": 1.7976207733154297, "Pretrain/Step": 4673, "Pretrain/Step Time": 8.46600873209536} +{"Pretrain/Learning Rate": 4.4176555256601506e-05, "Pretrain/Loss": 2.0623390674591064, "Pretrain/Loss (Raw)": 1.8290152549743652, "Pretrain/Step": 4674, "Pretrain/Step Time": 8.465691504999995} +{"Pretrain/Learning Rate": 4.4173831397405015e-05, "Pretrain/Loss": 2.063105583190918, "Pretrain/Loss (Raw)": 1.9760081768035889, "Pretrain/Step": 4675, "Pretrain/Step Time": 8.463251829147339} +{"Pretrain/Learning Rate": 4.417110698534461e-05, "Pretrain/Loss": 2.063680648803711, "Pretrain/Loss (Raw)": 2.1784138679504395, "Pretrain/Step": 4676, "Pretrain/Step Time": 8.4673887565732} +{"Pretrain/Learning Rate": 4.416838202049885e-05, "Pretrain/Loss": 2.060830593109131, "Pretrain/Loss (Raw)": 1.7169535160064697, "Pretrain/Step": 4677, "Pretrain/Step Time": 8.467072462663054} +{"Pretrain/Learning Rate": 4.4165656502946307e-05, "Pretrain/Loss": 2.058074951171875, "Pretrain/Loss (Raw)": 1.834001064300537, "Pretrain/Step": 4678, "Pretrain/Step Time": 8.467820828780532} +{"Pretrain/Learning Rate": 4.416293043276557e-05, "Pretrain/Loss": 2.0614144802093506, "Pretrain/Loss (Raw)": 2.525846481323242, "Pretrain/Step": 4679, "Pretrain/Step Time": 8.46899976208806} +{"Pretrain/Learning Rate": 4.416020381003524e-05, "Pretrain/Loss": 2.0612471103668213, "Pretrain/Loss (Raw)": 2.054241895675659, "Pretrain/Step": 4680, "Pretrain/Step Time": 8.468758264556527} +{"Pretrain/Learning Rate": 4.415747663483394e-05, "Pretrain/Loss": 2.062607765197754, "Pretrain/Loss (Raw)": 2.1893680095672607, "Pretrain/Step": 4681, "Pretrain/Step Time": 8.463148891925812} +{"Pretrain/Learning Rate": 4.415474890724032e-05, "Pretrain/Loss": 2.06265926361084, "Pretrain/Loss (Raw)": 2.096010446548462, "Pretrain/Step": 4682, "Pretrain/Step Time": 8.461256919428706} +{"Pretrain/Learning Rate": 4.4152020627333e-05, "Pretrain/Loss": 2.0649333000183105, "Pretrain/Loss (Raw)": 2.0727696418762207, "Pretrain/Step": 4683, "Pretrain/Step Time": 8.46105109155178} +{"Pretrain/Learning Rate": 4.414929179519067e-05, "Pretrain/Loss": 2.066837787628174, "Pretrain/Loss (Raw)": 2.1555423736572266, "Pretrain/Step": 4684, "Pretrain/Step Time": 8.462327091023326} +{"Pretrain/Learning Rate": 4.414656241089202e-05, "Pretrain/Loss": 2.065375566482544, "Pretrain/Loss (Raw)": 2.1909236907958984, "Pretrain/Step": 4685, "Pretrain/Step Time": 8.46643159352243} +{"Pretrain/Learning Rate": 4.4143832474515734e-05, "Pretrain/Loss": 2.0623483657836914, "Pretrain/Loss (Raw)": 1.8971903324127197, "Pretrain/Step": 4686, "Pretrain/Step Time": 8.470209136605263} +{"Pretrain/Learning Rate": 4.414110198614054e-05, "Pretrain/Loss": 2.0617446899414062, "Pretrain/Loss (Raw)": 1.7968113422393799, "Pretrain/Step": 4687, "Pretrain/Step Time": 8.469431590288877} +{"Pretrain/Learning Rate": 4.413837094584516e-05, "Pretrain/Loss": 2.0562100410461426, "Pretrain/Loss (Raw)": 1.7912603616714478, "Pretrain/Step": 4688, "Pretrain/Step Time": 8.467551255598664} +{"Pretrain/Learning Rate": 4.413563935370833e-05, "Pretrain/Loss": 2.0580999851226807, "Pretrain/Loss (Raw)": 2.212327003479004, "Pretrain/Step": 4689, "Pretrain/Step Time": 8.468677170574665} +{"Pretrain/Learning Rate": 4.4132907209808846e-05, "Pretrain/Loss": 2.0587122440338135, "Pretrain/Loss (Raw)": 1.9499635696411133, "Pretrain/Step": 4690, "Pretrain/Step Time": 8.471457542851567} +{"Pretrain/Learning Rate": 4.413017451422548e-05, "Pretrain/Loss": 2.058784008026123, "Pretrain/Loss (Raw)": 2.1904900074005127, "Pretrain/Step": 4691, "Pretrain/Step Time": 8.46527467481792} +{"Pretrain/Learning Rate": 4.4127441267036995e-05, "Pretrain/Loss": 2.0598130226135254, "Pretrain/Loss (Raw)": 2.1251535415649414, "Pretrain/Step": 4692, "Pretrain/Step Time": 8.468095721676946} +{"Pretrain/Learning Rate": 4.412470746832224e-05, "Pretrain/Loss": 2.0617637634277344, "Pretrain/Loss (Raw)": 2.190516948699951, "Pretrain/Step": 4693, "Pretrain/Step Time": 8.4669548291713} +{"Pretrain/Learning Rate": 4.412197311816002e-05, "Pretrain/Loss": 2.0597643852233887, "Pretrain/Loss (Raw)": 1.8610516786575317, "Pretrain/Step": 4694, "Pretrain/Step Time": 8.468185931444168} +{"Pretrain/Learning Rate": 4.411923821662919e-05, "Pretrain/Loss": 2.058499813079834, "Pretrain/Loss (Raw)": 1.9775458574295044, "Pretrain/Step": 4695, "Pretrain/Step Time": 8.462407076731324} +{"Pretrain/Learning Rate": 4.41165027638086e-05, "Pretrain/Loss": 2.0582542419433594, "Pretrain/Loss (Raw)": 2.118954658508301, "Pretrain/Step": 4696, "Pretrain/Step Time": 8.460911242291331} +{"Pretrain/Learning Rate": 4.4113766759777134e-05, "Pretrain/Loss": 2.056303024291992, "Pretrain/Loss (Raw)": 1.9710956811904907, "Pretrain/Step": 4697, "Pretrain/Step Time": 8.462489617988467} +{"Pretrain/Learning Rate": 4.411103020461368e-05, "Pretrain/Loss": 2.0552875995635986, "Pretrain/Loss (Raw)": 1.9633158445358276, "Pretrain/Step": 4698, "Pretrain/Step Time": 8.457477882504463} +{"Pretrain/Learning Rate": 4.4108293098397134e-05, "Pretrain/Loss": 2.0551271438598633, "Pretrain/Loss (Raw)": 1.9874805212020874, "Pretrain/Step": 4699, "Pretrain/Step Time": 8.463273648172617} +{"Pretrain/Learning Rate": 4.410555544120643e-05, "Pretrain/Loss": 2.0560226440429688, "Pretrain/Loss (Raw)": 2.0578417778015137, "Pretrain/Step": 4700, "Pretrain/Step Time": 8.459394050762057} +{"Pretrain/Learning Rate": 4.41028172331205e-05, "Pretrain/Loss": 2.056641101837158, "Pretrain/Loss (Raw)": 2.081942081451416, "Pretrain/Step": 4701, "Pretrain/Step Time": 8.465317083522677} +{"Pretrain/Learning Rate": 4.410007847421831e-05, "Pretrain/Loss": 2.0572495460510254, "Pretrain/Loss (Raw)": 2.1919045448303223, "Pretrain/Step": 4702, "Pretrain/Step Time": 8.466756135225296} +{"Pretrain/Learning Rate": 4.4097339164578816e-05, "Pretrain/Loss": 2.058093547821045, "Pretrain/Loss (Raw)": 1.9769091606140137, "Pretrain/Step": 4703, "Pretrain/Step Time": 8.466081714257598} +{"Pretrain/Learning Rate": 4.4094599304281015e-05, "Pretrain/Loss": 2.057812213897705, "Pretrain/Loss (Raw)": 1.9556423425674438, "Pretrain/Step": 4704, "Pretrain/Step Time": 8.461708849295974} +{"Pretrain/Learning Rate": 4.409185889340389e-05, "Pretrain/Loss": 2.0563230514526367, "Pretrain/Loss (Raw)": 1.9196425676345825, "Pretrain/Step": 4705, "Pretrain/Step Time": 8.462534088641405} +{"Pretrain/Learning Rate": 4.4089117932026494e-05, "Pretrain/Loss": 2.0537643432617188, "Pretrain/Loss (Raw)": 1.8204939365386963, "Pretrain/Step": 4706, "Pretrain/Step Time": 8.460077404975891} +{"Pretrain/Learning Rate": 4.4086376420227824e-05, "Pretrain/Loss": 2.0559580326080322, "Pretrain/Loss (Raw)": 2.255183696746826, "Pretrain/Step": 4707, "Pretrain/Step Time": 8.462101427838206} +{"Pretrain/Learning Rate": 4.4083634358086945e-05, "Pretrain/Loss": 2.0538086891174316, "Pretrain/Loss (Raw)": 2.0340893268585205, "Pretrain/Step": 4708, "Pretrain/Step Time": 8.46163753978908} +{"Pretrain/Learning Rate": 4.408089174568293e-05, "Pretrain/Loss": 2.0529046058654785, "Pretrain/Loss (Raw)": 2.06888484954834, "Pretrain/Step": 4709, "Pretrain/Step Time": 8.463558999821544} +{"Pretrain/Learning Rate": 4.407814858309485e-05, "Pretrain/Loss": 2.052393913269043, "Pretrain/Loss (Raw)": 1.9847551584243774, "Pretrain/Step": 4710, "Pretrain/Step Time": 8.466781634837389} +{"Pretrain/Learning Rate": 4.4075404870401806e-05, "Pretrain/Loss": 2.0528042316436768, "Pretrain/Loss (Raw)": 2.076462984085083, "Pretrain/Step": 4711, "Pretrain/Step Time": 8.46800941042602} +{"Pretrain/Learning Rate": 4.40726606076829e-05, "Pretrain/Loss": 2.050868511199951, "Pretrain/Loss (Raw)": 1.851025104522705, "Pretrain/Step": 4712, "Pretrain/Step Time": 8.467974286526442} +{"Pretrain/Learning Rate": 4.406991579501728e-05, "Pretrain/Loss": 2.051246166229248, "Pretrain/Loss (Raw)": 2.120837450027466, "Pretrain/Step": 4713, "Pretrain/Step Time": 8.463405285030603} +{"Pretrain/Learning Rate": 4.406717043248408e-05, "Pretrain/Loss": 2.0508298873901367, "Pretrain/Loss (Raw)": 1.9553751945495605, "Pretrain/Step": 4714, "Pretrain/Step Time": 8.464834928512573} +{"Pretrain/Learning Rate": 4.406442452016246e-05, "Pretrain/Loss": 2.049440622329712, "Pretrain/Loss (Raw)": 1.9558167457580566, "Pretrain/Step": 4715, "Pretrain/Step Time": 8.464887242764235} +{"Pretrain/Learning Rate": 4.4061678058131605e-05, "Pretrain/Loss": 2.0476574897766113, "Pretrain/Loss (Raw)": 2.0222928524017334, "Pretrain/Step": 4716, "Pretrain/Step Time": 8.466078076511621} +{"Pretrain/Learning Rate": 4.40589310464707e-05, "Pretrain/Loss": 2.0451231002807617, "Pretrain/Loss (Raw)": 1.841055154800415, "Pretrain/Step": 4717, "Pretrain/Step Time": 8.46919777430594} +{"Pretrain/Learning Rate": 4.405618348525895e-05, "Pretrain/Loss": 2.0470898151397705, "Pretrain/Loss (Raw)": 1.989938497543335, "Pretrain/Step": 4718, "Pretrain/Step Time": 8.466932389885187} +{"Pretrain/Learning Rate": 4.405343537457558e-05, "Pretrain/Loss": 2.049099922180176, "Pretrain/Loss (Raw)": 2.2184531688690186, "Pretrain/Step": 4719, "Pretrain/Step Time": 8.466689497232437} +{"Pretrain/Learning Rate": 4.405068671449983e-05, "Pretrain/Loss": 2.0483977794647217, "Pretrain/Loss (Raw)": 2.0621042251586914, "Pretrain/Step": 4720, "Pretrain/Step Time": 8.469656728208065} +{"Pretrain/Learning Rate": 4.404793750511097e-05, "Pretrain/Loss": 2.046590805053711, "Pretrain/Loss (Raw)": 1.9672328233718872, "Pretrain/Step": 4721, "Pretrain/Step Time": 8.464692624285817} +{"Pretrain/Learning Rate": 4.4045187746488253e-05, "Pretrain/Loss": 2.049197196960449, "Pretrain/Loss (Raw)": 2.131317138671875, "Pretrain/Step": 4722, "Pretrain/Step Time": 8.468483688309789} +{"Pretrain/Learning Rate": 4.404243743871097e-05, "Pretrain/Loss": 2.049208164215088, "Pretrain/Loss (Raw)": 2.121177911758423, "Pretrain/Step": 4723, "Pretrain/Step Time": 8.471488486975431} +{"Pretrain/Learning Rate": 4.4039686581858434e-05, "Pretrain/Loss": 2.0481576919555664, "Pretrain/Loss (Raw)": 2.0173768997192383, "Pretrain/Step": 4724, "Pretrain/Step Time": 8.470188166946173} +{"Pretrain/Learning Rate": 4.4036935176009964e-05, "Pretrain/Loss": 2.050020694732666, "Pretrain/Loss (Raw)": 2.169419765472412, "Pretrain/Step": 4725, "Pretrain/Step Time": 8.465876063331962} +{"Pretrain/Learning Rate": 4.4034183221244877e-05, "Pretrain/Loss": 2.0492875576019287, "Pretrain/Loss (Raw)": 1.9858808517456055, "Pretrain/Step": 4726, "Pretrain/Step Time": 8.467227265238762} +{"Pretrain/Learning Rate": 4.4031430717642534e-05, "Pretrain/Loss": 2.0508337020874023, "Pretrain/Loss (Raw)": 2.2664151191711426, "Pretrain/Step": 4727, "Pretrain/Step Time": 8.477911099791527} +{"Pretrain/Learning Rate": 4.402867766528231e-05, "Pretrain/Loss": 2.051424503326416, "Pretrain/Loss (Raw)": 2.0429773330688477, "Pretrain/Step": 4728, "Pretrain/Step Time": 8.475662089884281} +{"Pretrain/Learning Rate": 4.4025924064243573e-05, "Pretrain/Loss": 2.0528688430786133, "Pretrain/Loss (Raw)": 2.1118342876434326, "Pretrain/Step": 4729, "Pretrain/Step Time": 8.476620998233557} +{"Pretrain/Learning Rate": 4.402316991460573e-05, "Pretrain/Loss": 2.053649663925171, "Pretrain/Loss (Raw)": 2.0236282348632812, "Pretrain/Step": 4730, "Pretrain/Step Time": 8.474547177553177} +{"Pretrain/Learning Rate": 4.4020415216448194e-05, "Pretrain/Loss": 2.054002523422241, "Pretrain/Loss (Raw)": 2.1374905109405518, "Pretrain/Step": 4731, "Pretrain/Step Time": 8.466797292232513} +{"Pretrain/Learning Rate": 4.40176599698504e-05, "Pretrain/Loss": 2.0522043704986572, "Pretrain/Loss (Raw)": 1.9790005683898926, "Pretrain/Step": 4732, "Pretrain/Step Time": 8.473409106954932} +{"Pretrain/Learning Rate": 4.401490417489178e-05, "Pretrain/Loss": 2.0497729778289795, "Pretrain/Loss (Raw)": 1.9557923078536987, "Pretrain/Step": 4733, "Pretrain/Step Time": 8.476949838921428} +{"Pretrain/Learning Rate": 4.4012147831651805e-05, "Pretrain/Loss": 2.0499074459075928, "Pretrain/Loss (Raw)": 2.119056224822998, "Pretrain/Step": 4734, "Pretrain/Step Time": 8.478700492531061} +{"Pretrain/Learning Rate": 4.400939094020995e-05, "Pretrain/Loss": 2.050961971282959, "Pretrain/Loss (Raw)": 2.1911673545837402, "Pretrain/Step": 4735, "Pretrain/Step Time": 8.485832342877984} +{"Pretrain/Learning Rate": 4.4006633500645705e-05, "Pretrain/Loss": 2.051586389541626, "Pretrain/Loss (Raw)": 2.1360912322998047, "Pretrain/Step": 4736, "Pretrain/Step Time": 8.485540356487036} +{"Pretrain/Learning Rate": 4.4003875513038585e-05, "Pretrain/Loss": 2.053091526031494, "Pretrain/Loss (Raw)": 2.215510845184326, "Pretrain/Step": 4737, "Pretrain/Step Time": 8.481564039364457} +{"Pretrain/Learning Rate": 4.400111697746811e-05, "Pretrain/Loss": 2.0531954765319824, "Pretrain/Loss (Raw)": 2.13092303276062, "Pretrain/Step": 4738, "Pretrain/Step Time": 8.481461726129055} +{"Pretrain/Learning Rate": 4.399835789401382e-05, "Pretrain/Loss": 2.052852153778076, "Pretrain/Loss (Raw)": 2.026937961578369, "Pretrain/Step": 4739, "Pretrain/Step Time": 8.478004677221179} +{"Pretrain/Learning Rate": 4.3995598262755276e-05, "Pretrain/Loss": 2.0519070625305176, "Pretrain/Loss (Raw)": 2.008610963821411, "Pretrain/Step": 4740, "Pretrain/Step Time": 8.478973101824522} +{"Pretrain/Learning Rate": 4.399283808377205e-05, "Pretrain/Loss": 2.053373336791992, "Pretrain/Loss (Raw)": 2.282060384750366, "Pretrain/Step": 4741, "Pretrain/Step Time": 8.476628156378865} +{"Pretrain/Learning Rate": 4.399007735714372e-05, "Pretrain/Loss": 2.052433967590332, "Pretrain/Loss (Raw)": 2.0304038524627686, "Pretrain/Step": 4742, "Pretrain/Step Time": 8.48038436472416} +{"Pretrain/Learning Rate": 4.3987316082949905e-05, "Pretrain/Loss": 2.0534019470214844, "Pretrain/Loss (Raw)": 1.9766039848327637, "Pretrain/Step": 4743, "Pretrain/Step Time": 8.483883414417505} +{"Pretrain/Learning Rate": 4.3984554261270206e-05, "Pretrain/Loss": 2.055800199508667, "Pretrain/Loss (Raw)": 2.2977752685546875, "Pretrain/Step": 4744, "Pretrain/Step Time": 8.483805702999234} +{"Pretrain/Learning Rate": 4.398179189218427e-05, "Pretrain/Loss": 2.0551204681396484, "Pretrain/Loss (Raw)": 2.0189921855926514, "Pretrain/Step": 4745, "Pretrain/Step Time": 8.477744786068797} +{"Pretrain/Learning Rate": 4.3979028975771754e-05, "Pretrain/Loss": 2.054306745529175, "Pretrain/Loss (Raw)": 2.0138330459594727, "Pretrain/Step": 4746, "Pretrain/Step Time": 8.479392394423485} +{"Pretrain/Learning Rate": 4.397626551211231e-05, "Pretrain/Loss": 2.053788661956787, "Pretrain/Loss (Raw)": 1.8297908306121826, "Pretrain/Step": 4747, "Pretrain/Step Time": 8.477149872109294} +{"Pretrain/Learning Rate": 4.397350150128563e-05, "Pretrain/Loss": 2.053407669067383, "Pretrain/Loss (Raw)": 2.1703555583953857, "Pretrain/Step": 4748, "Pretrain/Step Time": 8.477205511182547} +{"Pretrain/Learning Rate": 4.3970736943371406e-05, "Pretrain/Loss": 2.0532357692718506, "Pretrain/Loss (Raw)": 1.9424411058425903, "Pretrain/Step": 4749, "Pretrain/Step Time": 8.47611297853291} +{"Pretrain/Learning Rate": 4.396797183844936e-05, "Pretrain/Loss": 2.0517354011535645, "Pretrain/Loss (Raw)": 2.09503173828125, "Pretrain/Step": 4750, "Pretrain/Step Time": 8.482974106445909} +{"Pretrain/Learning Rate": 4.396520618659922e-05, "Pretrain/Loss": 2.0484514236450195, "Pretrain/Loss (Raw)": 1.7659419775009155, "Pretrain/Step": 4751, "Pretrain/Step Time": 8.482725951820612} +{"Pretrain/Learning Rate": 4.396243998790072e-05, "Pretrain/Loss": 2.050802230834961, "Pretrain/Loss (Raw)": 2.060431957244873, "Pretrain/Step": 4752, "Pretrain/Step Time": 8.483180904760957} +{"Pretrain/Learning Rate": 4.3959673242433635e-05, "Pretrain/Loss": 2.0497708320617676, "Pretrain/Loss (Raw)": 2.0596466064453125, "Pretrain/Step": 4753, "Pretrain/Step Time": 8.480730718001723} +{"Pretrain/Learning Rate": 4.395690595027774e-05, "Pretrain/Loss": 2.050931453704834, "Pretrain/Loss (Raw)": 2.278695583343506, "Pretrain/Step": 4754, "Pretrain/Step Time": 8.478732995688915} +{"Pretrain/Learning Rate": 4.395413811151282e-05, "Pretrain/Loss": 2.0492589473724365, "Pretrain/Loss (Raw)": 2.0495693683624268, "Pretrain/Step": 4755, "Pretrain/Step Time": 8.482849294319749} +{"Pretrain/Learning Rate": 4.39513697262187e-05, "Pretrain/Loss": 2.0491697788238525, "Pretrain/Loss (Raw)": 2.089019775390625, "Pretrain/Step": 4756, "Pretrain/Step Time": 8.482494693249464} +{"Pretrain/Learning Rate": 4.394860079447518e-05, "Pretrain/Loss": 2.0507946014404297, "Pretrain/Loss (Raw)": 2.2422778606414795, "Pretrain/Step": 4757, "Pretrain/Step Time": 8.484860435128212} +{"Pretrain/Learning Rate": 4.394583131636213e-05, "Pretrain/Loss": 2.052077293395996, "Pretrain/Loss (Raw)": 2.118652820587158, "Pretrain/Step": 4758, "Pretrain/Step Time": 8.481974832713604} +{"Pretrain/Learning Rate": 4.394306129195938e-05, "Pretrain/Loss": 2.0497324466705322, "Pretrain/Loss (Raw)": 1.676354169845581, "Pretrain/Step": 4759, "Pretrain/Step Time": 8.48160028271377} +{"Pretrain/Learning Rate": 4.394029072134681e-05, "Pretrain/Loss": 2.0482778549194336, "Pretrain/Loss (Raw)": 1.9197602272033691, "Pretrain/Step": 4760, "Pretrain/Step Time": 8.480436546728015} +{"Pretrain/Learning Rate": 4.393751960460431e-05, "Pretrain/Loss": 2.0510077476501465, "Pretrain/Loss (Raw)": 2.2132887840270996, "Pretrain/Step": 4761, "Pretrain/Step Time": 8.480699883773923} +{"Pretrain/Learning Rate": 4.393474794181179e-05, "Pretrain/Loss": 2.050956964492798, "Pretrain/Loss (Raw)": 1.9605063199996948, "Pretrain/Step": 4762, "Pretrain/Step Time": 8.477345187216997} +{"Pretrain/Learning Rate": 4.393197573304915e-05, "Pretrain/Loss": 2.0518269538879395, "Pretrain/Loss (Raw)": 2.339327812194824, "Pretrain/Step": 4763, "Pretrain/Step Time": 8.47847744077444} +{"Pretrain/Learning Rate": 4.3929202978396344e-05, "Pretrain/Loss": 2.049996852874756, "Pretrain/Loss (Raw)": 1.9670964479446411, "Pretrain/Step": 4764, "Pretrain/Step Time": 8.47932443395257} +{"Pretrain/Learning Rate": 4.392642967793331e-05, "Pretrain/Loss": 2.05224871635437, "Pretrain/Loss (Raw)": 2.2301621437072754, "Pretrain/Step": 4765, "Pretrain/Step Time": 8.484289525076747} +{"Pretrain/Learning Rate": 4.3923655831740016e-05, "Pretrain/Loss": 2.0490195751190186, "Pretrain/Loss (Raw)": 1.7082332372665405, "Pretrain/Step": 4766, "Pretrain/Step Time": 8.482751315459609} +{"Pretrain/Learning Rate": 4.3920881439896454e-05, "Pretrain/Loss": 2.049319267272949, "Pretrain/Loss (Raw)": 1.9966732263565063, "Pretrain/Step": 4767, "Pretrain/Step Time": 8.487988790497184} +{"Pretrain/Learning Rate": 4.3918106502482616e-05, "Pretrain/Loss": 2.049389362335205, "Pretrain/Loss (Raw)": 2.040703296661377, "Pretrain/Step": 4768, "Pretrain/Step Time": 8.48559520766139} +{"Pretrain/Learning Rate": 4.3915331019578503e-05, "Pretrain/Loss": 2.0482001304626465, "Pretrain/Loss (Raw)": 2.219749927520752, "Pretrain/Step": 4769, "Pretrain/Step Time": 8.48521988466382} +{"Pretrain/Learning Rate": 4.3912554991264164e-05, "Pretrain/Loss": 2.048440933227539, "Pretrain/Loss (Raw)": 2.066519021987915, "Pretrain/Step": 4770, "Pretrain/Step Time": 8.48605340719223} +{"Pretrain/Learning Rate": 4.390977841761963e-05, "Pretrain/Loss": 2.0481181144714355, "Pretrain/Loss (Raw)": 2.214550733566284, "Pretrain/Step": 4771, "Pretrain/Step Time": 8.49131372384727} +{"Pretrain/Learning Rate": 4.390700129872497e-05, "Pretrain/Loss": 2.0488648414611816, "Pretrain/Loss (Raw)": 2.1557743549346924, "Pretrain/Step": 4772, "Pretrain/Step Time": 8.483336139470339} +{"Pretrain/Learning Rate": 4.390422363466025e-05, "Pretrain/Loss": 2.0491433143615723, "Pretrain/Loss (Raw)": 2.0584044456481934, "Pretrain/Step": 4773, "Pretrain/Step Time": 8.488540159538388} +{"Pretrain/Learning Rate": 4.390144542550556e-05, "Pretrain/Loss": 2.050551414489746, "Pretrain/Loss (Raw)": 2.0604248046875, "Pretrain/Step": 4774, "Pretrain/Step Time": 8.485337296500802} +{"Pretrain/Learning Rate": 4.389866667134103e-05, "Pretrain/Loss": 2.051455497741699, "Pretrain/Loss (Raw)": 2.1190624237060547, "Pretrain/Step": 4775, "Pretrain/Step Time": 8.483866276219487} +{"Pretrain/Learning Rate": 4.389588737224676e-05, "Pretrain/Loss": 2.050118923187256, "Pretrain/Loss (Raw)": 1.9335412979125977, "Pretrain/Step": 4776, "Pretrain/Step Time": 8.482027187943459} +{"Pretrain/Learning Rate": 4.389310752830291e-05, "Pretrain/Loss": 2.050546169281006, "Pretrain/Loss (Raw)": 2.1151156425476074, "Pretrain/Step": 4777, "Pretrain/Step Time": 8.486812496557832} +{"Pretrain/Learning Rate": 4.3890327139589616e-05, "Pretrain/Loss": 2.0514183044433594, "Pretrain/Loss (Raw)": 2.2801671028137207, "Pretrain/Step": 4778, "Pretrain/Step Time": 8.48654261790216} +{"Pretrain/Learning Rate": 4.388754620618706e-05, "Pretrain/Loss": 2.054210662841797, "Pretrain/Loss (Raw)": 2.1098225116729736, "Pretrain/Step": 4779, "Pretrain/Step Time": 8.48548130132258} +{"Pretrain/Learning Rate": 4.388476472817541e-05, "Pretrain/Loss": 2.054706335067749, "Pretrain/Loss (Raw)": 2.2217319011688232, "Pretrain/Step": 4780, "Pretrain/Step Time": 8.483954368159175} +{"Pretrain/Learning Rate": 4.388198270563489e-05, "Pretrain/Loss": 2.052797317504883, "Pretrain/Loss (Raw)": 1.836445927619934, "Pretrain/Step": 4781, "Pretrain/Step Time": 8.487393947318196} +{"Pretrain/Learning Rate": 4.387920013864571e-05, "Pretrain/Loss": 2.052520990371704, "Pretrain/Loss (Raw)": 2.1194517612457275, "Pretrain/Step": 4782, "Pretrain/Step Time": 8.48983240313828} +{"Pretrain/Learning Rate": 4.3876417027288114e-05, "Pretrain/Loss": 2.0525052547454834, "Pretrain/Loss (Raw)": 2.055666208267212, "Pretrain/Step": 4783, "Pretrain/Step Time": 8.4872367978096} +{"Pretrain/Learning Rate": 4.387363337164233e-05, "Pretrain/Loss": 2.0538032054901123, "Pretrain/Loss (Raw)": 2.0492353439331055, "Pretrain/Step": 4784, "Pretrain/Step Time": 8.492563305422664} +{"Pretrain/Learning Rate": 4.387084917178863e-05, "Pretrain/Loss": 2.057772397994995, "Pretrain/Loss (Raw)": 2.416083574295044, "Pretrain/Step": 4785, "Pretrain/Step Time": 8.49375981092453} +{"Pretrain/Learning Rate": 4.38680644278073e-05, "Pretrain/Loss": 2.0565881729125977, "Pretrain/Loss (Raw)": 2.0028674602508545, "Pretrain/Step": 4786, "Pretrain/Step Time": 8.48845249414444} +{"Pretrain/Learning Rate": 4.3865279139778635e-05, "Pretrain/Loss": 2.0563111305236816, "Pretrain/Loss (Raw)": 2.0495963096618652, "Pretrain/Step": 4787, "Pretrain/Step Time": 8.489759657531977} +{"Pretrain/Learning Rate": 4.386249330778295e-05, "Pretrain/Loss": 2.056758165359497, "Pretrain/Loss (Raw)": 2.132974863052368, "Pretrain/Step": 4788, "Pretrain/Step Time": 8.48766009695828} +{"Pretrain/Learning Rate": 4.385970693190056e-05, "Pretrain/Loss": 2.0546069145202637, "Pretrain/Loss (Raw)": 1.7589831352233887, "Pretrain/Step": 4789, "Pretrain/Step Time": 8.490337142720819} +{"Pretrain/Learning Rate": 4.3856920012211814e-05, "Pretrain/Loss": 2.0556631088256836, "Pretrain/Loss (Raw)": 1.9821217060089111, "Pretrain/Step": 4790, "Pretrain/Step Time": 8.48340735398233} +{"Pretrain/Learning Rate": 4.3854132548797077e-05, "Pretrain/Loss": 2.0569868087768555, "Pretrain/Loss (Raw)": 2.0637474060058594, "Pretrain/Step": 4791, "Pretrain/Step Time": 8.482557812705636} +{"Pretrain/Learning Rate": 4.385134454173672e-05, "Pretrain/Loss": 2.0567917823791504, "Pretrain/Loss (Raw)": 2.2266008853912354, "Pretrain/Step": 4792, "Pretrain/Step Time": 8.486885383725166} +{"Pretrain/Learning Rate": 4.3848555991111126e-05, "Pretrain/Loss": 2.056204080581665, "Pretrain/Loss (Raw)": 2.211263418197632, "Pretrain/Step": 4793, "Pretrain/Step Time": 8.479338027536869} +{"Pretrain/Learning Rate": 4.3845766897000715e-05, "Pretrain/Loss": 2.056497573852539, "Pretrain/Loss (Raw)": 2.1291160583496094, "Pretrain/Step": 4794, "Pretrain/Step Time": 8.48330332711339} +{"Pretrain/Learning Rate": 4.38429772594859e-05, "Pretrain/Loss": 2.0570271015167236, "Pretrain/Loss (Raw)": 2.1609859466552734, "Pretrain/Step": 4795, "Pretrain/Step Time": 8.48238736949861} +{"Pretrain/Learning Rate": 4.384018707864712e-05, "Pretrain/Loss": 2.0599515438079834, "Pretrain/Loss (Raw)": 2.265315294265747, "Pretrain/Step": 4796, "Pretrain/Step Time": 8.474374543875456} +{"Pretrain/Learning Rate": 4.383739635456482e-05, "Pretrain/Loss": 2.061177968978882, "Pretrain/Loss (Raw)": 2.1792290210723877, "Pretrain/Step": 4797, "Pretrain/Step Time": 8.475377220660448} +{"Pretrain/Learning Rate": 4.383460508731948e-05, "Pretrain/Loss": 2.0600857734680176, "Pretrain/Loss (Raw)": 2.0757973194122314, "Pretrain/Step": 4798, "Pretrain/Step Time": 8.471884859725833} +{"Pretrain/Learning Rate": 4.383181327699158e-05, "Pretrain/Loss": 2.059581995010376, "Pretrain/Loss (Raw)": 1.8813005685806274, "Pretrain/Step": 4799, "Pretrain/Step Time": 8.476276183500886} +{"Pretrain/Learning Rate": 4.3829020923661624e-05, "Pretrain/Loss": 2.0585782527923584, "Pretrain/Loss (Raw)": 2.1443755626678467, "Pretrain/Step": 4800, "Pretrain/Step Time": 8.480663292109966} +{"Pretrain/Learning Rate": 4.382622802741012e-05, "Pretrain/Loss": 2.0612921714782715, "Pretrain/Loss (Raw)": 2.1450297832489014, "Pretrain/Step": 4801, "Pretrain/Step Time": 8.479634353891015} +{"Pretrain/Learning Rate": 4.3823434588317593e-05, "Pretrain/Loss": 2.061936378479004, "Pretrain/Loss (Raw)": 1.9114587306976318, "Pretrain/Step": 4802, "Pretrain/Step Time": 8.475568698719144} +{"Pretrain/Learning Rate": 4.3820640606464614e-05, "Pretrain/Loss": 2.0616507530212402, "Pretrain/Loss (Raw)": 1.9394524097442627, "Pretrain/Step": 4803, "Pretrain/Step Time": 8.474029691889882} +{"Pretrain/Learning Rate": 4.381784608193173e-05, "Pretrain/Loss": 2.0593771934509277, "Pretrain/Loss (Raw)": 1.8873789310455322, "Pretrain/Step": 4804, "Pretrain/Step Time": 8.472933229058981} +{"Pretrain/Learning Rate": 4.381505101479951e-05, "Pretrain/Loss": 2.0613975524902344, "Pretrain/Loss (Raw)": 1.9755891561508179, "Pretrain/Step": 4805, "Pretrain/Step Time": 8.475856812670827} +{"Pretrain/Learning Rate": 4.381225540514856e-05, "Pretrain/Loss": 2.0650148391723633, "Pretrain/Loss (Raw)": 2.296976327896118, "Pretrain/Step": 4806, "Pretrain/Step Time": 8.473046749830246} +{"Pretrain/Learning Rate": 4.3809459253059484e-05, "Pretrain/Loss": 2.061091899871826, "Pretrain/Loss (Raw)": 2.0237255096435547, "Pretrain/Step": 4807, "Pretrain/Step Time": 8.470655012875795} +{"Pretrain/Learning Rate": 4.380666255861292e-05, "Pretrain/Loss": 2.0608718395233154, "Pretrain/Loss (Raw)": 2.0260541439056396, "Pretrain/Step": 4808, "Pretrain/Step Time": 8.46871318668127} +{"Pretrain/Learning Rate": 4.3803865321889495e-05, "Pretrain/Loss": 2.060070514678955, "Pretrain/Loss (Raw)": 2.0867860317230225, "Pretrain/Step": 4809, "Pretrain/Step Time": 8.46796964108944} +{"Pretrain/Learning Rate": 4.380106754296987e-05, "Pretrain/Loss": 2.0599365234375, "Pretrain/Loss (Raw)": 2.078868865966797, "Pretrain/Step": 4810, "Pretrain/Step Time": 8.474409654736519} +{"Pretrain/Learning Rate": 4.379826922193471e-05, "Pretrain/Loss": 2.060157299041748, "Pretrain/Loss (Raw)": 2.10103702545166, "Pretrain/Step": 4811, "Pretrain/Step Time": 8.469939270988107} +{"Pretrain/Learning Rate": 4.379547035886472e-05, "Pretrain/Loss": 2.0602846145629883, "Pretrain/Loss (Raw)": 2.171851396560669, "Pretrain/Step": 4812, "Pretrain/Step Time": 8.466195218265057} +{"Pretrain/Learning Rate": 4.3792670953840586e-05, "Pretrain/Loss": 2.0580434799194336, "Pretrain/Loss (Raw)": 1.904056429862976, "Pretrain/Step": 4813, "Pretrain/Step Time": 8.463263822719455} +{"Pretrain/Learning Rate": 4.378987100694303e-05, "Pretrain/Loss": 2.059943437576294, "Pretrain/Loss (Raw)": 2.140376567840576, "Pretrain/Step": 4814, "Pretrain/Step Time": 8.461478095501661} +{"Pretrain/Learning Rate": 4.378707051825279e-05, "Pretrain/Loss": 2.0622692108154297, "Pretrain/Loss (Raw)": 2.09452748298645, "Pretrain/Step": 4815, "Pretrain/Step Time": 8.465409656986594} +{"Pretrain/Learning Rate": 4.378426948785062e-05, "Pretrain/Loss": 2.064983367919922, "Pretrain/Loss (Raw)": 2.1386847496032715, "Pretrain/Step": 4816, "Pretrain/Step Time": 8.468695065006614} +{"Pretrain/Learning Rate": 4.378146791581728e-05, "Pretrain/Loss": 2.062647819519043, "Pretrain/Loss (Raw)": 1.913356065750122, "Pretrain/Step": 4817, "Pretrain/Step Time": 8.470137756317854} +{"Pretrain/Learning Rate": 4.377866580223356e-05, "Pretrain/Loss": 2.0616455078125, "Pretrain/Loss (Raw)": 1.821685552597046, "Pretrain/Step": 4818, "Pretrain/Step Time": 8.466571556404233} +{"Pretrain/Learning Rate": 4.377586314718023e-05, "Pretrain/Loss": 2.0599892139434814, "Pretrain/Loss (Raw)": 1.9784650802612305, "Pretrain/Step": 4819, "Pretrain/Step Time": 8.466506708413363} +{"Pretrain/Learning Rate": 4.3773059950738136e-05, "Pretrain/Loss": 2.058412790298462, "Pretrain/Loss (Raw)": 1.9233580827713013, "Pretrain/Step": 4820, "Pretrain/Step Time": 8.465543247759342} +{"Pretrain/Learning Rate": 4.377025621298809e-05, "Pretrain/Loss": 2.0556845664978027, "Pretrain/Loss (Raw)": 1.841347098350525, "Pretrain/Step": 4821, "Pretrain/Step Time": 8.468537535518408} +{"Pretrain/Learning Rate": 4.376745193401094e-05, "Pretrain/Loss": 2.0588860511779785, "Pretrain/Loss (Raw)": 2.2708232402801514, "Pretrain/Step": 4822, "Pretrain/Step Time": 8.468064507469535} +{"Pretrain/Learning Rate": 4.376464711388755e-05, "Pretrain/Loss": 2.0585033893585205, "Pretrain/Loss (Raw)": 1.9285560846328735, "Pretrain/Step": 4823, "Pretrain/Step Time": 8.47004503570497} +{"Pretrain/Learning Rate": 4.376184175269878e-05, "Pretrain/Loss": 2.057671546936035, "Pretrain/Loss (Raw)": 2.0124902725219727, "Pretrain/Step": 4824, "Pretrain/Step Time": 8.468442808836699} +{"Pretrain/Learning Rate": 4.375903585052552e-05, "Pretrain/Loss": 2.0588531494140625, "Pretrain/Loss (Raw)": 2.122352361679077, "Pretrain/Step": 4825, "Pretrain/Step Time": 8.462638635188341} +{"Pretrain/Learning Rate": 4.37562294074487e-05, "Pretrain/Loss": 2.059788227081299, "Pretrain/Loss (Raw)": 2.0829720497131348, "Pretrain/Step": 4826, "Pretrain/Step Time": 8.465682107955217} +{"Pretrain/Learning Rate": 4.3753422423549224e-05, "Pretrain/Loss": 2.0606486797332764, "Pretrain/Loss (Raw)": 2.0976297855377197, "Pretrain/Step": 4827, "Pretrain/Step Time": 8.46251112781465} +{"Pretrain/Learning Rate": 4.375061489890803e-05, "Pretrain/Loss": 2.06117582321167, "Pretrain/Loss (Raw)": 2.125309944152832, "Pretrain/Step": 4828, "Pretrain/Step Time": 8.46262383274734} +{"Pretrain/Learning Rate": 4.374780683360608e-05, "Pretrain/Loss": 2.061544179916382, "Pretrain/Loss (Raw)": 2.129103660583496, "Pretrain/Step": 4829, "Pretrain/Step Time": 8.460513247177005} +{"Pretrain/Learning Rate": 4.374499822772433e-05, "Pretrain/Loss": 2.060394525527954, "Pretrain/Loss (Raw)": 2.0447423458099365, "Pretrain/Step": 4830, "Pretrain/Step Time": 8.456960855051875} +{"Pretrain/Learning Rate": 4.374218908134378e-05, "Pretrain/Loss": 2.0615782737731934, "Pretrain/Loss (Raw)": 2.1284401416778564, "Pretrain/Step": 4831, "Pretrain/Step Time": 8.461883330717683} +{"Pretrain/Learning Rate": 4.373937939454541e-05, "Pretrain/Loss": 2.062612771987915, "Pretrain/Loss (Raw)": 2.0880484580993652, "Pretrain/Step": 4832, "Pretrain/Step Time": 8.466809019446373} +{"Pretrain/Learning Rate": 4.373656916741025e-05, "Pretrain/Loss": 2.0623793601989746, "Pretrain/Loss (Raw)": 1.889791488647461, "Pretrain/Step": 4833, "Pretrain/Step Time": 8.466190312057734} +{"Pretrain/Learning Rate": 4.373375840001932e-05, "Pretrain/Loss": 2.0649232864379883, "Pretrain/Loss (Raw)": 2.1460752487182617, "Pretrain/Step": 4834, "Pretrain/Step Time": 8.470137313008308} +{"Pretrain/Learning Rate": 4.373094709245368e-05, "Pretrain/Loss": 2.0641214847564697, "Pretrain/Loss (Raw)": 2.15256667137146, "Pretrain/Step": 4835, "Pretrain/Step Time": 8.462533790618181} +{"Pretrain/Learning Rate": 4.372813524479438e-05, "Pretrain/Loss": 2.0635440349578857, "Pretrain/Loss (Raw)": 1.9601682424545288, "Pretrain/Step": 4836, "Pretrain/Step Time": 8.46984019689262} +{"Pretrain/Learning Rate": 4.3725322857122505e-05, "Pretrain/Loss": 2.062363624572754, "Pretrain/Loss (Raw)": 1.9177820682525635, "Pretrain/Step": 4837, "Pretrain/Step Time": 8.467492893338203} +{"Pretrain/Learning Rate": 4.372250992951915e-05, "Pretrain/Loss": 2.0620334148406982, "Pretrain/Loss (Raw)": 1.942516565322876, "Pretrain/Step": 4838, "Pretrain/Step Time": 8.463643753901124} +{"Pretrain/Learning Rate": 4.3719696462065414e-05, "Pretrain/Loss": 2.061784029006958, "Pretrain/Loss (Raw)": 2.0445334911346436, "Pretrain/Step": 4839, "Pretrain/Step Time": 8.463027566671371} +{"Pretrain/Learning Rate": 4.371688245484242e-05, "Pretrain/Loss": 2.062898635864258, "Pretrain/Loss (Raw)": 1.993721604347229, "Pretrain/Step": 4840, "Pretrain/Step Time": 8.461955664679408} +{"Pretrain/Learning Rate": 4.3714067907931335e-05, "Pretrain/Loss": 2.0619730949401855, "Pretrain/Loss (Raw)": 2.002361536026001, "Pretrain/Step": 4841, "Pretrain/Step Time": 8.463375171646476} +{"Pretrain/Learning Rate": 4.371125282141328e-05, "Pretrain/Loss": 2.062225580215454, "Pretrain/Loss (Raw)": 1.9876670837402344, "Pretrain/Step": 4842, "Pretrain/Step Time": 8.460773311555386} +{"Pretrain/Learning Rate": 4.370843719536945e-05, "Pretrain/Loss": 2.0641798973083496, "Pretrain/Loss (Raw)": 2.2059731483459473, "Pretrain/Step": 4843, "Pretrain/Step Time": 8.460715167224407} +{"Pretrain/Learning Rate": 4.3705621029881006e-05, "Pretrain/Loss": 2.0648763179779053, "Pretrain/Loss (Raw)": 2.1114284992218018, "Pretrain/Step": 4844, "Pretrain/Step Time": 8.459606165066361} +{"Pretrain/Learning Rate": 4.370280432502918e-05, "Pretrain/Loss": 2.066403388977051, "Pretrain/Loss (Raw)": 2.036511182785034, "Pretrain/Step": 4845, "Pretrain/Step Time": 8.463428795337677} +{"Pretrain/Learning Rate": 4.369998708089517e-05, "Pretrain/Loss": 2.0683257579803467, "Pretrain/Loss (Raw)": 2.2360293865203857, "Pretrain/Step": 4846, "Pretrain/Step Time": 8.461112961173058} +{"Pretrain/Learning Rate": 4.3697169297560215e-05, "Pretrain/Loss": 2.0658516883850098, "Pretrain/Loss (Raw)": 1.9017643928527832, "Pretrain/Step": 4847, "Pretrain/Step Time": 8.46481417492032} +{"Pretrain/Learning Rate": 4.369435097510557e-05, "Pretrain/Loss": 2.0662026405334473, "Pretrain/Loss (Raw)": 2.1070408821105957, "Pretrain/Step": 4848, "Pretrain/Step Time": 8.461643693968654} +{"Pretrain/Learning Rate": 4.369153211361249e-05, "Pretrain/Loss": 2.067845106124878, "Pretrain/Loss (Raw)": 2.17744779586792, "Pretrain/Step": 4849, "Pretrain/Step Time": 8.46673871204257} +{"Pretrain/Learning Rate": 4.3688712713162256e-05, "Pretrain/Loss": 2.0656399726867676, "Pretrain/Loss (Raw)": 1.849074363708496, "Pretrain/Step": 4850, "Pretrain/Step Time": 8.468931721523404} +{"Pretrain/Learning Rate": 4.368589277383617e-05, "Pretrain/Loss": 2.062797784805298, "Pretrain/Loss (Raw)": 1.7573585510253906, "Pretrain/Step": 4851, "Pretrain/Step Time": 8.465848535299301} +{"Pretrain/Learning Rate": 4.368307229571553e-05, "Pretrain/Loss": 2.062917709350586, "Pretrain/Loss (Raw)": 2.032731056213379, "Pretrain/Step": 4852, "Pretrain/Step Time": 8.464783864095807} +{"Pretrain/Learning Rate": 4.3680251278881676e-05, "Pretrain/Loss": 2.0615828037261963, "Pretrain/Loss (Raw)": 1.998550534248352, "Pretrain/Step": 4853, "Pretrain/Step Time": 8.469519797712564} +{"Pretrain/Learning Rate": 4.367742972341595e-05, "Pretrain/Loss": 2.063523769378662, "Pretrain/Loss (Raw)": 2.234326124191284, "Pretrain/Step": 4854, "Pretrain/Step Time": 8.465825028717518} +{"Pretrain/Learning Rate": 4.36746076293997e-05, "Pretrain/Loss": 2.065565824508667, "Pretrain/Loss (Raw)": 2.527808666229248, "Pretrain/Step": 4855, "Pretrain/Step Time": 8.457211434841156} +{"Pretrain/Learning Rate": 4.36717849969143e-05, "Pretrain/Loss": 2.0653903484344482, "Pretrain/Loss (Raw)": 2.020528793334961, "Pretrain/Step": 4856, "Pretrain/Step Time": 8.456303518265486} +{"Pretrain/Learning Rate": 4.366896182604115e-05, "Pretrain/Loss": 2.0659289360046387, "Pretrain/Loss (Raw)": 2.180741310119629, "Pretrain/Step": 4857, "Pretrain/Step Time": 8.459333883598447} +{"Pretrain/Learning Rate": 4.366613811686164e-05, "Pretrain/Loss": 2.065859079360962, "Pretrain/Loss (Raw)": 2.0146913528442383, "Pretrain/Step": 4858, "Pretrain/Step Time": 8.461908916011453} +{"Pretrain/Learning Rate": 4.3663313869457204e-05, "Pretrain/Loss": 2.0653953552246094, "Pretrain/Loss (Raw)": 2.078162431716919, "Pretrain/Step": 4859, "Pretrain/Step Time": 8.46495946496725} +{"Pretrain/Learning Rate": 4.366048908390926e-05, "Pretrain/Loss": 2.0663256645202637, "Pretrain/Loss (Raw)": 2.098062515258789, "Pretrain/Step": 4860, "Pretrain/Step Time": 8.456294430419803} +{"Pretrain/Learning Rate": 4.365766376029927e-05, "Pretrain/Loss": 2.0647377967834473, "Pretrain/Loss (Raw)": 1.7525594234466553, "Pretrain/Step": 4861, "Pretrain/Step Time": 8.456184079870582} +{"Pretrain/Learning Rate": 4.365483789870871e-05, "Pretrain/Loss": 2.0658910274505615, "Pretrain/Loss (Raw)": 2.2666592597961426, "Pretrain/Step": 4862, "Pretrain/Step Time": 8.458334809169173} +{"Pretrain/Learning Rate": 4.365201149921904e-05, "Pretrain/Loss": 2.066582202911377, "Pretrain/Loss (Raw)": 2.2796506881713867, "Pretrain/Step": 4863, "Pretrain/Step Time": 8.45810623280704} +{"Pretrain/Learning Rate": 4.364918456191177e-05, "Pretrain/Loss": 2.0647695064544678, "Pretrain/Loss (Raw)": 1.9040430784225464, "Pretrain/Step": 4864, "Pretrain/Step Time": 8.459387915208936} +{"Pretrain/Learning Rate": 4.3646357086868404e-05, "Pretrain/Loss": 2.0639801025390625, "Pretrain/Loss (Raw)": 2.114457845687866, "Pretrain/Step": 4865, "Pretrain/Step Time": 8.468100531026721} +{"Pretrain/Learning Rate": 4.364352907417048e-05, "Pretrain/Loss": 2.0631895065307617, "Pretrain/Loss (Raw)": 2.029754638671875, "Pretrain/Step": 4866, "Pretrain/Step Time": 8.469039445742965} +{"Pretrain/Learning Rate": 4.364070052389954e-05, "Pretrain/Loss": 2.063828706741333, "Pretrain/Loss (Raw)": 2.1087374687194824, "Pretrain/Step": 4867, "Pretrain/Step Time": 8.468868892639875} +{"Pretrain/Learning Rate": 4.3637871436137134e-05, "Pretrain/Loss": 2.064192056655884, "Pretrain/Loss (Raw)": 2.0551202297210693, "Pretrain/Step": 4868, "Pretrain/Step Time": 8.465511154383421} +{"Pretrain/Learning Rate": 4.363504181096485e-05, "Pretrain/Loss": 2.0602564811706543, "Pretrain/Loss (Raw)": 1.7783000469207764, "Pretrain/Step": 4869, "Pretrain/Step Time": 8.471701879054308} +{"Pretrain/Learning Rate": 4.363221164846427e-05, "Pretrain/Loss": 2.059617519378662, "Pretrain/Loss (Raw)": 1.9485995769500732, "Pretrain/Step": 4870, "Pretrain/Step Time": 8.469391951337457} +{"Pretrain/Learning Rate": 4.362938094871701e-05, "Pretrain/Loss": 2.0602211952209473, "Pretrain/Loss (Raw)": 2.053898572921753, "Pretrain/Step": 4871, "Pretrain/Step Time": 8.461703760549426} +{"Pretrain/Learning Rate": 4.362654971180467e-05, "Pretrain/Loss": 2.058824062347412, "Pretrain/Loss (Raw)": 2.1189701557159424, "Pretrain/Step": 4872, "Pretrain/Step Time": 8.46449725702405} +{"Pretrain/Learning Rate": 4.362371793780892e-05, "Pretrain/Loss": 2.058478832244873, "Pretrain/Loss (Raw)": 1.9747841358184814, "Pretrain/Step": 4873, "Pretrain/Step Time": 8.46712134219706} +{"Pretrain/Learning Rate": 4.362088562681137e-05, "Pretrain/Loss": 2.058694362640381, "Pretrain/Loss (Raw)": 2.0414035320281982, "Pretrain/Step": 4874, "Pretrain/Step Time": 8.463664436712861} +{"Pretrain/Learning Rate": 4.361805277889372e-05, "Pretrain/Loss": 2.0602874755859375, "Pretrain/Loss (Raw)": 2.0337398052215576, "Pretrain/Step": 4875, "Pretrain/Step Time": 8.472026301547885} +{"Pretrain/Learning Rate": 4.361521939413764e-05, "Pretrain/Loss": 2.059206247329712, "Pretrain/Loss (Raw)": 2.0319461822509766, "Pretrain/Step": 4876, "Pretrain/Step Time": 8.471406856551766} +{"Pretrain/Learning Rate": 4.361238547262484e-05, "Pretrain/Loss": 2.059286594390869, "Pretrain/Loss (Raw)": 1.952727198600769, "Pretrain/Step": 4877, "Pretrain/Step Time": 8.470724925398827} +{"Pretrain/Learning Rate": 4.360955101443701e-05, "Pretrain/Loss": 2.0604519844055176, "Pretrain/Loss (Raw)": 2.244175672531128, "Pretrain/Step": 4878, "Pretrain/Step Time": 8.472012419253588} +{"Pretrain/Learning Rate": 4.360671601965591e-05, "Pretrain/Loss": 2.0628244876861572, "Pretrain/Loss (Raw)": 2.0696377754211426, "Pretrain/Step": 4879, "Pretrain/Step Time": 8.472729044035077} +{"Pretrain/Learning Rate": 4.360388048836326e-05, "Pretrain/Loss": 2.0606260299682617, "Pretrain/Loss (Raw)": 1.7790380716323853, "Pretrain/Step": 4880, "Pretrain/Step Time": 8.4700241163373} +{"Pretrain/Learning Rate": 4.3601044420640836e-05, "Pretrain/Loss": 2.0610175132751465, "Pretrain/Loss (Raw)": 2.1097278594970703, "Pretrain/Step": 4881, "Pretrain/Step Time": 8.473694276064634} +{"Pretrain/Learning Rate": 4.3598207816570415e-05, "Pretrain/Loss": 2.0600271224975586, "Pretrain/Loss (Raw)": 2.1519453525543213, "Pretrain/Step": 4882, "Pretrain/Step Time": 8.473234664648771} +{"Pretrain/Learning Rate": 4.359537067623377e-05, "Pretrain/Loss": 2.060167074203491, "Pretrain/Loss (Raw)": 2.0674922466278076, "Pretrain/Step": 4883, "Pretrain/Step Time": 8.470292709767818} +{"Pretrain/Learning Rate": 4.359253299971273e-05, "Pretrain/Loss": 2.0592703819274902, "Pretrain/Loss (Raw)": 1.9742165803909302, "Pretrain/Step": 4884, "Pretrain/Step Time": 8.47473580762744} +{"Pretrain/Learning Rate": 4.35896947870891e-05, "Pretrain/Loss": 2.05781888961792, "Pretrain/Loss (Raw)": 2.056492805480957, "Pretrain/Step": 4885, "Pretrain/Step Time": 8.472586784511805} +{"Pretrain/Learning Rate": 4.358685603844473e-05, "Pretrain/Loss": 2.0572009086608887, "Pretrain/Loss (Raw)": 2.0395667552948, "Pretrain/Step": 4886, "Pretrain/Step Time": 8.469024870544672} +{"Pretrain/Learning Rate": 4.358401675386147e-05, "Pretrain/Loss": 2.0592236518859863, "Pretrain/Loss (Raw)": 1.9352644681930542, "Pretrain/Step": 4887, "Pretrain/Step Time": 8.476132288575172} +{"Pretrain/Learning Rate": 4.358117693342119e-05, "Pretrain/Loss": 2.06038761138916, "Pretrain/Loss (Raw)": 2.0687453746795654, "Pretrain/Step": 4888, "Pretrain/Step Time": 8.477002570405602} +{"Pretrain/Learning Rate": 4.357833657720577e-05, "Pretrain/Loss": 2.0583696365356445, "Pretrain/Loss (Raw)": 1.954983115196228, "Pretrain/Step": 4889, "Pretrain/Step Time": 8.476683851331472} +{"Pretrain/Learning Rate": 4.3575495685297105e-05, "Pretrain/Loss": 2.0584511756896973, "Pretrain/Loss (Raw)": 1.9709597826004028, "Pretrain/Step": 4890, "Pretrain/Step Time": 8.476858284324408} +{"Pretrain/Learning Rate": 4.357265425777712e-05, "Pretrain/Loss": 2.0561275482177734, "Pretrain/Loss (Raw)": 2.0418872833251953, "Pretrain/Step": 4891, "Pretrain/Step Time": 8.478103749454021} +{"Pretrain/Learning Rate": 4.3569812294727754e-05, "Pretrain/Loss": 2.0591700077056885, "Pretrain/Loss (Raw)": 2.3565499782562256, "Pretrain/Step": 4892, "Pretrain/Step Time": 8.480601666495204} +{"Pretrain/Learning Rate": 4.3566969796230927e-05, "Pretrain/Loss": 2.0577306747436523, "Pretrain/Loss (Raw)": 2.0458927154541016, "Pretrain/Step": 4893, "Pretrain/Step Time": 8.478541919961572} +{"Pretrain/Learning Rate": 4.3564126762368626e-05, "Pretrain/Loss": 2.059873104095459, "Pretrain/Loss (Raw)": 1.982490062713623, "Pretrain/Step": 4894, "Pretrain/Step Time": 8.480316573753953} +{"Pretrain/Learning Rate": 4.3561283193222804e-05, "Pretrain/Loss": 2.0606377124786377, "Pretrain/Loss (Raw)": 2.0945234298706055, "Pretrain/Step": 4895, "Pretrain/Step Time": 8.475376250222325} +{"Pretrain/Learning Rate": 4.355843908887548e-05, "Pretrain/Loss": 2.0603291988372803, "Pretrain/Loss (Raw)": 2.001225471496582, "Pretrain/Step": 4896, "Pretrain/Step Time": 8.476045144721866} +{"Pretrain/Learning Rate": 4.3555594449408635e-05, "Pretrain/Loss": 2.058793067932129, "Pretrain/Loss (Raw)": 2.023106098175049, "Pretrain/Step": 4897, "Pretrain/Step Time": 8.478878941386938} +{"Pretrain/Learning Rate": 4.3552749274904314e-05, "Pretrain/Loss": 2.0581181049346924, "Pretrain/Loss (Raw)": 1.9801392555236816, "Pretrain/Step": 4898, "Pretrain/Step Time": 8.482089081779122} +{"Pretrain/Learning Rate": 4.354990356544454e-05, "Pretrain/Loss": 2.05661940574646, "Pretrain/Loss (Raw)": 2.022724151611328, "Pretrain/Step": 4899, "Pretrain/Step Time": 8.47679695673287} +{"Pretrain/Learning Rate": 4.3547057321111374e-05, "Pretrain/Loss": 2.0555830001831055, "Pretrain/Loss (Raw)": 2.0230841636657715, "Pretrain/Step": 4900, "Pretrain/Step Time": 8.479904238134623} +{"Pretrain/Learning Rate": 4.354421054198688e-05, "Pretrain/Loss": 2.055551528930664, "Pretrain/Loss (Raw)": 2.0544145107269287, "Pretrain/Step": 4901, "Pretrain/Step Time": 8.483678778633475} +{"Pretrain/Learning Rate": 4.3541363228153164e-05, "Pretrain/Loss": 2.055499315261841, "Pretrain/Loss (Raw)": 2.0537221431732178, "Pretrain/Step": 4902, "Pretrain/Step Time": 8.480455715209246} +{"Pretrain/Learning Rate": 4.35385153796923e-05, "Pretrain/Loss": 2.0535926818847656, "Pretrain/Loss (Raw)": 1.875001072883606, "Pretrain/Step": 4903, "Pretrain/Step Time": 8.478082196787} +{"Pretrain/Learning Rate": 4.353566699668642e-05, "Pretrain/Loss": 2.0550668239593506, "Pretrain/Loss (Raw)": 2.1222479343414307, "Pretrain/Step": 4904, "Pretrain/Step Time": 8.479685068130493} +{"Pretrain/Learning Rate": 4.353281807921764e-05, "Pretrain/Loss": 2.0544826984405518, "Pretrain/Loss (Raw)": 2.040351390838623, "Pretrain/Step": 4905, "Pretrain/Step Time": 8.482819067314267} +{"Pretrain/Learning Rate": 4.3529968627368116e-05, "Pretrain/Loss": 2.0538957118988037, "Pretrain/Loss (Raw)": 2.2050271034240723, "Pretrain/Step": 4906, "Pretrain/Step Time": 8.483739947900176} +{"Pretrain/Learning Rate": 4.3527118641220016e-05, "Pretrain/Loss": 2.0531249046325684, "Pretrain/Loss (Raw)": 2.011140823364258, "Pretrain/Step": 4907, "Pretrain/Step Time": 8.48203052394092} +{"Pretrain/Learning Rate": 4.3524268120855506e-05, "Pretrain/Loss": 2.052194356918335, "Pretrain/Loss (Raw)": 2.1026597023010254, "Pretrain/Step": 4908, "Pretrain/Step Time": 8.484668182209134} +{"Pretrain/Learning Rate": 4.3521417066356784e-05, "Pretrain/Loss": 2.0532755851745605, "Pretrain/Loss (Raw)": 1.9748433828353882, "Pretrain/Step": 4909, "Pretrain/Step Time": 8.483262345194817} +{"Pretrain/Learning Rate": 4.351856547780606e-05, "Pretrain/Loss": 2.053818464279175, "Pretrain/Loss (Raw)": 2.1889188289642334, "Pretrain/Step": 4910, "Pretrain/Step Time": 8.482471810653806} +{"Pretrain/Learning Rate": 4.3515713355285554e-05, "Pretrain/Loss": 2.0551607608795166, "Pretrain/Loss (Raw)": 2.227470636367798, "Pretrain/Step": 4911, "Pretrain/Step Time": 8.481055375188589} +{"Pretrain/Learning Rate": 4.3512860698877505e-05, "Pretrain/Loss": 2.055051326751709, "Pretrain/Loss (Raw)": 2.03524112701416, "Pretrain/Step": 4912, "Pretrain/Step Time": 8.478015150874853} +{"Pretrain/Learning Rate": 4.351000750866417e-05, "Pretrain/Loss": 2.0539257526397705, "Pretrain/Loss (Raw)": 2.272005558013916, "Pretrain/Step": 4913, "Pretrain/Step Time": 8.476775102317333} +{"Pretrain/Learning Rate": 4.350715378472782e-05, "Pretrain/Loss": 2.0544843673706055, "Pretrain/Loss (Raw)": 2.0743629932403564, "Pretrain/Step": 4914, "Pretrain/Step Time": 8.48108446225524} +{"Pretrain/Learning Rate": 4.350429952715073e-05, "Pretrain/Loss": 2.0538668632507324, "Pretrain/Loss (Raw)": 1.9705637693405151, "Pretrain/Step": 4915, "Pretrain/Step Time": 8.480532774701715} +{"Pretrain/Learning Rate": 4.350144473601521e-05, "Pretrain/Loss": 2.0523617267608643, "Pretrain/Loss (Raw)": 1.9403212070465088, "Pretrain/Step": 4916, "Pretrain/Step Time": 8.485373808071017} +{"Pretrain/Learning Rate": 4.349858941140358e-05, "Pretrain/Loss": 2.056093692779541, "Pretrain/Loss (Raw)": 2.236694574356079, "Pretrain/Step": 4917, "Pretrain/Step Time": 8.482671473175287} +{"Pretrain/Learning Rate": 4.3495733553398156e-05, "Pretrain/Loss": 2.0567102432250977, "Pretrain/Loss (Raw)": 2.061028480529785, "Pretrain/Step": 4918, "Pretrain/Step Time": 8.484271122142673} +{"Pretrain/Learning Rate": 4.34928771620813e-05, "Pretrain/Loss": 2.0565290451049805, "Pretrain/Loss (Raw)": 2.040545701980591, "Pretrain/Step": 4919, "Pretrain/Step Time": 8.485453573986888} +{"Pretrain/Learning Rate": 4.349002023753537e-05, "Pretrain/Loss": 2.056086540222168, "Pretrain/Loss (Raw)": 2.1699721813201904, "Pretrain/Step": 4920, "Pretrain/Step Time": 8.485482500866055} +{"Pretrain/Learning Rate": 4.348716277984273e-05, "Pretrain/Loss": 2.0542616844177246, "Pretrain/Loss (Raw)": 1.97768235206604, "Pretrain/Step": 4921, "Pretrain/Step Time": 8.494507113471627} +{"Pretrain/Learning Rate": 4.3484304789085794e-05, "Pretrain/Loss": 2.054171323776245, "Pretrain/Loss (Raw)": 2.117537260055542, "Pretrain/Step": 4922, "Pretrain/Step Time": 8.490647818893194} +{"Pretrain/Learning Rate": 4.348144626534696e-05, "Pretrain/Loss": 2.0525765419006348, "Pretrain/Loss (Raw)": 1.9568374156951904, "Pretrain/Step": 4923, "Pretrain/Step Time": 8.490333395078778} +{"Pretrain/Learning Rate": 4.3478587208708646e-05, "Pretrain/Loss": 2.0496301651000977, "Pretrain/Loss (Raw)": 1.8881968259811401, "Pretrain/Step": 4924, "Pretrain/Step Time": 8.490788098424673} +{"Pretrain/Learning Rate": 4.3475727619253294e-05, "Pretrain/Loss": 2.0474956035614014, "Pretrain/Loss (Raw)": 1.9060109853744507, "Pretrain/Step": 4925, "Pretrain/Step Time": 8.494471285492182} +{"Pretrain/Learning Rate": 4.347286749706336e-05, "Pretrain/Loss": 2.0479846000671387, "Pretrain/Loss (Raw)": 2.138381004333496, "Pretrain/Step": 4926, "Pretrain/Step Time": 8.490706356242299} +{"Pretrain/Learning Rate": 4.3470006842221324e-05, "Pretrain/Loss": 2.049495220184326, "Pretrain/Loss (Raw)": 2.0746734142303467, "Pretrain/Step": 4927, "Pretrain/Step Time": 8.485438965260983} +{"Pretrain/Learning Rate": 4.346714565480966e-05, "Pretrain/Loss": 2.0504395961761475, "Pretrain/Loss (Raw)": 2.265241861343384, "Pretrain/Step": 4928, "Pretrain/Step Time": 8.48216769658029} +{"Pretrain/Learning Rate": 4.3464283934910864e-05, "Pretrain/Loss": 2.0477042198181152, "Pretrain/Loss (Raw)": 1.794911503791809, "Pretrain/Step": 4929, "Pretrain/Step Time": 8.48942494019866} +{"Pretrain/Learning Rate": 4.3461421682607455e-05, "Pretrain/Loss": 2.0488858222961426, "Pretrain/Loss (Raw)": 2.0626771450042725, "Pretrain/Step": 4930, "Pretrain/Step Time": 8.495044669136405} +{"Pretrain/Learning Rate": 4.345855889798197e-05, "Pretrain/Loss": 2.0484530925750732, "Pretrain/Loss (Raw)": 1.8840786218643188, "Pretrain/Step": 4931, "Pretrain/Step Time": 8.495031965896487} +{"Pretrain/Learning Rate": 4.345569558111695e-05, "Pretrain/Loss": 2.052415370941162, "Pretrain/Loss (Raw)": 2.394533395767212, "Pretrain/Step": 4932, "Pretrain/Step Time": 8.495392782613635} +{"Pretrain/Learning Rate": 4.345283173209497e-05, "Pretrain/Loss": 2.052614212036133, "Pretrain/Loss (Raw)": 2.0010528564453125, "Pretrain/Step": 4933, "Pretrain/Step Time": 8.492300108075142} +{"Pretrain/Learning Rate": 4.344996735099858e-05, "Pretrain/Loss": 2.0509815216064453, "Pretrain/Loss (Raw)": 2.0880041122436523, "Pretrain/Step": 4934, "Pretrain/Step Time": 8.488269567489624} +{"Pretrain/Learning Rate": 4.3447102437910394e-05, "Pretrain/Loss": 2.052126169204712, "Pretrain/Loss (Raw)": 2.1702373027801514, "Pretrain/Step": 4935, "Pretrain/Step Time": 8.490735752508044} +{"Pretrain/Learning Rate": 4.344423699291301e-05, "Pretrain/Loss": 2.0531675815582275, "Pretrain/Loss (Raw)": 2.1593546867370605, "Pretrain/Step": 4936, "Pretrain/Step Time": 8.494476659223437} +{"Pretrain/Learning Rate": 4.344137101608906e-05, "Pretrain/Loss": 2.0521039962768555, "Pretrain/Loss (Raw)": 1.9506648778915405, "Pretrain/Step": 4937, "Pretrain/Step Time": 8.495109280571342} +{"Pretrain/Learning Rate": 4.3438504507521175e-05, "Pretrain/Loss": 2.0520923137664795, "Pretrain/Loss (Raw)": 2.0773634910583496, "Pretrain/Step": 4938, "Pretrain/Step Time": 8.494120070710778} +{"Pretrain/Learning Rate": 4.343563746729201e-05, "Pretrain/Loss": 2.051572799682617, "Pretrain/Loss (Raw)": 2.0345096588134766, "Pretrain/Step": 4939, "Pretrain/Step Time": 8.49326092377305} +{"Pretrain/Learning Rate": 4.343276989548424e-05, "Pretrain/Loss": 2.051283121109009, "Pretrain/Loss (Raw)": 2.134793996810913, "Pretrain/Step": 4940, "Pretrain/Step Time": 8.497783994302154} +{"Pretrain/Learning Rate": 4.3429901792180535e-05, "Pretrain/Loss": 2.0532467365264893, "Pretrain/Loss (Raw)": 2.155411958694458, "Pretrain/Step": 4941, "Pretrain/Step Time": 8.497507002204657} +{"Pretrain/Learning Rate": 4.342703315746361e-05, "Pretrain/Loss": 2.052598237991333, "Pretrain/Loss (Raw)": 2.05735182762146, "Pretrain/Step": 4942, "Pretrain/Step Time": 8.495356485247612} +{"Pretrain/Learning Rate": 4.342416399141617e-05, "Pretrain/Loss": 2.0528385639190674, "Pretrain/Loss (Raw)": 2.125307559967041, "Pretrain/Step": 4943, "Pretrain/Step Time": 8.491579033434391} +{"Pretrain/Learning Rate": 4.342129429412096e-05, "Pretrain/Loss": 2.0522775650024414, "Pretrain/Loss (Raw)": 2.066857099533081, "Pretrain/Step": 4944, "Pretrain/Step Time": 8.49033984169364} +{"Pretrain/Learning Rate": 4.34184240656607e-05, "Pretrain/Loss": 2.053708076477051, "Pretrain/Loss (Raw)": 2.0964572429656982, "Pretrain/Step": 4945, "Pretrain/Step Time": 8.491986406967044} +{"Pretrain/Learning Rate": 4.341555330611817e-05, "Pretrain/Loss": 2.055344343185425, "Pretrain/Loss (Raw)": 2.0311312675476074, "Pretrain/Step": 4946, "Pretrain/Step Time": 8.49335246346891} +{"Pretrain/Learning Rate": 4.341268201557616e-05, "Pretrain/Loss": 2.0549135208129883, "Pretrain/Loss (Raw)": 1.9233182668685913, "Pretrain/Step": 4947, "Pretrain/Step Time": 8.499839168041945} +{"Pretrain/Learning Rate": 4.340981019411742e-05, "Pretrain/Loss": 2.0559349060058594, "Pretrain/Loss (Raw)": 2.054075241088867, "Pretrain/Step": 4948, "Pretrain/Step Time": 8.497499782592058} +{"Pretrain/Learning Rate": 4.340693784182479e-05, "Pretrain/Loss": 2.05816650390625, "Pretrain/Loss (Raw)": 2.1269984245300293, "Pretrain/Step": 4949, "Pretrain/Step Time": 8.49548544920981} +{"Pretrain/Learning Rate": 4.340406495878109e-05, "Pretrain/Loss": 2.0542776584625244, "Pretrain/Loss (Raw)": 1.7730622291564941, "Pretrain/Step": 4950, "Pretrain/Step Time": 8.495046624913812} +{"Pretrain/Learning Rate": 4.340119154506914e-05, "Pretrain/Loss": 2.0549521446228027, "Pretrain/Loss (Raw)": 2.0149147510528564, "Pretrain/Step": 4951, "Pretrain/Step Time": 8.494945021346211} +{"Pretrain/Learning Rate": 4.339831760077181e-05, "Pretrain/Loss": 2.0567102432250977, "Pretrain/Loss (Raw)": 2.237499237060547, "Pretrain/Step": 4952, "Pretrain/Step Time": 8.496798226609826} +{"Pretrain/Learning Rate": 4.3395443125971965e-05, "Pretrain/Loss": 2.0566511154174805, "Pretrain/Loss (Raw)": 2.1148159503936768, "Pretrain/Step": 4953, "Pretrain/Step Time": 8.497632252052426} +{"Pretrain/Learning Rate": 4.339256812075248e-05, "Pretrain/Loss": 2.0578699111938477, "Pretrain/Loss (Raw)": 2.2389819622039795, "Pretrain/Step": 4954, "Pretrain/Step Time": 8.496236836537719} +{"Pretrain/Learning Rate": 4.338969258519626e-05, "Pretrain/Loss": 2.057149648666382, "Pretrain/Loss (Raw)": 2.005413055419922, "Pretrain/Step": 4955, "Pretrain/Step Time": 8.494623463600874} +{"Pretrain/Learning Rate": 4.3386816519386224e-05, "Pretrain/Loss": 2.056218385696411, "Pretrain/Loss (Raw)": 2.006110191345215, "Pretrain/Step": 4956, "Pretrain/Step Time": 8.502962065860629} +{"Pretrain/Learning Rate": 4.338393992340529e-05, "Pretrain/Loss": 2.054985523223877, "Pretrain/Loss (Raw)": 1.9713200330734253, "Pretrain/Step": 4957, "Pretrain/Step Time": 8.497235966846347} +{"Pretrain/Learning Rate": 4.338106279733641e-05, "Pretrain/Loss": 2.0551605224609375, "Pretrain/Loss (Raw)": 2.067131757736206, "Pretrain/Step": 4958, "Pretrain/Step Time": 8.50182619690895} +{"Pretrain/Learning Rate": 4.337818514126254e-05, "Pretrain/Loss": 2.0535526275634766, "Pretrain/Loss (Raw)": 1.9226317405700684, "Pretrain/Step": 4959, "Pretrain/Step Time": 8.499986506998539} +{"Pretrain/Learning Rate": 4.337530695526666e-05, "Pretrain/Loss": 2.0532097816467285, "Pretrain/Loss (Raw)": 2.044158458709717, "Pretrain/Step": 4960, "Pretrain/Step Time": 8.49631585739553} +{"Pretrain/Learning Rate": 4.3372428239431753e-05, "Pretrain/Loss": 2.0546607971191406, "Pretrain/Loss (Raw)": 2.0755202770233154, "Pretrain/Step": 4961, "Pretrain/Step Time": 8.49983450397849} +{"Pretrain/Learning Rate": 4.336954899384084e-05, "Pretrain/Loss": 2.054673910140991, "Pretrain/Loss (Raw)": 2.147751569747925, "Pretrain/Step": 4962, "Pretrain/Step Time": 8.496058931574225} +{"Pretrain/Learning Rate": 4.3366669218576914e-05, "Pretrain/Loss": 2.057936191558838, "Pretrain/Loss (Raw)": 2.5701353549957275, "Pretrain/Step": 4963, "Pretrain/Step Time": 8.507527720183134} +{"Pretrain/Learning Rate": 4.336378891372304e-05, "Pretrain/Loss": 2.0576212406158447, "Pretrain/Loss (Raw)": 1.9198527336120605, "Pretrain/Step": 4964, "Pretrain/Step Time": 8.510504059493542} +{"Pretrain/Learning Rate": 4.336090807936226e-05, "Pretrain/Loss": 2.0583395957946777, "Pretrain/Loss (Raw)": 2.0097174644470215, "Pretrain/Step": 4965, "Pretrain/Step Time": 8.509683772921562} +{"Pretrain/Learning Rate": 4.335802671557764e-05, "Pretrain/Loss": 2.0590202808380127, "Pretrain/Loss (Raw)": 2.0296456813812256, "Pretrain/Step": 4966, "Pretrain/Step Time": 8.509535437449813} +{"Pretrain/Learning Rate": 4.3355144822452256e-05, "Pretrain/Loss": 2.0598909854888916, "Pretrain/Loss (Raw)": 2.1559898853302, "Pretrain/Step": 4967, "Pretrain/Step Time": 8.508971283212304} +{"Pretrain/Learning Rate": 4.335226240006921e-05, "Pretrain/Loss": 2.0597081184387207, "Pretrain/Loss (Raw)": 1.9703079462051392, "Pretrain/Step": 4968, "Pretrain/Step Time": 8.510175736621022} +{"Pretrain/Learning Rate": 4.334937944851162e-05, "Pretrain/Loss": 2.0589890480041504, "Pretrain/Loss (Raw)": 1.9103258848190308, "Pretrain/Step": 4969, "Pretrain/Step Time": 8.50970789603889} +{"Pretrain/Learning Rate": 4.33464959678626e-05, "Pretrain/Loss": 2.0612149238586426, "Pretrain/Loss (Raw)": 2.272592782974243, "Pretrain/Step": 4970, "Pretrain/Step Time": 8.51098232343793} +{"Pretrain/Learning Rate": 4.334361195820531e-05, "Pretrain/Loss": 2.0621299743652344, "Pretrain/Loss (Raw)": 2.3230693340301514, "Pretrain/Step": 4971, "Pretrain/Step Time": 8.51299381069839} +{"Pretrain/Learning Rate": 4.33407274196229e-05, "Pretrain/Loss": 2.060987710952759, "Pretrain/Loss (Raw)": 1.9652518033981323, "Pretrain/Step": 4972, "Pretrain/Step Time": 8.513735799118876} +{"Pretrain/Learning Rate": 4.333784235219854e-05, "Pretrain/Loss": 2.0626087188720703, "Pretrain/Loss (Raw)": 2.2439675331115723, "Pretrain/Step": 4973, "Pretrain/Step Time": 8.50800734385848} +{"Pretrain/Learning Rate": 4.3334956756015426e-05, "Pretrain/Loss": 2.061933994293213, "Pretrain/Loss (Raw)": 2.14972186088562, "Pretrain/Step": 4974, "Pretrain/Step Time": 8.51014538295567} +{"Pretrain/Learning Rate": 4.333207063115676e-05, "Pretrain/Loss": 2.063783645629883, "Pretrain/Loss (Raw)": 2.1384735107421875, "Pretrain/Step": 4975, "Pretrain/Step Time": 8.50927964784205} +{"Pretrain/Learning Rate": 4.3329183977705755e-05, "Pretrain/Loss": 2.062962532043457, "Pretrain/Loss (Raw)": 2.0019583702087402, "Pretrain/Step": 4976, "Pretrain/Step Time": 8.507752129808068} +{"Pretrain/Learning Rate": 4.332629679574566e-05, "Pretrain/Loss": 2.062605619430542, "Pretrain/Loss (Raw)": 2.1317524909973145, "Pretrain/Step": 4977, "Pretrain/Step Time": 8.508748792111874} +{"Pretrain/Learning Rate": 4.332340908535971e-05, "Pretrain/Loss": 2.063180685043335, "Pretrain/Loss (Raw)": 1.9227107763290405, "Pretrain/Step": 4978, "Pretrain/Step Time": 8.506875529885292} +{"Pretrain/Learning Rate": 4.3320520846631184e-05, "Pretrain/Loss": 2.0650339126586914, "Pretrain/Loss (Raw)": 1.9945143461227417, "Pretrain/Step": 4979, "Pretrain/Step Time": 8.508755538612604} +{"Pretrain/Learning Rate": 4.3317632079643345e-05, "Pretrain/Loss": 2.0642285346984863, "Pretrain/Loss (Raw)": 1.929704189300537, "Pretrain/Step": 4980, "Pretrain/Step Time": 8.510066842660308} +{"Pretrain/Learning Rate": 4.33147427844795e-05, "Pretrain/Loss": 2.065392017364502, "Pretrain/Loss (Raw)": 2.1474363803863525, "Pretrain/Step": 4981, "Pretrain/Step Time": 8.50734193250537} +{"Pretrain/Learning Rate": 4.3311852961222966e-05, "Pretrain/Loss": 2.063906669616699, "Pretrain/Loss (Raw)": 2.0441970825195312, "Pretrain/Step": 4982, "Pretrain/Step Time": 8.510488832369447} +{"Pretrain/Learning Rate": 4.330896260995705e-05, "Pretrain/Loss": 2.0603060722351074, "Pretrain/Loss (Raw)": 2.066955327987671, "Pretrain/Step": 4983, "Pretrain/Step Time": 8.509373117238283} +{"Pretrain/Learning Rate": 4.330607173076511e-05, "Pretrain/Loss": 2.060500144958496, "Pretrain/Loss (Raw)": 2.0453743934631348, "Pretrain/Step": 4984, "Pretrain/Step Time": 8.510342640802264} +{"Pretrain/Learning Rate": 4.33031803237305e-05, "Pretrain/Loss": 2.0605359077453613, "Pretrain/Loss (Raw)": 2.185288429260254, "Pretrain/Step": 4985, "Pretrain/Step Time": 8.505757676437497} +{"Pretrain/Learning Rate": 4.330028838893658e-05, "Pretrain/Loss": 2.0603322982788086, "Pretrain/Loss (Raw)": 1.9886516332626343, "Pretrain/Step": 4986, "Pretrain/Step Time": 8.50334345549345} +{"Pretrain/Learning Rate": 4.329739592646675e-05, "Pretrain/Loss": 2.0605363845825195, "Pretrain/Loss (Raw)": 2.104269504547119, "Pretrain/Step": 4987, "Pretrain/Step Time": 8.5093849375844} +{"Pretrain/Learning Rate": 4.32945029364044e-05, "Pretrain/Loss": 2.0579283237457275, "Pretrain/Loss (Raw)": 1.7642590999603271, "Pretrain/Step": 4988, "Pretrain/Step Time": 8.511186564341187} +{"Pretrain/Learning Rate": 4.3291609418832966e-05, "Pretrain/Loss": 2.060863494873047, "Pretrain/Loss (Raw)": 2.128239154815674, "Pretrain/Step": 4989, "Pretrain/Step Time": 8.507946589961648} +{"Pretrain/Learning Rate": 4.328871537383586e-05, "Pretrain/Loss": 2.0593619346618652, "Pretrain/Loss (Raw)": 2.074497699737549, "Pretrain/Step": 4990, "Pretrain/Step Time": 8.506609663367271} +{"Pretrain/Learning Rate": 4.3285820801496544e-05, "Pretrain/Loss": 2.0589663982391357, "Pretrain/Loss (Raw)": 2.2289998531341553, "Pretrain/Step": 4991, "Pretrain/Step Time": 8.498564146459103} +{"Pretrain/Learning Rate": 4.3282925701898473e-05, "Pretrain/Loss": 2.0614054203033447, "Pretrain/Loss (Raw)": 2.216226816177368, "Pretrain/Step": 4992, "Pretrain/Step Time": 8.50487799756229} +{"Pretrain/Learning Rate": 4.3280030075125135e-05, "Pretrain/Loss": 2.060821533203125, "Pretrain/Loss (Raw)": 2.0397326946258545, "Pretrain/Step": 4993, "Pretrain/Step Time": 8.500495042651892} +{"Pretrain/Learning Rate": 4.3277133921260006e-05, "Pretrain/Loss": 2.062075614929199, "Pretrain/Loss (Raw)": 2.1902811527252197, "Pretrain/Step": 4994, "Pretrain/Step Time": 8.503267107531428} +{"Pretrain/Learning Rate": 4.327423724038661e-05, "Pretrain/Loss": 2.0622477531433105, "Pretrain/Loss (Raw)": 2.130758762359619, "Pretrain/Step": 4995, "Pretrain/Step Time": 8.50735229998827} +{"Pretrain/Learning Rate": 4.327134003258847e-05, "Pretrain/Loss": 2.062488555908203, "Pretrain/Loss (Raw)": 2.0859475135803223, "Pretrain/Step": 4996, "Pretrain/Step Time": 8.508607771247625} +{"Pretrain/Learning Rate": 4.326844229794911e-05, "Pretrain/Loss": 2.0639684200286865, "Pretrain/Loss (Raw)": 1.967716097831726, "Pretrain/Step": 4997, "Pretrain/Step Time": 8.502848342061043} +{"Pretrain/Learning Rate": 4.326554403655211e-05, "Pretrain/Loss": 2.065509557723999, "Pretrain/Loss (Raw)": 2.1458754539489746, "Pretrain/Step": 4998, "Pretrain/Step Time": 8.503968169912696} +{"Pretrain/Learning Rate": 4.326264524848101e-05, "Pretrain/Loss": 2.0653088092803955, "Pretrain/Loss (Raw)": 2.0281786918640137, "Pretrain/Step": 4999, "Pretrain/Step Time": 8.50176483951509} +{"Pretrain/Learning Rate": 4.325974593381942e-05, "Pretrain/Loss": 2.064572334289551, "Pretrain/Loss (Raw)": 2.0246989727020264, "Pretrain/Step": 5000, "Pretrain/Step Time": 8.502319991588593} +{"Pretrain/Learning Rate": 4.325684609265092e-05, "Pretrain/Loss": 2.0645389556884766, "Pretrain/Loss (Raw)": 1.970512866973877, "Pretrain/Step": 5001, "Pretrain/Step Time": 9.596333999186754} +{"Pretrain/Learning Rate": 4.325394572505913e-05, "Pretrain/Loss": 2.064836025238037, "Pretrain/Loss (Raw)": 2.0794355869293213, "Pretrain/Step": 5002, "Pretrain/Step Time": 9.595657831057906} +{"Pretrain/Learning Rate": 4.3251044831127685e-05, "Pretrain/Loss": 2.062964916229248, "Pretrain/Loss (Raw)": 1.7942438125610352, "Pretrain/Step": 5003, "Pretrain/Step Time": 9.590224981307983} +{"Pretrain/Learning Rate": 4.324814341094023e-05, "Pretrain/Loss": 2.0625405311584473, "Pretrain/Loss (Raw)": 1.9776418209075928, "Pretrain/Step": 5004, "Pretrain/Step Time": 9.590972302481532} +{"Pretrain/Learning Rate": 4.324524146458043e-05, "Pretrain/Loss": 2.0629844665527344, "Pretrain/Loss (Raw)": 2.0095367431640625, "Pretrain/Step": 5005, "Pretrain/Step Time": 9.591466892510653} +{"Pretrain/Learning Rate": 4.324233899213195e-05, "Pretrain/Loss": 2.0620408058166504, "Pretrain/Loss (Raw)": 2.1233694553375244, "Pretrain/Step": 5006, "Pretrain/Step Time": 9.587917787954211} +{"Pretrain/Learning Rate": 4.323943599367848e-05, "Pretrain/Loss": 2.059891939163208, "Pretrain/Loss (Raw)": 1.7946070432662964, "Pretrain/Step": 5007, "Pretrain/Step Time": 9.58797904662788} +{"Pretrain/Learning Rate": 4.3236532469303733e-05, "Pretrain/Loss": 2.0619029998779297, "Pretrain/Loss (Raw)": 2.0364341735839844, "Pretrain/Step": 5008, "Pretrain/Step Time": 9.585002969950438} +{"Pretrain/Learning Rate": 4.323362841909144e-05, "Pretrain/Loss": 2.0615897178649902, "Pretrain/Loss (Raw)": 2.0696282386779785, "Pretrain/Step": 5009, "Pretrain/Step Time": 9.586084488779306} +{"Pretrain/Learning Rate": 4.3230723843125315e-05, "Pretrain/Loss": 2.0593175888061523, "Pretrain/Loss (Raw)": 1.8611401319503784, "Pretrain/Step": 5010, "Pretrain/Step Time": 9.588753804564476} +{"Pretrain/Learning Rate": 4.322781874148912e-05, "Pretrain/Loss": 2.0577104091644287, "Pretrain/Loss (Raw)": 1.8617650270462036, "Pretrain/Step": 5011, "Pretrain/Step Time": 9.591188631951809} +{"Pretrain/Learning Rate": 4.322491311426662e-05, "Pretrain/Loss": 2.059769868850708, "Pretrain/Loss (Raw)": 2.237830638885498, "Pretrain/Step": 5012, "Pretrain/Step Time": 9.592679357156157} +{"Pretrain/Learning Rate": 4.322200696154161e-05, "Pretrain/Loss": 2.061645030975342, "Pretrain/Loss (Raw)": 2.2965118885040283, "Pretrain/Step": 5013, "Pretrain/Step Time": 9.591323563829064} +{"Pretrain/Learning Rate": 4.3219100283397865e-05, "Pretrain/Loss": 2.0604395866394043, "Pretrain/Loss (Raw)": 1.8852685689926147, "Pretrain/Step": 5014, "Pretrain/Step Time": 9.592715097591281} +{"Pretrain/Learning Rate": 4.32161930799192e-05, "Pretrain/Loss": 2.0615615844726562, "Pretrain/Loss (Raw)": 2.0788841247558594, "Pretrain/Step": 5015, "Pretrain/Step Time": 9.585835348814726} +{"Pretrain/Learning Rate": 4.3213285351189456e-05, "Pretrain/Loss": 2.0612502098083496, "Pretrain/Loss (Raw)": 2.0288891792297363, "Pretrain/Step": 5016, "Pretrain/Step Time": 9.585933975875378} +{"Pretrain/Learning Rate": 4.3210377097292474e-05, "Pretrain/Loss": 2.0639610290527344, "Pretrain/Loss (Raw)": 2.301974058151245, "Pretrain/Step": 5017, "Pretrain/Step Time": 9.587374709546566} +{"Pretrain/Learning Rate": 4.32074683183121e-05, "Pretrain/Loss": 2.06473970413208, "Pretrain/Loss (Raw)": 2.0706257820129395, "Pretrain/Step": 5018, "Pretrain/Step Time": 9.5881785787642} +{"Pretrain/Learning Rate": 4.3204559014332215e-05, "Pretrain/Loss": 2.0646796226501465, "Pretrain/Loss (Raw)": 2.0341930389404297, "Pretrain/Step": 5019, "Pretrain/Step Time": 9.586251083761454} +{"Pretrain/Learning Rate": 4.32016491854367e-05, "Pretrain/Loss": 2.061431407928467, "Pretrain/Loss (Raw)": 1.9407455921173096, "Pretrain/Step": 5020, "Pretrain/Step Time": 9.588016079738736} +{"Pretrain/Learning Rate": 4.3198738831709465e-05, "Pretrain/Loss": 2.0599632263183594, "Pretrain/Loss (Raw)": 1.857990026473999, "Pretrain/Step": 5021, "Pretrain/Step Time": 9.58518691174686} +{"Pretrain/Learning Rate": 4.3195827953234424e-05, "Pretrain/Loss": 2.060676336288452, "Pretrain/Loss (Raw)": 2.073773145675659, "Pretrain/Step": 5022, "Pretrain/Step Time": 9.582769207656384} +{"Pretrain/Learning Rate": 4.3192916550095514e-05, "Pretrain/Loss": 2.0592355728149414, "Pretrain/Loss (Raw)": 1.9100804328918457, "Pretrain/Step": 5023, "Pretrain/Step Time": 9.581693129613996} +{"Pretrain/Learning Rate": 4.319000462237668e-05, "Pretrain/Loss": 2.058988094329834, "Pretrain/Loss (Raw)": 1.9695658683776855, "Pretrain/Step": 5024, "Pretrain/Step Time": 9.583725161850452} +{"Pretrain/Learning Rate": 4.318709217016188e-05, "Pretrain/Loss": 2.0576610565185547, "Pretrain/Loss (Raw)": 1.8532530069351196, "Pretrain/Step": 5025, "Pretrain/Step Time": 9.580037923529744} +{"Pretrain/Learning Rate": 4.3184179193535104e-05, "Pretrain/Loss": 2.057065010070801, "Pretrain/Loss (Raw)": 1.9038516283035278, "Pretrain/Step": 5026, "Pretrain/Step Time": 9.578100314363837} +{"Pretrain/Learning Rate": 4.318126569258034e-05, "Pretrain/Loss": 2.0581254959106445, "Pretrain/Loss (Raw)": 2.1584537029266357, "Pretrain/Step": 5027, "Pretrain/Step Time": 9.58316258341074} +{"Pretrain/Learning Rate": 4.3178351667381595e-05, "Pretrain/Loss": 2.0576014518737793, "Pretrain/Loss (Raw)": 1.9560065269470215, "Pretrain/Step": 5028, "Pretrain/Step Time": 9.583100298419595} +{"Pretrain/Learning Rate": 4.31754371180229e-05, "Pretrain/Loss": 2.0570011138916016, "Pretrain/Loss (Raw)": 1.977555274963379, "Pretrain/Step": 5029, "Pretrain/Step Time": 9.576357368379831} +{"Pretrain/Learning Rate": 4.317252204458828e-05, "Pretrain/Loss": 2.0576725006103516, "Pretrain/Loss (Raw)": 2.1396450996398926, "Pretrain/Step": 5030, "Pretrain/Step Time": 9.573344629257917} +{"Pretrain/Learning Rate": 4.31696064471618e-05, "Pretrain/Loss": 2.0590999126434326, "Pretrain/Loss (Raw)": 2.057734966278076, "Pretrain/Step": 5031, "Pretrain/Step Time": 9.575459111481905} +{"Pretrain/Learning Rate": 4.316669032582753e-05, "Pretrain/Loss": 2.0588531494140625, "Pretrain/Loss (Raw)": 2.090639114379883, "Pretrain/Step": 5032, "Pretrain/Step Time": 9.579289052635431} +{"Pretrain/Learning Rate": 4.3163773680669545e-05, "Pretrain/Loss": 2.0574936866760254, "Pretrain/Loss (Raw)": 1.8663607835769653, "Pretrain/Step": 5033, "Pretrain/Step Time": 9.573678569868207} +{"Pretrain/Learning Rate": 4.3160856511771955e-05, "Pretrain/Loss": 2.057529926300049, "Pretrain/Loss (Raw)": 2.2096898555755615, "Pretrain/Step": 5034, "Pretrain/Step Time": 9.575805515050888} +{"Pretrain/Learning Rate": 4.3157938819218865e-05, "Pretrain/Loss": 2.057079315185547, "Pretrain/Loss (Raw)": 1.9534499645233154, "Pretrain/Step": 5035, "Pretrain/Step Time": 9.577362203970551} +{"Pretrain/Learning Rate": 4.315502060309442e-05, "Pretrain/Loss": 2.0566182136535645, "Pretrain/Loss (Raw)": 2.043628454208374, "Pretrain/Step": 5036, "Pretrain/Step Time": 9.575259106233716} +{"Pretrain/Learning Rate": 4.3152101863482746e-05, "Pretrain/Loss": 2.0567846298217773, "Pretrain/Loss (Raw)": 1.996140956878662, "Pretrain/Step": 5037, "Pretrain/Step Time": 9.572609547525644} +{"Pretrain/Learning Rate": 4.314918260046801e-05, "Pretrain/Loss": 2.0563595294952393, "Pretrain/Loss (Raw)": 2.1345252990722656, "Pretrain/Step": 5038, "Pretrain/Step Time": 9.574640227481723} +{"Pretrain/Learning Rate": 4.31462628141344e-05, "Pretrain/Loss": 2.0548617839813232, "Pretrain/Loss (Raw)": 2.0357420444488525, "Pretrain/Step": 5039, "Pretrain/Step Time": 9.569796459749341} +{"Pretrain/Learning Rate": 4.314334250456609e-05, "Pretrain/Loss": 2.0539350509643555, "Pretrain/Loss (Raw)": 1.9166252613067627, "Pretrain/Step": 5040, "Pretrain/Step Time": 9.571967847645283} +{"Pretrain/Learning Rate": 4.314042167184728e-05, "Pretrain/Loss": 2.0521934032440186, "Pretrain/Loss (Raw)": 2.049069404602051, "Pretrain/Step": 5041, "Pretrain/Step Time": 9.574035491794348} +{"Pretrain/Learning Rate": 4.3137500316062204e-05, "Pretrain/Loss": 2.0513858795166016, "Pretrain/Loss (Raw)": 1.9710272550582886, "Pretrain/Step": 5042, "Pretrain/Step Time": 9.570724239572883} +{"Pretrain/Learning Rate": 4.313457843729509e-05, "Pretrain/Loss": 2.053530693054199, "Pretrain/Loss (Raw)": 2.245093822479248, "Pretrain/Step": 5043, "Pretrain/Step Time": 9.574962809681892} +{"Pretrain/Learning Rate": 4.3131656035630196e-05, "Pretrain/Loss": 2.0548171997070312, "Pretrain/Loss (Raw)": 2.1049695014953613, "Pretrain/Step": 5044, "Pretrain/Step Time": 9.573741007596254} +{"Pretrain/Learning Rate": 4.312873311115177e-05, "Pretrain/Loss": 2.052241325378418, "Pretrain/Loss (Raw)": 1.9069856405258179, "Pretrain/Step": 5045, "Pretrain/Step Time": 9.572383284568787} +{"Pretrain/Learning Rate": 4.3125809663944124e-05, "Pretrain/Loss": 2.050546407699585, "Pretrain/Loss (Raw)": 1.8440881967544556, "Pretrain/Step": 5046, "Pretrain/Step Time": 9.57530840113759} +{"Pretrain/Learning Rate": 4.3122885694091525e-05, "Pretrain/Loss": 2.051295757293701, "Pretrain/Loss (Raw)": 2.1364376544952393, "Pretrain/Step": 5047, "Pretrain/Step Time": 9.57244661822915} +{"Pretrain/Learning Rate": 4.3119961201678295e-05, "Pretrain/Loss": 2.050163745880127, "Pretrain/Loss (Raw)": 2.025097131729126, "Pretrain/Step": 5048, "Pretrain/Step Time": 9.571369970217347} +{"Pretrain/Learning Rate": 4.311703618678875e-05, "Pretrain/Loss": 2.051027297973633, "Pretrain/Loss (Raw)": 2.0882346630096436, "Pretrain/Step": 5049, "Pretrain/Step Time": 9.5623489767313} +{"Pretrain/Learning Rate": 4.3114110649507244e-05, "Pretrain/Loss": 2.0516467094421387, "Pretrain/Loss (Raw)": 2.196808338165283, "Pretrain/Step": 5050, "Pretrain/Step Time": 9.564264837652445} +{"Pretrain/Learning Rate": 4.311118458991813e-05, "Pretrain/Loss": 2.0524659156799316, "Pretrain/Loss (Raw)": 2.0616822242736816, "Pretrain/Step": 5051, "Pretrain/Step Time": 9.569334175437689} +{"Pretrain/Learning Rate": 4.310825800810577e-05, "Pretrain/Loss": 2.053745746612549, "Pretrain/Loss (Raw)": 2.052015542984009, "Pretrain/Step": 5052, "Pretrain/Step Time": 9.568821128457785} +{"Pretrain/Learning Rate": 4.310533090415455e-05, "Pretrain/Loss": 2.053837299346924, "Pretrain/Loss (Raw)": 1.917744517326355, "Pretrain/Step": 5053, "Pretrain/Step Time": 9.564637951552868} +{"Pretrain/Learning Rate": 4.310240327814889e-05, "Pretrain/Loss": 2.0521976947784424, "Pretrain/Loss (Raw)": 1.9285025596618652, "Pretrain/Step": 5054, "Pretrain/Step Time": 9.564545137807727} +{"Pretrain/Learning Rate": 4.309947513017318e-05, "Pretrain/Loss": 2.0528030395507812, "Pretrain/Loss (Raw)": 2.152179718017578, "Pretrain/Step": 5055, "Pretrain/Step Time": 9.567273927852511} +{"Pretrain/Learning Rate": 4.309654646031188e-05, "Pretrain/Loss": 2.050518035888672, "Pretrain/Loss (Raw)": 1.9727152585983276, "Pretrain/Step": 5056, "Pretrain/Step Time": 9.565533813089132} +{"Pretrain/Learning Rate": 4.309361726864941e-05, "Pretrain/Loss": 2.050313949584961, "Pretrain/Loss (Raw)": 1.7688096761703491, "Pretrain/Step": 5057, "Pretrain/Step Time": 9.559247804805636} +{"Pretrain/Learning Rate": 4.3090687555270234e-05, "Pretrain/Loss": 2.0497913360595703, "Pretrain/Loss (Raw)": 1.9958077669143677, "Pretrain/Step": 5058, "Pretrain/Step Time": 9.560320498421788} +{"Pretrain/Learning Rate": 4.308775732025885e-05, "Pretrain/Loss": 2.050548553466797, "Pretrain/Loss (Raw)": 1.9810113906860352, "Pretrain/Step": 5059, "Pretrain/Step Time": 9.56033737026155} +{"Pretrain/Learning Rate": 4.308482656369973e-05, "Pretrain/Loss": 2.0506796836853027, "Pretrain/Loss (Raw)": 2.411313772201538, "Pretrain/Step": 5060, "Pretrain/Step Time": 9.561727041378617} +{"Pretrain/Learning Rate": 4.3081895285677384e-05, "Pretrain/Loss": 2.051356554031372, "Pretrain/Loss (Raw)": 2.087677240371704, "Pretrain/Step": 5061, "Pretrain/Step Time": 9.563334465026855} +{"Pretrain/Learning Rate": 4.3078963486276334e-05, "Pretrain/Loss": 2.0519590377807617, "Pretrain/Loss (Raw)": 2.16513729095459, "Pretrain/Step": 5062, "Pretrain/Step Time": 9.565362537279725} +{"Pretrain/Learning Rate": 4.307603116558112e-05, "Pretrain/Loss": 2.0507893562316895, "Pretrain/Loss (Raw)": 2.020495891571045, "Pretrain/Step": 5063, "Pretrain/Step Time": 9.566019598394632} +{"Pretrain/Learning Rate": 4.307309832367629e-05, "Pretrain/Loss": 2.0498695373535156, "Pretrain/Loss (Raw)": 2.0416252613067627, "Pretrain/Step": 5064, "Pretrain/Step Time": 9.562427999451756} +{"Pretrain/Learning Rate": 4.30701649606464e-05, "Pretrain/Loss": 2.051145076751709, "Pretrain/Loss (Raw)": 2.113936185836792, "Pretrain/Step": 5065, "Pretrain/Step Time": 9.561220558360219} +{"Pretrain/Learning Rate": 4.306723107657605e-05, "Pretrain/Loss": 2.0500783920288086, "Pretrain/Loss (Raw)": 1.9408289194107056, "Pretrain/Step": 5066, "Pretrain/Step Time": 9.559234090149403} +{"Pretrain/Learning Rate": 4.306429667154983e-05, "Pretrain/Loss": 2.052339553833008, "Pretrain/Loss (Raw)": 2.323946714401245, "Pretrain/Step": 5067, "Pretrain/Step Time": 9.564824257045984} +{"Pretrain/Learning Rate": 4.306136174565235e-05, "Pretrain/Loss": 2.051985502243042, "Pretrain/Loss (Raw)": 2.0894668102264404, "Pretrain/Step": 5068, "Pretrain/Step Time": 9.55816913023591} +{"Pretrain/Learning Rate": 4.305842629896823e-05, "Pretrain/Loss": 2.0466299057006836, "Pretrain/Loss (Raw)": 1.4699175357818604, "Pretrain/Step": 5069, "Pretrain/Step Time": 9.559356668964028} +{"Pretrain/Learning Rate": 4.305549033158212e-05, "Pretrain/Loss": 2.0476059913635254, "Pretrain/Loss (Raw)": 2.182281970977783, "Pretrain/Step": 5070, "Pretrain/Step Time": 9.55816869623959} +{"Pretrain/Learning Rate": 4.305255384357868e-05, "Pretrain/Loss": 2.0480198860168457, "Pretrain/Loss (Raw)": 2.1782588958740234, "Pretrain/Step": 5071, "Pretrain/Step Time": 9.558110225945711} +{"Pretrain/Learning Rate": 4.304961683504257e-05, "Pretrain/Loss": 2.048478603363037, "Pretrain/Loss (Raw)": 2.1255877017974854, "Pretrain/Step": 5072, "Pretrain/Step Time": 9.56251891888678} +{"Pretrain/Learning Rate": 4.304667930605849e-05, "Pretrain/Loss": 2.04764986038208, "Pretrain/Loss (Raw)": 1.9903565645217896, "Pretrain/Step": 5073, "Pretrain/Step Time": 9.558309998363256} +{"Pretrain/Learning Rate": 4.304374125671113e-05, "Pretrain/Loss": 2.046222686767578, "Pretrain/Loss (Raw)": 1.8484747409820557, "Pretrain/Step": 5074, "Pretrain/Step Time": 9.556176101788878} +{"Pretrain/Learning Rate": 4.304080268708521e-05, "Pretrain/Loss": 2.0461645126342773, "Pretrain/Loss (Raw)": 1.915858507156372, "Pretrain/Step": 5075, "Pretrain/Step Time": 9.553166938945651} +{"Pretrain/Learning Rate": 4.303786359726546e-05, "Pretrain/Loss": 2.0450122356414795, "Pretrain/Loss (Raw)": 1.9065968990325928, "Pretrain/Step": 5076, "Pretrain/Step Time": 9.56476036272943} +{"Pretrain/Learning Rate": 4.3034923987336636e-05, "Pretrain/Loss": 2.043835163116455, "Pretrain/Loss (Raw)": 1.9763271808624268, "Pretrain/Step": 5077, "Pretrain/Step Time": 9.565977016463876} +{"Pretrain/Learning Rate": 4.3031983857383484e-05, "Pretrain/Loss": 2.0451693534851074, "Pretrain/Loss (Raw)": 1.9438263177871704, "Pretrain/Step": 5078, "Pretrain/Step Time": 9.56736491061747} +{"Pretrain/Learning Rate": 4.302904320749079e-05, "Pretrain/Loss": 2.0440561771392822, "Pretrain/Loss (Raw)": 1.8724294900894165, "Pretrain/Step": 5079, "Pretrain/Step Time": 9.569904575124383} +{"Pretrain/Learning Rate": 4.302610203774335e-05, "Pretrain/Loss": 2.0427346229553223, "Pretrain/Loss (Raw)": 2.068355083465576, "Pretrain/Step": 5080, "Pretrain/Step Time": 9.56770552508533} +{"Pretrain/Learning Rate": 4.302316034822597e-05, "Pretrain/Loss": 2.0437893867492676, "Pretrain/Loss (Raw)": 2.249842882156372, "Pretrain/Step": 5081, "Pretrain/Step Time": 9.56666591949761} +{"Pretrain/Learning Rate": 4.302021813902346e-05, "Pretrain/Loss": 2.0415310859680176, "Pretrain/Loss (Raw)": 1.949902892112732, "Pretrain/Step": 5082, "Pretrain/Step Time": 9.564398365095258} +{"Pretrain/Learning Rate": 4.301727541022066e-05, "Pretrain/Loss": 2.0407543182373047, "Pretrain/Loss (Raw)": 1.9059710502624512, "Pretrain/Step": 5083, "Pretrain/Step Time": 9.565715791657567} +{"Pretrain/Learning Rate": 4.301433216190244e-05, "Pretrain/Loss": 2.042273998260498, "Pretrain/Loss (Raw)": 2.20063853263855, "Pretrain/Step": 5084, "Pretrain/Step Time": 9.559413738548756} +{"Pretrain/Learning Rate": 4.3011388394153636e-05, "Pretrain/Loss": 2.0435843467712402, "Pretrain/Loss (Raw)": 2.1390492916107178, "Pretrain/Step": 5085, "Pretrain/Step Time": 9.562145674601197} +{"Pretrain/Learning Rate": 4.300844410705915e-05, "Pretrain/Loss": 2.04312801361084, "Pretrain/Loss (Raw)": 2.0087392330169678, "Pretrain/Step": 5086, "Pretrain/Step Time": 9.556679371744394} +{"Pretrain/Learning Rate": 4.300549930070387e-05, "Pretrain/Loss": 2.0456666946411133, "Pretrain/Loss (Raw)": 2.247560977935791, "Pretrain/Step": 5087, "Pretrain/Step Time": 9.561095774173737} +{"Pretrain/Learning Rate": 4.3002553975172714e-05, "Pretrain/Loss": 2.0451161861419678, "Pretrain/Loss (Raw)": 1.9736791849136353, "Pretrain/Step": 5088, "Pretrain/Step Time": 9.562102541327477} +{"Pretrain/Learning Rate": 4.299960813055061e-05, "Pretrain/Loss": 2.043858528137207, "Pretrain/Loss (Raw)": 1.9145339727401733, "Pretrain/Step": 5089, "Pretrain/Step Time": 9.559391777962446} +{"Pretrain/Learning Rate": 4.299666176692248e-05, "Pretrain/Loss": 2.042344808578491, "Pretrain/Loss (Raw)": 1.954030990600586, "Pretrain/Step": 5090, "Pretrain/Step Time": 9.56036907248199} +{"Pretrain/Learning Rate": 4.2993714884373303e-05, "Pretrain/Loss": 2.038278818130493, "Pretrain/Loss (Raw)": 2.049683094024658, "Pretrain/Step": 5091, "Pretrain/Step Time": 9.552310494706035} +{"Pretrain/Learning Rate": 4.299076748298805e-05, "Pretrain/Loss": 2.043487071990967, "Pretrain/Loss (Raw)": 2.586503744125366, "Pretrain/Step": 5092, "Pretrain/Step Time": 9.546407327055931} +{"Pretrain/Learning Rate": 4.2987819562851686e-05, "Pretrain/Loss": 2.0450081825256348, "Pretrain/Loss (Raw)": 2.2044079303741455, "Pretrain/Step": 5093, "Pretrain/Step Time": 9.546691933646798} +{"Pretrain/Learning Rate": 4.298487112404923e-05, "Pretrain/Loss": 2.0452418327331543, "Pretrain/Loss (Raw)": 2.0595648288726807, "Pretrain/Step": 5094, "Pretrain/Step Time": 9.557355463504791} +{"Pretrain/Learning Rate": 4.29819221666657e-05, "Pretrain/Loss": 2.04482364654541, "Pretrain/Loss (Raw)": 2.1024324893951416, "Pretrain/Step": 5095, "Pretrain/Step Time": 9.554434029385448} +{"Pretrain/Learning Rate": 4.297897269078611e-05, "Pretrain/Loss": 2.045360565185547, "Pretrain/Loss (Raw)": 2.0390512943267822, "Pretrain/Step": 5096, "Pretrain/Step Time": 9.554312914609909} +{"Pretrain/Learning Rate": 4.297602269649553e-05, "Pretrain/Loss": 2.0509719848632812, "Pretrain/Loss (Raw)": 2.6285977363586426, "Pretrain/Step": 5097, "Pretrain/Step Time": 9.55198178999126} +{"Pretrain/Learning Rate": 4.2973072183879e-05, "Pretrain/Loss": 2.0485763549804688, "Pretrain/Loss (Raw)": 1.9659305810928345, "Pretrain/Step": 5098, "Pretrain/Step Time": 9.552227851003408} +{"Pretrain/Learning Rate": 4.2970121153021606e-05, "Pretrain/Loss": 2.0451314449310303, "Pretrain/Loss (Raw)": 1.8821213245391846, "Pretrain/Step": 5099, "Pretrain/Step Time": 9.549725426360965} +{"Pretrain/Learning Rate": 4.296716960400843e-05, "Pretrain/Loss": 2.047548294067383, "Pretrain/Loss (Raw)": 2.274618625640869, "Pretrain/Step": 5100, "Pretrain/Step Time": 9.549357948824763} +{"Pretrain/Learning Rate": 4.296421753692459e-05, "Pretrain/Loss": 2.045691967010498, "Pretrain/Loss (Raw)": 2.0063889026641846, "Pretrain/Step": 5101, "Pretrain/Step Time": 9.549149580299854} +{"Pretrain/Learning Rate": 4.2961264951855205e-05, "Pretrain/Loss": 2.0465025901794434, "Pretrain/Loss (Raw)": 2.25343656539917, "Pretrain/Step": 5102, "Pretrain/Step Time": 9.55261392146349} +{"Pretrain/Learning Rate": 4.29583118488854e-05, "Pretrain/Loss": 2.046151638031006, "Pretrain/Loss (Raw)": 2.093571186065674, "Pretrain/Step": 5103, "Pretrain/Step Time": 9.55052293278277} +{"Pretrain/Learning Rate": 4.295535822810034e-05, "Pretrain/Loss": 2.047158718109131, "Pretrain/Loss (Raw)": 2.130854845046997, "Pretrain/Step": 5104, "Pretrain/Step Time": 9.55786014162004} +{"Pretrain/Learning Rate": 4.2952404089585176e-05, "Pretrain/Loss": 2.0463833808898926, "Pretrain/Loss (Raw)": 2.03251051902771, "Pretrain/Step": 5105, "Pretrain/Step Time": 9.555007055401802} +{"Pretrain/Learning Rate": 4.29494494334251e-05, "Pretrain/Loss": 2.0470564365386963, "Pretrain/Loss (Raw)": 2.0088908672332764, "Pretrain/Step": 5106, "Pretrain/Step Time": 9.550233764573932} +{"Pretrain/Learning Rate": 4.29464942597053e-05, "Pretrain/Loss": 2.0484213829040527, "Pretrain/Loss (Raw)": 2.169222831726074, "Pretrain/Step": 5107, "Pretrain/Step Time": 9.551392264664173} +{"Pretrain/Learning Rate": 4.294353856851099e-05, "Pretrain/Loss": 2.0488109588623047, "Pretrain/Loss (Raw)": 1.9795259237289429, "Pretrain/Step": 5108, "Pretrain/Step Time": 9.550055526196957} +{"Pretrain/Learning Rate": 4.29405823599274e-05, "Pretrain/Loss": 2.04807186126709, "Pretrain/Loss (Raw)": 2.0528652667999268, "Pretrain/Step": 5109, "Pretrain/Step Time": 9.556677803397179} +{"Pretrain/Learning Rate": 4.293762563403976e-05, "Pretrain/Loss": 2.048678398132324, "Pretrain/Loss (Raw)": 2.121802568435669, "Pretrain/Step": 5110, "Pretrain/Step Time": 9.555438319221139} +{"Pretrain/Learning Rate": 4.293466839093333e-05, "Pretrain/Loss": 2.0494651794433594, "Pretrain/Loss (Raw)": 2.167707681655884, "Pretrain/Step": 5111, "Pretrain/Step Time": 9.555417807772756} +{"Pretrain/Learning Rate": 4.2931710630693375e-05, "Pretrain/Loss": 2.04984450340271, "Pretrain/Loss (Raw)": 2.093900442123413, "Pretrain/Step": 5112, "Pretrain/Step Time": 9.560277238488197} +{"Pretrain/Learning Rate": 4.2928752353405195e-05, "Pretrain/Loss": 2.0487143993377686, "Pretrain/Loss (Raw)": 2.0406510829925537, "Pretrain/Step": 5113, "Pretrain/Step Time": 9.561011267825961} +{"Pretrain/Learning Rate": 4.292579355915407e-05, "Pretrain/Loss": 2.0495026111602783, "Pretrain/Loss (Raw)": 2.089542865753174, "Pretrain/Step": 5114, "Pretrain/Step Time": 9.562749646604061} +{"Pretrain/Learning Rate": 4.2922834248025336e-05, "Pretrain/Loss": 2.0491886138916016, "Pretrain/Loss (Raw)": 2.0640339851379395, "Pretrain/Step": 5115, "Pretrain/Step Time": 9.557841386646032} +{"Pretrain/Learning Rate": 4.29198744201043e-05, "Pretrain/Loss": 2.0507912635803223, "Pretrain/Loss (Raw)": 1.969440221786499, "Pretrain/Step": 5116, "Pretrain/Step Time": 9.557115521281958} +{"Pretrain/Learning Rate": 4.291691407547632e-05, "Pretrain/Loss": 2.050541877746582, "Pretrain/Loss (Raw)": 2.096315622329712, "Pretrain/Step": 5117, "Pretrain/Step Time": 9.560923585668206} +{"Pretrain/Learning Rate": 4.291395321422676e-05, "Pretrain/Loss": 2.050504207611084, "Pretrain/Loss (Raw)": 2.069650173187256, "Pretrain/Step": 5118, "Pretrain/Step Time": 9.561339864507318} +{"Pretrain/Learning Rate": 4.291099183644098e-05, "Pretrain/Loss": 2.0503997802734375, "Pretrain/Loss (Raw)": 2.215650796890259, "Pretrain/Step": 5119, "Pretrain/Step Time": 9.561838585883379} +{"Pretrain/Learning Rate": 4.2908029942204386e-05, "Pretrain/Loss": 2.0477805137634277, "Pretrain/Loss (Raw)": 1.880959391593933, "Pretrain/Step": 5120, "Pretrain/Step Time": 9.564822234213352} +{"Pretrain/Learning Rate": 4.2905067531602364e-05, "Pretrain/Loss": 2.0479228496551514, "Pretrain/Loss (Raw)": 2.0579440593719482, "Pretrain/Step": 5121, "Pretrain/Step Time": 9.559962473809719} +{"Pretrain/Learning Rate": 4.290210460472035e-05, "Pretrain/Loss": 2.0509867668151855, "Pretrain/Loss (Raw)": 2.5825119018554688, "Pretrain/Step": 5122, "Pretrain/Step Time": 9.560082590207458} +{"Pretrain/Learning Rate": 4.2899141161643766e-05, "Pretrain/Loss": 2.048758029937744, "Pretrain/Loss (Raw)": 1.8454360961914062, "Pretrain/Step": 5123, "Pretrain/Step Time": 9.555043270811439} +{"Pretrain/Learning Rate": 4.289617720245807e-05, "Pretrain/Loss": 2.0488805770874023, "Pretrain/Loss (Raw)": 2.1016252040863037, "Pretrain/Step": 5124, "Pretrain/Step Time": 9.55907061137259} +{"Pretrain/Learning Rate": 4.289321272724871e-05, "Pretrain/Loss": 2.049812078475952, "Pretrain/Loss (Raw)": 2.0869662761688232, "Pretrain/Step": 5125, "Pretrain/Step Time": 9.562028968706727} +{"Pretrain/Learning Rate": 4.2890247736101176e-05, "Pretrain/Loss": 2.0518343448638916, "Pretrain/Loss (Raw)": 2.4047155380249023, "Pretrain/Step": 5126, "Pretrain/Step Time": 9.562100321054459} +{"Pretrain/Learning Rate": 4.288728222910097e-05, "Pretrain/Loss": 2.0507543087005615, "Pretrain/Loss (Raw)": 1.8899375200271606, "Pretrain/Step": 5127, "Pretrain/Step Time": 9.567930387333035} +{"Pretrain/Learning Rate": 4.2884316206333576e-05, "Pretrain/Loss": 2.051586627960205, "Pretrain/Loss (Raw)": 2.131258726119995, "Pretrain/Step": 5128, "Pretrain/Step Time": 9.566595893353224} +{"Pretrain/Learning Rate": 4.288134966788454e-05, "Pretrain/Loss": 2.0507798194885254, "Pretrain/Loss (Raw)": 1.8672268390655518, "Pretrain/Step": 5129, "Pretrain/Step Time": 8.469437833875418} +{"Pretrain/Learning Rate": 4.287838261383939e-05, "Pretrain/Loss": 2.051783561706543, "Pretrain/Loss (Raw)": 2.207935094833374, "Pretrain/Step": 5130, "Pretrain/Step Time": 8.472843296825886} +{"Pretrain/Learning Rate": 4.287541504428368e-05, "Pretrain/Loss": 2.0509634017944336, "Pretrain/Loss (Raw)": 1.6892123222351074, "Pretrain/Step": 5131, "Pretrain/Step Time": 8.47019811347127} +{"Pretrain/Learning Rate": 4.287244695930299e-05, "Pretrain/Loss": 2.050764560699463, "Pretrain/Loss (Raw)": 1.9522058963775635, "Pretrain/Step": 5132, "Pretrain/Step Time": 8.471719436347485} +{"Pretrain/Learning Rate": 4.2869478358982876e-05, "Pretrain/Loss": 2.0508108139038086, "Pretrain/Loss (Raw)": 2.0154638290405273, "Pretrain/Step": 5133, "Pretrain/Step Time": 8.46850484982133} +{"Pretrain/Learning Rate": 4.2866509243408956e-05, "Pretrain/Loss": 2.0505151748657227, "Pretrain/Loss (Raw)": 2.0855190753936768, "Pretrain/Step": 5134, "Pretrain/Step Time": 8.467071371152997} +{"Pretrain/Learning Rate": 4.286353961266684e-05, "Pretrain/Loss": 2.0525128841400146, "Pretrain/Loss (Raw)": 2.0503382682800293, "Pretrain/Step": 5135, "Pretrain/Step Time": 8.467843659222126} +{"Pretrain/Learning Rate": 4.286056946684215e-05, "Pretrain/Loss": 2.0542526245117188, "Pretrain/Loss (Raw)": 2.2591071128845215, "Pretrain/Step": 5136, "Pretrain/Step Time": 8.475893760100007} +{"Pretrain/Learning Rate": 4.2857598806020536e-05, "Pretrain/Loss": 2.0522561073303223, "Pretrain/Loss (Raw)": 1.8140747547149658, "Pretrain/Step": 5137, "Pretrain/Step Time": 8.473576098680496} +{"Pretrain/Learning Rate": 4.285462763028764e-05, "Pretrain/Loss": 2.0538148880004883, "Pretrain/Loss (Raw)": 2.060671091079712, "Pretrain/Step": 5138, "Pretrain/Step Time": 8.473231447860599} +{"Pretrain/Learning Rate": 4.285165593972915e-05, "Pretrain/Loss": 2.0551066398620605, "Pretrain/Loss (Raw)": 2.0271100997924805, "Pretrain/Step": 5139, "Pretrain/Step Time": 8.471149619668722} +{"Pretrain/Learning Rate": 4.284868373443074e-05, "Pretrain/Loss": 2.0542731285095215, "Pretrain/Loss (Raw)": 2.131138324737549, "Pretrain/Step": 5140, "Pretrain/Step Time": 8.465463330969214} +{"Pretrain/Learning Rate": 4.2845711014478116e-05, "Pretrain/Loss": 2.051649570465088, "Pretrain/Loss (Raw)": 1.9606889486312866, "Pretrain/Step": 5141, "Pretrain/Step Time": 8.464857500046492} +{"Pretrain/Learning Rate": 4.2842737779957e-05, "Pretrain/Loss": 2.048973560333252, "Pretrain/Loss (Raw)": 1.542726993560791, "Pretrain/Step": 5142, "Pretrain/Step Time": 8.468293942511082} +{"Pretrain/Learning Rate": 4.283976403095312e-05, "Pretrain/Loss": 2.0462889671325684, "Pretrain/Loss (Raw)": 1.735266923904419, "Pretrain/Step": 5143, "Pretrain/Step Time": 8.46743381768465} +{"Pretrain/Learning Rate": 4.283678976755221e-05, "Pretrain/Loss": 2.0477828979492188, "Pretrain/Loss (Raw)": 2.220128297805786, "Pretrain/Step": 5144, "Pretrain/Step Time": 8.471243433654308} +{"Pretrain/Learning Rate": 4.283381498984006e-05, "Pretrain/Loss": 2.0462143421173096, "Pretrain/Loss (Raw)": 2.1011717319488525, "Pretrain/Step": 5145, "Pretrain/Step Time": 8.469315681606531} +{"Pretrain/Learning Rate": 4.283083969790241e-05, "Pretrain/Loss": 2.0479207038879395, "Pretrain/Loss (Raw)": 2.289046287536621, "Pretrain/Step": 5146, "Pretrain/Step Time": 8.466801965609193} +{"Pretrain/Learning Rate": 4.282786389182507e-05, "Pretrain/Loss": 2.0491743087768555, "Pretrain/Loss (Raw)": 2.194643259048462, "Pretrain/Step": 5147, "Pretrain/Step Time": 8.467264669016004} +{"Pretrain/Learning Rate": 4.282488757169385e-05, "Pretrain/Loss": 2.048328161239624, "Pretrain/Loss (Raw)": 1.8324692249298096, "Pretrain/Step": 5148, "Pretrain/Step Time": 8.465067621320486} +{"Pretrain/Learning Rate": 4.2821910737594554e-05, "Pretrain/Loss": 2.048292636871338, "Pretrain/Loss (Raw)": 1.853422999382019, "Pretrain/Step": 5149, "Pretrain/Step Time": 8.466114705428481} +{"Pretrain/Learning Rate": 4.281893338961304e-05, "Pretrain/Loss": 2.047732353210449, "Pretrain/Loss (Raw)": 2.0020575523376465, "Pretrain/Step": 5150, "Pretrain/Step Time": 8.46522900648415} +{"Pretrain/Learning Rate": 4.281595552783513e-05, "Pretrain/Loss": 2.0484838485717773, "Pretrain/Loss (Raw)": 2.006267547607422, "Pretrain/Step": 5151, "Pretrain/Step Time": 8.46566243097186} +{"Pretrain/Learning Rate": 4.28129771523467e-05, "Pretrain/Loss": 2.0492067337036133, "Pretrain/Loss (Raw)": 2.062121868133545, "Pretrain/Step": 5152, "Pretrain/Step Time": 8.465953195467591} +{"Pretrain/Learning Rate": 4.280999826323363e-05, "Pretrain/Loss": 2.049616813659668, "Pretrain/Loss (Raw)": 1.9057276248931885, "Pretrain/Step": 5153, "Pretrain/Step Time": 8.467943754047155} +{"Pretrain/Learning Rate": 4.280701886058183e-05, "Pretrain/Loss": 2.0517420768737793, "Pretrain/Loss (Raw)": 2.175852060317993, "Pretrain/Step": 5154, "Pretrain/Step Time": 8.467682672664523} +{"Pretrain/Learning Rate": 4.280403894447718e-05, "Pretrain/Loss": 2.0516772270202637, "Pretrain/Loss (Raw)": 2.1501827239990234, "Pretrain/Step": 5155, "Pretrain/Step Time": 8.462073866277933} +{"Pretrain/Learning Rate": 4.280105851500562e-05, "Pretrain/Loss": 2.0529961585998535, "Pretrain/Loss (Raw)": 2.1248342990875244, "Pretrain/Step": 5156, "Pretrain/Step Time": 8.463352419435978} +{"Pretrain/Learning Rate": 4.279807757225309e-05, "Pretrain/Loss": 2.052943706512451, "Pretrain/Loss (Raw)": 1.9708151817321777, "Pretrain/Step": 5157, "Pretrain/Step Time": 8.465378688648343} +{"Pretrain/Learning Rate": 4.279509611630555e-05, "Pretrain/Loss": 2.0541529655456543, "Pretrain/Loss (Raw)": 2.2944281101226807, "Pretrain/Step": 5158, "Pretrain/Step Time": 8.471267480403185} +{"Pretrain/Learning Rate": 4.279211414724894e-05, "Pretrain/Loss": 2.0544252395629883, "Pretrain/Loss (Raw)": 2.0926320552825928, "Pretrain/Step": 5159, "Pretrain/Step Time": 8.469081157818437} +{"Pretrain/Learning Rate": 4.2789131665169266e-05, "Pretrain/Loss": 2.05412220954895, "Pretrain/Loss (Raw)": 2.0518269538879395, "Pretrain/Step": 5160, "Pretrain/Step Time": 8.471503088250756} +{"Pretrain/Learning Rate": 4.2786148670152523e-05, "Pretrain/Loss": 2.0571255683898926, "Pretrain/Loss (Raw)": 2.250769853591919, "Pretrain/Step": 5161, "Pretrain/Step Time": 8.469821432605386} +{"Pretrain/Learning Rate": 4.278316516228472e-05, "Pretrain/Loss": 2.055459976196289, "Pretrain/Loss (Raw)": 1.9965150356292725, "Pretrain/Step": 5162, "Pretrain/Step Time": 8.463674880564213} +{"Pretrain/Learning Rate": 4.27801811416519e-05, "Pretrain/Loss": 2.056784152984619, "Pretrain/Loss (Raw)": 2.122934341430664, "Pretrain/Step": 5163, "Pretrain/Step Time": 8.469435280188918} +{"Pretrain/Learning Rate": 4.2777196608340076e-05, "Pretrain/Loss": 2.056802749633789, "Pretrain/Loss (Raw)": 2.0460243225097656, "Pretrain/Step": 5164, "Pretrain/Step Time": 8.470456102862954} +{"Pretrain/Learning Rate": 4.2774211562435316e-05, "Pretrain/Loss": 2.0567917823791504, "Pretrain/Loss (Raw)": 1.9947329759597778, "Pretrain/Step": 5165, "Pretrain/Step Time": 8.470895515754819} +{"Pretrain/Learning Rate": 4.277122600402371e-05, "Pretrain/Loss": 2.056189775466919, "Pretrain/Loss (Raw)": 2.0574684143066406, "Pretrain/Step": 5166, "Pretrain/Step Time": 8.469837108626962} +{"Pretrain/Learning Rate": 4.2768239933191324e-05, "Pretrain/Loss": 2.0551257133483887, "Pretrain/Loss (Raw)": 1.8995556831359863, "Pretrain/Step": 5167, "Pretrain/Step Time": 8.471758589148521} +{"Pretrain/Learning Rate": 4.2765253350024256e-05, "Pretrain/Loss": 2.0551552772521973, "Pretrain/Loss (Raw)": 1.9203990697860718, "Pretrain/Step": 5168, "Pretrain/Step Time": 8.468391276896} +{"Pretrain/Learning Rate": 4.276226625460865e-05, "Pretrain/Loss": 2.0544815063476562, "Pretrain/Loss (Raw)": 1.9628065824508667, "Pretrain/Step": 5169, "Pretrain/Step Time": 8.46750159189105} +{"Pretrain/Learning Rate": 4.27592786470306e-05, "Pretrain/Loss": 2.0556511878967285, "Pretrain/Loss (Raw)": 2.120778799057007, "Pretrain/Step": 5170, "Pretrain/Step Time": 8.474925396963954} +{"Pretrain/Learning Rate": 4.275629052737628e-05, "Pretrain/Loss": 2.0543923377990723, "Pretrain/Loss (Raw)": 2.083958148956299, "Pretrain/Step": 5171, "Pretrain/Step Time": 8.471731185913086} +{"Pretrain/Learning Rate": 4.275330189573183e-05, "Pretrain/Loss": 2.0544745922088623, "Pretrain/Loss (Raw)": 2.115492343902588, "Pretrain/Step": 5172, "Pretrain/Step Time": 8.470070488750935} +{"Pretrain/Learning Rate": 4.2750312752183454e-05, "Pretrain/Loss": 2.0558009147644043, "Pretrain/Loss (Raw)": 2.076749324798584, "Pretrain/Step": 5173, "Pretrain/Step Time": 8.472748957574368} +{"Pretrain/Learning Rate": 4.27473230968173e-05, "Pretrain/Loss": 2.0575740337371826, "Pretrain/Loss (Raw)": 2.0710322856903076, "Pretrain/Step": 5174, "Pretrain/Step Time": 8.471117429435253} +{"Pretrain/Learning Rate": 4.274433292971961e-05, "Pretrain/Loss": 2.057694435119629, "Pretrain/Loss (Raw)": 2.1518566608428955, "Pretrain/Step": 5175, "Pretrain/Step Time": 8.47562555782497} +{"Pretrain/Learning Rate": 4.274134225097659e-05, "Pretrain/Loss": 2.0583832263946533, "Pretrain/Loss (Raw)": 2.1132845878601074, "Pretrain/Step": 5176, "Pretrain/Step Time": 8.474277729168534} +{"Pretrain/Learning Rate": 4.2738351060674464e-05, "Pretrain/Loss": 2.056570529937744, "Pretrain/Loss (Raw)": 1.8562147617340088, "Pretrain/Step": 5177, "Pretrain/Step Time": 8.475406691432} +{"Pretrain/Learning Rate": 4.273535935889949e-05, "Pretrain/Loss": 2.0548367500305176, "Pretrain/Loss (Raw)": 1.9748685359954834, "Pretrain/Step": 5178, "Pretrain/Step Time": 8.47666623070836} +{"Pretrain/Learning Rate": 4.273236714573794e-05, "Pretrain/Loss": 2.0551271438598633, "Pretrain/Loss (Raw)": 2.0988411903381348, "Pretrain/Step": 5179, "Pretrain/Step Time": 8.4715375918895} +{"Pretrain/Learning Rate": 4.272937442127608e-05, "Pretrain/Loss": 2.053408145904541, "Pretrain/Loss (Raw)": 1.8319995403289795, "Pretrain/Step": 5180, "Pretrain/Step Time": 8.476841049268842} +{"Pretrain/Learning Rate": 4.2726381185600205e-05, "Pretrain/Loss": 2.0540380477905273, "Pretrain/Loss (Raw)": 1.9983657598495483, "Pretrain/Step": 5181, "Pretrain/Step Time": 8.479491962119937} +{"Pretrain/Learning Rate": 4.272338743879664e-05, "Pretrain/Loss": 2.055081367492676, "Pretrain/Loss (Raw)": 2.06204891204834, "Pretrain/Step": 5182, "Pretrain/Step Time": 8.480656864121556} +{"Pretrain/Learning Rate": 4.272039318095167e-05, "Pretrain/Loss": 2.054765224456787, "Pretrain/Loss (Raw)": 2.111698627471924, "Pretrain/Step": 5183, "Pretrain/Step Time": 8.478525457903743} +{"Pretrain/Learning Rate": 4.271739841215166e-05, "Pretrain/Loss": 2.05393123626709, "Pretrain/Loss (Raw)": 1.8659894466400146, "Pretrain/Step": 5184, "Pretrain/Step Time": 8.481099193915725} +{"Pretrain/Learning Rate": 4.271440313248297e-05, "Pretrain/Loss": 2.0568509101867676, "Pretrain/Loss (Raw)": 2.1425297260284424, "Pretrain/Step": 5185, "Pretrain/Step Time": 8.481326391920447} +{"Pretrain/Learning Rate": 4.2711407342031936e-05, "Pretrain/Loss": 2.058426856994629, "Pretrain/Loss (Raw)": 2.1975345611572266, "Pretrain/Step": 5186, "Pretrain/Step Time": 8.477400975301862} +{"Pretrain/Learning Rate": 4.270841104088497e-05, "Pretrain/Loss": 2.0603551864624023, "Pretrain/Loss (Raw)": 2.2278153896331787, "Pretrain/Step": 5187, "Pretrain/Step Time": 8.475837273523211} +{"Pretrain/Learning Rate": 4.270541422912845e-05, "Pretrain/Loss": 2.0572452545166016, "Pretrain/Loss (Raw)": 2.0132696628570557, "Pretrain/Step": 5188, "Pretrain/Step Time": 8.479460436850786} +{"Pretrain/Learning Rate": 4.27024169068488e-05, "Pretrain/Loss": 2.0570452213287354, "Pretrain/Loss (Raw)": 2.0620508193969727, "Pretrain/Step": 5189, "Pretrain/Step Time": 8.484003562480211} +{"Pretrain/Learning Rate": 4.2699419074132424e-05, "Pretrain/Loss": 2.053913116455078, "Pretrain/Loss (Raw)": 1.7642178535461426, "Pretrain/Step": 5190, "Pretrain/Step Time": 8.483061702921987} +{"Pretrain/Learning Rate": 4.2696420731065776e-05, "Pretrain/Loss": 2.051204204559326, "Pretrain/Loss (Raw)": 1.67376708984375, "Pretrain/Step": 5191, "Pretrain/Step Time": 8.481663355603814} +{"Pretrain/Learning Rate": 4.269342187773532e-05, "Pretrain/Loss": 2.0520284175872803, "Pretrain/Loss (Raw)": 2.14713191986084, "Pretrain/Step": 5192, "Pretrain/Step Time": 8.488199902698398} +{"Pretrain/Learning Rate": 4.2690422514227516e-05, "Pretrain/Loss": 2.0514323711395264, "Pretrain/Loss (Raw)": 2.0376291275024414, "Pretrain/Step": 5193, "Pretrain/Step Time": 8.487401278689504} +{"Pretrain/Learning Rate": 4.268742264062885e-05, "Pretrain/Loss": 2.0542688369750977, "Pretrain/Loss (Raw)": 2.303914785385132, "Pretrain/Step": 5194, "Pretrain/Step Time": 8.495228020474315} +{"Pretrain/Learning Rate": 4.2684422257025827e-05, "Pretrain/Loss": 2.053241729736328, "Pretrain/Loss (Raw)": 2.192462682723999, "Pretrain/Step": 5195, "Pretrain/Step Time": 8.489819582551718} +{"Pretrain/Learning Rate": 4.268142136350494e-05, "Pretrain/Loss": 2.05212140083313, "Pretrain/Loss (Raw)": 1.946077585220337, "Pretrain/Step": 5196, "Pretrain/Step Time": 8.494646364822984} +{"Pretrain/Learning Rate": 4.267841996015274e-05, "Pretrain/Loss": 2.0557522773742676, "Pretrain/Loss (Raw)": 1.9346903562545776, "Pretrain/Step": 5197, "Pretrain/Step Time": 8.49643318541348} +{"Pretrain/Learning Rate": 4.267541804705577e-05, "Pretrain/Loss": 2.055739641189575, "Pretrain/Loss (Raw)": 2.1806223392486572, "Pretrain/Step": 5198, "Pretrain/Step Time": 8.497673373669386} +{"Pretrain/Learning Rate": 4.2672415624300575e-05, "Pretrain/Loss": 2.0544872283935547, "Pretrain/Loss (Raw)": 2.017941951751709, "Pretrain/Step": 5199, "Pretrain/Step Time": 8.498912051320076} +{"Pretrain/Learning Rate": 4.266941269197373e-05, "Pretrain/Loss": 2.054004192352295, "Pretrain/Loss (Raw)": 2.0637810230255127, "Pretrain/Step": 5200, "Pretrain/Step Time": 8.496176762506366} +{"Pretrain/Learning Rate": 4.266640925016182e-05, "Pretrain/Loss": 2.0543322563171387, "Pretrain/Loss (Raw)": 2.032351493835449, "Pretrain/Step": 5201, "Pretrain/Step Time": 8.497346805408597} +{"Pretrain/Learning Rate": 4.266340529895147e-05, "Pretrain/Loss": 2.052093505859375, "Pretrain/Loss (Raw)": 1.5618900060653687, "Pretrain/Step": 5202, "Pretrain/Step Time": 8.499221475794911} +{"Pretrain/Learning Rate": 4.266040083842927e-05, "Pretrain/Loss": 2.0565881729125977, "Pretrain/Loss (Raw)": 2.491196870803833, "Pretrain/Step": 5203, "Pretrain/Step Time": 8.494157647714019} +{"Pretrain/Learning Rate": 4.2657395868681865e-05, "Pretrain/Loss": 2.059441566467285, "Pretrain/Loss (Raw)": 2.2718465328216553, "Pretrain/Step": 5204, "Pretrain/Step Time": 8.488165404647589} +{"Pretrain/Learning Rate": 4.26543903897959e-05, "Pretrain/Loss": 2.0615477561950684, "Pretrain/Loss (Raw)": 2.245905637741089, "Pretrain/Step": 5205, "Pretrain/Step Time": 8.488773562014103} +{"Pretrain/Learning Rate": 4.265138440185803e-05, "Pretrain/Loss": 2.063106060028076, "Pretrain/Loss (Raw)": 2.1433002948760986, "Pretrain/Step": 5206, "Pretrain/Step Time": 8.489359242841601} +{"Pretrain/Learning Rate": 4.264837790495493e-05, "Pretrain/Loss": 2.0619263648986816, "Pretrain/Loss (Raw)": 1.7214041948318481, "Pretrain/Step": 5207, "Pretrain/Step Time": 8.489016892388463} +{"Pretrain/Learning Rate": 4.26453708991733e-05, "Pretrain/Loss": 2.060762405395508, "Pretrain/Loss (Raw)": 1.919376254081726, "Pretrain/Step": 5208, "Pretrain/Step Time": 8.492121012881398} +{"Pretrain/Learning Rate": 4.264236338459984e-05, "Pretrain/Loss": 2.0600011348724365, "Pretrain/Loss (Raw)": 2.1523854732513428, "Pretrain/Step": 5209, "Pretrain/Step Time": 8.496046874672174} +{"Pretrain/Learning Rate": 4.2639355361321264e-05, "Pretrain/Loss": 2.0597352981567383, "Pretrain/Loss (Raw)": 1.9159036874771118, "Pretrain/Step": 5210, "Pretrain/Step Time": 8.496684795245528} +{"Pretrain/Learning Rate": 4.2636346829424314e-05, "Pretrain/Loss": 2.0613067150115967, "Pretrain/Loss (Raw)": 2.107095241546631, "Pretrain/Step": 5211, "Pretrain/Step Time": 8.499558666720986} +{"Pretrain/Learning Rate": 4.263333778899574e-05, "Pretrain/Loss": 2.057260036468506, "Pretrain/Loss (Raw)": 1.6826719045639038, "Pretrain/Step": 5212, "Pretrain/Step Time": 8.497221929952502} +{"Pretrain/Learning Rate": 4.2630328240122294e-05, "Pretrain/Loss": 2.056318998336792, "Pretrain/Loss (Raw)": 2.018596649169922, "Pretrain/Step": 5213, "Pretrain/Step Time": 8.499672662466764} +{"Pretrain/Learning Rate": 4.262731818289077e-05, "Pretrain/Loss": 2.056612968444824, "Pretrain/Loss (Raw)": 2.0463476181030273, "Pretrain/Step": 5214, "Pretrain/Step Time": 8.500324698165059} +{"Pretrain/Learning Rate": 4.2624307617387946e-05, "Pretrain/Loss": 2.0537257194519043, "Pretrain/Loss (Raw)": 1.8780103921890259, "Pretrain/Step": 5215, "Pretrain/Step Time": 8.494697788730264} +{"Pretrain/Learning Rate": 4.262129654370064e-05, "Pretrain/Loss": 2.053439140319824, "Pretrain/Loss (Raw)": 1.9370074272155762, "Pretrain/Step": 5216, "Pretrain/Step Time": 8.49362000823021} +{"Pretrain/Learning Rate": 4.261828496191567e-05, "Pretrain/Loss": 2.05511474609375, "Pretrain/Loss (Raw)": 2.128995656967163, "Pretrain/Step": 5217, "Pretrain/Step Time": 8.497707810252905} +{"Pretrain/Learning Rate": 4.261527287211987e-05, "Pretrain/Loss": 2.055882215499878, "Pretrain/Loss (Raw)": 2.052274465560913, "Pretrain/Step": 5218, "Pretrain/Step Time": 8.495322806760669} +{"Pretrain/Learning Rate": 4.26122602744001e-05, "Pretrain/Loss": 2.057859420776367, "Pretrain/Loss (Raw)": 2.3027398586273193, "Pretrain/Step": 5219, "Pretrain/Step Time": 8.496052591130137} +{"Pretrain/Learning Rate": 4.260924716884321e-05, "Pretrain/Loss": 2.053311347961426, "Pretrain/Loss (Raw)": 2.0043692588806152, "Pretrain/Step": 5220, "Pretrain/Step Time": 8.4929252974689} +{"Pretrain/Learning Rate": 4.26062335555361e-05, "Pretrain/Loss": 2.050492286682129, "Pretrain/Loss (Raw)": 1.8435829877853394, "Pretrain/Step": 5221, "Pretrain/Step Time": 8.494450544938445} +{"Pretrain/Learning Rate": 4.2603219434565664e-05, "Pretrain/Loss": 2.051509380340576, "Pretrain/Loss (Raw)": 2.1897671222686768, "Pretrain/Step": 5222, "Pretrain/Step Time": 8.488573994487524} +{"Pretrain/Learning Rate": 4.2600204806018796e-05, "Pretrain/Loss": 2.05039644241333, "Pretrain/Loss (Raw)": 1.9599474668502808, "Pretrain/Step": 5223, "Pretrain/Step Time": 8.492295799776912} +{"Pretrain/Learning Rate": 4.259718966998243e-05, "Pretrain/Loss": 2.0514743328094482, "Pretrain/Loss (Raw)": 2.1770107746124268, "Pretrain/Step": 5224, "Pretrain/Step Time": 8.490582393482327} +{"Pretrain/Learning Rate": 4.259417402654351e-05, "Pretrain/Loss": 2.047560453414917, "Pretrain/Loss (Raw)": 2.1276257038116455, "Pretrain/Step": 5225, "Pretrain/Step Time": 8.492782730609179} +{"Pretrain/Learning Rate": 4.259115787578898e-05, "Pretrain/Loss": 2.0523247718811035, "Pretrain/Loss (Raw)": 2.5758004188537598, "Pretrain/Step": 5226, "Pretrain/Step Time": 8.491566244512796} +{"Pretrain/Learning Rate": 4.2588141217805813e-05, "Pretrain/Loss": 2.0549986362457275, "Pretrain/Loss (Raw)": 2.2243425846099854, "Pretrain/Step": 5227, "Pretrain/Step Time": 8.491933749988675} +{"Pretrain/Learning Rate": 4.258512405268099e-05, "Pretrain/Loss": 2.0524871349334717, "Pretrain/Loss (Raw)": 1.9531694650650024, "Pretrain/Step": 5228, "Pretrain/Step Time": 8.490159699693322} +{"Pretrain/Learning Rate": 4.258210638050152e-05, "Pretrain/Loss": 2.0536468029022217, "Pretrain/Loss (Raw)": 2.1548008918762207, "Pretrain/Step": 5229, "Pretrain/Step Time": 8.497124541550875} +{"Pretrain/Learning Rate": 4.25790882013544e-05, "Pretrain/Loss": 2.049710750579834, "Pretrain/Loss (Raw)": 1.749625325202942, "Pretrain/Step": 5230, "Pretrain/Step Time": 8.491511998698115} +{"Pretrain/Learning Rate": 4.257606951532667e-05, "Pretrain/Loss": 2.0483429431915283, "Pretrain/Loss (Raw)": 1.9184988737106323, "Pretrain/Step": 5231, "Pretrain/Step Time": 8.488387918099761} +{"Pretrain/Learning Rate": 4.257305032250536e-05, "Pretrain/Loss": 2.0499703884124756, "Pretrain/Loss (Raw)": 2.3391659259796143, "Pretrain/Step": 5232, "Pretrain/Step Time": 8.485905414447188} +{"Pretrain/Learning Rate": 4.2570030622977536e-05, "Pretrain/Loss": 2.048583507537842, "Pretrain/Loss (Raw)": 1.854978084564209, "Pretrain/Step": 5233, "Pretrain/Step Time": 8.488803118467331} +{"Pretrain/Learning Rate": 4.256701041683027e-05, "Pretrain/Loss": 2.05007266998291, "Pretrain/Loss (Raw)": 2.1995248794555664, "Pretrain/Step": 5234, "Pretrain/Step Time": 8.488236349076033} +{"Pretrain/Learning Rate": 4.256398970415063e-05, "Pretrain/Loss": 2.0482044219970703, "Pretrain/Loss (Raw)": 1.9300531148910522, "Pretrain/Step": 5235, "Pretrain/Step Time": 8.491028720512986} +{"Pretrain/Learning Rate": 4.2560968485025737e-05, "Pretrain/Loss": 2.048757553100586, "Pretrain/Loss (Raw)": 2.0503556728363037, "Pretrain/Step": 5236, "Pretrain/Step Time": 8.490812085568905} +{"Pretrain/Learning Rate": 4.25579467595427e-05, "Pretrain/Loss": 2.0486559867858887, "Pretrain/Loss (Raw)": 2.039844036102295, "Pretrain/Step": 5237, "Pretrain/Step Time": 8.486251829192042} +{"Pretrain/Learning Rate": 4.2554924527788635e-05, "Pretrain/Loss": 2.0486254692077637, "Pretrain/Loss (Raw)": 2.117924928665161, "Pretrain/Step": 5238, "Pretrain/Step Time": 8.487828643992543} +{"Pretrain/Learning Rate": 4.25519017898507e-05, "Pretrain/Loss": 2.0450925827026367, "Pretrain/Loss (Raw)": 1.7154839038848877, "Pretrain/Step": 5239, "Pretrain/Step Time": 8.49425420165062} +{"Pretrain/Learning Rate": 4.254887854581606e-05, "Pretrain/Loss": 2.0449459552764893, "Pretrain/Loss (Raw)": 2.0751302242279053, "Pretrain/Step": 5240, "Pretrain/Step Time": 8.492450848221779} +{"Pretrain/Learning Rate": 4.2545854795771865e-05, "Pretrain/Loss": 2.044564962387085, "Pretrain/Loss (Raw)": 1.9918855428695679, "Pretrain/Step": 5241, "Pretrain/Step Time": 8.491609314456582} +{"Pretrain/Learning Rate": 4.2542830539805326e-05, "Pretrain/Loss": 2.0426759719848633, "Pretrain/Loss (Raw)": 1.847765326499939, "Pretrain/Step": 5242, "Pretrain/Step Time": 8.491057747974992} +{"Pretrain/Learning Rate": 4.2539805778003634e-05, "Pretrain/Loss": 2.0423450469970703, "Pretrain/Loss (Raw)": 2.0216596126556396, "Pretrain/Step": 5243, "Pretrain/Step Time": 8.487662848085165} +{"Pretrain/Learning Rate": 4.2536780510454005e-05, "Pretrain/Loss": 2.0437827110290527, "Pretrain/Loss (Raw)": 2.1534640789031982, "Pretrain/Step": 5244, "Pretrain/Step Time": 8.49246366508305} +{"Pretrain/Learning Rate": 4.253375473724367e-05, "Pretrain/Loss": 2.0418894290924072, "Pretrain/Loss (Raw)": 1.8539756536483765, "Pretrain/Step": 5245, "Pretrain/Step Time": 8.48872122913599} +{"Pretrain/Learning Rate": 4.253072845845988e-05, "Pretrain/Loss": 2.041294574737549, "Pretrain/Loss (Raw)": 1.9935190677642822, "Pretrain/Step": 5246, "Pretrain/Step Time": 8.48689111508429} +{"Pretrain/Learning Rate": 4.2527701674189897e-05, "Pretrain/Loss": 2.040933847427368, "Pretrain/Loss (Raw)": 2.169462203979492, "Pretrain/Step": 5247, "Pretrain/Step Time": 8.491532392799854} +{"Pretrain/Learning Rate": 4.252467438452099e-05, "Pretrain/Loss": 2.0429372787475586, "Pretrain/Loss (Raw)": 2.1374051570892334, "Pretrain/Step": 5248, "Pretrain/Step Time": 8.484054142609239} +{"Pretrain/Learning Rate": 4.252164658954045e-05, "Pretrain/Loss": 2.0444111824035645, "Pretrain/Loss (Raw)": 2.246598720550537, "Pretrain/Step": 5249, "Pretrain/Step Time": 8.486910136416554} +{"Pretrain/Learning Rate": 4.2518618289335585e-05, "Pretrain/Loss": 2.04079008102417, "Pretrain/Loss (Raw)": 2.1190123558044434, "Pretrain/Step": 5250, "Pretrain/Step Time": 8.486644826829433} +{"Pretrain/Learning Rate": 4.25155894839937e-05, "Pretrain/Loss": 2.041107177734375, "Pretrain/Loss (Raw)": 1.8860474824905396, "Pretrain/Step": 5251, "Pretrain/Step Time": 8.483984962105751} +{"Pretrain/Learning Rate": 4.2512560173602154e-05, "Pretrain/Loss": 2.0444846153259277, "Pretrain/Loss (Raw)": 2.533936023712158, "Pretrain/Step": 5252, "Pretrain/Step Time": 8.486228363588452} +{"Pretrain/Learning Rate": 4.2509530358248274e-05, "Pretrain/Loss": 2.044081211090088, "Pretrain/Loss (Raw)": 2.0353174209594727, "Pretrain/Step": 5253, "Pretrain/Step Time": 8.484462449327111} +{"Pretrain/Learning Rate": 4.250650003801944e-05, "Pretrain/Loss": 2.0414812564849854, "Pretrain/Loss (Raw)": 2.0719218254089355, "Pretrain/Step": 5254, "Pretrain/Step Time": 8.484245648607612} +{"Pretrain/Learning Rate": 4.2503469213003e-05, "Pretrain/Loss": 2.0435171127319336, "Pretrain/Loss (Raw)": 2.1505322456359863, "Pretrain/Step": 5255, "Pretrain/Step Time": 8.481079317629337} +{"Pretrain/Learning Rate": 4.250043788328638e-05, "Pretrain/Loss": 2.0424227714538574, "Pretrain/Loss (Raw)": 1.9911925792694092, "Pretrain/Step": 5256, "Pretrain/Step Time": 8.48524497076869} +{"Pretrain/Learning Rate": 4.249740604895696e-05, "Pretrain/Loss": 2.042515516281128, "Pretrain/Loss (Raw)": 1.8790642023086548, "Pretrain/Step": 5257, "Pretrain/Step Time": 8.489638825878501} +{"Pretrain/Learning Rate": 4.249437371010218e-05, "Pretrain/Loss": 2.040435314178467, "Pretrain/Loss (Raw)": 1.9416825771331787, "Pretrain/Step": 5258, "Pretrain/Step Time": 8.486788712441921} +{"Pretrain/Learning Rate": 4.249134086680946e-05, "Pretrain/Loss": 2.0423483848571777, "Pretrain/Loss (Raw)": 1.9341093301773071, "Pretrain/Step": 5259, "Pretrain/Step Time": 8.48603887297213} +{"Pretrain/Learning Rate": 4.2488307519166257e-05, "Pretrain/Loss": 2.0449912548065186, "Pretrain/Loss (Raw)": 2.2904608249664307, "Pretrain/Step": 5260, "Pretrain/Step Time": 8.484724374487996} +{"Pretrain/Learning Rate": 4.248527366726005e-05, "Pretrain/Loss": 2.0446228981018066, "Pretrain/Loss (Raw)": 1.968326449394226, "Pretrain/Step": 5261, "Pretrain/Step Time": 8.48781355470419} +{"Pretrain/Learning Rate": 4.248223931117829e-05, "Pretrain/Loss": 2.048445701599121, "Pretrain/Loss (Raw)": 2.574815511703491, "Pretrain/Step": 5262, "Pretrain/Step Time": 8.488637447357178} +{"Pretrain/Learning Rate": 4.247920445100848e-05, "Pretrain/Loss": 2.0482888221740723, "Pretrain/Loss (Raw)": 2.030290126800537, "Pretrain/Step": 5263, "Pretrain/Step Time": 8.488231463357806} +{"Pretrain/Learning Rate": 4.247616908683814e-05, "Pretrain/Loss": 2.0474987030029297, "Pretrain/Loss (Raw)": 2.157945156097412, "Pretrain/Step": 5264, "Pretrain/Step Time": 8.486612677574158} +{"Pretrain/Learning Rate": 4.247313321875478e-05, "Pretrain/Loss": 2.048158645629883, "Pretrain/Loss (Raw)": 1.898546576499939, "Pretrain/Step": 5265, "Pretrain/Step Time": 8.488060241565108} +{"Pretrain/Learning Rate": 4.2470096846845944e-05, "Pretrain/Loss": 2.045999526977539, "Pretrain/Loss (Raw)": 1.784325361251831, "Pretrain/Step": 5266, "Pretrain/Step Time": 8.490469504147768} +{"Pretrain/Learning Rate": 4.246705997119918e-05, "Pretrain/Loss": 2.047011137008667, "Pretrain/Loss (Raw)": 2.15659761428833, "Pretrain/Step": 5267, "Pretrain/Step Time": 8.487888038158417} +{"Pretrain/Learning Rate": 4.2464022591902055e-05, "Pretrain/Loss": 2.046786308288574, "Pretrain/Loss (Raw)": 2.102358818054199, "Pretrain/Step": 5268, "Pretrain/Step Time": 8.486916191875935} +{"Pretrain/Learning Rate": 4.246098470904215e-05, "Pretrain/Loss": 2.0469822883605957, "Pretrain/Loss (Raw)": 1.9857721328735352, "Pretrain/Step": 5269, "Pretrain/Step Time": 8.49037453532219} +{"Pretrain/Learning Rate": 4.2457946322707055e-05, "Pretrain/Loss": 2.047999382019043, "Pretrain/Loss (Raw)": 1.6729260683059692, "Pretrain/Step": 5270, "Pretrain/Step Time": 8.490427665412426} +{"Pretrain/Learning Rate": 4.245490743298439e-05, "Pretrain/Loss": 2.0526270866394043, "Pretrain/Loss (Raw)": 2.3275794982910156, "Pretrain/Step": 5271, "Pretrain/Step Time": 8.49118953384459} +{"Pretrain/Learning Rate": 4.245186803996177e-05, "Pretrain/Loss": 2.0523321628570557, "Pretrain/Loss (Raw)": 2.1823863983154297, "Pretrain/Step": 5272, "Pretrain/Step Time": 8.490986132994294} +{"Pretrain/Learning Rate": 4.244882814372685e-05, "Pretrain/Loss": 2.0513548851013184, "Pretrain/Loss (Raw)": 1.9760916233062744, "Pretrain/Step": 5273, "Pretrain/Step Time": 8.498762743547559} +{"Pretrain/Learning Rate": 4.244578774436726e-05, "Pretrain/Loss": 2.049076557159424, "Pretrain/Loss (Raw)": 1.9974437952041626, "Pretrain/Step": 5274, "Pretrain/Step Time": 8.497149819508195} +{"Pretrain/Learning Rate": 4.2442746841970684e-05, "Pretrain/Loss": 2.0485827922821045, "Pretrain/Loss (Raw)": 2.1314303874969482, "Pretrain/Step": 5275, "Pretrain/Step Time": 8.496739733964205} +{"Pretrain/Learning Rate": 4.243970543662479e-05, "Pretrain/Loss": 2.048516273498535, "Pretrain/Loss (Raw)": 1.8239256143569946, "Pretrain/Step": 5276, "Pretrain/Step Time": 8.497412139549851} +{"Pretrain/Learning Rate": 4.2436663528417295e-05, "Pretrain/Loss": 2.04899263381958, "Pretrain/Loss (Raw)": 1.9144245386123657, "Pretrain/Step": 5277, "Pretrain/Step Time": 8.493849106132984} +{"Pretrain/Learning Rate": 4.24336211174359e-05, "Pretrain/Loss": 2.0484907627105713, "Pretrain/Loss (Raw)": 1.9378056526184082, "Pretrain/Step": 5278, "Pretrain/Step Time": 8.494552846997976} +{"Pretrain/Learning Rate": 4.243057820376831e-05, "Pretrain/Loss": 2.0490307807922363, "Pretrain/Loss (Raw)": 2.075382709503174, "Pretrain/Step": 5279, "Pretrain/Step Time": 8.498125465586782} +{"Pretrain/Learning Rate": 4.242753478750231e-05, "Pretrain/Loss": 2.0487542152404785, "Pretrain/Loss (Raw)": 2.0267295837402344, "Pretrain/Step": 5280, "Pretrain/Step Time": 8.498415546491742} +{"Pretrain/Learning Rate": 4.2424490868725616e-05, "Pretrain/Loss": 2.049531936645508, "Pretrain/Loss (Raw)": 2.005279541015625, "Pretrain/Step": 5281, "Pretrain/Step Time": 8.496487185359001} +{"Pretrain/Learning Rate": 4.2421446447526015e-05, "Pretrain/Loss": 2.050330638885498, "Pretrain/Loss (Raw)": 2.2780840396881104, "Pretrain/Step": 5282, "Pretrain/Step Time": 8.502732312306762} +{"Pretrain/Learning Rate": 4.241840152399129e-05, "Pretrain/Loss": 2.049415111541748, "Pretrain/Loss (Raw)": 2.033003807067871, "Pretrain/Step": 5283, "Pretrain/Step Time": 8.503288956359029} +{"Pretrain/Learning Rate": 4.241535609820922e-05, "Pretrain/Loss": 2.0503759384155273, "Pretrain/Loss (Raw)": 2.2478129863739014, "Pretrain/Step": 5284, "Pretrain/Step Time": 8.499772058799863} +{"Pretrain/Learning Rate": 4.241231017026766e-05, "Pretrain/Loss": 2.054131031036377, "Pretrain/Loss (Raw)": 2.4514482021331787, "Pretrain/Step": 5285, "Pretrain/Step Time": 8.49756489880383} +{"Pretrain/Learning Rate": 4.240926374025439e-05, "Pretrain/Loss": 2.0539002418518066, "Pretrain/Loss (Raw)": 2.2649192810058594, "Pretrain/Step": 5286, "Pretrain/Step Time": 8.497534334659576} +{"Pretrain/Learning Rate": 4.240621680825729e-05, "Pretrain/Loss": 2.05313777923584, "Pretrain/Loss (Raw)": 1.9950076341629028, "Pretrain/Step": 5287, "Pretrain/Step Time": 8.497945543378592} +{"Pretrain/Learning Rate": 4.2403169374364184e-05, "Pretrain/Loss": 2.052180767059326, "Pretrain/Loss (Raw)": 1.9293326139450073, "Pretrain/Step": 5288, "Pretrain/Step Time": 8.49787949025631} +{"Pretrain/Learning Rate": 4.2400121438662966e-05, "Pretrain/Loss": 2.0511698722839355, "Pretrain/Loss (Raw)": 2.121405601501465, "Pretrain/Step": 5289, "Pretrain/Step Time": 8.50316995754838} +{"Pretrain/Learning Rate": 4.239707300124151e-05, "Pretrain/Loss": 2.050370216369629, "Pretrain/Loss (Raw)": 1.89415442943573, "Pretrain/Step": 5290, "Pretrain/Step Time": 8.50577723607421} +{"Pretrain/Learning Rate": 4.239402406218772e-05, "Pretrain/Loss": 2.0500121116638184, "Pretrain/Loss (Raw)": 2.0770840644836426, "Pretrain/Step": 5291, "Pretrain/Step Time": 8.497742781415582} +{"Pretrain/Learning Rate": 4.23909746215895e-05, "Pretrain/Loss": 2.048394203186035, "Pretrain/Loss (Raw)": 1.838905692100525, "Pretrain/Step": 5292, "Pretrain/Step Time": 8.499305563047528} +{"Pretrain/Learning Rate": 4.23879246795348e-05, "Pretrain/Loss": 2.0497000217437744, "Pretrain/Loss (Raw)": 2.161903142929077, "Pretrain/Step": 5293, "Pretrain/Step Time": 8.500419087707996} +{"Pretrain/Learning Rate": 4.2384874236111535e-05, "Pretrain/Loss": 2.047428607940674, "Pretrain/Loss (Raw)": 1.7667301893234253, "Pretrain/Step": 5294, "Pretrain/Step Time": 8.499236136674881} +{"Pretrain/Learning Rate": 4.238182329140768e-05, "Pretrain/Loss": 2.0474321842193604, "Pretrain/Loss (Raw)": 1.900020718574524, "Pretrain/Step": 5295, "Pretrain/Step Time": 8.504909129813313} +{"Pretrain/Learning Rate": 4.237877184551122e-05, "Pretrain/Loss": 2.051133394241333, "Pretrain/Loss (Raw)": 2.3941500186920166, "Pretrain/Step": 5296, "Pretrain/Step Time": 8.50255087390542} +{"Pretrain/Learning Rate": 4.237571989851011e-05, "Pretrain/Loss": 2.051931858062744, "Pretrain/Loss (Raw)": 2.065002918243408, "Pretrain/Step": 5297, "Pretrain/Step Time": 8.505074553191662} +{"Pretrain/Learning Rate": 4.2372667450492364e-05, "Pretrain/Loss": 2.049564838409424, "Pretrain/Loss (Raw)": 1.817782998085022, "Pretrain/Step": 5298, "Pretrain/Step Time": 8.499800853431225} +{"Pretrain/Learning Rate": 4.236961450154601e-05, "Pretrain/Loss": 2.0491652488708496, "Pretrain/Loss (Raw)": 2.0328049659729004, "Pretrain/Step": 5299, "Pretrain/Step Time": 8.501935301348567} +{"Pretrain/Learning Rate": 4.2366561051759055e-05, "Pretrain/Loss": 2.048231840133667, "Pretrain/Loss (Raw)": 1.9960358142852783, "Pretrain/Step": 5300, "Pretrain/Step Time": 8.501919411122799} +{"Pretrain/Learning Rate": 4.2363507101219564e-05, "Pretrain/Loss": 2.047224283218384, "Pretrain/Loss (Raw)": 1.9477828741073608, "Pretrain/Step": 5301, "Pretrain/Step Time": 8.50124592334032} +{"Pretrain/Learning Rate": 4.236045265001558e-05, "Pretrain/Loss": 2.0470926761627197, "Pretrain/Loss (Raw)": 2.0541961193084717, "Pretrain/Step": 5302, "Pretrain/Step Time": 8.50136436149478} +{"Pretrain/Learning Rate": 4.235739769823519e-05, "Pretrain/Loss": 2.0478458404541016, "Pretrain/Loss (Raw)": 2.2482354640960693, "Pretrain/Step": 5303, "Pretrain/Step Time": 8.502678241580725} +{"Pretrain/Learning Rate": 4.235434224596647e-05, "Pretrain/Loss": 2.047513008117676, "Pretrain/Loss (Raw)": 2.0707123279571533, "Pretrain/Step": 5304, "Pretrain/Step Time": 8.505403906106949} +{"Pretrain/Learning Rate": 4.235128629329752e-05, "Pretrain/Loss": 2.0500283241271973, "Pretrain/Loss (Raw)": 2.178166151046753, "Pretrain/Step": 5305, "Pretrain/Step Time": 8.509032994508743} +{"Pretrain/Learning Rate": 4.2348229840316465e-05, "Pretrain/Loss": 2.050689220428467, "Pretrain/Loss (Raw)": 2.0594468116760254, "Pretrain/Step": 5306, "Pretrain/Step Time": 8.506703993305564} +{"Pretrain/Learning Rate": 4.2345172887111435e-05, "Pretrain/Loss": 2.049269676208496, "Pretrain/Loss (Raw)": 1.9171373844146729, "Pretrain/Step": 5307, "Pretrain/Step Time": 8.508066594600677} +{"Pretrain/Learning Rate": 4.234211543377057e-05, "Pretrain/Loss": 2.0495848655700684, "Pretrain/Loss (Raw)": 1.8723548650741577, "Pretrain/Step": 5308, "Pretrain/Step Time": 8.503643814474344} +{"Pretrain/Learning Rate": 4.233905748038203e-05, "Pretrain/Loss": 2.0492963790893555, "Pretrain/Loss (Raw)": 1.961445927619934, "Pretrain/Step": 5309, "Pretrain/Step Time": 8.501951994374394} +{"Pretrain/Learning Rate": 4.233599902703399e-05, "Pretrain/Loss": 2.0484910011291504, "Pretrain/Loss (Raw)": 1.9589641094207764, "Pretrain/Step": 5310, "Pretrain/Step Time": 8.499610951170325} +{"Pretrain/Learning Rate": 4.2332940073814644e-05, "Pretrain/Loss": 2.048491954803467, "Pretrain/Loss (Raw)": 2.1117982864379883, "Pretrain/Step": 5311, "Pretrain/Step Time": 8.499203011393547} +{"Pretrain/Learning Rate": 4.2329880620812193e-05, "Pretrain/Loss": 2.0495100021362305, "Pretrain/Loss (Raw)": 1.9963072538375854, "Pretrain/Step": 5312, "Pretrain/Step Time": 8.505179712548852} +{"Pretrain/Learning Rate": 4.232682066811484e-05, "Pretrain/Loss": 2.0475029945373535, "Pretrain/Loss (Raw)": 1.8856174945831299, "Pretrain/Step": 5313, "Pretrain/Step Time": 8.508588811382651} +{"Pretrain/Learning Rate": 4.2323760215810836e-05, "Pretrain/Loss": 2.0463995933532715, "Pretrain/Loss (Raw)": 2.05629825592041, "Pretrain/Step": 5314, "Pretrain/Step Time": 8.508815359324217} +{"Pretrain/Learning Rate": 4.2320699263988416e-05, "Pretrain/Loss": 2.0457334518432617, "Pretrain/Loss (Raw)": 2.1425585746765137, "Pretrain/Step": 5315, "Pretrain/Step Time": 8.511592356488109} +{"Pretrain/Learning Rate": 4.231763781273584e-05, "Pretrain/Loss": 2.0456337928771973, "Pretrain/Loss (Raw)": 2.000546455383301, "Pretrain/Step": 5316, "Pretrain/Step Time": 8.504459792748094} +{"Pretrain/Learning Rate": 4.2314575862141394e-05, "Pretrain/Loss": 2.046562433242798, "Pretrain/Loss (Raw)": 2.1808838844299316, "Pretrain/Step": 5317, "Pretrain/Step Time": 8.500499000772834} +{"Pretrain/Learning Rate": 4.231151341229335e-05, "Pretrain/Loss": 2.0493757724761963, "Pretrain/Loss (Raw)": 2.1243433952331543, "Pretrain/Step": 5318, "Pretrain/Step Time": 8.501369742676616} +{"Pretrain/Learning Rate": 4.230845046328002e-05, "Pretrain/Loss": 2.052452802658081, "Pretrain/Loss (Raw)": 2.0676190853118896, "Pretrain/Step": 5319, "Pretrain/Step Time": 8.503217475488782} +{"Pretrain/Learning Rate": 4.230538701518973e-05, "Pretrain/Loss": 2.052161931991577, "Pretrain/Loss (Raw)": 2.10990571975708, "Pretrain/Step": 5320, "Pretrain/Step Time": 8.496839053928852} +{"Pretrain/Learning Rate": 4.23023230681108e-05, "Pretrain/Loss": 2.0517287254333496, "Pretrain/Loss (Raw)": 1.9821757078170776, "Pretrain/Step": 5321, "Pretrain/Step Time": 8.506469164043665} +{"Pretrain/Learning Rate": 4.229925862213158e-05, "Pretrain/Loss": 2.049408435821533, "Pretrain/Loss (Raw)": 2.0069193840026855, "Pretrain/Step": 5322, "Pretrain/Step Time": 8.497389558702707} +{"Pretrain/Learning Rate": 4.229619367734044e-05, "Pretrain/Loss": 2.04862642288208, "Pretrain/Loss (Raw)": 2.0923633575439453, "Pretrain/Step": 5323, "Pretrain/Step Time": 8.501820530742407} +{"Pretrain/Learning Rate": 4.229312823382574e-05, "Pretrain/Loss": 2.048954486846924, "Pretrain/Loss (Raw)": 1.9880973100662231, "Pretrain/Step": 5324, "Pretrain/Step Time": 8.497600788250566} +{"Pretrain/Learning Rate": 4.229006229167588e-05, "Pretrain/Loss": 2.0492594242095947, "Pretrain/Loss (Raw)": 1.9736918210983276, "Pretrain/Step": 5325, "Pretrain/Step Time": 8.49430969543755} +{"Pretrain/Learning Rate": 4.228699585097927e-05, "Pretrain/Loss": 2.0485634803771973, "Pretrain/Loss (Raw)": 2.0915465354919434, "Pretrain/Step": 5326, "Pretrain/Step Time": 8.493977719917893} +{"Pretrain/Learning Rate": 4.228392891182432e-05, "Pretrain/Loss": 2.0478854179382324, "Pretrain/Loss (Raw)": 1.9311256408691406, "Pretrain/Step": 5327, "Pretrain/Step Time": 8.496812775731087} +{"Pretrain/Learning Rate": 4.2280861474299464e-05, "Pretrain/Loss": 2.052164077758789, "Pretrain/Loss (Raw)": 2.611462354660034, "Pretrain/Step": 5328, "Pretrain/Step Time": 8.498249121010303} +{"Pretrain/Learning Rate": 4.227779353849314e-05, "Pretrain/Loss": 2.0523252487182617, "Pretrain/Loss (Raw)": 2.0529677867889404, "Pretrain/Step": 5329, "Pretrain/Step Time": 8.500002341344953} +{"Pretrain/Learning Rate": 4.227472510449383e-05, "Pretrain/Loss": 2.0547256469726562, "Pretrain/Loss (Raw)": 1.8691473007202148, "Pretrain/Step": 5330, "Pretrain/Step Time": 8.49998969770968} +{"Pretrain/Learning Rate": 4.227165617238999e-05, "Pretrain/Loss": 2.0508804321289062, "Pretrain/Loss (Raw)": 1.9990383386611938, "Pretrain/Step": 5331, "Pretrain/Step Time": 8.50273577682674} +{"Pretrain/Learning Rate": 4.226858674227012e-05, "Pretrain/Loss": 2.048405170440674, "Pretrain/Loss (Raw)": 1.955031394958496, "Pretrain/Step": 5332, "Pretrain/Step Time": 8.49941160902381} +{"Pretrain/Learning Rate": 4.2265516814222734e-05, "Pretrain/Loss": 2.047121286392212, "Pretrain/Loss (Raw)": 2.0815255641937256, "Pretrain/Step": 5333, "Pretrain/Step Time": 8.500782765448093} +{"Pretrain/Learning Rate": 4.226244638833634e-05, "Pretrain/Loss": 2.0463485717773438, "Pretrain/Loss (Raw)": 2.04439377784729, "Pretrain/Step": 5334, "Pretrain/Step Time": 8.497069954872131} +{"Pretrain/Learning Rate": 4.225937546469947e-05, "Pretrain/Loss": 2.048495292663574, "Pretrain/Loss (Raw)": 1.9962034225463867, "Pretrain/Step": 5335, "Pretrain/Step Time": 8.494059979915619} +{"Pretrain/Learning Rate": 4.2256304043400676e-05, "Pretrain/Loss": 2.0500919818878174, "Pretrain/Loss (Raw)": 2.1237401962280273, "Pretrain/Step": 5336, "Pretrain/Step Time": 8.492308083921671} +{"Pretrain/Learning Rate": 4.225323212452852e-05, "Pretrain/Loss": 2.0486972332000732, "Pretrain/Loss (Raw)": 1.9738632440567017, "Pretrain/Step": 5337, "Pretrain/Step Time": 8.49582415446639} +{"Pretrain/Learning Rate": 4.225015970817158e-05, "Pretrain/Loss": 2.0505831241607666, "Pretrain/Loss (Raw)": 2.1573073863983154, "Pretrain/Step": 5338, "Pretrain/Step Time": 8.49692676961422} +{"Pretrain/Learning Rate": 4.2247086794418445e-05, "Pretrain/Loss": 2.049461841583252, "Pretrain/Loss (Raw)": 1.9635586738586426, "Pretrain/Step": 5339, "Pretrain/Step Time": 8.492320878431201} +{"Pretrain/Learning Rate": 4.224401338335772e-05, "Pretrain/Loss": 2.051630973815918, "Pretrain/Loss (Raw)": 1.9603248834609985, "Pretrain/Step": 5340, "Pretrain/Step Time": 8.492671752348542} +{"Pretrain/Learning Rate": 4.224093947507802e-05, "Pretrain/Loss": 2.0485739707946777, "Pretrain/Loss (Raw)": 1.6273163557052612, "Pretrain/Step": 5341, "Pretrain/Step Time": 8.492871331050992} +{"Pretrain/Learning Rate": 4.2237865069667994e-05, "Pretrain/Loss": 2.0479142665863037, "Pretrain/Loss (Raw)": 1.961897373199463, "Pretrain/Step": 5342, "Pretrain/Step Time": 8.493162207305431} +{"Pretrain/Learning Rate": 4.2234790167216274e-05, "Pretrain/Loss": 2.0512003898620605, "Pretrain/Loss (Raw)": 2.298617362976074, "Pretrain/Step": 5343, "Pretrain/Step Time": 8.494722736999393} +{"Pretrain/Learning Rate": 4.223171476781154e-05, "Pretrain/Loss": 2.051117181777954, "Pretrain/Loss (Raw)": 1.9263612031936646, "Pretrain/Step": 5344, "Pretrain/Step Time": 8.49797104485333} +{"Pretrain/Learning Rate": 4.222863887154245e-05, "Pretrain/Loss": 2.0485002994537354, "Pretrain/Loss (Raw)": 1.794043779373169, "Pretrain/Step": 5345, "Pretrain/Step Time": 8.498491615056992} +{"Pretrain/Learning Rate": 4.22255624784977e-05, "Pretrain/Loss": 2.0474679470062256, "Pretrain/Loss (Raw)": 1.9201464653015137, "Pretrain/Step": 5346, "Pretrain/Step Time": 8.50384727306664} +{"Pretrain/Learning Rate": 4.2222485588766005e-05, "Pretrain/Loss": 2.045828342437744, "Pretrain/Loss (Raw)": 2.0928471088409424, "Pretrain/Step": 5347, "Pretrain/Step Time": 8.50170730240643} +{"Pretrain/Learning Rate": 4.221940820243607e-05, "Pretrain/Loss": 2.0473105907440186, "Pretrain/Loss (Raw)": 2.194106340408325, "Pretrain/Step": 5348, "Pretrain/Step Time": 8.504164619371295} +{"Pretrain/Learning Rate": 4.221633031959665e-05, "Pretrain/Loss": 2.0483484268188477, "Pretrain/Loss (Raw)": 1.9764050245285034, "Pretrain/Step": 5349, "Pretrain/Step Time": 8.501219067722559} +{"Pretrain/Learning Rate": 4.2213251940336476e-05, "Pretrain/Loss": 2.048189878463745, "Pretrain/Loss (Raw)": 2.169494390487671, "Pretrain/Step": 5350, "Pretrain/Step Time": 8.499554647132754} +{"Pretrain/Learning Rate": 4.2210173064744316e-05, "Pretrain/Loss": 2.0477938652038574, "Pretrain/Loss (Raw)": 1.9092581272125244, "Pretrain/Step": 5351, "Pretrain/Step Time": 8.502778980880976} +{"Pretrain/Learning Rate": 4.220709369290895e-05, "Pretrain/Loss": 2.047353744506836, "Pretrain/Loss (Raw)": 2.120689868927002, "Pretrain/Step": 5352, "Pretrain/Step Time": 8.502225771546364} +{"Pretrain/Learning Rate": 4.220401382491917e-05, "Pretrain/Loss": 2.048036575317383, "Pretrain/Loss (Raw)": 2.2150027751922607, "Pretrain/Step": 5353, "Pretrain/Step Time": 8.506223760545254} +{"Pretrain/Learning Rate": 4.220093346086378e-05, "Pretrain/Loss": 2.044786214828491, "Pretrain/Loss (Raw)": 2.1597542762756348, "Pretrain/Step": 5354, "Pretrain/Step Time": 8.501966958865523} +{"Pretrain/Learning Rate": 4.219785260083159e-05, "Pretrain/Loss": 2.043635845184326, "Pretrain/Loss (Raw)": 2.0771148204803467, "Pretrain/Step": 5355, "Pretrain/Step Time": 8.50456446222961} +{"Pretrain/Learning Rate": 4.219477124491146e-05, "Pretrain/Loss": 2.044867515563965, "Pretrain/Loss (Raw)": 2.1108362674713135, "Pretrain/Step": 5356, "Pretrain/Step Time": 8.506078701466322} +{"Pretrain/Learning Rate": 4.219168939319221e-05, "Pretrain/Loss": 2.045630931854248, "Pretrain/Loss (Raw)": 2.2525129318237305, "Pretrain/Step": 5357, "Pretrain/Step Time": 8.500371925532818} +{"Pretrain/Learning Rate": 4.218860704576272e-05, "Pretrain/Loss": 2.0474979877471924, "Pretrain/Loss (Raw)": 1.9885919094085693, "Pretrain/Step": 5358, "Pretrain/Step Time": 8.499626515433192} +{"Pretrain/Learning Rate": 4.2185524202711854e-05, "Pretrain/Loss": 2.0476815700531006, "Pretrain/Loss (Raw)": 1.941992998123169, "Pretrain/Step": 5359, "Pretrain/Step Time": 8.504486912861466} +{"Pretrain/Learning Rate": 4.2182440864128526e-05, "Pretrain/Loss": 2.044840097427368, "Pretrain/Loss (Raw)": 1.975451111793518, "Pretrain/Step": 5360, "Pretrain/Step Time": 8.504416693001986} +{"Pretrain/Learning Rate": 4.217935703010162e-05, "Pretrain/Loss": 2.047396421432495, "Pretrain/Loss (Raw)": 2.182191848754883, "Pretrain/Step": 5361, "Pretrain/Step Time": 8.501896785572171} +{"Pretrain/Learning Rate": 4.217627270072006e-05, "Pretrain/Loss": 2.0481090545654297, "Pretrain/Loss (Raw)": 2.290745258331299, "Pretrain/Step": 5362, "Pretrain/Step Time": 8.504803948104382} +{"Pretrain/Learning Rate": 4.2173187876072803e-05, "Pretrain/Loss": 2.049375534057617, "Pretrain/Loss (Raw)": 2.0921688079833984, "Pretrain/Step": 5363, "Pretrain/Step Time": 8.499452577903867} +{"Pretrain/Learning Rate": 4.217010255624877e-05, "Pretrain/Loss": 2.0490665435791016, "Pretrain/Loss (Raw)": 2.0107922554016113, "Pretrain/Step": 5364, "Pretrain/Step Time": 8.500703647732735} +{"Pretrain/Learning Rate": 4.216701674133693e-05, "Pretrain/Loss": 2.0503015518188477, "Pretrain/Loss (Raw)": 2.197923183441162, "Pretrain/Step": 5365, "Pretrain/Step Time": 8.50049426779151} +{"Pretrain/Learning Rate": 4.216393043142627e-05, "Pretrain/Loss": 2.049206256866455, "Pretrain/Loss (Raw)": 1.9777206182479858, "Pretrain/Step": 5366, "Pretrain/Step Time": 8.499573377892375} +{"Pretrain/Learning Rate": 4.216084362660577e-05, "Pretrain/Loss": 2.050570487976074, "Pretrain/Loss (Raw)": 1.890121340751648, "Pretrain/Step": 5367, "Pretrain/Step Time": 8.495585421100259} +{"Pretrain/Learning Rate": 4.2157756326964446e-05, "Pretrain/Loss": 2.051349639892578, "Pretrain/Loss (Raw)": 2.1748604774475098, "Pretrain/Step": 5368, "Pretrain/Step Time": 8.49453185684979} +{"Pretrain/Learning Rate": 4.2154668532591316e-05, "Pretrain/Loss": 2.051873207092285, "Pretrain/Loss (Raw)": 2.058896541595459, "Pretrain/Step": 5369, "Pretrain/Step Time": 8.4915572963655} +{"Pretrain/Learning Rate": 4.2151580243575407e-05, "Pretrain/Loss": 2.0540778636932373, "Pretrain/Loss (Raw)": 2.1299667358398438, "Pretrain/Step": 5370, "Pretrain/Step Time": 8.496206590905786} +{"Pretrain/Learning Rate": 4.214849146000577e-05, "Pretrain/Loss": 2.0543973445892334, "Pretrain/Loss (Raw)": 2.0625524520874023, "Pretrain/Step": 5371, "Pretrain/Step Time": 8.496458664536476} +{"Pretrain/Learning Rate": 4.214540218197148e-05, "Pretrain/Loss": 2.0543718338012695, "Pretrain/Loss (Raw)": 2.1501994132995605, "Pretrain/Step": 5372, "Pretrain/Step Time": 8.492266593500972} +{"Pretrain/Learning Rate": 4.21423124095616e-05, "Pretrain/Loss": 2.0565476417541504, "Pretrain/Loss (Raw)": 2.1324985027313232, "Pretrain/Step": 5373, "Pretrain/Step Time": 8.49113342165947} +{"Pretrain/Learning Rate": 4.2139222142865224e-05, "Pretrain/Loss": 2.0555598735809326, "Pretrain/Loss (Raw)": 1.8670614957809448, "Pretrain/Step": 5374, "Pretrain/Step Time": 8.48947754316032} +{"Pretrain/Learning Rate": 4.213613138197147e-05, "Pretrain/Loss": 2.0527281761169434, "Pretrain/Loss (Raw)": 1.807025671005249, "Pretrain/Step": 5375, "Pretrain/Step Time": 8.488213634118438} +{"Pretrain/Learning Rate": 4.213304012696943e-05, "Pretrain/Loss": 2.0522475242614746, "Pretrain/Loss (Raw)": 2.075855255126953, "Pretrain/Step": 5376, "Pretrain/Step Time": 8.488937813788652} +{"Pretrain/Learning Rate": 4.212994837794827e-05, "Pretrain/Loss": 2.0511395931243896, "Pretrain/Loss (Raw)": 2.104790687561035, "Pretrain/Step": 5377, "Pretrain/Step Time": 8.486584931612015} +{"Pretrain/Learning Rate": 4.2126856134997114e-05, "Pretrain/Loss": 2.0502989292144775, "Pretrain/Loss (Raw)": 2.011388063430786, "Pretrain/Step": 5378, "Pretrain/Step Time": 8.484777888283134} +{"Pretrain/Learning Rate": 4.212376339820515e-05, "Pretrain/Loss": 2.0515592098236084, "Pretrain/Loss (Raw)": 2.0473990440368652, "Pretrain/Step": 5379, "Pretrain/Step Time": 8.48775321431458} +{"Pretrain/Learning Rate": 4.212067016766153e-05, "Pretrain/Loss": 2.048299551010132, "Pretrain/Loss (Raw)": 2.116680145263672, "Pretrain/Step": 5380, "Pretrain/Step Time": 8.48400929197669} +{"Pretrain/Learning Rate": 4.211757644345545e-05, "Pretrain/Loss": 2.0500588417053223, "Pretrain/Loss (Raw)": 2.2605249881744385, "Pretrain/Step": 5381, "Pretrain/Step Time": 8.486181639134884} +{"Pretrain/Learning Rate": 4.2114482225676136e-05, "Pretrain/Loss": 2.0505545139312744, "Pretrain/Loss (Raw)": 2.135359525680542, "Pretrain/Step": 5382, "Pretrain/Step Time": 8.486647428944707} +{"Pretrain/Learning Rate": 4.211138751441278e-05, "Pretrain/Loss": 2.0524485111236572, "Pretrain/Loss (Raw)": 2.392974376678467, "Pretrain/Step": 5383, "Pretrain/Step Time": 8.484880793839693} +{"Pretrain/Learning Rate": 4.2108292309754626e-05, "Pretrain/Loss": 2.0520987510681152, "Pretrain/Loss (Raw)": 1.9464069604873657, "Pretrain/Step": 5384, "Pretrain/Step Time": 8.488352112472057} +{"Pretrain/Learning Rate": 4.210519661179093e-05, "Pretrain/Loss": 2.0538876056671143, "Pretrain/Loss (Raw)": 2.1080312728881836, "Pretrain/Step": 5385, "Pretrain/Step Time": 8.484961248934269} +{"Pretrain/Learning Rate": 4.2102100420610945e-05, "Pretrain/Loss": 2.054161310195923, "Pretrain/Loss (Raw)": 1.9767252206802368, "Pretrain/Step": 5386, "Pretrain/Step Time": 8.481816831976175} +{"Pretrain/Learning Rate": 4.2099003736303955e-05, "Pretrain/Loss": 2.0561647415161133, "Pretrain/Loss (Raw)": 2.1905455589294434, "Pretrain/Step": 5387, "Pretrain/Step Time": 8.490028662607074} +{"Pretrain/Learning Rate": 4.209590655895924e-05, "Pretrain/Loss": 2.0553035736083984, "Pretrain/Loss (Raw)": 2.180232524871826, "Pretrain/Step": 5388, "Pretrain/Step Time": 8.489626105874777} +{"Pretrain/Learning Rate": 4.209280888866612e-05, "Pretrain/Loss": 2.056014060974121, "Pretrain/Loss (Raw)": 2.0592541694641113, "Pretrain/Step": 5389, "Pretrain/Step Time": 8.490072645246983} +{"Pretrain/Learning Rate": 4.20897107255139e-05, "Pretrain/Loss": 2.053744316101074, "Pretrain/Loss (Raw)": 2.284291982650757, "Pretrain/Step": 5390, "Pretrain/Step Time": 8.48685523495078} +{"Pretrain/Learning Rate": 4.208661206959191e-05, "Pretrain/Loss": 2.053743600845337, "Pretrain/Loss (Raw)": 2.0302155017852783, "Pretrain/Step": 5391, "Pretrain/Step Time": 8.488832427188754} +{"Pretrain/Learning Rate": 4.208351292098952e-05, "Pretrain/Loss": 2.0527830123901367, "Pretrain/Loss (Raw)": 2.034968376159668, "Pretrain/Step": 5392, "Pretrain/Step Time": 8.485837139189243} +{"Pretrain/Learning Rate": 4.208041327979607e-05, "Pretrain/Loss": 2.054915428161621, "Pretrain/Loss (Raw)": 2.1715054512023926, "Pretrain/Step": 5393, "Pretrain/Step Time": 8.487872902303934} +{"Pretrain/Learning Rate": 4.207731314610095e-05, "Pretrain/Loss": 2.0568490028381348, "Pretrain/Loss (Raw)": 2.031831979751587, "Pretrain/Step": 5394, "Pretrain/Step Time": 8.482300033792853} +{"Pretrain/Learning Rate": 4.207421251999354e-05, "Pretrain/Loss": 2.0566883087158203, "Pretrain/Loss (Raw)": 2.13604474067688, "Pretrain/Step": 5395, "Pretrain/Step Time": 8.486875524744391} +{"Pretrain/Learning Rate": 4.2071111401563244e-05, "Pretrain/Loss": 2.0584716796875, "Pretrain/Loss (Raw)": 2.3306026458740234, "Pretrain/Step": 5396, "Pretrain/Step Time": 8.487647270783782} +{"Pretrain/Learning Rate": 4.2068009790899493e-05, "Pretrain/Loss": 2.060793161392212, "Pretrain/Loss (Raw)": 2.282935380935669, "Pretrain/Step": 5397, "Pretrain/Step Time": 8.486267104744911} +{"Pretrain/Learning Rate": 4.206490768809171e-05, "Pretrain/Loss": 2.062272071838379, "Pretrain/Loss (Raw)": 1.8622307777404785, "Pretrain/Step": 5398, "Pretrain/Step Time": 8.485945610329509} +{"Pretrain/Learning Rate": 4.2061805093229343e-05, "Pretrain/Loss": 2.058854579925537, "Pretrain/Loss (Raw)": 1.8901199102401733, "Pretrain/Step": 5399, "Pretrain/Step Time": 8.490087829530239} +{"Pretrain/Learning Rate": 4.205870200640185e-05, "Pretrain/Loss": 2.0548529624938965, "Pretrain/Loss (Raw)": 1.6701693534851074, "Pretrain/Step": 5400, "Pretrain/Step Time": 8.486221246421337} +{"Pretrain/Learning Rate": 4.2055598427698715e-05, "Pretrain/Loss": 2.053999900817871, "Pretrain/Loss (Raw)": 1.866921067237854, "Pretrain/Step": 5401, "Pretrain/Step Time": 8.485017543658614} +{"Pretrain/Learning Rate": 4.205249435720943e-05, "Pretrain/Loss": 2.0535950660705566, "Pretrain/Loss (Raw)": 1.945600152015686, "Pretrain/Step": 5402, "Pretrain/Step Time": 8.488531241193414} +{"Pretrain/Learning Rate": 4.204938979502347e-05, "Pretrain/Loss": 2.0513789653778076, "Pretrain/Loss (Raw)": 1.8477939367294312, "Pretrain/Step": 5403, "Pretrain/Step Time": 8.492256922647357} +{"Pretrain/Learning Rate": 4.204628474123039e-05, "Pretrain/Loss": 2.05320405960083, "Pretrain/Loss (Raw)": 2.0575332641601562, "Pretrain/Step": 5404, "Pretrain/Step Time": 8.489229125902057} +{"Pretrain/Learning Rate": 4.2043179195919703e-05, "Pretrain/Loss": 2.0545694828033447, "Pretrain/Loss (Raw)": 2.0891952514648438, "Pretrain/Step": 5405, "Pretrain/Step Time": 8.497521288692951} +{"Pretrain/Learning Rate": 4.204007315918096e-05, "Pretrain/Loss": 2.054746150970459, "Pretrain/Loss (Raw)": 1.9604122638702393, "Pretrain/Step": 5406, "Pretrain/Step Time": 8.496631087735295} +{"Pretrain/Learning Rate": 4.203696663110372e-05, "Pretrain/Loss": 2.055715560913086, "Pretrain/Loss (Raw)": 2.1994893550872803, "Pretrain/Step": 5407, "Pretrain/Step Time": 8.491237808018923} +{"Pretrain/Learning Rate": 4.203385961177756e-05, "Pretrain/Loss": 2.0551047325134277, "Pretrain/Loss (Raw)": 1.9485275745391846, "Pretrain/Step": 5408, "Pretrain/Step Time": 8.4907330814749} +{"Pretrain/Learning Rate": 4.203075210129206e-05, "Pretrain/Loss": 2.057450771331787, "Pretrain/Loss (Raw)": 2.3055553436279297, "Pretrain/Step": 5409, "Pretrain/Step Time": 8.495208637788892} +{"Pretrain/Learning Rate": 4.2027644099736826e-05, "Pretrain/Loss": 2.0571093559265137, "Pretrain/Loss (Raw)": 2.2344281673431396, "Pretrain/Step": 5410, "Pretrain/Step Time": 8.488506527617574} +{"Pretrain/Learning Rate": 4.202453560720149e-05, "Pretrain/Loss": 2.0583739280700684, "Pretrain/Loss (Raw)": 2.194829225540161, "Pretrain/Step": 5411, "Pretrain/Step Time": 8.492084633558989} +{"Pretrain/Learning Rate": 4.2021426623775664e-05, "Pretrain/Loss": 2.0554521083831787, "Pretrain/Loss (Raw)": 1.8738327026367188, "Pretrain/Step": 5412, "Pretrain/Step Time": 8.494533950462937} +{"Pretrain/Learning Rate": 4.2018317149549004e-05, "Pretrain/Loss": 2.0536820888519287, "Pretrain/Loss (Raw)": 2.2248880863189697, "Pretrain/Step": 5413, "Pretrain/Step Time": 8.496764725074172} +{"Pretrain/Learning Rate": 4.201520718461116e-05, "Pretrain/Loss": 2.053199291229248, "Pretrain/Loss (Raw)": 2.2031471729278564, "Pretrain/Step": 5414, "Pretrain/Step Time": 8.49099737033248} +{"Pretrain/Learning Rate": 4.201209672905182e-05, "Pretrain/Loss": 2.0547728538513184, "Pretrain/Loss (Raw)": 2.196382761001587, "Pretrain/Step": 5415, "Pretrain/Step Time": 8.494070364162326} +{"Pretrain/Learning Rate": 4.2008985782960654e-05, "Pretrain/Loss": 2.056086778640747, "Pretrain/Loss (Raw)": 2.0975213050842285, "Pretrain/Step": 5416, "Pretrain/Step Time": 8.489363357424736} +{"Pretrain/Learning Rate": 4.200587434642738e-05, "Pretrain/Loss": 2.054267644882202, "Pretrain/Loss (Raw)": 1.888577938079834, "Pretrain/Step": 5417, "Pretrain/Step Time": 8.49006668664515} +{"Pretrain/Learning Rate": 4.200276241954171e-05, "Pretrain/Loss": 2.053549289703369, "Pretrain/Loss (Raw)": 1.8021883964538574, "Pretrain/Step": 5418, "Pretrain/Step Time": 8.490771021693945} +{"Pretrain/Learning Rate": 4.199965000239336e-05, "Pretrain/Loss": 2.0532970428466797, "Pretrain/Loss (Raw)": 2.0448005199432373, "Pretrain/Step": 5419, "Pretrain/Step Time": 8.500092098489404} +{"Pretrain/Learning Rate": 4.1996537095072094e-05, "Pretrain/Loss": 2.0555827617645264, "Pretrain/Loss (Raw)": 2.1314735412597656, "Pretrain/Step": 5420, "Pretrain/Step Time": 8.500492559745908} +{"Pretrain/Learning Rate": 4.1993423697667665e-05, "Pretrain/Loss": 2.0552988052368164, "Pretrain/Loss (Raw)": 2.125575065612793, "Pretrain/Step": 5421, "Pretrain/Step Time": 8.499023223295808} +{"Pretrain/Learning Rate": 4.199030981026985e-05, "Pretrain/Loss": 2.058101177215576, "Pretrain/Loss (Raw)": 2.1254231929779053, "Pretrain/Step": 5422, "Pretrain/Step Time": 8.49944468215108} +{"Pretrain/Learning Rate": 4.1987195432968416e-05, "Pretrain/Loss": 2.0580551624298096, "Pretrain/Loss (Raw)": 1.8941409587860107, "Pretrain/Step": 5423, "Pretrain/Step Time": 8.49367631599307} +{"Pretrain/Learning Rate": 4.198408056585318e-05, "Pretrain/Loss": 2.0592751502990723, "Pretrain/Loss (Raw)": 2.5503129959106445, "Pretrain/Step": 5424, "Pretrain/Step Time": 8.499495266005397} +{"Pretrain/Learning Rate": 4.198096520901395e-05, "Pretrain/Loss": 2.0572314262390137, "Pretrain/Loss (Raw)": 1.8033806085586548, "Pretrain/Step": 5425, "Pretrain/Step Time": 8.495546288788319} +{"Pretrain/Learning Rate": 4.197784936254057e-05, "Pretrain/Loss": 2.0574822425842285, "Pretrain/Loss (Raw)": 1.8498822450637817, "Pretrain/Step": 5426, "Pretrain/Step Time": 8.496277892962098} +{"Pretrain/Learning Rate": 4.197473302652286e-05, "Pretrain/Loss": 2.0558412075042725, "Pretrain/Loss (Raw)": 1.8227778673171997, "Pretrain/Step": 5427, "Pretrain/Step Time": 8.49460351653397} +{"Pretrain/Learning Rate": 4.1971616201050704e-05, "Pretrain/Loss": 2.055454730987549, "Pretrain/Loss (Raw)": 1.9465733766555786, "Pretrain/Step": 5428, "Pretrain/Step Time": 8.493224056437612} +{"Pretrain/Learning Rate": 4.1968498886213945e-05, "Pretrain/Loss": 2.056565284729004, "Pretrain/Loss (Raw)": 2.0899062156677246, "Pretrain/Step": 5429, "Pretrain/Step Time": 8.49421920068562} +{"Pretrain/Learning Rate": 4.1965381082102495e-05, "Pretrain/Loss": 2.0559935569763184, "Pretrain/Loss (Raw)": 1.9810106754302979, "Pretrain/Step": 5430, "Pretrain/Step Time": 8.493036421015859} +{"Pretrain/Learning Rate": 4.1962262788806235e-05, "Pretrain/Loss": 2.052853584289551, "Pretrain/Loss (Raw)": 1.846347451210022, "Pretrain/Step": 5431, "Pretrain/Step Time": 8.488350253552198} +{"Pretrain/Learning Rate": 4.1959144006415085e-05, "Pretrain/Loss": 2.051583766937256, "Pretrain/Loss (Raw)": 1.908156394958496, "Pretrain/Step": 5432, "Pretrain/Step Time": 8.488158663734794} +{"Pretrain/Learning Rate": 4.1956024735018974e-05, "Pretrain/Loss": 2.049718141555786, "Pretrain/Loss (Raw)": 1.9393815994262695, "Pretrain/Step": 5433, "Pretrain/Step Time": 8.483940659090877} +{"Pretrain/Learning Rate": 4.195290497470784e-05, "Pretrain/Loss": 2.0466694831848145, "Pretrain/Loss (Raw)": 1.6692321300506592, "Pretrain/Step": 5434, "Pretrain/Step Time": 8.48160146549344} +{"Pretrain/Learning Rate": 4.194978472557164e-05, "Pretrain/Loss": 2.0486607551574707, "Pretrain/Loss (Raw)": 2.171989917755127, "Pretrain/Step": 5435, "Pretrain/Step Time": 8.484919579699636} +{"Pretrain/Learning Rate": 4.1946663987700354e-05, "Pretrain/Loss": 2.049251079559326, "Pretrain/Loss (Raw)": 1.9479252099990845, "Pretrain/Step": 5436, "Pretrain/Step Time": 8.489308441057801} +{"Pretrain/Learning Rate": 4.194354276118395e-05, "Pretrain/Loss": 2.049954891204834, "Pretrain/Loss (Raw)": 2.0515525341033936, "Pretrain/Step": 5437, "Pretrain/Step Time": 8.489963112398982} +{"Pretrain/Learning Rate": 4.194042104611244e-05, "Pretrain/Loss": 2.050985097885132, "Pretrain/Loss (Raw)": 2.090815305709839, "Pretrain/Step": 5438, "Pretrain/Step Time": 8.490695420652628} +{"Pretrain/Learning Rate": 4.1937298842575836e-05, "Pretrain/Loss": 2.0497827529907227, "Pretrain/Loss (Raw)": 1.9579219818115234, "Pretrain/Step": 5439, "Pretrain/Step Time": 8.489429580047727} +{"Pretrain/Learning Rate": 4.193417615066415e-05, "Pretrain/Loss": 2.0477583408355713, "Pretrain/Loss (Raw)": 1.7371792793273926, "Pretrain/Step": 5440, "Pretrain/Step Time": 8.489242469891906} +{"Pretrain/Learning Rate": 4.193105297046744e-05, "Pretrain/Loss": 2.0488080978393555, "Pretrain/Loss (Raw)": 2.0199787616729736, "Pretrain/Step": 5441, "Pretrain/Step Time": 8.48612055554986} +{"Pretrain/Learning Rate": 4.192792930207575e-05, "Pretrain/Loss": 2.0488786697387695, "Pretrain/Loss (Raw)": 2.0653200149536133, "Pretrain/Step": 5442, "Pretrain/Step Time": 8.487453347072005} +{"Pretrain/Learning Rate": 4.192480514557915e-05, "Pretrain/Loss": 2.048039674758911, "Pretrain/Loss (Raw)": 2.0351779460906982, "Pretrain/Step": 5443, "Pretrain/Step Time": 8.489019529893994} +{"Pretrain/Learning Rate": 4.192168050106773e-05, "Pretrain/Loss": 2.046041965484619, "Pretrain/Loss (Raw)": 1.7448183298110962, "Pretrain/Step": 5444, "Pretrain/Step Time": 8.491096135228872} +{"Pretrain/Learning Rate": 4.191855536863157e-05, "Pretrain/Loss": 2.0450053215026855, "Pretrain/Loss (Raw)": 2.0482053756713867, "Pretrain/Step": 5445, "Pretrain/Step Time": 8.490928186103702} +{"Pretrain/Learning Rate": 4.1915429748360807e-05, "Pretrain/Loss": 2.043794870376587, "Pretrain/Loss (Raw)": 1.9694169759750366, "Pretrain/Step": 5446, "Pretrain/Step Time": 8.491980889812112} +{"Pretrain/Learning Rate": 4.191230364034555e-05, "Pretrain/Loss": 2.044353485107422, "Pretrain/Loss (Raw)": 2.1391232013702393, "Pretrain/Step": 5447, "Pretrain/Step Time": 8.489853469654918} +{"Pretrain/Learning Rate": 4.190917704467593e-05, "Pretrain/Loss": 2.042780637741089, "Pretrain/Loss (Raw)": 1.9085713624954224, "Pretrain/Step": 5448, "Pretrain/Step Time": 8.492723874747753} +{"Pretrain/Learning Rate": 4.190604996144212e-05, "Pretrain/Loss": 2.042983293533325, "Pretrain/Loss (Raw)": 2.008113384246826, "Pretrain/Step": 5449, "Pretrain/Step Time": 8.485482694581151} +{"Pretrain/Learning Rate": 4.1902922390734274e-05, "Pretrain/Loss": 2.0431911945343018, "Pretrain/Loss (Raw)": 2.0335488319396973, "Pretrain/Step": 5450, "Pretrain/Step Time": 8.487967517226934} +{"Pretrain/Learning Rate": 4.189979433264257e-05, "Pretrain/Loss": 2.043971061706543, "Pretrain/Loss (Raw)": 2.192161798477173, "Pretrain/Step": 5451, "Pretrain/Step Time": 8.487586867064238} +{"Pretrain/Learning Rate": 4.189666578725722e-05, "Pretrain/Loss": 2.0454764366149902, "Pretrain/Loss (Raw)": 2.1807820796966553, "Pretrain/Step": 5452, "Pretrain/Step Time": 8.488245429471135} +{"Pretrain/Learning Rate": 4.1893536754668415e-05, "Pretrain/Loss": 2.0455305576324463, "Pretrain/Loss (Raw)": 1.9806243181228638, "Pretrain/Step": 5453, "Pretrain/Step Time": 8.49608270637691} +{"Pretrain/Learning Rate": 4.18904072349664e-05, "Pretrain/Loss": 2.0446202754974365, "Pretrain/Loss (Raw)": 1.9750349521636963, "Pretrain/Step": 5454, "Pretrain/Step Time": 8.49594296142459} +{"Pretrain/Learning Rate": 4.188727722824138e-05, "Pretrain/Loss": 2.0449161529541016, "Pretrain/Loss (Raw)": 1.9689669609069824, "Pretrain/Step": 5455, "Pretrain/Step Time": 8.49128219857812} +{"Pretrain/Learning Rate": 4.188414673458364e-05, "Pretrain/Loss": 2.0407814979553223, "Pretrain/Loss (Raw)": 2.082251787185669, "Pretrain/Step": 5456, "Pretrain/Step Time": 8.486529678106308} +{"Pretrain/Learning Rate": 4.188101575408343e-05, "Pretrain/Loss": 2.0440196990966797, "Pretrain/Loss (Raw)": 2.4674339294433594, "Pretrain/Step": 5457, "Pretrain/Step Time": 8.488008318468928} +{"Pretrain/Learning Rate": 4.187788428683103e-05, "Pretrain/Loss": 2.0451622009277344, "Pretrain/Loss (Raw)": 2.0154051780700684, "Pretrain/Step": 5458, "Pretrain/Step Time": 8.488807892426848} +{"Pretrain/Learning Rate": 4.1874752332916735e-05, "Pretrain/Loss": 2.045897960662842, "Pretrain/Loss (Raw)": 2.093221664428711, "Pretrain/Step": 5459, "Pretrain/Step Time": 8.488922329619527} +{"Pretrain/Learning Rate": 4.187161989243085e-05, "Pretrain/Loss": 2.0470142364501953, "Pretrain/Loss (Raw)": 2.097907543182373, "Pretrain/Step": 5460, "Pretrain/Step Time": 8.487595999613404} +{"Pretrain/Learning Rate": 4.186848696546371e-05, "Pretrain/Loss": 2.0469470024108887, "Pretrain/Loss (Raw)": 2.0729174613952637, "Pretrain/Step": 5461, "Pretrain/Step Time": 8.484373746439815} +{"Pretrain/Learning Rate": 4.186535355210562e-05, "Pretrain/Loss": 2.046403646469116, "Pretrain/Loss (Raw)": 1.9748743772506714, "Pretrain/Step": 5462, "Pretrain/Step Time": 8.489603571593761} +{"Pretrain/Learning Rate": 4.186221965244697e-05, "Pretrain/Loss": 2.0467543601989746, "Pretrain/Loss (Raw)": 2.0410523414611816, "Pretrain/Step": 5463, "Pretrain/Step Time": 8.49401169270277} +{"Pretrain/Learning Rate": 4.185908526657809e-05, "Pretrain/Loss": 2.0470709800720215, "Pretrain/Loss (Raw)": 2.1643054485321045, "Pretrain/Step": 5464, "Pretrain/Step Time": 8.493546007201076} +{"Pretrain/Learning Rate": 4.1855950394589374e-05, "Pretrain/Loss": 2.047394275665283, "Pretrain/Loss (Raw)": 2.015249013900757, "Pretrain/Step": 5465, "Pretrain/Step Time": 8.486864071339369} +{"Pretrain/Learning Rate": 4.185281503657121e-05, "Pretrain/Loss": 2.046943187713623, "Pretrain/Loss (Raw)": 2.09957218170166, "Pretrain/Step": 5466, "Pretrain/Step Time": 8.489350639283657} +{"Pretrain/Learning Rate": 4.184967919261401e-05, "Pretrain/Loss": 2.0486223697662354, "Pretrain/Loss (Raw)": 2.1784749031066895, "Pretrain/Step": 5467, "Pretrain/Step Time": 8.49171551503241} +{"Pretrain/Learning Rate": 4.184654286280818e-05, "Pretrain/Loss": 2.047579050064087, "Pretrain/Loss (Raw)": 1.8267790079116821, "Pretrain/Step": 5468, "Pretrain/Step Time": 8.493472561240196} +{"Pretrain/Learning Rate": 4.1843406047244174e-05, "Pretrain/Loss": 2.051069498062134, "Pretrain/Loss (Raw)": 2.074087142944336, "Pretrain/Step": 5469, "Pretrain/Step Time": 8.493933057412505} +{"Pretrain/Learning Rate": 4.1840268746012416e-05, "Pretrain/Loss": 2.0511722564697266, "Pretrain/Loss (Raw)": 1.9750518798828125, "Pretrain/Step": 5470, "Pretrain/Step Time": 8.49453928694129} +{"Pretrain/Learning Rate": 4.1837130959203394e-05, "Pretrain/Loss": 2.050506114959717, "Pretrain/Loss (Raw)": 2.213357448577881, "Pretrain/Step": 5471, "Pretrain/Step Time": 8.49150513857603} +{"Pretrain/Learning Rate": 4.183399268690756e-05, "Pretrain/Loss": 2.0533499717712402, "Pretrain/Loss (Raw)": 2.2903685569763184, "Pretrain/Step": 5472, "Pretrain/Step Time": 8.49021746404469} +{"Pretrain/Learning Rate": 4.183085392921542e-05, "Pretrain/Loss": 2.055479049682617, "Pretrain/Loss (Raw)": 2.0665884017944336, "Pretrain/Step": 5473, "Pretrain/Step Time": 8.484614785760641} +{"Pretrain/Learning Rate": 4.1827714686217465e-05, "Pretrain/Loss": 2.0552315711975098, "Pretrain/Loss (Raw)": 1.8884531259536743, "Pretrain/Step": 5474, "Pretrain/Step Time": 8.480759229511023} +{"Pretrain/Learning Rate": 4.1824574958004226e-05, "Pretrain/Loss": 2.054368734359741, "Pretrain/Loss (Raw)": 1.9824028015136719, "Pretrain/Step": 5475, "Pretrain/Step Time": 8.48010952025652} +{"Pretrain/Learning Rate": 4.182143474466622e-05, "Pretrain/Loss": 2.0537161827087402, "Pretrain/Loss (Raw)": 2.1105544567108154, "Pretrain/Step": 5476, "Pretrain/Step Time": 8.477720191702247} +{"Pretrain/Learning Rate": 4.181829404629401e-05, "Pretrain/Loss": 2.053154468536377, "Pretrain/Loss (Raw)": 1.9045408964157104, "Pretrain/Step": 5477, "Pretrain/Step Time": 8.482957178726792} +{"Pretrain/Learning Rate": 4.181515286297815e-05, "Pretrain/Loss": 2.051748752593994, "Pretrain/Loss (Raw)": 1.9895601272583008, "Pretrain/Step": 5478, "Pretrain/Step Time": 8.483158243820071} +{"Pretrain/Learning Rate": 4.1812011194809205e-05, "Pretrain/Loss": 2.0528483390808105, "Pretrain/Loss (Raw)": 2.050006628036499, "Pretrain/Step": 5479, "Pretrain/Step Time": 8.479647971689701} +{"Pretrain/Learning Rate": 4.1808869041877764e-05, "Pretrain/Loss": 2.0497822761535645, "Pretrain/Loss (Raw)": 1.7282437086105347, "Pretrain/Step": 5480, "Pretrain/Step Time": 8.481594873592257} +{"Pretrain/Learning Rate": 4.180572640427444e-05, "Pretrain/Loss": 2.048731803894043, "Pretrain/Loss (Raw)": 2.0805368423461914, "Pretrain/Step": 5481, "Pretrain/Step Time": 8.478303492069244} +{"Pretrain/Learning Rate": 4.180258328208985e-05, "Pretrain/Loss": 2.0469093322753906, "Pretrain/Loss (Raw)": 1.9264423847198486, "Pretrain/Step": 5482, "Pretrain/Step Time": 8.484772484749556} +{"Pretrain/Learning Rate": 4.1799439675414604e-05, "Pretrain/Loss": 2.0470502376556396, "Pretrain/Loss (Raw)": 2.095170259475708, "Pretrain/Step": 5483, "Pretrain/Step Time": 8.483804630115628} +{"Pretrain/Learning Rate": 4.1796295584339365e-05, "Pretrain/Loss": 2.0470669269561768, "Pretrain/Loss (Raw)": 2.1129772663116455, "Pretrain/Step": 5484, "Pretrain/Step Time": 8.482974652200937} +{"Pretrain/Learning Rate": 4.1793151008954776e-05, "Pretrain/Loss": 2.044811248779297, "Pretrain/Loss (Raw)": 1.9637911319732666, "Pretrain/Step": 5485, "Pretrain/Step Time": 8.481874275952578} +{"Pretrain/Learning Rate": 4.179000594935152e-05, "Pretrain/Loss": 2.0444626808166504, "Pretrain/Loss (Raw)": 1.943952202796936, "Pretrain/Step": 5486, "Pretrain/Step Time": 8.490717872977257} +{"Pretrain/Learning Rate": 4.1786860405620275e-05, "Pretrain/Loss": 2.0426156520843506, "Pretrain/Loss (Raw)": 1.7055860757827759, "Pretrain/Step": 5487, "Pretrain/Step Time": 8.489534160122275} +{"Pretrain/Learning Rate": 4.178371437785176e-05, "Pretrain/Loss": 2.0422170162200928, "Pretrain/Loss (Raw)": 1.9244407415390015, "Pretrain/Step": 5488, "Pretrain/Step Time": 8.485333297401667} +{"Pretrain/Learning Rate": 4.178056786613666e-05, "Pretrain/Loss": 2.041146755218506, "Pretrain/Loss (Raw)": 2.0451836585998535, "Pretrain/Step": 5489, "Pretrain/Step Time": 8.484218336641788} +{"Pretrain/Learning Rate": 4.177742087056571e-05, "Pretrain/Loss": 2.0401339530944824, "Pretrain/Loss (Raw)": 2.1611368656158447, "Pretrain/Step": 5490, "Pretrain/Step Time": 8.4872679207474} +{"Pretrain/Learning Rate": 4.177427339122966e-05, "Pretrain/Loss": 2.037282705307007, "Pretrain/Loss (Raw)": 1.7271878719329834, "Pretrain/Step": 5491, "Pretrain/Step Time": 8.4863569624722} +{"Pretrain/Learning Rate": 4.177112542821927e-05, "Pretrain/Loss": 2.0377910137176514, "Pretrain/Loss (Raw)": 2.0758588314056396, "Pretrain/Step": 5492, "Pretrain/Step Time": 8.486855942755938} +{"Pretrain/Learning Rate": 4.176797698162529e-05, "Pretrain/Loss": 2.0363879203796387, "Pretrain/Loss (Raw)": 2.0183141231536865, "Pretrain/Step": 5493, "Pretrain/Step Time": 8.487482361495495} +{"Pretrain/Learning Rate": 4.176482805153852e-05, "Pretrain/Loss": 2.0344038009643555, "Pretrain/Loss (Raw)": 1.7237606048583984, "Pretrain/Step": 5494, "Pretrain/Step Time": 8.484894236549735} +{"Pretrain/Learning Rate": 4.176167863804975e-05, "Pretrain/Loss": 2.0359981060028076, "Pretrain/Loss (Raw)": 2.094177007675171, "Pretrain/Step": 5495, "Pretrain/Step Time": 8.485064608976245} +{"Pretrain/Learning Rate": 4.1758528741249794e-05, "Pretrain/Loss": 2.034487247467041, "Pretrain/Loss (Raw)": 1.9814891815185547, "Pretrain/Step": 5496, "Pretrain/Step Time": 8.48327224701643} +{"Pretrain/Learning Rate": 4.175537836122948e-05, "Pretrain/Loss": 2.0337069034576416, "Pretrain/Loss (Raw)": 1.9589955806732178, "Pretrain/Step": 5497, "Pretrain/Step Time": 8.48478228598833} +{"Pretrain/Learning Rate": 4.1752227498079636e-05, "Pretrain/Loss": 2.0324583053588867, "Pretrain/Loss (Raw)": 1.970144271850586, "Pretrain/Step": 5498, "Pretrain/Step Time": 8.483102234080434} +{"Pretrain/Learning Rate": 4.1749076151891125e-05, "Pretrain/Loss": 2.0337982177734375, "Pretrain/Loss (Raw)": 2.234072208404541, "Pretrain/Step": 5499, "Pretrain/Step Time": 8.4830525778234} +{"Pretrain/Learning Rate": 4.174592432275481e-05, "Pretrain/Loss": 2.0332353115081787, "Pretrain/Loss (Raw)": 2.0781686305999756, "Pretrain/Step": 5500, "Pretrain/Step Time": 8.483057467266917} +{"Pretrain/Learning Rate": 4.1742772010761574e-05, "Pretrain/Loss": 2.033222198486328, "Pretrain/Loss (Raw)": 2.1308059692382812, "Pretrain/Step": 5501, "Pretrain/Step Time": 8.487343428656459} +{"Pretrain/Learning Rate": 4.17396192160023e-05, "Pretrain/Loss": 2.0353784561157227, "Pretrain/Loss (Raw)": 2.143045663833618, "Pretrain/Step": 5502, "Pretrain/Step Time": 8.491153687238693} +{"Pretrain/Learning Rate": 4.1736465938567915e-05, "Pretrain/Loss": 2.0367794036865234, "Pretrain/Loss (Raw)": 1.9863425493240356, "Pretrain/Step": 5503, "Pretrain/Step Time": 8.490779362618923} +{"Pretrain/Learning Rate": 4.1733312178549336e-05, "Pretrain/Loss": 2.036870002746582, "Pretrain/Loss (Raw)": 2.0874733924865723, "Pretrain/Step": 5504, "Pretrain/Step Time": 8.492823051288724} +{"Pretrain/Learning Rate": 4.1730157936037494e-05, "Pretrain/Loss": 2.036865711212158, "Pretrain/Loss (Raw)": 2.1042234897613525, "Pretrain/Step": 5505, "Pretrain/Step Time": 8.49381204135716} +{"Pretrain/Learning Rate": 4.172700321112334e-05, "Pretrain/Loss": 2.03590726852417, "Pretrain/Loss (Raw)": 1.888711929321289, "Pretrain/Step": 5506, "Pretrain/Step Time": 8.494688879698515} +{"Pretrain/Learning Rate": 4.172384800389784e-05, "Pretrain/Loss": 2.0358173847198486, "Pretrain/Loss (Raw)": 2.0359046459198, "Pretrain/Step": 5507, "Pretrain/Step Time": 8.49933572113514} +{"Pretrain/Learning Rate": 4.172069231445197e-05, "Pretrain/Loss": 2.036442756652832, "Pretrain/Loss (Raw)": 2.1967499256134033, "Pretrain/Step": 5508, "Pretrain/Step Time": 8.497267756611109} +{"Pretrain/Learning Rate": 4.171753614287673e-05, "Pretrain/Loss": 2.0340147018432617, "Pretrain/Loss (Raw)": 1.9497170448303223, "Pretrain/Step": 5509, "Pretrain/Step Time": 8.495938874781132} +{"Pretrain/Learning Rate": 4.171437948926312e-05, "Pretrain/Loss": 2.035017728805542, "Pretrain/Loss (Raw)": 2.2637393474578857, "Pretrain/Step": 5510, "Pretrain/Step Time": 8.493388241156936} +{"Pretrain/Learning Rate": 4.171122235370216e-05, "Pretrain/Loss": 2.032410144805908, "Pretrain/Loss (Raw)": 2.0591647624969482, "Pretrain/Step": 5511, "Pretrain/Step Time": 8.498316852375865} +{"Pretrain/Learning Rate": 4.170806473628488e-05, "Pretrain/Loss": 2.0330071449279785, "Pretrain/Loss (Raw)": 2.022883653640747, "Pretrain/Step": 5512, "Pretrain/Step Time": 8.491200575605035} +{"Pretrain/Learning Rate": 4.1704906637102334e-05, "Pretrain/Loss": 2.0327720642089844, "Pretrain/Loss (Raw)": 2.077923536300659, "Pretrain/Step": 5513, "Pretrain/Step Time": 8.494970008730888} +{"Pretrain/Learning Rate": 4.170174805624558e-05, "Pretrain/Loss": 2.033296585083008, "Pretrain/Loss (Raw)": 2.043862819671631, "Pretrain/Step": 5514, "Pretrain/Step Time": 8.496001157909632} +{"Pretrain/Learning Rate": 4.1698588993805706e-05, "Pretrain/Loss": 2.0316085815429688, "Pretrain/Loss (Raw)": 1.9744846820831299, "Pretrain/Step": 5515, "Pretrain/Step Time": 8.48804660141468} +{"Pretrain/Learning Rate": 4.169542944987378e-05, "Pretrain/Loss": 2.0310325622558594, "Pretrain/Loss (Raw)": 2.106497049331665, "Pretrain/Step": 5516, "Pretrain/Step Time": 8.49009881541133} +{"Pretrain/Learning Rate": 4.169226942454091e-05, "Pretrain/Loss": 2.0333518981933594, "Pretrain/Loss (Raw)": 2.356151819229126, "Pretrain/Step": 5517, "Pretrain/Step Time": 8.490774193778634} +{"Pretrain/Learning Rate": 4.1689108917898226e-05, "Pretrain/Loss": 2.0309677124023438, "Pretrain/Loss (Raw)": 1.97908616065979, "Pretrain/Step": 5518, "Pretrain/Step Time": 8.490932136774063} +{"Pretrain/Learning Rate": 4.168594793003685e-05, "Pretrain/Loss": 2.031221389770508, "Pretrain/Loss (Raw)": 2.062659502029419, "Pretrain/Step": 5519, "Pretrain/Step Time": 8.490161115303636} +{"Pretrain/Learning Rate": 4.168278646104793e-05, "Pretrain/Loss": 2.0313875675201416, "Pretrain/Loss (Raw)": 2.0562798976898193, "Pretrain/Step": 5520, "Pretrain/Step Time": 8.487578021362424} +{"Pretrain/Learning Rate": 4.167962451102262e-05, "Pretrain/Loss": 2.029297351837158, "Pretrain/Loss (Raw)": 1.9039428234100342, "Pretrain/Step": 5521, "Pretrain/Step Time": 8.484679469838738} +{"Pretrain/Learning Rate": 4.167646208005209e-05, "Pretrain/Loss": 2.0282177925109863, "Pretrain/Loss (Raw)": 1.8936564922332764, "Pretrain/Step": 5522, "Pretrain/Step Time": 8.487922022119164} +{"Pretrain/Learning Rate": 4.1673299168227544e-05, "Pretrain/Loss": 2.02740478515625, "Pretrain/Loss (Raw)": 2.031987428665161, "Pretrain/Step": 5523, "Pretrain/Step Time": 8.484820386394858} +{"Pretrain/Learning Rate": 4.167013577564016e-05, "Pretrain/Loss": 2.0256175994873047, "Pretrain/Loss (Raw)": 2.1018588542938232, "Pretrain/Step": 5524, "Pretrain/Step Time": 8.482041338458657} +{"Pretrain/Learning Rate": 4.166697190238117e-05, "Pretrain/Loss": 2.0231752395629883, "Pretrain/Loss (Raw)": 1.9703141450881958, "Pretrain/Step": 5525, "Pretrain/Step Time": 8.48751325532794} +{"Pretrain/Learning Rate": 4.1663807548541794e-05, "Pretrain/Loss": 2.022893190383911, "Pretrain/Loss (Raw)": 1.8261146545410156, "Pretrain/Step": 5526, "Pretrain/Step Time": 8.484498279169202} +{"Pretrain/Learning Rate": 4.166064271421327e-05, "Pretrain/Loss": 2.023461103439331, "Pretrain/Loss (Raw)": 1.9627975225448608, "Pretrain/Step": 5527, "Pretrain/Step Time": 8.482580706477165} +{"Pretrain/Learning Rate": 4.165747739948686e-05, "Pretrain/Loss": 2.025055408477783, "Pretrain/Loss (Raw)": 1.8742426633834839, "Pretrain/Step": 5528, "Pretrain/Step Time": 8.48338808491826} +{"Pretrain/Learning Rate": 4.165431160445383e-05, "Pretrain/Loss": 2.027010440826416, "Pretrain/Loss (Raw)": 2.117168664932251, "Pretrain/Step": 5529, "Pretrain/Step Time": 8.4827681183815} +{"Pretrain/Learning Rate": 4.1651145329205475e-05, "Pretrain/Loss": 2.0274276733398438, "Pretrain/Loss (Raw)": 1.999014139175415, "Pretrain/Step": 5530, "Pretrain/Step Time": 8.48325315117836} +{"Pretrain/Learning Rate": 4.164797857383308e-05, "Pretrain/Loss": 2.027678966522217, "Pretrain/Loss (Raw)": 1.8799655437469482, "Pretrain/Step": 5531, "Pretrain/Step Time": 8.479387059807777} +{"Pretrain/Learning Rate": 4.164481133842795e-05, "Pretrain/Loss": 2.026412010192871, "Pretrain/Loss (Raw)": 1.8953378200531006, "Pretrain/Step": 5532, "Pretrain/Step Time": 8.483169490471482} +{"Pretrain/Learning Rate": 4.164164362308143e-05, "Pretrain/Loss": 2.0260443687438965, "Pretrain/Loss (Raw)": 2.042152166366577, "Pretrain/Step": 5533, "Pretrain/Step Time": 8.479597486555576} +{"Pretrain/Learning Rate": 4.1638475427884835e-05, "Pretrain/Loss": 2.0259881019592285, "Pretrain/Loss (Raw)": 1.9531810283660889, "Pretrain/Step": 5534, "Pretrain/Step Time": 8.483169194310904} +{"Pretrain/Learning Rate": 4.163530675292954e-05, "Pretrain/Loss": 2.025249481201172, "Pretrain/Loss (Raw)": 2.104990005493164, "Pretrain/Step": 5535, "Pretrain/Step Time": 8.486945739015937} +{"Pretrain/Learning Rate": 4.16321375983069e-05, "Pretrain/Loss": 2.02616548538208, "Pretrain/Loss (Raw)": 2.06575870513916, "Pretrain/Step": 5536, "Pretrain/Step Time": 8.487732449546456} +{"Pretrain/Learning Rate": 4.162896796410829e-05, "Pretrain/Loss": 2.0239052772521973, "Pretrain/Loss (Raw)": 2.016226291656494, "Pretrain/Step": 5537, "Pretrain/Step Time": 8.482832442969084} +{"Pretrain/Learning Rate": 4.162579785042512e-05, "Pretrain/Loss": 2.0226478576660156, "Pretrain/Loss (Raw)": 2.073478937149048, "Pretrain/Step": 5538, "Pretrain/Step Time": 8.487486595287919} +{"Pretrain/Learning Rate": 4.1622627257348786e-05, "Pretrain/Loss": 2.021775245666504, "Pretrain/Loss (Raw)": 2.083139657974243, "Pretrain/Step": 5539, "Pretrain/Step Time": 8.483520055189729} +{"Pretrain/Learning Rate": 4.1619456184970715e-05, "Pretrain/Loss": 2.024923324584961, "Pretrain/Loss (Raw)": 2.2768216133117676, "Pretrain/Step": 5540, "Pretrain/Step Time": 8.483253272250295} +{"Pretrain/Learning Rate": 4.1616284633382344e-05, "Pretrain/Loss": 2.022580146789551, "Pretrain/Loss (Raw)": 1.924953818321228, "Pretrain/Step": 5541, "Pretrain/Step Time": 8.482318555936217} +{"Pretrain/Learning Rate": 4.1613112602675105e-05, "Pretrain/Loss": 2.0204391479492188, "Pretrain/Loss (Raw)": 1.9290748834609985, "Pretrain/Step": 5542, "Pretrain/Step Time": 8.483886314556003} +{"Pretrain/Learning Rate": 4.160994009294049e-05, "Pretrain/Loss": 2.0172975063323975, "Pretrain/Loss (Raw)": 1.7942754030227661, "Pretrain/Step": 5543, "Pretrain/Step Time": 8.481052290648222} +{"Pretrain/Learning Rate": 4.160676710426996e-05, "Pretrain/Loss": 2.016390323638916, "Pretrain/Loss (Raw)": 1.9813711643218994, "Pretrain/Step": 5544, "Pretrain/Step Time": 8.482480958104134} +{"Pretrain/Learning Rate": 4.1603593636755e-05, "Pretrain/Loss": 2.016834259033203, "Pretrain/Loss (Raw)": 1.9454216957092285, "Pretrain/Step": 5545, "Pretrain/Step Time": 8.482022240757942} +{"Pretrain/Learning Rate": 4.160041969048714e-05, "Pretrain/Loss": 2.0185861587524414, "Pretrain/Loss (Raw)": 2.0264179706573486, "Pretrain/Step": 5546, "Pretrain/Step Time": 8.479729041457176} +{"Pretrain/Learning Rate": 4.159724526555786e-05, "Pretrain/Loss": 2.018364906311035, "Pretrain/Loss (Raw)": 2.0165019035339355, "Pretrain/Step": 5547, "Pretrain/Step Time": 8.47181624546647} +{"Pretrain/Learning Rate": 4.1594070362058724e-05, "Pretrain/Loss": 2.0174691677093506, "Pretrain/Loss (Raw)": 2.0168159008026123, "Pretrain/Step": 5548, "Pretrain/Step Time": 8.475112097337842} +{"Pretrain/Learning Rate": 4.159089498008126e-05, "Pretrain/Loss": 2.0160398483276367, "Pretrain/Loss (Raw)": 1.9426023960113525, "Pretrain/Step": 5549, "Pretrain/Step Time": 8.480025701224804} +{"Pretrain/Learning Rate": 4.158771911971704e-05, "Pretrain/Loss": 2.0140814781188965, "Pretrain/Loss (Raw)": 1.8747665882110596, "Pretrain/Step": 5550, "Pretrain/Step Time": 8.480505844578147} +{"Pretrain/Learning Rate": 4.1584542781057635e-05, "Pretrain/Loss": 2.0176596641540527, "Pretrain/Loss (Raw)": 2.352173328399658, "Pretrain/Step": 5551, "Pretrain/Step Time": 8.480031033977866} +{"Pretrain/Learning Rate": 4.1581365964194625e-05, "Pretrain/Loss": 2.0123798847198486, "Pretrain/Loss (Raw)": 1.874467372894287, "Pretrain/Step": 5552, "Pretrain/Step Time": 8.483537202700973} +{"Pretrain/Learning Rate": 4.157818866921962e-05, "Pretrain/Loss": 2.015198230743408, "Pretrain/Loss (Raw)": 2.1641128063201904, "Pretrain/Step": 5553, "Pretrain/Step Time": 8.48669907823205} +{"Pretrain/Learning Rate": 4.157501089622423e-05, "Pretrain/Loss": 2.015808343887329, "Pretrain/Loss (Raw)": 1.927993655204773, "Pretrain/Step": 5554, "Pretrain/Step Time": 8.483156654983759} +{"Pretrain/Learning Rate": 4.157183264530009e-05, "Pretrain/Loss": 2.0203471183776855, "Pretrain/Loss (Raw)": 2.403728485107422, "Pretrain/Step": 5555, "Pretrain/Step Time": 8.4815657697618} +{"Pretrain/Learning Rate": 4.156865391653883e-05, "Pretrain/Loss": 2.0203919410705566, "Pretrain/Loss (Raw)": 1.9523512125015259, "Pretrain/Step": 5556, "Pretrain/Step Time": 8.48365337587893} +{"Pretrain/Learning Rate": 4.156547471003211e-05, "Pretrain/Loss": 2.017792224884033, "Pretrain/Loss (Raw)": 1.757095217704773, "Pretrain/Step": 5557, "Pretrain/Step Time": 8.484480621293187} +{"Pretrain/Learning Rate": 4.1562295025871625e-05, "Pretrain/Loss": 2.0180182456970215, "Pretrain/Loss (Raw)": 2.0099356174468994, "Pretrain/Step": 5558, "Pretrain/Step Time": 8.486698247492313} +{"Pretrain/Learning Rate": 4.155911486414902e-05, "Pretrain/Loss": 2.0193817615509033, "Pretrain/Loss (Raw)": 2.0209197998046875, "Pretrain/Step": 5559, "Pretrain/Step Time": 8.48660528473556} +{"Pretrain/Learning Rate": 4.155593422495602e-05, "Pretrain/Loss": 2.0211987495422363, "Pretrain/Loss (Raw)": 2.140726327896118, "Pretrain/Step": 5560, "Pretrain/Step Time": 8.485413113608956} +{"Pretrain/Learning Rate": 4.155275310838432e-05, "Pretrain/Loss": 2.0229249000549316, "Pretrain/Loss (Raw)": 2.160309076309204, "Pretrain/Step": 5561, "Pretrain/Step Time": 8.486677875742316} +{"Pretrain/Learning Rate": 4.1549571514525664e-05, "Pretrain/Loss": 2.0256707668304443, "Pretrain/Loss (Raw)": 2.0207011699676514, "Pretrain/Step": 5562, "Pretrain/Step Time": 8.485384298488498} +{"Pretrain/Learning Rate": 4.154638944347178e-05, "Pretrain/Loss": 2.025402545928955, "Pretrain/Loss (Raw)": 2.1376821994781494, "Pretrain/Step": 5563, "Pretrain/Step Time": 8.482632026076317} +{"Pretrain/Learning Rate": 4.154320689531441e-05, "Pretrain/Loss": 2.0251083374023438, "Pretrain/Loss (Raw)": 1.910244345664978, "Pretrain/Step": 5564, "Pretrain/Step Time": 8.477818191051483} +{"Pretrain/Learning Rate": 4.154002387014534e-05, "Pretrain/Loss": 2.024435043334961, "Pretrain/Loss (Raw)": 1.9653881788253784, "Pretrain/Step": 5565, "Pretrain/Step Time": 8.48241033218801} +{"Pretrain/Learning Rate": 4.153684036805634e-05, "Pretrain/Loss": 2.0242884159088135, "Pretrain/Loss (Raw)": 2.0720365047454834, "Pretrain/Step": 5566, "Pretrain/Step Time": 8.481816846877337} +{"Pretrain/Learning Rate": 4.15336563891392e-05, "Pretrain/Loss": 2.025358200073242, "Pretrain/Loss (Raw)": 2.0948374271392822, "Pretrain/Step": 5567, "Pretrain/Step Time": 8.485923485830426} +{"Pretrain/Learning Rate": 4.1530471933485737e-05, "Pretrain/Loss": 2.0272326469421387, "Pretrain/Loss (Raw)": 1.977129578590393, "Pretrain/Step": 5568, "Pretrain/Step Time": 8.479895737022161} +{"Pretrain/Learning Rate": 4.152728700118777e-05, "Pretrain/Loss": 2.030376672744751, "Pretrain/Loss (Raw)": 2.422405958175659, "Pretrain/Step": 5569, "Pretrain/Step Time": 8.482972972095013} +{"Pretrain/Learning Rate": 4.1524101592337134e-05, "Pretrain/Loss": 2.02966570854187, "Pretrain/Loss (Raw)": 1.9743175506591797, "Pretrain/Step": 5570, "Pretrain/Step Time": 8.481924559921026} +{"Pretrain/Learning Rate": 4.152091570702568e-05, "Pretrain/Loss": 2.02933931350708, "Pretrain/Loss (Raw)": 1.9934061765670776, "Pretrain/Step": 5571, "Pretrain/Step Time": 8.480369566008449} +{"Pretrain/Learning Rate": 4.1517729345345256e-05, "Pretrain/Loss": 2.031325578689575, "Pretrain/Loss (Raw)": 1.9990590810775757, "Pretrain/Step": 5572, "Pretrain/Step Time": 8.479837669059634} +{"Pretrain/Learning Rate": 4.1514542507387764e-05, "Pretrain/Loss": 2.0318589210510254, "Pretrain/Loss (Raw)": 2.1164748668670654, "Pretrain/Step": 5573, "Pretrain/Step Time": 8.477976206690073} +{"Pretrain/Learning Rate": 4.151135519324507e-05, "Pretrain/Loss": 2.0323739051818848, "Pretrain/Loss (Raw)": 2.035339832305908, "Pretrain/Step": 5574, "Pretrain/Step Time": 8.478065431118011} +{"Pretrain/Learning Rate": 4.15081674030091e-05, "Pretrain/Loss": 2.032371997833252, "Pretrain/Loss (Raw)": 2.1388661861419678, "Pretrain/Step": 5575, "Pretrain/Step Time": 8.481784364208579} +{"Pretrain/Learning Rate": 4.150497913677176e-05, "Pretrain/Loss": 2.0352768898010254, "Pretrain/Loss (Raw)": 2.28043270111084, "Pretrain/Step": 5576, "Pretrain/Step Time": 8.476641777902842} +{"Pretrain/Learning Rate": 4.1501790394624975e-05, "Pretrain/Loss": 2.034513473510742, "Pretrain/Loss (Raw)": 1.9103875160217285, "Pretrain/Step": 5577, "Pretrain/Step Time": 8.478317821398377} +{"Pretrain/Learning Rate": 4.1498601176660694e-05, "Pretrain/Loss": 2.035338878631592, "Pretrain/Loss (Raw)": 2.1391725540161133, "Pretrain/Step": 5578, "Pretrain/Step Time": 8.475943643599749} +{"Pretrain/Learning Rate": 4.149541148297088e-05, "Pretrain/Loss": 2.0347824096679688, "Pretrain/Loss (Raw)": 2.120950222015381, "Pretrain/Step": 5579, "Pretrain/Step Time": 8.473083388060331} +{"Pretrain/Learning Rate": 4.149222131364751e-05, "Pretrain/Loss": 2.0347537994384766, "Pretrain/Loss (Raw)": 2.177124261856079, "Pretrain/Step": 5580, "Pretrain/Step Time": 8.47809294424951} +{"Pretrain/Learning Rate": 4.1489030668782565e-05, "Pretrain/Loss": 2.0337021350860596, "Pretrain/Loss (Raw)": 1.8460029363632202, "Pretrain/Step": 5581, "Pretrain/Step Time": 8.472912827506661} +{"Pretrain/Learning Rate": 4.1485839548468045e-05, "Pretrain/Loss": 2.038250207901001, "Pretrain/Loss (Raw)": 2.5571951866149902, "Pretrain/Step": 5582, "Pretrain/Step Time": 8.478201691061258} +{"Pretrain/Learning Rate": 4.148264795279596e-05, "Pretrain/Loss": 2.037956953048706, "Pretrain/Loss (Raw)": 1.9314159154891968, "Pretrain/Step": 5583, "Pretrain/Step Time": 8.482788544148207} +{"Pretrain/Learning Rate": 4.147945588185834e-05, "Pretrain/Loss": 2.038321018218994, "Pretrain/Loss (Raw)": 2.128887176513672, "Pretrain/Step": 5584, "Pretrain/Step Time": 8.48393914476037} +{"Pretrain/Learning Rate": 4.1476263335747225e-05, "Pretrain/Loss": 2.0326530933380127, "Pretrain/Loss (Raw)": 1.7419108152389526, "Pretrain/Step": 5585, "Pretrain/Step Time": 8.482487816363573} +{"Pretrain/Learning Rate": 4.1473070314554676e-05, "Pretrain/Loss": 2.033095359802246, "Pretrain/Loss (Raw)": 2.0719926357269287, "Pretrain/Step": 5586, "Pretrain/Step Time": 8.480869140475988} +{"Pretrain/Learning Rate": 4.1469876818372756e-05, "Pretrain/Loss": 2.034891128540039, "Pretrain/Loss (Raw)": 2.3230984210968018, "Pretrain/Step": 5587, "Pretrain/Step Time": 8.480928964912891} +{"Pretrain/Learning Rate": 4.146668284729355e-05, "Pretrain/Loss": 2.038115978240967, "Pretrain/Loss (Raw)": 2.51068115234375, "Pretrain/Step": 5588, "Pretrain/Step Time": 8.481262605637312} +{"Pretrain/Learning Rate": 4.146348840140915e-05, "Pretrain/Loss": 2.0343122482299805, "Pretrain/Loss (Raw)": 1.586066484451294, "Pretrain/Step": 5589, "Pretrain/Step Time": 8.481869544833899} +{"Pretrain/Learning Rate": 4.146029348081167e-05, "Pretrain/Loss": 2.036334276199341, "Pretrain/Loss (Raw)": 2.233680486679077, "Pretrain/Step": 5590, "Pretrain/Step Time": 8.481183037161827} +{"Pretrain/Learning Rate": 4.145709808559323e-05, "Pretrain/Loss": 2.036166191101074, "Pretrain/Loss (Raw)": 2.0195155143737793, "Pretrain/Step": 5591, "Pretrain/Step Time": 8.478193273767829} +{"Pretrain/Learning Rate": 4.145390221584597e-05, "Pretrain/Loss": 2.038769483566284, "Pretrain/Loss (Raw)": 2.4975523948669434, "Pretrain/Step": 5592, "Pretrain/Step Time": 8.478806482627988} +{"Pretrain/Learning Rate": 4.145070587166203e-05, "Pretrain/Loss": 2.038389205932617, "Pretrain/Loss (Raw)": 1.9665815830230713, "Pretrain/Step": 5593, "Pretrain/Step Time": 8.480319947004318} +{"Pretrain/Learning Rate": 4.1447509053133595e-05, "Pretrain/Loss": 2.0382184982299805, "Pretrain/Loss (Raw)": 2.0777106285095215, "Pretrain/Step": 5594, "Pretrain/Step Time": 8.482554508373141} +{"Pretrain/Learning Rate": 4.144431176035283e-05, "Pretrain/Loss": 2.039802074432373, "Pretrain/Loss (Raw)": 2.381171703338623, "Pretrain/Step": 5595, "Pretrain/Step Time": 8.48188566043973} +{"Pretrain/Learning Rate": 4.1441113993411924e-05, "Pretrain/Loss": 2.04068660736084, "Pretrain/Loss (Raw)": 1.9399839639663696, "Pretrain/Step": 5596, "Pretrain/Step Time": 8.479763956740499} +{"Pretrain/Learning Rate": 4.143791575240309e-05, "Pretrain/Loss": 2.0403225421905518, "Pretrain/Loss (Raw)": 2.0274853706359863, "Pretrain/Step": 5597, "Pretrain/Step Time": 8.48120465874672} +{"Pretrain/Learning Rate": 4.143471703741853e-05, "Pretrain/Loss": 2.042736768722534, "Pretrain/Loss (Raw)": 2.2840960025787354, "Pretrain/Step": 5598, "Pretrain/Step Time": 8.485541505739093} +{"Pretrain/Learning Rate": 4.14315178485505e-05, "Pretrain/Loss": 2.0413310527801514, "Pretrain/Loss (Raw)": 2.033411979675293, "Pretrain/Step": 5599, "Pretrain/Step Time": 8.488932747393847} +{"Pretrain/Learning Rate": 4.142831818589125e-05, "Pretrain/Loss": 2.0379128456115723, "Pretrain/Loss (Raw)": 1.8528496026992798, "Pretrain/Step": 5600, "Pretrain/Step Time": 8.485814318060875} +{"Pretrain/Learning Rate": 4.142511804953301e-05, "Pretrain/Loss": 2.0378000736236572, "Pretrain/Loss (Raw)": 2.0521416664123535, "Pretrain/Step": 5601, "Pretrain/Step Time": 8.48950612358749} +{"Pretrain/Learning Rate": 4.142191743956807e-05, "Pretrain/Loss": 2.039041042327881, "Pretrain/Loss (Raw)": 2.047330141067505, "Pretrain/Step": 5602, "Pretrain/Step Time": 8.492403667420149} +{"Pretrain/Learning Rate": 4.1418716356088715e-05, "Pretrain/Loss": 2.040156602859497, "Pretrain/Loss (Raw)": 2.1251680850982666, "Pretrain/Step": 5603, "Pretrain/Step Time": 8.494125783443451} +{"Pretrain/Learning Rate": 4.1415514799187256e-05, "Pretrain/Loss": 2.039226531982422, "Pretrain/Loss (Raw)": 1.9915008544921875, "Pretrain/Step": 5604, "Pretrain/Step Time": 8.496929930523038} +{"Pretrain/Learning Rate": 4.1412312768955994e-05, "Pretrain/Loss": 2.0385324954986572, "Pretrain/Loss (Raw)": 1.8156991004943848, "Pretrain/Step": 5605, "Pretrain/Step Time": 8.493379356339574} +{"Pretrain/Learning Rate": 4.1409110265487275e-05, "Pretrain/Loss": 2.039426803588867, "Pretrain/Loss (Raw)": 2.104050397872925, "Pretrain/Step": 5606, "Pretrain/Step Time": 8.49521630257368} +{"Pretrain/Learning Rate": 4.140590728887341e-05, "Pretrain/Loss": 2.03849720954895, "Pretrain/Loss (Raw)": 1.9309988021850586, "Pretrain/Step": 5607, "Pretrain/Step Time": 8.494312128052115} +{"Pretrain/Learning Rate": 4.1402703839206794e-05, "Pretrain/Loss": 2.04103684425354, "Pretrain/Loss (Raw)": 2.0533182621002197, "Pretrain/Step": 5608, "Pretrain/Step Time": 8.492038201540709} +{"Pretrain/Learning Rate": 4.139949991657976e-05, "Pretrain/Loss": 2.0406484603881836, "Pretrain/Loss (Raw)": 2.0308234691619873, "Pretrain/Step": 5609, "Pretrain/Step Time": 8.492017425596714} +{"Pretrain/Learning Rate": 4.1396295521084717e-05, "Pretrain/Loss": 2.0416207313537598, "Pretrain/Loss (Raw)": 2.0509159564971924, "Pretrain/Step": 5610, "Pretrain/Step Time": 8.490156691521406} +{"Pretrain/Learning Rate": 4.139309065281404e-05, "Pretrain/Loss": 2.040848731994629, "Pretrain/Loss (Raw)": 1.9963611364364624, "Pretrain/Step": 5611, "Pretrain/Step Time": 8.488253638148308} +{"Pretrain/Learning Rate": 4.138988531186016e-05, "Pretrain/Loss": 2.041238784790039, "Pretrain/Loss (Raw)": 2.162869691848755, "Pretrain/Step": 5612, "Pretrain/Step Time": 8.489978877827525} +{"Pretrain/Learning Rate": 4.138667949831549e-05, "Pretrain/Loss": 2.0425071716308594, "Pretrain/Loss (Raw)": 2.126152276992798, "Pretrain/Step": 5613, "Pretrain/Step Time": 8.493840876966715} +{"Pretrain/Learning Rate": 4.138347321227247e-05, "Pretrain/Loss": 2.042144775390625, "Pretrain/Loss (Raw)": 1.897559404373169, "Pretrain/Step": 5614, "Pretrain/Step Time": 8.491630239412189} +{"Pretrain/Learning Rate": 4.1380266453823544e-05, "Pretrain/Loss": 2.044038772583008, "Pretrain/Loss (Raw)": 1.9479990005493164, "Pretrain/Step": 5615, "Pretrain/Step Time": 8.489706486463547} +{"Pretrain/Learning Rate": 4.137705922306119e-05, "Pretrain/Loss": 2.0447068214416504, "Pretrain/Loss (Raw)": 2.009962558746338, "Pretrain/Step": 5616, "Pretrain/Step Time": 8.493954068049788} +{"Pretrain/Learning Rate": 4.137385152007786e-05, "Pretrain/Loss": 2.0454611778259277, "Pretrain/Loss (Raw)": 2.141756296157837, "Pretrain/Step": 5617, "Pretrain/Step Time": 8.4912432115525} +{"Pretrain/Learning Rate": 4.1370643344966085e-05, "Pretrain/Loss": 2.043851852416992, "Pretrain/Loss (Raw)": 1.9551478624343872, "Pretrain/Step": 5618, "Pretrain/Step Time": 8.48746839351952} +{"Pretrain/Learning Rate": 4.136743469781834e-05, "Pretrain/Loss": 2.0479488372802734, "Pretrain/Loss (Raw)": 2.2516090869903564, "Pretrain/Step": 5619, "Pretrain/Step Time": 8.49287211149931} +{"Pretrain/Learning Rate": 4.136422557872716e-05, "Pretrain/Loss": 2.0463030338287354, "Pretrain/Loss (Raw)": 1.865168809890747, "Pretrain/Step": 5620, "Pretrain/Step Time": 8.490712650120258} +{"Pretrain/Learning Rate": 4.136101598778507e-05, "Pretrain/Loss": 2.046800136566162, "Pretrain/Loss (Raw)": 2.081979990005493, "Pretrain/Step": 5621, "Pretrain/Step Time": 8.4914829172194} +{"Pretrain/Learning Rate": 4.1357805925084614e-05, "Pretrain/Loss": 2.048354148864746, "Pretrain/Loss (Raw)": 1.9226552248001099, "Pretrain/Step": 5622, "Pretrain/Step Time": 8.492689544335008} +{"Pretrain/Learning Rate": 4.1354595390718353e-05, "Pretrain/Loss": 2.048001527786255, "Pretrain/Loss (Raw)": 2.0490305423736572, "Pretrain/Step": 5623, "Pretrain/Step Time": 8.492803437635303} +{"Pretrain/Learning Rate": 4.1351384384778867e-05, "Pretrain/Loss": 2.0468342304229736, "Pretrain/Loss (Raw)": 1.8320789337158203, "Pretrain/Step": 5624, "Pretrain/Step Time": 8.494792096316814} +{"Pretrain/Learning Rate": 4.134817290735874e-05, "Pretrain/Loss": 2.0467777252197266, "Pretrain/Loss (Raw)": 1.9517533779144287, "Pretrain/Step": 5625, "Pretrain/Step Time": 8.496950345113873} +{"Pretrain/Learning Rate": 4.134496095855057e-05, "Pretrain/Loss": 2.047497034072876, "Pretrain/Loss (Raw)": 2.062229871749878, "Pretrain/Step": 5626, "Pretrain/Step Time": 8.489430097863078} +{"Pretrain/Learning Rate": 4.1341748538446975e-05, "Pretrain/Loss": 2.0451536178588867, "Pretrain/Loss (Raw)": 1.9340883493423462, "Pretrain/Step": 5627, "Pretrain/Step Time": 8.496165053918958} +{"Pretrain/Learning Rate": 4.133853564714058e-05, "Pretrain/Loss": 2.0450339317321777, "Pretrain/Loss (Raw)": 2.0628654956817627, "Pretrain/Step": 5628, "Pretrain/Step Time": 8.498816786333919} +{"Pretrain/Learning Rate": 4.133532228472403e-05, "Pretrain/Loss": 2.0429162979125977, "Pretrain/Loss (Raw)": 1.8597629070281982, "Pretrain/Step": 5629, "Pretrain/Step Time": 8.495247127488256} +{"Pretrain/Learning Rate": 4.133210845128998e-05, "Pretrain/Loss": 2.0427372455596924, "Pretrain/Loss (Raw)": 2.1201083660125732, "Pretrain/Step": 5630, "Pretrain/Step Time": 8.495902173221111} +{"Pretrain/Learning Rate": 4.1328894146931085e-05, "Pretrain/Loss": 2.0444352626800537, "Pretrain/Loss (Raw)": 2.203688859939575, "Pretrain/Step": 5631, "Pretrain/Step Time": 8.499879958108068} +{"Pretrain/Learning Rate": 4.1325679371740045e-05, "Pretrain/Loss": 2.0454108715057373, "Pretrain/Loss (Raw)": 2.2123782634735107, "Pretrain/Step": 5632, "Pretrain/Step Time": 8.495414013043046} +{"Pretrain/Learning Rate": 4.1322464125809544e-05, "Pretrain/Loss": 2.0445542335510254, "Pretrain/Loss (Raw)": 1.9945803880691528, "Pretrain/Step": 5633, "Pretrain/Step Time": 8.496619582176208} +{"Pretrain/Learning Rate": 4.13192484092323e-05, "Pretrain/Loss": 2.0455563068389893, "Pretrain/Loss (Raw)": 2.0169644355773926, "Pretrain/Step": 5634, "Pretrain/Step Time": 8.496445981785655} +{"Pretrain/Learning Rate": 4.131603222210104e-05, "Pretrain/Loss": 2.0445401668548584, "Pretrain/Loss (Raw)": 1.9058284759521484, "Pretrain/Step": 5635, "Pretrain/Step Time": 8.489384623244405} +{"Pretrain/Learning Rate": 4.131281556450849e-05, "Pretrain/Loss": 2.0431296825408936, "Pretrain/Loss (Raw)": 2.016207218170166, "Pretrain/Step": 5636, "Pretrain/Step Time": 8.491148814558983} +{"Pretrain/Learning Rate": 4.13095984365474e-05, "Pretrain/Loss": 2.0435709953308105, "Pretrain/Loss (Raw)": 2.0062062740325928, "Pretrain/Step": 5637, "Pretrain/Step Time": 8.493487594649196} +{"Pretrain/Learning Rate": 4.1306380838310534e-05, "Pretrain/Loss": 2.041682481765747, "Pretrain/Loss (Raw)": 2.0220212936401367, "Pretrain/Step": 5638, "Pretrain/Step Time": 8.494672995060682} +{"Pretrain/Learning Rate": 4.130316276989068e-05, "Pretrain/Loss": 2.040372371673584, "Pretrain/Loss (Raw)": 1.8914598226547241, "Pretrain/Step": 5639, "Pretrain/Step Time": 8.489903911948204} +{"Pretrain/Learning Rate": 4.129994423138062e-05, "Pretrain/Loss": 2.0423638820648193, "Pretrain/Loss (Raw)": 2.2778103351593018, "Pretrain/Step": 5640, "Pretrain/Step Time": 8.489277275279164} +{"Pretrain/Learning Rate": 4.129672522287315e-05, "Pretrain/Loss": 2.0433106422424316, "Pretrain/Loss (Raw)": 2.1990864276885986, "Pretrain/Step": 5641, "Pretrain/Step Time": 8.491275114938617} +{"Pretrain/Learning Rate": 4.12935057444611e-05, "Pretrain/Loss": 2.041748285293579, "Pretrain/Loss (Raw)": 1.8438879251480103, "Pretrain/Step": 5642, "Pretrain/Step Time": 8.493877151980996} +{"Pretrain/Learning Rate": 4.1290285796237295e-05, "Pretrain/Loss": 2.041625499725342, "Pretrain/Loss (Raw)": 1.9587773084640503, "Pretrain/Step": 5643, "Pretrain/Step Time": 8.495670814067125} +{"Pretrain/Learning Rate": 4.128706537829459e-05, "Pretrain/Loss": 2.040316104888916, "Pretrain/Loss (Raw)": 1.9388848543167114, "Pretrain/Step": 5644, "Pretrain/Step Time": 8.493675181642175} +{"Pretrain/Learning Rate": 4.1283844490725834e-05, "Pretrain/Loss": 2.0381643772125244, "Pretrain/Loss (Raw)": 2.0807344913482666, "Pretrain/Step": 5645, "Pretrain/Step Time": 8.493503086268902} +{"Pretrain/Learning Rate": 4.1280623133623895e-05, "Pretrain/Loss": 2.038094997406006, "Pretrain/Loss (Raw)": 1.9701862335205078, "Pretrain/Step": 5646, "Pretrain/Step Time": 8.493407923728228} +{"Pretrain/Learning Rate": 4.127740130708167e-05, "Pretrain/Loss": 2.037229537963867, "Pretrain/Loss (Raw)": 1.951870322227478, "Pretrain/Step": 5647, "Pretrain/Step Time": 8.497419500723481} +{"Pretrain/Learning Rate": 4.127417901119205e-05, "Pretrain/Loss": 2.038116931915283, "Pretrain/Loss (Raw)": 2.169912576675415, "Pretrain/Step": 5648, "Pretrain/Step Time": 8.500779511407018} +{"Pretrain/Learning Rate": 4.127095624604795e-05, "Pretrain/Loss": 2.0395712852478027, "Pretrain/Loss (Raw)": 2.0900778770446777, "Pretrain/Step": 5649, "Pretrain/Step Time": 8.50083433277905} +{"Pretrain/Learning Rate": 4.1267733011742304e-05, "Pretrain/Loss": 2.0409200191497803, "Pretrain/Loss (Raw)": 2.0663065910339355, "Pretrain/Step": 5650, "Pretrain/Step Time": 8.500634081661701} +{"Pretrain/Learning Rate": 4.1264509308368046e-05, "Pretrain/Loss": 2.0414371490478516, "Pretrain/Loss (Raw)": 2.0981650352478027, "Pretrain/Step": 5651, "Pretrain/Step Time": 8.501323753967881} +{"Pretrain/Learning Rate": 4.1261285136018126e-05, "Pretrain/Loss": 2.0408213138580322, "Pretrain/Loss (Raw)": 2.023031711578369, "Pretrain/Step": 5652, "Pretrain/Step Time": 8.50251823849976} +{"Pretrain/Learning Rate": 4.125806049478551e-05, "Pretrain/Loss": 2.0396909713745117, "Pretrain/Loss (Raw)": 1.8256527185440063, "Pretrain/Step": 5653, "Pretrain/Step Time": 8.496696341782808} +{"Pretrain/Learning Rate": 4.125483538476318e-05, "Pretrain/Loss": 2.0413737297058105, "Pretrain/Loss (Raw)": 2.041506290435791, "Pretrain/Step": 5654, "Pretrain/Step Time": 8.502628928050399} +{"Pretrain/Learning Rate": 4.125160980604413e-05, "Pretrain/Loss": 2.041229724884033, "Pretrain/Loss (Raw)": 1.944351315498352, "Pretrain/Step": 5655, "Pretrain/Step Time": 8.500384975224733} +{"Pretrain/Learning Rate": 4.124838375872136e-05, "Pretrain/Loss": 2.0442392826080322, "Pretrain/Loss (Raw)": 2.259472370147705, "Pretrain/Step": 5656, "Pretrain/Step Time": 8.500968648120761} +{"Pretrain/Learning Rate": 4.124515724288791e-05, "Pretrain/Loss": 2.048287868499756, "Pretrain/Loss (Raw)": 2.6353838443756104, "Pretrain/Step": 5657, "Pretrain/Step Time": 8.494506657123566} +{"Pretrain/Learning Rate": 4.1241930258636805e-05, "Pretrain/Loss": 2.0482091903686523, "Pretrain/Loss (Raw)": 1.988965392112732, "Pretrain/Step": 5658, "Pretrain/Step Time": 8.49886878579855} +{"Pretrain/Learning Rate": 4.123870280606109e-05, "Pretrain/Loss": 2.0505614280700684, "Pretrain/Loss (Raw)": 2.1810524463653564, "Pretrain/Step": 5659, "Pretrain/Step Time": 8.498400516808033} +{"Pretrain/Learning Rate": 4.123547488525382e-05, "Pretrain/Loss": 2.0523343086242676, "Pretrain/Loss (Raw)": 2.1222620010375977, "Pretrain/Step": 5660, "Pretrain/Step Time": 8.497699992731214} +{"Pretrain/Learning Rate": 4.123224649630808e-05, "Pretrain/Loss": 2.052119731903076, "Pretrain/Loss (Raw)": 2.0146656036376953, "Pretrain/Step": 5661, "Pretrain/Step Time": 8.492365593090653} +{"Pretrain/Learning Rate": 4.1229017639316956e-05, "Pretrain/Loss": 2.053534746170044, "Pretrain/Loss (Raw)": 2.1343088150024414, "Pretrain/Step": 5662, "Pretrain/Step Time": 8.490869130939245} +{"Pretrain/Learning Rate": 4.1225788314373556e-05, "Pretrain/Loss": 2.05316162109375, "Pretrain/Loss (Raw)": 2.0572400093078613, "Pretrain/Step": 5663, "Pretrain/Step Time": 8.49433228559792} +{"Pretrain/Learning Rate": 4.122255852157098e-05, "Pretrain/Loss": 2.0541298389434814, "Pretrain/Loss (Raw)": 2.189681053161621, "Pretrain/Step": 5664, "Pretrain/Step Time": 8.491676740348339} +{"Pretrain/Learning Rate": 4.1219328261002364e-05, "Pretrain/Loss": 2.055544853210449, "Pretrain/Loss (Raw)": 2.1973652839660645, "Pretrain/Step": 5665, "Pretrain/Step Time": 8.497745456174016} +{"Pretrain/Learning Rate": 4.121609753276085e-05, "Pretrain/Loss": 2.055009365081787, "Pretrain/Loss (Raw)": 2.004897356033325, "Pretrain/Step": 5666, "Pretrain/Step Time": 8.495855621993542} +{"Pretrain/Learning Rate": 4.12128663369396e-05, "Pretrain/Loss": 2.0508365631103516, "Pretrain/Loss (Raw)": 1.5490258932113647, "Pretrain/Step": 5667, "Pretrain/Step Time": 8.49617162719369} +{"Pretrain/Learning Rate": 4.120963467363178e-05, "Pretrain/Loss": 2.0475704669952393, "Pretrain/Loss (Raw)": 1.8587665557861328, "Pretrain/Step": 5668, "Pretrain/Step Time": 8.495688425377011} +{"Pretrain/Learning Rate": 4.1206402542930566e-05, "Pretrain/Loss": 2.0489859580993652, "Pretrain/Loss (Raw)": 2.1061463356018066, "Pretrain/Step": 5669, "Pretrain/Step Time": 8.49159430898726} +{"Pretrain/Learning Rate": 4.120316994492917e-05, "Pretrain/Loss": 2.0495996475219727, "Pretrain/Loss (Raw)": 2.007645606994629, "Pretrain/Step": 5670, "Pretrain/Step Time": 8.495515696704388} +{"Pretrain/Learning Rate": 4.119993687972078e-05, "Pretrain/Loss": 2.052048683166504, "Pretrain/Loss (Raw)": 2.107725143432617, "Pretrain/Step": 5671, "Pretrain/Step Time": 8.494889387860894} +{"Pretrain/Learning Rate": 4.119670334739864e-05, "Pretrain/Loss": 2.0528223514556885, "Pretrain/Loss (Raw)": 2.080413818359375, "Pretrain/Step": 5672, "Pretrain/Step Time": 8.495079204440117} +{"Pretrain/Learning Rate": 4.119346934805597e-05, "Pretrain/Loss": 2.0517067909240723, "Pretrain/Loss (Raw)": 1.8026372194290161, "Pretrain/Step": 5673, "Pretrain/Step Time": 8.493568738922477} +{"Pretrain/Learning Rate": 4.119023488178602e-05, "Pretrain/Loss": 2.0520520210266113, "Pretrain/Loss (Raw)": 2.0705721378326416, "Pretrain/Step": 5674, "Pretrain/Step Time": 8.498958807438612} +{"Pretrain/Learning Rate": 4.118699994868207e-05, "Pretrain/Loss": 2.0519888401031494, "Pretrain/Loss (Raw)": 2.008427381515503, "Pretrain/Step": 5675, "Pretrain/Step Time": 8.4981648940593} +{"Pretrain/Learning Rate": 4.118376454883739e-05, "Pretrain/Loss": 2.055591583251953, "Pretrain/Loss (Raw)": 2.4779722690582275, "Pretrain/Step": 5676, "Pretrain/Step Time": 8.496282074600458} +{"Pretrain/Learning Rate": 4.118052868234526e-05, "Pretrain/Loss": 2.054298162460327, "Pretrain/Loss (Raw)": 1.7770335674285889, "Pretrain/Step": 5677, "Pretrain/Step Time": 8.494898308068514} +{"Pretrain/Learning Rate": 4.1177292349299e-05, "Pretrain/Loss": 2.0553359985351562, "Pretrain/Loss (Raw)": 2.007636785507202, "Pretrain/Step": 5678, "Pretrain/Step Time": 8.496318263933063} +{"Pretrain/Learning Rate": 4.1174055549791915e-05, "Pretrain/Loss": 2.0542917251586914, "Pretrain/Loss (Raw)": 2.2184762954711914, "Pretrain/Step": 5679, "Pretrain/Step Time": 8.49539689347148} +{"Pretrain/Learning Rate": 4.117081828391733e-05, "Pretrain/Loss": 2.054565191268921, "Pretrain/Loss (Raw)": 1.9094812870025635, "Pretrain/Step": 5680, "Pretrain/Step Time": 8.494296124204993} +{"Pretrain/Learning Rate": 4.116758055176862e-05, "Pretrain/Loss": 2.054456949234009, "Pretrain/Loss (Raw)": 2.150261640548706, "Pretrain/Step": 5681, "Pretrain/Step Time": 8.491427537053823} +{"Pretrain/Learning Rate": 4.116434235343911e-05, "Pretrain/Loss": 2.0537028312683105, "Pretrain/Loss (Raw)": 1.831470012664795, "Pretrain/Step": 5682, "Pretrain/Step Time": 8.497713435441256} +{"Pretrain/Learning Rate": 4.1161103689022186e-05, "Pretrain/Loss": 2.0496439933776855, "Pretrain/Loss (Raw)": 1.8842183351516724, "Pretrain/Step": 5683, "Pretrain/Step Time": 8.496971637010574} +{"Pretrain/Learning Rate": 4.115786455861124e-05, "Pretrain/Loss": 2.0496420860290527, "Pretrain/Loss (Raw)": 1.9520986080169678, "Pretrain/Step": 5684, "Pretrain/Step Time": 8.496317148208618} +{"Pretrain/Learning Rate": 4.1154624962299637e-05, "Pretrain/Loss": 2.052517890930176, "Pretrain/Loss (Raw)": 2.125194787979126, "Pretrain/Step": 5685, "Pretrain/Step Time": 8.494737720116973} +{"Pretrain/Learning Rate": 4.1151384900180826e-05, "Pretrain/Loss": 2.0554347038269043, "Pretrain/Loss (Raw)": 2.3832976818084717, "Pretrain/Step": 5686, "Pretrain/Step Time": 8.491109618917108} +{"Pretrain/Learning Rate": 4.1148144372348216e-05, "Pretrain/Loss": 2.0554962158203125, "Pretrain/Loss (Raw)": 2.028783082962036, "Pretrain/Step": 5687, "Pretrain/Step Time": 8.489683194085956} +{"Pretrain/Learning Rate": 4.114490337889525e-05, "Pretrain/Loss": 2.0537354946136475, "Pretrain/Loss (Raw)": 1.9153549671173096, "Pretrain/Step": 5688, "Pretrain/Step Time": 8.49129786528647} +{"Pretrain/Learning Rate": 4.114166191991537e-05, "Pretrain/Loss": 2.0537261962890625, "Pretrain/Loss (Raw)": 2.159095048904419, "Pretrain/Step": 5689, "Pretrain/Step Time": 8.492157693952322} +{"Pretrain/Learning Rate": 4.113841999550205e-05, "Pretrain/Loss": 2.0524115562438965, "Pretrain/Loss (Raw)": 1.8524281978607178, "Pretrain/Step": 5690, "Pretrain/Step Time": 8.49547348357737} +{"Pretrain/Learning Rate": 4.1135177605748764e-05, "Pretrain/Loss": 2.052656650543213, "Pretrain/Loss (Raw)": 2.1690633296966553, "Pretrain/Step": 5691, "Pretrain/Step Time": 8.494294729083776} +{"Pretrain/Learning Rate": 4.1131934750749016e-05, "Pretrain/Loss": 2.053562641143799, "Pretrain/Loss (Raw)": 2.026195764541626, "Pretrain/Step": 5692, "Pretrain/Step Time": 8.493840971961617} +{"Pretrain/Learning Rate": 4.112869143059629e-05, "Pretrain/Loss": 2.0545060634613037, "Pretrain/Loss (Raw)": 2.0861403942108154, "Pretrain/Step": 5693, "Pretrain/Step Time": 8.495111983269453} +{"Pretrain/Learning Rate": 4.1125447645384116e-05, "Pretrain/Loss": 2.0530614852905273, "Pretrain/Loss (Raw)": 1.8871654272079468, "Pretrain/Step": 5694, "Pretrain/Step Time": 8.496424106881022} +{"Pretrain/Learning Rate": 4.1122203395206036e-05, "Pretrain/Loss": 2.050171136856079, "Pretrain/Loss (Raw)": 1.7248603105545044, "Pretrain/Step": 5695, "Pretrain/Step Time": 8.49335229024291} +{"Pretrain/Learning Rate": 4.111895868015559e-05, "Pretrain/Loss": 2.0508482456207275, "Pretrain/Loss (Raw)": 2.0637993812561035, "Pretrain/Step": 5696, "Pretrain/Step Time": 8.496265282854438} +{"Pretrain/Learning Rate": 4.111571350032632e-05, "Pretrain/Loss": 2.047309160232544, "Pretrain/Loss (Raw)": 1.9693880081176758, "Pretrain/Step": 5697, "Pretrain/Step Time": 8.497511129826307} +{"Pretrain/Learning Rate": 4.111246785581181e-05, "Pretrain/Loss": 2.04691743850708, "Pretrain/Loss (Raw)": 1.9242055416107178, "Pretrain/Step": 5698, "Pretrain/Step Time": 8.497055873274803} +{"Pretrain/Learning Rate": 4.110922174670566e-05, "Pretrain/Loss": 2.0481629371643066, "Pretrain/Loss (Raw)": 2.1527998447418213, "Pretrain/Step": 5699, "Pretrain/Step Time": 8.496283521875739} +{"Pretrain/Learning Rate": 4.110597517310145e-05, "Pretrain/Loss": 2.0478217601776123, "Pretrain/Loss (Raw)": 1.9554001092910767, "Pretrain/Step": 5700, "Pretrain/Step Time": 8.491355517879128} +{"Pretrain/Learning Rate": 4.11027281350928e-05, "Pretrain/Loss": 2.0486817359924316, "Pretrain/Loss (Raw)": 2.2265515327453613, "Pretrain/Step": 5701, "Pretrain/Step Time": 8.496132418513298} +{"Pretrain/Learning Rate": 4.109948063277335e-05, "Pretrain/Loss": 2.0472733974456787, "Pretrain/Loss (Raw)": 1.8550972938537598, "Pretrain/Step": 5702, "Pretrain/Step Time": 8.49296503700316} +{"Pretrain/Learning Rate": 4.1096232666236715e-05, "Pretrain/Loss": 2.0470070838928223, "Pretrain/Loss (Raw)": 2.1047630310058594, "Pretrain/Step": 5703, "Pretrain/Step Time": 8.49333692342043} +{"Pretrain/Learning Rate": 4.109298423557655e-05, "Pretrain/Loss": 2.045116662979126, "Pretrain/Loss (Raw)": 2.038442611694336, "Pretrain/Step": 5704, "Pretrain/Step Time": 8.494418511167169} +{"Pretrain/Learning Rate": 4.1089735340886536e-05, "Pretrain/Loss": 2.0454273223876953, "Pretrain/Loss (Raw)": 1.950140357017517, "Pretrain/Step": 5705, "Pretrain/Step Time": 8.493721421808004} +{"Pretrain/Learning Rate": 4.108648598226035e-05, "Pretrain/Loss": 2.044994354248047, "Pretrain/Loss (Raw)": 2.0837621688842773, "Pretrain/Step": 5706, "Pretrain/Step Time": 8.493539677932858} +{"Pretrain/Learning Rate": 4.108323615979168e-05, "Pretrain/Loss": 2.0478453636169434, "Pretrain/Loss (Raw)": 2.485884666442871, "Pretrain/Step": 5707, "Pretrain/Step Time": 8.496503250673413} +{"Pretrain/Learning Rate": 4.107998587357423e-05, "Pretrain/Loss": 2.047879695892334, "Pretrain/Loss (Raw)": 2.1815176010131836, "Pretrain/Step": 5708, "Pretrain/Step Time": 8.493390448391438} +{"Pretrain/Learning Rate": 4.107673512370172e-05, "Pretrain/Loss": 2.048616886138916, "Pretrain/Loss (Raw)": 1.940353274345398, "Pretrain/Step": 5709, "Pretrain/Step Time": 8.494066897779703} +{"Pretrain/Learning Rate": 4.107348391026789e-05, "Pretrain/Loss": 2.042832374572754, "Pretrain/Loss (Raw)": 1.8167954683303833, "Pretrain/Step": 5710, "Pretrain/Step Time": 8.486877487972379} +{"Pretrain/Learning Rate": 4.107023223336649e-05, "Pretrain/Loss": 2.043919324874878, "Pretrain/Loss (Raw)": 2.0705580711364746, "Pretrain/Step": 5711, "Pretrain/Step Time": 8.48634871467948} +{"Pretrain/Learning Rate": 4.1066980093091256e-05, "Pretrain/Loss": 2.043478488922119, "Pretrain/Loss (Raw)": 2.072457790374756, "Pretrain/Step": 5712, "Pretrain/Step Time": 8.486982382833958} +{"Pretrain/Learning Rate": 4.106372748953599e-05, "Pretrain/Loss": 2.0450754165649414, "Pretrain/Loss (Raw)": 1.9462933540344238, "Pretrain/Step": 5713, "Pretrain/Step Time": 8.48790768161416} +{"Pretrain/Learning Rate": 4.106047442279446e-05, "Pretrain/Loss": 2.0445218086242676, "Pretrain/Loss (Raw)": 2.001154661178589, "Pretrain/Step": 5714, "Pretrain/Step Time": 8.48749454319477} +{"Pretrain/Learning Rate": 4.105722089296048e-05, "Pretrain/Loss": 2.0425896644592285, "Pretrain/Loss (Raw)": 2.075766086578369, "Pretrain/Step": 5715, "Pretrain/Step Time": 8.489178735762835} +{"Pretrain/Learning Rate": 4.105396690012784e-05, "Pretrain/Loss": 2.0393247604370117, "Pretrain/Loss (Raw)": 2.0927789211273193, "Pretrain/Step": 5716, "Pretrain/Step Time": 8.489148704335093} +{"Pretrain/Learning Rate": 4.105071244439039e-05, "Pretrain/Loss": 2.0423378944396973, "Pretrain/Loss (Raw)": 1.971750020980835, "Pretrain/Step": 5717, "Pretrain/Step Time": 8.487772973254323} +{"Pretrain/Learning Rate": 4.104745752584197e-05, "Pretrain/Loss": 2.0393617153167725, "Pretrain/Loss (Raw)": 1.852750539779663, "Pretrain/Step": 5718, "Pretrain/Step Time": 8.486045081168413} +{"Pretrain/Learning Rate": 4.1044202144576416e-05, "Pretrain/Loss": 2.04025936126709, "Pretrain/Loss (Raw)": 2.134397268295288, "Pretrain/Step": 5719, "Pretrain/Step Time": 8.488236613571644} +{"Pretrain/Learning Rate": 4.1040946300687604e-05, "Pretrain/Loss": 2.0346429347991943, "Pretrain/Loss (Raw)": 1.7786482572555542, "Pretrain/Step": 5720, "Pretrain/Step Time": 8.485570879653096} +{"Pretrain/Learning Rate": 4.103768999426941e-05, "Pretrain/Loss": 2.0367817878723145, "Pretrain/Loss (Raw)": 2.240360975265503, "Pretrain/Step": 5721, "Pretrain/Step Time": 8.487120846286416} +{"Pretrain/Learning Rate": 4.103443322541574e-05, "Pretrain/Loss": 2.0338242053985596, "Pretrain/Loss (Raw)": 1.6991145610809326, "Pretrain/Step": 5722, "Pretrain/Step Time": 8.482693176716566} +{"Pretrain/Learning Rate": 4.103117599422049e-05, "Pretrain/Loss": 2.031385898590088, "Pretrain/Loss (Raw)": 2.0690712928771973, "Pretrain/Step": 5723, "Pretrain/Step Time": 8.484602658078074} +{"Pretrain/Learning Rate": 4.102791830077758e-05, "Pretrain/Loss": 2.031491279602051, "Pretrain/Loss (Raw)": 1.9534980058670044, "Pretrain/Step": 5724, "Pretrain/Step Time": 8.48698647506535} +{"Pretrain/Learning Rate": 4.102466014518094e-05, "Pretrain/Loss": 2.033045768737793, "Pretrain/Loss (Raw)": 2.2264297008514404, "Pretrain/Step": 5725, "Pretrain/Step Time": 8.481537330895662} +{"Pretrain/Learning Rate": 4.1021401527524526e-05, "Pretrain/Loss": 2.0308127403259277, "Pretrain/Loss (Raw)": 1.998315691947937, "Pretrain/Step": 5726, "Pretrain/Step Time": 8.484904559329152} +{"Pretrain/Learning Rate": 4.1018142447902296e-05, "Pretrain/Loss": 2.0307369232177734, "Pretrain/Loss (Raw)": 2.023695468902588, "Pretrain/Step": 5727, "Pretrain/Step Time": 8.480909749865532} +{"Pretrain/Learning Rate": 4.101488290640821e-05, "Pretrain/Loss": 2.031125545501709, "Pretrain/Loss (Raw)": 1.9025944471359253, "Pretrain/Step": 5728, "Pretrain/Step Time": 8.484063552692533} +{"Pretrain/Learning Rate": 4.1011622903136275e-05, "Pretrain/Loss": 2.031686544418335, "Pretrain/Loss (Raw)": 2.1239399909973145, "Pretrain/Step": 5729, "Pretrain/Step Time": 8.485496260225773} +{"Pretrain/Learning Rate": 4.100836243818048e-05, "Pretrain/Loss": 2.031245231628418, "Pretrain/Loss (Raw)": 1.9908533096313477, "Pretrain/Step": 5730, "Pretrain/Step Time": 8.485307231545448} +{"Pretrain/Learning Rate": 4.100510151163484e-05, "Pretrain/Loss": 2.0340585708618164, "Pretrain/Loss (Raw)": 2.4852590560913086, "Pretrain/Step": 5731, "Pretrain/Step Time": 8.490936310961843} +{"Pretrain/Learning Rate": 4.100184012359337e-05, "Pretrain/Loss": 2.0340144634246826, "Pretrain/Loss (Raw)": 1.9858732223510742, "Pretrain/Step": 5732, "Pretrain/Step Time": 8.485699879005551} +{"Pretrain/Learning Rate": 4.099857827415013e-05, "Pretrain/Loss": 2.0360538959503174, "Pretrain/Loss (Raw)": 2.0767319202423096, "Pretrain/Step": 5733, "Pretrain/Step Time": 8.486950038000941} +{"Pretrain/Learning Rate": 4.099531596339916e-05, "Pretrain/Loss": 2.0361199378967285, "Pretrain/Loss (Raw)": 2.1125259399414062, "Pretrain/Step": 5734, "Pretrain/Step Time": 8.484086165204644} +{"Pretrain/Learning Rate": 4.099205319143453e-05, "Pretrain/Loss": 2.037259101867676, "Pretrain/Loss (Raw)": 2.0767970085144043, "Pretrain/Step": 5735, "Pretrain/Step Time": 8.483347879722714} +{"Pretrain/Learning Rate": 4.098878995835033e-05, "Pretrain/Loss": 2.037566900253296, "Pretrain/Loss (Raw)": 2.09271240234375, "Pretrain/Step": 5736, "Pretrain/Step Time": 8.489551709964871} +{"Pretrain/Learning Rate": 4.0985526264240636e-05, "Pretrain/Loss": 2.0372400283813477, "Pretrain/Loss (Raw)": 1.9889795780181885, "Pretrain/Step": 5737, "Pretrain/Step Time": 8.486465847119689} +{"Pretrain/Learning Rate": 4.0982262109199554e-05, "Pretrain/Loss": 2.0364418029785156, "Pretrain/Loss (Raw)": 1.948729395866394, "Pretrain/Step": 5738, "Pretrain/Step Time": 8.486408980563283} +{"Pretrain/Learning Rate": 4.097899749332122e-05, "Pretrain/Loss": 2.0411338806152344, "Pretrain/Loss (Raw)": 2.596970319747925, "Pretrain/Step": 5739, "Pretrain/Step Time": 8.488288583233953} +{"Pretrain/Learning Rate": 4.097573241669975e-05, "Pretrain/Loss": 2.040160655975342, "Pretrain/Loss (Raw)": 2.0382866859436035, "Pretrain/Step": 5740, "Pretrain/Step Time": 8.486592315137386} +{"Pretrain/Learning Rate": 4.09724668794293e-05, "Pretrain/Loss": 2.0377612113952637, "Pretrain/Loss (Raw)": 1.8190292119979858, "Pretrain/Step": 5741, "Pretrain/Step Time": 8.484911609441042} +{"Pretrain/Learning Rate": 4.0969200881604035e-05, "Pretrain/Loss": 2.0409021377563477, "Pretrain/Loss (Raw)": 2.2996156215667725, "Pretrain/Step": 5742, "Pretrain/Step Time": 8.484543649479747} +{"Pretrain/Learning Rate": 4.096593442331812e-05, "Pretrain/Loss": 2.0409555435180664, "Pretrain/Loss (Raw)": 1.9548301696777344, "Pretrain/Step": 5743, "Pretrain/Step Time": 8.489417620003223} +{"Pretrain/Learning Rate": 4.096266750466573e-05, "Pretrain/Loss": 2.043766975402832, "Pretrain/Loss (Raw)": 2.369835376739502, "Pretrain/Step": 5744, "Pretrain/Step Time": 8.48414846137166} +{"Pretrain/Learning Rate": 4.0959400125741085e-05, "Pretrain/Loss": 2.044301986694336, "Pretrain/Loss (Raw)": 2.2101988792419434, "Pretrain/Step": 5745, "Pretrain/Step Time": 8.488690013065934} +{"Pretrain/Learning Rate": 4.095613228663838e-05, "Pretrain/Loss": 2.0447635650634766, "Pretrain/Loss (Raw)": 2.0142524242401123, "Pretrain/Step": 5746, "Pretrain/Step Time": 8.495050020515919} +{"Pretrain/Learning Rate": 4.0952863987451865e-05, "Pretrain/Loss": 2.0432889461517334, "Pretrain/Loss (Raw)": 2.0628490447998047, "Pretrain/Step": 5747, "Pretrain/Step Time": 8.495980616658926} +{"Pretrain/Learning Rate": 4.094959522827574e-05, "Pretrain/Loss": 2.0445704460144043, "Pretrain/Loss (Raw)": 2.0292060375213623, "Pretrain/Step": 5748, "Pretrain/Step Time": 8.496808277443051} +{"Pretrain/Learning Rate": 4.0946326009204296e-05, "Pretrain/Loss": 2.043707847595215, "Pretrain/Loss (Raw)": 1.9715644121170044, "Pretrain/Step": 5749, "Pretrain/Step Time": 8.491958558559418} +{"Pretrain/Learning Rate": 4.094305633033178e-05, "Pretrain/Loss": 2.0446481704711914, "Pretrain/Loss (Raw)": 2.0430140495300293, "Pretrain/Step": 5750, "Pretrain/Step Time": 8.494385158643126} +{"Pretrain/Learning Rate": 4.093978619175247e-05, "Pretrain/Loss": 2.0442285537719727, "Pretrain/Loss (Raw)": 1.9953093528747559, "Pretrain/Step": 5751, "Pretrain/Step Time": 8.491366973146796} +{"Pretrain/Learning Rate": 4.093651559356067e-05, "Pretrain/Loss": 2.045104503631592, "Pretrain/Loss (Raw)": 1.9442005157470703, "Pretrain/Step": 5752, "Pretrain/Step Time": 8.49991286918521} +{"Pretrain/Learning Rate": 4.093324453585067e-05, "Pretrain/Loss": 2.04586124420166, "Pretrain/Loss (Raw)": 2.0486321449279785, "Pretrain/Step": 5753, "Pretrain/Step Time": 8.497119536623359} +{"Pretrain/Learning Rate": 4.0929973018716794e-05, "Pretrain/Loss": 2.046795606613159, "Pretrain/Loss (Raw)": 2.1818268299102783, "Pretrain/Step": 5754, "Pretrain/Step Time": 8.500934429466724} +{"Pretrain/Learning Rate": 4.0926701042253376e-05, "Pretrain/Loss": 2.046168804168701, "Pretrain/Loss (Raw)": 1.8538578748703003, "Pretrain/Step": 5755, "Pretrain/Step Time": 8.4967894051224} +{"Pretrain/Learning Rate": 4.092342860655477e-05, "Pretrain/Loss": 2.0460026264190674, "Pretrain/Loss (Raw)": 2.0415940284729004, "Pretrain/Step": 5756, "Pretrain/Step Time": 8.496125802397728} +{"Pretrain/Learning Rate": 4.0920155711715326e-05, "Pretrain/Loss": 2.048088312149048, "Pretrain/Loss (Raw)": 2.126723051071167, "Pretrain/Step": 5757, "Pretrain/Step Time": 8.495750388130546} +{"Pretrain/Learning Rate": 4.0916882357829406e-05, "Pretrain/Loss": 2.045647144317627, "Pretrain/Loss (Raw)": 1.8076651096343994, "Pretrain/Step": 5758, "Pretrain/Step Time": 8.495016010478139} +{"Pretrain/Learning Rate": 4.09136085449914e-05, "Pretrain/Loss": 2.042807102203369, "Pretrain/Loss (Raw)": 1.8401504755020142, "Pretrain/Step": 5759, "Pretrain/Step Time": 8.494442647323012} +{"Pretrain/Learning Rate": 4.091033427329572e-05, "Pretrain/Loss": 2.041419506072998, "Pretrain/Loss (Raw)": 2.034742832183838, "Pretrain/Step": 5760, "Pretrain/Step Time": 8.495370883494616} +{"Pretrain/Learning Rate": 4.0907059542836766e-05, "Pretrain/Loss": 2.0426597595214844, "Pretrain/Loss (Raw)": 2.1533541679382324, "Pretrain/Step": 5761, "Pretrain/Step Time": 8.495192160829902} +{"Pretrain/Learning Rate": 4.090378435370896e-05, "Pretrain/Loss": 2.0414958000183105, "Pretrain/Loss (Raw)": 1.8679864406585693, "Pretrain/Step": 5762, "Pretrain/Step Time": 8.495578117668629} +{"Pretrain/Learning Rate": 4.090050870600675e-05, "Pretrain/Loss": 2.040069580078125, "Pretrain/Loss (Raw)": 1.7232657670974731, "Pretrain/Step": 5763, "Pretrain/Step Time": 8.503119939938188} +{"Pretrain/Learning Rate": 4.089723259982458e-05, "Pretrain/Loss": 2.039310932159424, "Pretrain/Loss (Raw)": 1.919087290763855, "Pretrain/Step": 5764, "Pretrain/Step Time": 8.504246084019542} +{"Pretrain/Learning Rate": 4.089395603525691e-05, "Pretrain/Loss": 2.0393028259277344, "Pretrain/Loss (Raw)": 2.0051896572113037, "Pretrain/Step": 5765, "Pretrain/Step Time": 8.500460578128695} +{"Pretrain/Learning Rate": 4.0890679012398225e-05, "Pretrain/Loss": 2.0403518676757812, "Pretrain/Loss (Raw)": 2.1562771797180176, "Pretrain/Step": 5766, "Pretrain/Step Time": 8.498343469575047} +{"Pretrain/Learning Rate": 4.088740153134301e-05, "Pretrain/Loss": 2.0429911613464355, "Pretrain/Loss (Raw)": 2.229273557662964, "Pretrain/Step": 5767, "Pretrain/Step Time": 8.504860445857048} +{"Pretrain/Learning Rate": 4.088412359218577e-05, "Pretrain/Loss": 2.0415713787078857, "Pretrain/Loss (Raw)": 2.096081018447876, "Pretrain/Step": 5768, "Pretrain/Step Time": 8.505333350971341} +{"Pretrain/Learning Rate": 4.0880845195021035e-05, "Pretrain/Loss": 2.041217803955078, "Pretrain/Loss (Raw)": 2.153839588165283, "Pretrain/Step": 5769, "Pretrain/Step Time": 8.50131269544363} +{"Pretrain/Learning Rate": 4.087756633994331e-05, "Pretrain/Loss": 2.0426268577575684, "Pretrain/Loss (Raw)": 2.0242457389831543, "Pretrain/Step": 5770, "Pretrain/Step Time": 8.500283548608422} +{"Pretrain/Learning Rate": 4.087428702704716e-05, "Pretrain/Loss": 2.0446181297302246, "Pretrain/Loss (Raw)": 2.213665008544922, "Pretrain/Step": 5771, "Pretrain/Step Time": 8.501243956387043} +{"Pretrain/Learning Rate": 4.087100725642713e-05, "Pretrain/Loss": 2.045546054840088, "Pretrain/Loss (Raw)": 2.0576584339141846, "Pretrain/Step": 5772, "Pretrain/Step Time": 8.501033276319504} +{"Pretrain/Learning Rate": 4.08677270281778e-05, "Pretrain/Loss": 2.0439300537109375, "Pretrain/Loss (Raw)": 1.8738945722579956, "Pretrain/Step": 5773, "Pretrain/Step Time": 8.502388834953308} +{"Pretrain/Learning Rate": 4.086444634239375e-05, "Pretrain/Loss": 2.0454840660095215, "Pretrain/Loss (Raw)": 2.169084072113037, "Pretrain/Step": 5774, "Pretrain/Step Time": 8.503575855866075} +{"Pretrain/Learning Rate": 4.086116519916956e-05, "Pretrain/Loss": 2.045536994934082, "Pretrain/Loss (Raw)": 1.9586527347564697, "Pretrain/Step": 5775, "Pretrain/Step Time": 8.50322112813592} +{"Pretrain/Learning Rate": 4.085788359859986e-05, "Pretrain/Loss": 2.04415225982666, "Pretrain/Loss (Raw)": 1.9926872253417969, "Pretrain/Step": 5776, "Pretrain/Step Time": 8.501932060346007} +{"Pretrain/Learning Rate": 4.085460154077927e-05, "Pretrain/Loss": 2.0445046424865723, "Pretrain/Loss (Raw)": 2.135165214538574, "Pretrain/Step": 5777, "Pretrain/Step Time": 8.500490233302116} +{"Pretrain/Learning Rate": 4.085131902580242e-05, "Pretrain/Loss": 2.043673038482666, "Pretrain/Loss (Raw)": 1.9598655700683594, "Pretrain/Step": 5778, "Pretrain/Step Time": 8.50116297416389} +{"Pretrain/Learning Rate": 4.084803605376395e-05, "Pretrain/Loss": 2.043099880218506, "Pretrain/Loss (Raw)": 2.024790048599243, "Pretrain/Step": 5779, "Pretrain/Step Time": 8.499435221776366} +{"Pretrain/Learning Rate": 4.084475262475854e-05, "Pretrain/Loss": 2.0451409816741943, "Pretrain/Loss (Raw)": 2.2842929363250732, "Pretrain/Step": 5780, "Pretrain/Step Time": 8.50506516546011} +{"Pretrain/Learning Rate": 4.084146873888086e-05, "Pretrain/Loss": 2.0478322505950928, "Pretrain/Loss (Raw)": 2.1701455116271973, "Pretrain/Step": 5781, "Pretrain/Step Time": 8.508809637278318} +{"Pretrain/Learning Rate": 4.0838184396225595e-05, "Pretrain/Loss": 2.0479207038879395, "Pretrain/Loss (Raw)": 2.0528109073638916, "Pretrain/Step": 5782, "Pretrain/Step Time": 8.501641312614083} +{"Pretrain/Learning Rate": 4.083489959688744e-05, "Pretrain/Loss": 2.0489675998687744, "Pretrain/Loss (Raw)": 2.078350782394409, "Pretrain/Step": 5783, "Pretrain/Step Time": 8.5039973706007} +{"Pretrain/Learning Rate": 4.0831614340961135e-05, "Pretrain/Loss": 2.0472187995910645, "Pretrain/Loss (Raw)": 2.0356242656707764, "Pretrain/Step": 5784, "Pretrain/Step Time": 8.50527168251574} +{"Pretrain/Learning Rate": 4.082832862854138e-05, "Pretrain/Loss": 2.0428013801574707, "Pretrain/Loss (Raw)": 2.0699825286865234, "Pretrain/Step": 5785, "Pretrain/Step Time": 8.50429704785347} +{"Pretrain/Learning Rate": 4.082504245972292e-05, "Pretrain/Loss": 2.0443942546844482, "Pretrain/Loss (Raw)": 2.1928229331970215, "Pretrain/Step": 5786, "Pretrain/Step Time": 8.498505370691419} +{"Pretrain/Learning Rate": 4.082175583460053e-05, "Pretrain/Loss": 2.0436325073242188, "Pretrain/Loss (Raw)": 2.083561897277832, "Pretrain/Step": 5787, "Pretrain/Step Time": 8.497297959402204} +{"Pretrain/Learning Rate": 4.0818468753268956e-05, "Pretrain/Loss": 2.044193744659424, "Pretrain/Loss (Raw)": 2.1941049098968506, "Pretrain/Step": 5788, "Pretrain/Step Time": 8.497684055939317} +{"Pretrain/Learning Rate": 4.0815181215822995e-05, "Pretrain/Loss": 2.044827461242676, "Pretrain/Loss (Raw)": 2.0957608222961426, "Pretrain/Step": 5789, "Pretrain/Step Time": 8.497994339093566} +{"Pretrain/Learning Rate": 4.081189322235742e-05, "Pretrain/Loss": 2.0431625843048096, "Pretrain/Loss (Raw)": 1.9212242364883423, "Pretrain/Step": 5790, "Pretrain/Step Time": 8.501704161986709} +{"Pretrain/Learning Rate": 4.0808604772967063e-05, "Pretrain/Loss": 2.0423688888549805, "Pretrain/Loss (Raw)": 1.955657958984375, "Pretrain/Step": 5791, "Pretrain/Step Time": 8.497055523097515} +{"Pretrain/Learning Rate": 4.080531586774673e-05, "Pretrain/Loss": 2.0406384468078613, "Pretrain/Loss (Raw)": 1.9681836366653442, "Pretrain/Step": 5792, "Pretrain/Step Time": 8.499128157272935} +{"Pretrain/Learning Rate": 4.080202650679125e-05, "Pretrain/Loss": 2.0415890216827393, "Pretrain/Loss (Raw)": 2.319023370742798, "Pretrain/Step": 5793, "Pretrain/Step Time": 8.497170869261026} +{"Pretrain/Learning Rate": 4.079873669019548e-05, "Pretrain/Loss": 2.0420007705688477, "Pretrain/Loss (Raw)": 2.057590961456299, "Pretrain/Step": 5794, "Pretrain/Step Time": 8.496245935559273} +{"Pretrain/Learning Rate": 4.0795446418054275e-05, "Pretrain/Loss": 2.0443027019500732, "Pretrain/Loss (Raw)": 1.8436839580535889, "Pretrain/Step": 5795, "Pretrain/Step Time": 8.497698076069355} +{"Pretrain/Learning Rate": 4.07921556904625e-05, "Pretrain/Loss": 2.047006368637085, "Pretrain/Loss (Raw)": 2.2048370838165283, "Pretrain/Step": 5796, "Pretrain/Step Time": 8.496216218918562} +{"Pretrain/Learning Rate": 4.078886450751506e-05, "Pretrain/Loss": 2.0448899269104004, "Pretrain/Loss (Raw)": 1.8352211713790894, "Pretrain/Step": 5797, "Pretrain/Step Time": 8.50023689866066} +{"Pretrain/Learning Rate": 4.078557286930683e-05, "Pretrain/Loss": 2.0452005863189697, "Pretrain/Loss (Raw)": 2.047438859939575, "Pretrain/Step": 5798, "Pretrain/Step Time": 8.501733418554068} +{"Pretrain/Learning Rate": 4.078228077593275e-05, "Pretrain/Loss": 2.045545816421509, "Pretrain/Loss (Raw)": 2.1519036293029785, "Pretrain/Step": 5799, "Pretrain/Step Time": 8.50221411883831} +{"Pretrain/Learning Rate": 4.077898822748771e-05, "Pretrain/Loss": 2.043294906616211, "Pretrain/Loss (Raw)": 1.7922961711883545, "Pretrain/Step": 5800, "Pretrain/Step Time": 8.502446744590998} +{"Pretrain/Learning Rate": 4.077569522406668e-05, "Pretrain/Loss": 2.0462000370025635, "Pretrain/Loss (Raw)": 2.174497604370117, "Pretrain/Step": 5801, "Pretrain/Step Time": 8.50031115859747} +{"Pretrain/Learning Rate": 4.07724017657646e-05, "Pretrain/Loss": 2.0434513092041016, "Pretrain/Loss (Raw)": 1.7187479734420776, "Pretrain/Step": 5802, "Pretrain/Step Time": 8.498257290571928} +{"Pretrain/Learning Rate": 4.076910785267644e-05, "Pretrain/Loss": 2.0434510707855225, "Pretrain/Loss (Raw)": 2.0083799362182617, "Pretrain/Step": 5803, "Pretrain/Step Time": 8.497460471466184} +{"Pretrain/Learning Rate": 4.0765813484897154e-05, "Pretrain/Loss": 2.0346999168395996, "Pretrain/Loss (Raw)": 1.3578226566314697, "Pretrain/Step": 5804, "Pretrain/Step Time": 8.495273787528276} +{"Pretrain/Learning Rate": 4.0762518662521765e-05, "Pretrain/Loss": 2.0367813110351562, "Pretrain/Loss (Raw)": 2.043480157852173, "Pretrain/Step": 5805, "Pretrain/Step Time": 8.492591939866543} +{"Pretrain/Learning Rate": 4.075922338564525e-05, "Pretrain/Loss": 2.037229537963867, "Pretrain/Loss (Raw)": 2.0650031566619873, "Pretrain/Step": 5806, "Pretrain/Step Time": 8.495554717257619} +{"Pretrain/Learning Rate": 4.075592765436265e-05, "Pretrain/Loss": 2.0368475914001465, "Pretrain/Loss (Raw)": 2.1695785522460938, "Pretrain/Step": 5807, "Pretrain/Step Time": 8.496554279699922} +{"Pretrain/Learning Rate": 4.075263146876898e-05, "Pretrain/Loss": 2.0352840423583984, "Pretrain/Loss (Raw)": 1.70933198928833, "Pretrain/Step": 5808, "Pretrain/Step Time": 8.492000445723534} +{"Pretrain/Learning Rate": 4.074933482895928e-05, "Pretrain/Loss": 2.0345962047576904, "Pretrain/Loss (Raw)": 2.062225818634033, "Pretrain/Step": 5809, "Pretrain/Step Time": 8.493690373376012} +{"Pretrain/Learning Rate": 4.074603773502862e-05, "Pretrain/Loss": 2.0369150638580322, "Pretrain/Loss (Raw)": 2.1282801628112793, "Pretrain/Step": 5810, "Pretrain/Step Time": 8.497294120490551} +{"Pretrain/Learning Rate": 4.074274018707206e-05, "Pretrain/Loss": 2.038464069366455, "Pretrain/Loss (Raw)": 2.082486391067505, "Pretrain/Step": 5811, "Pretrain/Step Time": 8.497487243264914} +{"Pretrain/Learning Rate": 4.0739442185184685e-05, "Pretrain/Loss": 2.0389091968536377, "Pretrain/Loss (Raw)": 2.009082555770874, "Pretrain/Step": 5812, "Pretrain/Step Time": 8.496392672881484} +{"Pretrain/Learning Rate": 4.073614372946159e-05, "Pretrain/Loss": 2.0390727519989014, "Pretrain/Loss (Raw)": 2.146134853363037, "Pretrain/Step": 5813, "Pretrain/Step Time": 8.501220654696226} +{"Pretrain/Learning Rate": 4.073284481999788e-05, "Pretrain/Loss": 2.036978244781494, "Pretrain/Loss (Raw)": 2.115208864212036, "Pretrain/Step": 5814, "Pretrain/Step Time": 8.499690053984523} +{"Pretrain/Learning Rate": 4.0729545456888684e-05, "Pretrain/Loss": 2.036831855773926, "Pretrain/Loss (Raw)": 2.0100417137145996, "Pretrain/Step": 5815, "Pretrain/Step Time": 8.505803320556879} +{"Pretrain/Learning Rate": 4.072624564022914e-05, "Pretrain/Loss": 2.0370752811431885, "Pretrain/Loss (Raw)": 1.9465100765228271, "Pretrain/Step": 5816, "Pretrain/Step Time": 8.503072237595916} +{"Pretrain/Learning Rate": 4.072294537011438e-05, "Pretrain/Loss": 2.034183979034424, "Pretrain/Loss (Raw)": 1.789014458656311, "Pretrain/Step": 5817, "Pretrain/Step Time": 8.502854224294424} +{"Pretrain/Learning Rate": 4.071964464663958e-05, "Pretrain/Loss": 2.0368690490722656, "Pretrain/Loss (Raw)": 2.1961352825164795, "Pretrain/Step": 5818, "Pretrain/Step Time": 8.500587966293097} +{"Pretrain/Learning Rate": 4.0716343469899896e-05, "Pretrain/Loss": 2.036947727203369, "Pretrain/Loss (Raw)": 2.1790969371795654, "Pretrain/Step": 5819, "Pretrain/Step Time": 8.502596653997898} +{"Pretrain/Learning Rate": 4.071304183999054e-05, "Pretrain/Loss": 2.036949634552002, "Pretrain/Loss (Raw)": 2.0264432430267334, "Pretrain/Step": 5820, "Pretrain/Step Time": 8.507230097427964} +{"Pretrain/Learning Rate": 4.0709739757006695e-05, "Pretrain/Loss": 2.036364793777466, "Pretrain/Loss (Raw)": 2.0112950801849365, "Pretrain/Step": 5821, "Pretrain/Step Time": 8.500090824440122} +{"Pretrain/Learning Rate": 4.070643722104358e-05, "Pretrain/Loss": 2.0350449085235596, "Pretrain/Loss (Raw)": 1.7182201147079468, "Pretrain/Step": 5822, "Pretrain/Step Time": 8.50385357066989} +{"Pretrain/Learning Rate": 4.0703134232196416e-05, "Pretrain/Loss": 2.039170265197754, "Pretrain/Loss (Raw)": 2.252876043319702, "Pretrain/Step": 5823, "Pretrain/Step Time": 8.50552630238235} +{"Pretrain/Learning Rate": 4.0699830790560456e-05, "Pretrain/Loss": 2.0396311283111572, "Pretrain/Loss (Raw)": 2.1228199005126953, "Pretrain/Step": 5824, "Pretrain/Step Time": 8.503673700615764} +{"Pretrain/Learning Rate": 4.0696526896230935e-05, "Pretrain/Loss": 2.0406370162963867, "Pretrain/Loss (Raw)": 2.0981507301330566, "Pretrain/Step": 5825, "Pretrain/Step Time": 8.49888744018972} +{"Pretrain/Learning Rate": 4.069322254930312e-05, "Pretrain/Loss": 2.041224479675293, "Pretrain/Loss (Raw)": 1.9993948936462402, "Pretrain/Step": 5826, "Pretrain/Step Time": 8.503012515604496} +{"Pretrain/Learning Rate": 4.068991774987231e-05, "Pretrain/Loss": 2.041212797164917, "Pretrain/Loss (Raw)": 2.1513001918792725, "Pretrain/Step": 5827, "Pretrain/Step Time": 8.503809170797467} +{"Pretrain/Learning Rate": 4.0686612498033774e-05, "Pretrain/Loss": 2.0407841205596924, "Pretrain/Loss (Raw)": 1.9005353450775146, "Pretrain/Step": 5828, "Pretrain/Step Time": 8.505584809929132} +{"Pretrain/Learning Rate": 4.068330679388283e-05, "Pretrain/Loss": 2.0417518615722656, "Pretrain/Loss (Raw)": 2.3504414558410645, "Pretrain/Step": 5829, "Pretrain/Step Time": 8.500557592138648} +{"Pretrain/Learning Rate": 4.0680000637514784e-05, "Pretrain/Loss": 2.0432803630828857, "Pretrain/Loss (Raw)": 2.050719738006592, "Pretrain/Step": 5830, "Pretrain/Step Time": 8.504611222073436} +{"Pretrain/Learning Rate": 4.067669402902497e-05, "Pretrain/Loss": 2.0436904430389404, "Pretrain/Loss (Raw)": 2.157254457473755, "Pretrain/Step": 5831, "Pretrain/Step Time": 8.500911070033908} +{"Pretrain/Learning Rate": 4.067338696850875e-05, "Pretrain/Loss": 2.044987916946411, "Pretrain/Loss (Raw)": 2.204524517059326, "Pretrain/Step": 5832, "Pretrain/Step Time": 8.50397863984108} +{"Pretrain/Learning Rate": 4.067007945606146e-05, "Pretrain/Loss": 2.0448055267333984, "Pretrain/Loss (Raw)": 1.9267867803573608, "Pretrain/Step": 5833, "Pretrain/Step Time": 8.503960529342294} +{"Pretrain/Learning Rate": 4.0666771491778475e-05, "Pretrain/Loss": 2.0443668365478516, "Pretrain/Loss (Raw)": 2.0275914669036865, "Pretrain/Step": 5834, "Pretrain/Step Time": 8.505012905225158} +{"Pretrain/Learning Rate": 4.066346307575518e-05, "Pretrain/Loss": 2.0415916442871094, "Pretrain/Loss (Raw)": 2.1306586265563965, "Pretrain/Step": 5835, "Pretrain/Step Time": 8.502810753881931} +{"Pretrain/Learning Rate": 4.066015420808696e-05, "Pretrain/Loss": 2.041168451309204, "Pretrain/Loss (Raw)": 2.1273560523986816, "Pretrain/Step": 5836, "Pretrain/Step Time": 8.502601619809866} +{"Pretrain/Learning Rate": 4.065684488886924e-05, "Pretrain/Loss": 2.0423898696899414, "Pretrain/Loss (Raw)": 2.096693277359009, "Pretrain/Step": 5837, "Pretrain/Step Time": 8.504993807524443} +{"Pretrain/Learning Rate": 4.065353511819743e-05, "Pretrain/Loss": 2.049490451812744, "Pretrain/Loss (Raw)": 2.7257072925567627, "Pretrain/Step": 5838, "Pretrain/Step Time": 8.505069557577372} +{"Pretrain/Learning Rate": 4.0650224896166975e-05, "Pretrain/Loss": 2.047687530517578, "Pretrain/Loss (Raw)": 1.8397719860076904, "Pretrain/Step": 5839, "Pretrain/Step Time": 8.505773654207587} +{"Pretrain/Learning Rate": 4.0646914222873325e-05, "Pretrain/Loss": 2.0472757816314697, "Pretrain/Loss (Raw)": 2.019749402999878, "Pretrain/Step": 5840, "Pretrain/Step Time": 8.505863435566425} +{"Pretrain/Learning Rate": 4.064360309841192e-05, "Pretrain/Loss": 2.047726631164551, "Pretrain/Loss (Raw)": 2.0039806365966797, "Pretrain/Step": 5841, "Pretrain/Step Time": 8.507337292656302} +{"Pretrain/Learning Rate": 4.064029152287825e-05, "Pretrain/Loss": 2.047621250152588, "Pretrain/Loss (Raw)": 1.9876930713653564, "Pretrain/Step": 5842, "Pretrain/Step Time": 8.510311480611563} +{"Pretrain/Learning Rate": 4.0636979496367805e-05, "Pretrain/Loss": 2.0477871894836426, "Pretrain/Loss (Raw)": 2.0970163345336914, "Pretrain/Step": 5843, "Pretrain/Step Time": 8.512213410809636} +{"Pretrain/Learning Rate": 4.063366701897607e-05, "Pretrain/Loss": 2.0471372604370117, "Pretrain/Loss (Raw)": 2.0095746517181396, "Pretrain/Step": 5844, "Pretrain/Step Time": 8.512272015213966} +{"Pretrain/Learning Rate": 4.063035409079858e-05, "Pretrain/Loss": 2.0468897819519043, "Pretrain/Loss (Raw)": 1.9400523900985718, "Pretrain/Step": 5845, "Pretrain/Step Time": 8.510963978245854} +{"Pretrain/Learning Rate": 4.062704071193084e-05, "Pretrain/Loss": 2.0481467247009277, "Pretrain/Loss (Raw)": 2.013641834259033, "Pretrain/Step": 5846, "Pretrain/Step Time": 8.512305852025747} +{"Pretrain/Learning Rate": 4.062372688246841e-05, "Pretrain/Loss": 2.0468361377716064, "Pretrain/Loss (Raw)": 1.9666343927383423, "Pretrain/Step": 5847, "Pretrain/Step Time": 8.50871298275888} +{"Pretrain/Learning Rate": 4.062041260250682e-05, "Pretrain/Loss": 2.0501906871795654, "Pretrain/Loss (Raw)": 2.2080376148223877, "Pretrain/Step": 5848, "Pretrain/Step Time": 8.51072809100151} +{"Pretrain/Learning Rate": 4.061709787214164e-05, "Pretrain/Loss": 2.0489296913146973, "Pretrain/Loss (Raw)": 2.0789577960968018, "Pretrain/Step": 5849, "Pretrain/Step Time": 8.510135304182768} +{"Pretrain/Learning Rate": 4.061378269146846e-05, "Pretrain/Loss": 2.0509018898010254, "Pretrain/Loss (Raw)": 1.9515775442123413, "Pretrain/Step": 5850, "Pretrain/Step Time": 8.5095649138093} +{"Pretrain/Learning Rate": 4.0610467060582856e-05, "Pretrain/Loss": 2.0515060424804688, "Pretrain/Loss (Raw)": 2.1463778018951416, "Pretrain/Step": 5851, "Pretrain/Step Time": 8.507577938959002} +{"Pretrain/Learning Rate": 4.060715097958045e-05, "Pretrain/Loss": 2.052220344543457, "Pretrain/Loss (Raw)": 2.0449318885803223, "Pretrain/Step": 5852, "Pretrain/Step Time": 8.506244650110602} +{"Pretrain/Learning Rate": 4.060383444855683e-05, "Pretrain/Loss": 2.050306797027588, "Pretrain/Loss (Raw)": 1.981512188911438, "Pretrain/Step": 5853, "Pretrain/Step Time": 8.510710764676332} +{"Pretrain/Learning Rate": 4.0600517467607654e-05, "Pretrain/Loss": 2.049191474914551, "Pretrain/Loss (Raw)": 1.8555697202682495, "Pretrain/Step": 5854, "Pretrain/Step Time": 8.505641655996442} +{"Pretrain/Learning Rate": 4.059720003682856e-05, "Pretrain/Loss": 2.0506067276000977, "Pretrain/Loss (Raw)": 2.2048351764678955, "Pretrain/Step": 5855, "Pretrain/Step Time": 8.505190391093493} +{"Pretrain/Learning Rate": 4.0593882156315196e-05, "Pretrain/Loss": 2.050212860107422, "Pretrain/Loss (Raw)": 1.852146029472351, "Pretrain/Step": 5856, "Pretrain/Step Time": 8.504669656977057} +{"Pretrain/Learning Rate": 4.0590563826163224e-05, "Pretrain/Loss": 2.051363468170166, "Pretrain/Loss (Raw)": 2.271237850189209, "Pretrain/Step": 5857, "Pretrain/Step Time": 8.506758268922567} +{"Pretrain/Learning Rate": 4.058724504646834e-05, "Pretrain/Loss": 2.0509986877441406, "Pretrain/Loss (Raw)": 1.9441776275634766, "Pretrain/Step": 5858, "Pretrain/Step Time": 8.508073387667537} +{"Pretrain/Learning Rate": 4.058392581732623e-05, "Pretrain/Loss": 2.047097682952881, "Pretrain/Loss (Raw)": 1.9859288930892944, "Pretrain/Step": 5859, "Pretrain/Step Time": 8.502718798816204} +{"Pretrain/Learning Rate": 4.058060613883261e-05, "Pretrain/Loss": 2.0486388206481934, "Pretrain/Loss (Raw)": 2.1831138134002686, "Pretrain/Step": 5860, "Pretrain/Step Time": 8.503597225993872} +{"Pretrain/Learning Rate": 4.05772860110832e-05, "Pretrain/Loss": 2.047874689102173, "Pretrain/Loss (Raw)": 1.9789313077926636, "Pretrain/Step": 5861, "Pretrain/Step Time": 8.504887517541647} +{"Pretrain/Learning Rate": 4.057396543417372e-05, "Pretrain/Loss": 2.048128128051758, "Pretrain/Loss (Raw)": 2.1449711322784424, "Pretrain/Step": 5862, "Pretrain/Step Time": 8.510378289967775} +{"Pretrain/Learning Rate": 4.057064440819993e-05, "Pretrain/Loss": 2.04819917678833, "Pretrain/Loss (Raw)": 2.08587384223938, "Pretrain/Step": 5863, "Pretrain/Step Time": 8.508970445021987} +{"Pretrain/Learning Rate": 4.056732293325758e-05, "Pretrain/Loss": 2.0506062507629395, "Pretrain/Loss (Raw)": 2.400801658630371, "Pretrain/Step": 5864, "Pretrain/Step Time": 8.505415013059974} +{"Pretrain/Learning Rate": 4.0564001009442455e-05, "Pretrain/Loss": 2.051633596420288, "Pretrain/Loss (Raw)": 2.1205081939697266, "Pretrain/Step": 5865, "Pretrain/Step Time": 8.507564187049866} +{"Pretrain/Learning Rate": 4.056067863685033e-05, "Pretrain/Loss": 2.050666332244873, "Pretrain/Loss (Raw)": 1.8249268531799316, "Pretrain/Step": 5866, "Pretrain/Step Time": 8.50911652483046} +{"Pretrain/Learning Rate": 4.0557355815577006e-05, "Pretrain/Loss": 2.047447919845581, "Pretrain/Loss (Raw)": 2.185012102127075, "Pretrain/Step": 5867, "Pretrain/Step Time": 8.510885512456298} +{"Pretrain/Learning Rate": 4.055403254571829e-05, "Pretrain/Loss": 2.0487802028656006, "Pretrain/Loss (Raw)": 2.2088143825531006, "Pretrain/Step": 5868, "Pretrain/Step Time": 8.510352622717619} +{"Pretrain/Learning Rate": 4.055070882737002e-05, "Pretrain/Loss": 2.0515527725219727, "Pretrain/Loss (Raw)": 2.1739063262939453, "Pretrain/Step": 5869, "Pretrain/Step Time": 8.509685916826129} +{"Pretrain/Learning Rate": 4.054738466062802e-05, "Pretrain/Loss": 2.0499773025512695, "Pretrain/Loss (Raw)": 2.0979695320129395, "Pretrain/Step": 5870, "Pretrain/Step Time": 8.511941676959395} +{"Pretrain/Learning Rate": 4.054406004558814e-05, "Pretrain/Loss": 2.0495219230651855, "Pretrain/Loss (Raw)": 1.896563172340393, "Pretrain/Step": 5871, "Pretrain/Step Time": 8.505352836102247} +{"Pretrain/Learning Rate": 4.0540734982346246e-05, "Pretrain/Loss": 2.0461297035217285, "Pretrain/Loss (Raw)": 1.9355919361114502, "Pretrain/Step": 5872, "Pretrain/Step Time": 8.510173244401813} +{"Pretrain/Learning Rate": 4.0537409470998214e-05, "Pretrain/Loss": 2.043056011199951, "Pretrain/Loss (Raw)": 1.8167864084243774, "Pretrain/Step": 5873, "Pretrain/Step Time": 8.508723935112357} +{"Pretrain/Learning Rate": 4.0534083511639934e-05, "Pretrain/Loss": 2.0422310829162598, "Pretrain/Loss (Raw)": 1.9086469411849976, "Pretrain/Step": 5874, "Pretrain/Step Time": 8.505465734750032} +{"Pretrain/Learning Rate": 4.053075710436731e-05, "Pretrain/Loss": 2.040983200073242, "Pretrain/Loss (Raw)": 1.9031319618225098, "Pretrain/Step": 5875, "Pretrain/Step Time": 8.499077212065458} +{"Pretrain/Learning Rate": 4.052743024927625e-05, "Pretrain/Loss": 2.0419626235961914, "Pretrain/Loss (Raw)": 2.1545515060424805, "Pretrain/Step": 5876, "Pretrain/Step Time": 8.49988709948957} +{"Pretrain/Learning Rate": 4.052410294646268e-05, "Pretrain/Loss": 2.0430550575256348, "Pretrain/Loss (Raw)": 2.111428737640381, "Pretrain/Step": 5877, "Pretrain/Step Time": 8.500463236123323} +{"Pretrain/Learning Rate": 4.052077519602255e-05, "Pretrain/Loss": 2.043368101119995, "Pretrain/Loss (Raw)": 2.083066463470459, "Pretrain/Step": 5878, "Pretrain/Step Time": 8.502817291766405} +{"Pretrain/Learning Rate": 4.051744699805182e-05, "Pretrain/Loss": 2.0443460941314697, "Pretrain/Loss (Raw)": 2.1204886436462402, "Pretrain/Step": 5879, "Pretrain/Step Time": 8.503957441076636} +{"Pretrain/Learning Rate": 4.051411835264643e-05, "Pretrain/Loss": 2.0464649200439453, "Pretrain/Loss (Raw)": 2.215381622314453, "Pretrain/Step": 5880, "Pretrain/Step Time": 8.496919222176075} +{"Pretrain/Learning Rate": 4.0510789259902385e-05, "Pretrain/Loss": 2.0453763008117676, "Pretrain/Loss (Raw)": 1.909321904182434, "Pretrain/Step": 5881, "Pretrain/Step Time": 8.497336084023118} +{"Pretrain/Learning Rate": 4.050745971991565e-05, "Pretrain/Loss": 2.044595718383789, "Pretrain/Loss (Raw)": 2.0818960666656494, "Pretrain/Step": 5882, "Pretrain/Step Time": 8.496225103735924} +{"Pretrain/Learning Rate": 4.050412973278226e-05, "Pretrain/Loss": 2.0470480918884277, "Pretrain/Loss (Raw)": 2.1677916049957275, "Pretrain/Step": 5883, "Pretrain/Step Time": 8.49604706838727} +{"Pretrain/Learning Rate": 4.050079929859821e-05, "Pretrain/Loss": 2.0466246604919434, "Pretrain/Loss (Raw)": 1.987397313117981, "Pretrain/Step": 5884, "Pretrain/Step Time": 8.499627459794283} +{"Pretrain/Learning Rate": 4.0497468417459547e-05, "Pretrain/Loss": 2.045070171356201, "Pretrain/Loss (Raw)": 1.9277570247650146, "Pretrain/Step": 5885, "Pretrain/Step Time": 8.50027977488935} +{"Pretrain/Learning Rate": 4.04941370894623e-05, "Pretrain/Loss": 2.0451104640960693, "Pretrain/Loss (Raw)": 1.8128007650375366, "Pretrain/Step": 5886, "Pretrain/Step Time": 8.50054980814457} +{"Pretrain/Learning Rate": 4.049080531470254e-05, "Pretrain/Loss": 2.0486598014831543, "Pretrain/Loss (Raw)": 2.294484853744507, "Pretrain/Step": 5887, "Pretrain/Step Time": 8.504332037642598} +{"Pretrain/Learning Rate": 4.0487473093276326e-05, "Pretrain/Loss": 2.047804355621338, "Pretrain/Loss (Raw)": 1.9252409934997559, "Pretrain/Step": 5888, "Pretrain/Step Time": 8.505701499059796} +{"Pretrain/Learning Rate": 4.048414042527975e-05, "Pretrain/Loss": 2.0476434230804443, "Pretrain/Loss (Raw)": 2.1327316761016846, "Pretrain/Step": 5889, "Pretrain/Step Time": 8.508189659565687} +{"Pretrain/Learning Rate": 4.048080731080889e-05, "Pretrain/Loss": 2.048305034637451, "Pretrain/Loss (Raw)": 1.9526512622833252, "Pretrain/Step": 5890, "Pretrain/Step Time": 8.50913099013269} +{"Pretrain/Learning Rate": 4.0477473749959874e-05, "Pretrain/Loss": 2.051785469055176, "Pretrain/Loss (Raw)": 2.1687793731689453, "Pretrain/Step": 5891, "Pretrain/Step Time": 8.503738522529602} +{"Pretrain/Learning Rate": 4.047413974282881e-05, "Pretrain/Loss": 2.0535969734191895, "Pretrain/Loss (Raw)": 2.150944232940674, "Pretrain/Step": 5892, "Pretrain/Step Time": 8.505105219781399} +{"Pretrain/Learning Rate": 4.047080528951183e-05, "Pretrain/Loss": 2.054661750793457, "Pretrain/Loss (Raw)": 2.141508102416992, "Pretrain/Step": 5893, "Pretrain/Step Time": 8.504404284060001} +{"Pretrain/Learning Rate": 4.0467470390105086e-05, "Pretrain/Loss": 2.05379581451416, "Pretrain/Loss (Raw)": 2.0454342365264893, "Pretrain/Step": 5894, "Pretrain/Step Time": 8.504763647913933} +{"Pretrain/Learning Rate": 4.0464135044704746e-05, "Pretrain/Loss": 2.051319122314453, "Pretrain/Loss (Raw)": 1.9122593402862549, "Pretrain/Step": 5895, "Pretrain/Step Time": 8.503957128152251} +{"Pretrain/Learning Rate": 4.046079925340696e-05, "Pretrain/Loss": 2.0520148277282715, "Pretrain/Loss (Raw)": 2.185122013092041, "Pretrain/Step": 5896, "Pretrain/Step Time": 8.503561589866877} +{"Pretrain/Learning Rate": 4.045746301630794e-05, "Pretrain/Loss": 2.0524463653564453, "Pretrain/Loss (Raw)": 2.2090954780578613, "Pretrain/Step": 5897, "Pretrain/Step Time": 8.501283798366785} +{"Pretrain/Learning Rate": 4.045412633350386e-05, "Pretrain/Loss": 2.0530591011047363, "Pretrain/Loss (Raw)": 2.1026344299316406, "Pretrain/Step": 5898, "Pretrain/Step Time": 8.49880270846188} +{"Pretrain/Learning Rate": 4.045078920509094e-05, "Pretrain/Loss": 2.0516109466552734, "Pretrain/Loss (Raw)": 2.0283079147338867, "Pretrain/Step": 5899, "Pretrain/Step Time": 8.499436028301716} +{"Pretrain/Learning Rate": 4.0447451631165416e-05, "Pretrain/Loss": 2.0510621070861816, "Pretrain/Loss (Raw)": 1.9874393939971924, "Pretrain/Step": 5900, "Pretrain/Step Time": 8.501665623858571} +{"Pretrain/Learning Rate": 4.044411361182351e-05, "Pretrain/Loss": 2.0536692142486572, "Pretrain/Loss (Raw)": 2.2075910568237305, "Pretrain/Step": 5901, "Pretrain/Step Time": 8.500416573137045} +{"Pretrain/Learning Rate": 4.044077514716148e-05, "Pretrain/Loss": 2.050410747528076, "Pretrain/Loss (Raw)": 1.75199294090271, "Pretrain/Step": 5902, "Pretrain/Step Time": 8.500865690410137} +{"Pretrain/Learning Rate": 4.043743623727557e-05, "Pretrain/Loss": 2.050633430480957, "Pretrain/Loss (Raw)": 1.9871801137924194, "Pretrain/Step": 5903, "Pretrain/Step Time": 8.4972382504493} +{"Pretrain/Learning Rate": 4.0434096882262086e-05, "Pretrain/Loss": 2.051017999649048, "Pretrain/Loss (Raw)": 2.0419130325317383, "Pretrain/Step": 5904, "Pretrain/Step Time": 8.4964391682297} +{"Pretrain/Learning Rate": 4.043075708221729e-05, "Pretrain/Loss": 2.0494225025177, "Pretrain/Loss (Raw)": 1.93092942237854, "Pretrain/Step": 5905, "Pretrain/Step Time": 8.496026378124952} +{"Pretrain/Learning Rate": 4.042741683723749e-05, "Pretrain/Loss": 2.051579236984253, "Pretrain/Loss (Raw)": 2.23591947555542, "Pretrain/Step": 5906, "Pretrain/Step Time": 8.49930596910417} +{"Pretrain/Learning Rate": 4.0424076147418996e-05, "Pretrain/Loss": 2.0531015396118164, "Pretrain/Loss (Raw)": 2.2196168899536133, "Pretrain/Step": 5907, "Pretrain/Step Time": 8.501194586977363} +{"Pretrain/Learning Rate": 4.042073501285815e-05, "Pretrain/Loss": 2.0496387481689453, "Pretrain/Loss (Raw)": 1.841078281402588, "Pretrain/Step": 5908, "Pretrain/Step Time": 8.499880846589804} +{"Pretrain/Learning Rate": 4.0417393433651275e-05, "Pretrain/Loss": 2.0482006072998047, "Pretrain/Loss (Raw)": 1.9860645532608032, "Pretrain/Step": 5909, "Pretrain/Step Time": 8.495210709050298} +{"Pretrain/Learning Rate": 4.041405140989473e-05, "Pretrain/Loss": 2.0476348400115967, "Pretrain/Loss (Raw)": 1.980394959449768, "Pretrain/Step": 5910, "Pretrain/Step Time": 8.497831555083394} +{"Pretrain/Learning Rate": 4.0410708941684886e-05, "Pretrain/Loss": 2.0477051734924316, "Pretrain/Loss (Raw)": 2.087347984313965, "Pretrain/Step": 5911, "Pretrain/Step Time": 8.49495648033917} +{"Pretrain/Learning Rate": 4.04073660291181e-05, "Pretrain/Loss": 2.047299385070801, "Pretrain/Loss (Raw)": 1.9837007522583008, "Pretrain/Step": 5912, "Pretrain/Step Time": 8.493581736460328} +{"Pretrain/Learning Rate": 4.0404022672290784e-05, "Pretrain/Loss": 2.0440330505371094, "Pretrain/Loss (Raw)": 1.6519012451171875, "Pretrain/Step": 5913, "Pretrain/Step Time": 8.494489833712578} +{"Pretrain/Learning Rate": 4.040067887129934e-05, "Pretrain/Loss": 2.042929172515869, "Pretrain/Loss (Raw)": 2.051510810852051, "Pretrain/Step": 5914, "Pretrain/Step Time": 8.490562599152327} +{"Pretrain/Learning Rate": 4.039733462624016e-05, "Pretrain/Loss": 2.0426881313323975, "Pretrain/Loss (Raw)": 2.0527095794677734, "Pretrain/Step": 5915, "Pretrain/Step Time": 8.49673705548048} +{"Pretrain/Learning Rate": 4.039398993720971e-05, "Pretrain/Loss": 2.0423896312713623, "Pretrain/Loss (Raw)": 2.155888557434082, "Pretrain/Step": 5916, "Pretrain/Step Time": 8.493594640865922} +{"Pretrain/Learning Rate": 4.0390644804304404e-05, "Pretrain/Loss": 2.0427627563476562, "Pretrain/Loss (Raw)": 2.1435465812683105, "Pretrain/Step": 5917, "Pretrain/Step Time": 8.499599359929562} +{"Pretrain/Learning Rate": 4.038729922762069e-05, "Pretrain/Loss": 2.042503833770752, "Pretrain/Loss (Raw)": 1.8880653381347656, "Pretrain/Step": 5918, "Pretrain/Step Time": 8.496570769697428} +{"Pretrain/Learning Rate": 4.0383953207255074e-05, "Pretrain/Loss": 2.0442023277282715, "Pretrain/Loss (Raw)": 2.1730782985687256, "Pretrain/Step": 5919, "Pretrain/Step Time": 8.497447099536657} +{"Pretrain/Learning Rate": 4.038060674330399e-05, "Pretrain/Loss": 2.0442333221435547, "Pretrain/Loss (Raw)": 1.972155213356018, "Pretrain/Step": 5920, "Pretrain/Step Time": 8.499374402686954} +{"Pretrain/Learning Rate": 4.0377259835863976e-05, "Pretrain/Loss": 2.0406081676483154, "Pretrain/Loss (Raw)": 1.8550018072128296, "Pretrain/Step": 5921, "Pretrain/Step Time": 8.497211748734117} +{"Pretrain/Learning Rate": 4.03739124850315e-05, "Pretrain/Loss": 2.038703441619873, "Pretrain/Loss (Raw)": 1.8137714862823486, "Pretrain/Step": 5922, "Pretrain/Step Time": 8.498030947521329} +{"Pretrain/Learning Rate": 4.03705646909031e-05, "Pretrain/Loss": 2.039156436920166, "Pretrain/Loss (Raw)": 1.9016467332839966, "Pretrain/Step": 5923, "Pretrain/Step Time": 8.495680896565318} +{"Pretrain/Learning Rate": 4.03672164535753e-05, "Pretrain/Loss": 2.0381624698638916, "Pretrain/Loss (Raw)": 2.077643871307373, "Pretrain/Step": 5924, "Pretrain/Step Time": 8.497178373858333} +{"Pretrain/Learning Rate": 4.036386777314465e-05, "Pretrain/Loss": 2.0396132469177246, "Pretrain/Loss (Raw)": 2.02091908454895, "Pretrain/Step": 5925, "Pretrain/Step Time": 8.497491789981723} +{"Pretrain/Learning Rate": 4.03605186497077e-05, "Pretrain/Loss": 2.0433294773101807, "Pretrain/Loss (Raw)": 2.5231003761291504, "Pretrain/Step": 5926, "Pretrain/Step Time": 8.491013463586569} +{"Pretrain/Learning Rate": 4.035716908336102e-05, "Pretrain/Loss": 2.0421624183654785, "Pretrain/Loss (Raw)": 2.0025463104248047, "Pretrain/Step": 5927, "Pretrain/Step Time": 8.498097110539675} +{"Pretrain/Learning Rate": 4.03538190742012e-05, "Pretrain/Loss": 2.0428755283355713, "Pretrain/Loss (Raw)": 1.8835358619689941, "Pretrain/Step": 5928, "Pretrain/Step Time": 8.494498921558261} +{"Pretrain/Learning Rate": 4.035046862232484e-05, "Pretrain/Loss": 2.0417940616607666, "Pretrain/Loss (Raw)": 2.0361006259918213, "Pretrain/Step": 5929, "Pretrain/Step Time": 8.496762286871672} +{"Pretrain/Learning Rate": 4.034711772782853e-05, "Pretrain/Loss": 2.0468876361846924, "Pretrain/Loss (Raw)": 2.370697021484375, "Pretrain/Step": 5930, "Pretrain/Step Time": 8.492671409621835} +{"Pretrain/Learning Rate": 4.0343766390808905e-05, "Pretrain/Loss": 2.0474886894226074, "Pretrain/Loss (Raw)": 2.085345506668091, "Pretrain/Step": 5931, "Pretrain/Step Time": 8.495652360841632} +{"Pretrain/Learning Rate": 4.034041461136258e-05, "Pretrain/Loss": 2.0533225536346436, "Pretrain/Loss (Raw)": 2.1045498847961426, "Pretrain/Step": 5932, "Pretrain/Step Time": 8.498322932049632} +{"Pretrain/Learning Rate": 4.0337062389586224e-05, "Pretrain/Loss": 2.0557093620300293, "Pretrain/Loss (Raw)": 2.3489749431610107, "Pretrain/Step": 5933, "Pretrain/Step Time": 8.497208150103688} +{"Pretrain/Learning Rate": 4.033370972557649e-05, "Pretrain/Loss": 2.056459903717041, "Pretrain/Loss (Raw)": 2.161099910736084, "Pretrain/Step": 5934, "Pretrain/Step Time": 8.495583459734917} +{"Pretrain/Learning Rate": 4.033035661943003e-05, "Pretrain/Loss": 2.0561084747314453, "Pretrain/Loss (Raw)": 2.124600410461426, "Pretrain/Step": 5935, "Pretrain/Step Time": 8.502514652907848} +{"Pretrain/Learning Rate": 4.032700307124356e-05, "Pretrain/Loss": 2.0594255924224854, "Pretrain/Loss (Raw)": 2.133901357650757, "Pretrain/Step": 5936, "Pretrain/Step Time": 8.502265164628625} +{"Pretrain/Learning Rate": 4.0323649081113754e-05, "Pretrain/Loss": 2.0586695671081543, "Pretrain/Loss (Raw)": 1.9654695987701416, "Pretrain/Step": 5937, "Pretrain/Step Time": 8.50665314309299} +{"Pretrain/Learning Rate": 4.0320294649137324e-05, "Pretrain/Loss": 2.0558905601501465, "Pretrain/Loss (Raw)": 1.7725406885147095, "Pretrain/Step": 5938, "Pretrain/Step Time": 8.503346972167492} +{"Pretrain/Learning Rate": 4.0316939775411006e-05, "Pretrain/Loss": 2.0560131072998047, "Pretrain/Loss (Raw)": 2.0981976985931396, "Pretrain/Step": 5939, "Pretrain/Step Time": 8.503426378592849} +{"Pretrain/Learning Rate": 4.0313584460031525e-05, "Pretrain/Loss": 2.056288957595825, "Pretrain/Loss (Raw)": 2.04439640045166, "Pretrain/Step": 5940, "Pretrain/Step Time": 8.508155789226294} +{"Pretrain/Learning Rate": 4.031022870309563e-05, "Pretrain/Loss": 2.0548253059387207, "Pretrain/Loss (Raw)": 1.9587730169296265, "Pretrain/Step": 5941, "Pretrain/Step Time": 8.505968235433102} +{"Pretrain/Learning Rate": 4.030687250470009e-05, "Pretrain/Loss": 2.056210994720459, "Pretrain/Loss (Raw)": 2.292605400085449, "Pretrain/Step": 5942, "Pretrain/Step Time": 8.505803570151329} +{"Pretrain/Learning Rate": 4.030351586494166e-05, "Pretrain/Loss": 2.05499529838562, "Pretrain/Loss (Raw)": 1.8544081449508667, "Pretrain/Step": 5943, "Pretrain/Step Time": 8.503182651475072} +{"Pretrain/Learning Rate": 4.0300158783917144e-05, "Pretrain/Loss": 2.0565032958984375, "Pretrain/Loss (Raw)": 2.1395299434661865, "Pretrain/Step": 5944, "Pretrain/Step Time": 8.506380822509527} +{"Pretrain/Learning Rate": 4.029680126172334e-05, "Pretrain/Loss": 2.055856704711914, "Pretrain/Loss (Raw)": 1.7062664031982422, "Pretrain/Step": 5945, "Pretrain/Step Time": 8.506374765187502} +{"Pretrain/Learning Rate": 4.0293443298457054e-05, "Pretrain/Loss": 2.0569915771484375, "Pretrain/Loss (Raw)": 2.3413796424865723, "Pretrain/Step": 5946, "Pretrain/Step Time": 8.50538333132863} +{"Pretrain/Learning Rate": 4.029008489421511e-05, "Pretrain/Loss": 2.0554039478302, "Pretrain/Loss (Raw)": 1.9758814573287964, "Pretrain/Step": 5947, "Pretrain/Step Time": 8.506289368495345} +{"Pretrain/Learning Rate": 4.028672604909434e-05, "Pretrain/Loss": 2.0564346313476562, "Pretrain/Loss (Raw)": 2.1583809852600098, "Pretrain/Step": 5948, "Pretrain/Step Time": 8.506932403892279} +{"Pretrain/Learning Rate": 4.028336676319161e-05, "Pretrain/Loss": 2.0569050312042236, "Pretrain/Loss (Raw)": 2.071490526199341, "Pretrain/Step": 5949, "Pretrain/Step Time": 8.507011083886027} +{"Pretrain/Learning Rate": 4.028000703660377e-05, "Pretrain/Loss": 2.0580482482910156, "Pretrain/Loss (Raw)": 1.8645561933517456, "Pretrain/Step": 5950, "Pretrain/Step Time": 8.5073018129915} +{"Pretrain/Learning Rate": 4.027664686942769e-05, "Pretrain/Loss": 2.0560951232910156, "Pretrain/Loss (Raw)": 2.002894639968872, "Pretrain/Step": 5951, "Pretrain/Step Time": 8.506669487804174} +{"Pretrain/Learning Rate": 4.027328626176028e-05, "Pretrain/Loss": 2.0556399822235107, "Pretrain/Loss (Raw)": 2.0645432472229004, "Pretrain/Step": 5952, "Pretrain/Step Time": 8.509587718173862} +{"Pretrain/Learning Rate": 4.0269925213698424e-05, "Pretrain/Loss": 2.0563340187072754, "Pretrain/Loss (Raw)": 2.1870148181915283, "Pretrain/Step": 5953, "Pretrain/Step Time": 8.511197831481695} +{"Pretrain/Learning Rate": 4.0266563725339036e-05, "Pretrain/Loss": 2.0572972297668457, "Pretrain/Loss (Raw)": 2.122654914855957, "Pretrain/Step": 5954, "Pretrain/Step Time": 8.507175961509347} +{"Pretrain/Learning Rate": 4.0263201796779045e-05, "Pretrain/Loss": 2.055828332901001, "Pretrain/Loss (Raw)": 1.963280439376831, "Pretrain/Step": 5955, "Pretrain/Step Time": 8.504437014460564} +{"Pretrain/Learning Rate": 4.02598394281154e-05, "Pretrain/Loss": 2.05473256111145, "Pretrain/Loss (Raw)": 1.7602912187576294, "Pretrain/Step": 5956, "Pretrain/Step Time": 8.512038350105286} +{"Pretrain/Learning Rate": 4.025647661944503e-05, "Pretrain/Loss": 2.0475735664367676, "Pretrain/Loss (Raw)": 1.4340986013412476, "Pretrain/Step": 5957, "Pretrain/Step Time": 8.515137942507863} +{"Pretrain/Learning Rate": 4.025311337086492e-05, "Pretrain/Loss": 2.04779052734375, "Pretrain/Loss (Raw)": 2.078469753265381, "Pretrain/Step": 5958, "Pretrain/Step Time": 8.513886466622353} +{"Pretrain/Learning Rate": 4.024974968247204e-05, "Pretrain/Loss": 2.04715633392334, "Pretrain/Loss (Raw)": 2.076077461242676, "Pretrain/Step": 5959, "Pretrain/Step Time": 8.51480090431869} +{"Pretrain/Learning Rate": 4.024638555436337e-05, "Pretrain/Loss": 2.04490327835083, "Pretrain/Loss (Raw)": 1.91614830493927, "Pretrain/Step": 5960, "Pretrain/Step Time": 8.518594991415739} +{"Pretrain/Learning Rate": 4.0243020986635926e-05, "Pretrain/Loss": 2.047377109527588, "Pretrain/Loss (Raw)": 2.243443489074707, "Pretrain/Step": 5961, "Pretrain/Step Time": 8.518667783588171} +{"Pretrain/Learning Rate": 4.0239655979386715e-05, "Pretrain/Loss": 2.0499348640441895, "Pretrain/Loss (Raw)": 2.354961633682251, "Pretrain/Step": 5962, "Pretrain/Step Time": 8.51671401783824} +{"Pretrain/Learning Rate": 4.023629053271276e-05, "Pretrain/Loss": 2.0486459732055664, "Pretrain/Loss (Raw)": 1.9656835794448853, "Pretrain/Step": 5963, "Pretrain/Step Time": 8.518721403554082} +{"Pretrain/Learning Rate": 4.0232924646711124e-05, "Pretrain/Loss": 2.049976348876953, "Pretrain/Loss (Raw)": 2.297635078430176, "Pretrain/Step": 5964, "Pretrain/Step Time": 8.517782304435968} +{"Pretrain/Learning Rate": 4.0229558321478836e-05, "Pretrain/Loss": 2.048492431640625, "Pretrain/Loss (Raw)": 1.906752109527588, "Pretrain/Step": 5965, "Pretrain/Step Time": 8.514786308631301} +{"Pretrain/Learning Rate": 4.022619155711297e-05, "Pretrain/Loss": 2.044229507446289, "Pretrain/Loss (Raw)": 2.180091142654419, "Pretrain/Step": 5966, "Pretrain/Step Time": 8.5177738443017} +{"Pretrain/Learning Rate": 4.022282435371061e-05, "Pretrain/Loss": 2.0483007431030273, "Pretrain/Loss (Raw)": 2.360844612121582, "Pretrain/Step": 5967, "Pretrain/Step Time": 8.51468481309712} +{"Pretrain/Learning Rate": 4.021945671136883e-05, "Pretrain/Loss": 2.049854040145874, "Pretrain/Loss (Raw)": 2.218592882156372, "Pretrain/Step": 5968, "Pretrain/Step Time": 8.522157587110996} +{"Pretrain/Learning Rate": 4.021608863018475e-05, "Pretrain/Loss": 2.0516228675842285, "Pretrain/Loss (Raw)": 2.2304022312164307, "Pretrain/Step": 5969, "Pretrain/Step Time": 8.516537083312869} +{"Pretrain/Learning Rate": 4.0212720110255484e-05, "Pretrain/Loss": 2.0525569915771484, "Pretrain/Loss (Raw)": 2.1072628498077393, "Pretrain/Step": 5970, "Pretrain/Step Time": 8.513793168589473} +{"Pretrain/Learning Rate": 4.020935115167816e-05, "Pretrain/Loss": 2.0517733097076416, "Pretrain/Loss (Raw)": 1.9966856241226196, "Pretrain/Step": 5971, "Pretrain/Step Time": 8.510062711313367} +{"Pretrain/Learning Rate": 4.02059817545499e-05, "Pretrain/Loss": 2.0536553859710693, "Pretrain/Loss (Raw)": 2.250497579574585, "Pretrain/Step": 5972, "Pretrain/Step Time": 8.517424911260605} +{"Pretrain/Learning Rate": 4.0202611918967895e-05, "Pretrain/Loss": 2.0551836490631104, "Pretrain/Loss (Raw)": 2.1356592178344727, "Pretrain/Step": 5973, "Pretrain/Step Time": 8.520374400541186} +{"Pretrain/Learning Rate": 4.019924164502928e-05, "Pretrain/Loss": 2.0548505783081055, "Pretrain/Loss (Raw)": 1.9710183143615723, "Pretrain/Step": 5974, "Pretrain/Step Time": 8.516971834003925} +{"Pretrain/Learning Rate": 4.0195870932831256e-05, "Pretrain/Loss": 2.0555472373962402, "Pretrain/Loss (Raw)": 2.0557799339294434, "Pretrain/Step": 5975, "Pretrain/Step Time": 8.520017240196466} +{"Pretrain/Learning Rate": 4.019249978247101e-05, "Pretrain/Loss": 2.0549874305725098, "Pretrain/Loss (Raw)": 2.136399984359741, "Pretrain/Step": 5976, "Pretrain/Step Time": 8.520638592541218} +{"Pretrain/Learning Rate": 4.0189128194045735e-05, "Pretrain/Loss": 2.0536630153656006, "Pretrain/Loss (Raw)": 1.9094419479370117, "Pretrain/Step": 5977, "Pretrain/Step Time": 8.520948154851794} +{"Pretrain/Learning Rate": 4.018575616765265e-05, "Pretrain/Loss": 2.0565836429595947, "Pretrain/Loss (Raw)": 2.325388193130493, "Pretrain/Step": 5978, "Pretrain/Step Time": 8.521085387095809} +{"Pretrain/Learning Rate": 4.0182383703389004e-05, "Pretrain/Loss": 2.0557610988616943, "Pretrain/Loss (Raw)": 2.0411152839660645, "Pretrain/Step": 5979, "Pretrain/Step Time": 8.521301930770278} +{"Pretrain/Learning Rate": 4.0179010801352023e-05, "Pretrain/Loss": 2.05418062210083, "Pretrain/Loss (Raw)": 1.842631220817566, "Pretrain/Step": 5980, "Pretrain/Step Time": 8.519822776317596} +{"Pretrain/Learning Rate": 4.0175637461638957e-05, "Pretrain/Loss": 2.054617404937744, "Pretrain/Loss (Raw)": 2.0374128818511963, "Pretrain/Step": 5981, "Pretrain/Step Time": 8.515522696077824} +{"Pretrain/Learning Rate": 4.01722636843471e-05, "Pretrain/Loss": 2.0559372901916504, "Pretrain/Loss (Raw)": 2.0244975090026855, "Pretrain/Step": 5982, "Pretrain/Step Time": 8.511916313320398} +{"Pretrain/Learning Rate": 4.01688894695737e-05, "Pretrain/Loss": 2.053419589996338, "Pretrain/Loss (Raw)": 1.882583737373352, "Pretrain/Step": 5983, "Pretrain/Step Time": 8.521478947252035} +{"Pretrain/Learning Rate": 4.016551481741607e-05, "Pretrain/Loss": 2.0545363426208496, "Pretrain/Loss (Raw)": 1.9950902462005615, "Pretrain/Step": 5984, "Pretrain/Step Time": 8.521966585889459} +{"Pretrain/Learning Rate": 4.0162139727971516e-05, "Pretrain/Loss": 2.053317070007324, "Pretrain/Loss (Raw)": 2.115185260772705, "Pretrain/Step": 5985, "Pretrain/Step Time": 8.520270314067602} +{"Pretrain/Learning Rate": 4.015876420133735e-05, "Pretrain/Loss": 2.0534300804138184, "Pretrain/Loss (Raw)": 1.9586182832717896, "Pretrain/Step": 5986, "Pretrain/Step Time": 8.51640160754323} +{"Pretrain/Learning Rate": 4.0155388237610894e-05, "Pretrain/Loss": 2.054625988006592, "Pretrain/Loss (Raw)": 2.1390445232391357, "Pretrain/Step": 5987, "Pretrain/Step Time": 8.516409747302532} +{"Pretrain/Learning Rate": 4.015201183688951e-05, "Pretrain/Loss": 2.0532913208007812, "Pretrain/Loss (Raw)": 2.012256622314453, "Pretrain/Step": 5988, "Pretrain/Step Time": 8.521692555397749} +{"Pretrain/Learning Rate": 4.014863499927055e-05, "Pretrain/Loss": 2.0544307231903076, "Pretrain/Loss (Raw)": 2.1247718334198, "Pretrain/Step": 5989, "Pretrain/Step Time": 8.520648779347539} +{"Pretrain/Learning Rate": 4.014525772485137e-05, "Pretrain/Loss": 2.0600051879882812, "Pretrain/Loss (Raw)": 2.858513593673706, "Pretrain/Step": 5990, "Pretrain/Step Time": 8.517952870577574} +{"Pretrain/Learning Rate": 4.014188001372937e-05, "Pretrain/Loss": 2.0598080158233643, "Pretrain/Loss (Raw)": 2.06062388420105, "Pretrain/Step": 5991, "Pretrain/Step Time": 8.520638540387154} +{"Pretrain/Learning Rate": 4.013850186600193e-05, "Pretrain/Loss": 2.0590217113494873, "Pretrain/Loss (Raw)": 2.300153970718384, "Pretrain/Step": 5992, "Pretrain/Step Time": 8.518402948975563} +{"Pretrain/Learning Rate": 4.013512328176646e-05, "Pretrain/Loss": 2.060264825820923, "Pretrain/Loss (Raw)": 2.2796263694763184, "Pretrain/Step": 5993, "Pretrain/Step Time": 8.51947041042149} +{"Pretrain/Learning Rate": 4.013174426112038e-05, "Pretrain/Loss": 2.0603585243225098, "Pretrain/Loss (Raw)": 1.8368899822235107, "Pretrain/Step": 5994, "Pretrain/Step Time": 8.516889836639166} +{"Pretrain/Learning Rate": 4.012836480416112e-05, "Pretrain/Loss": 2.0601119995117188, "Pretrain/Loss (Raw)": 2.153475284576416, "Pretrain/Step": 5995, "Pretrain/Step Time": 8.51689643599093} +{"Pretrain/Learning Rate": 4.012498491098613e-05, "Pretrain/Loss": 2.058950424194336, "Pretrain/Loss (Raw)": 2.060153007507324, "Pretrain/Step": 5996, "Pretrain/Step Time": 8.518517138436437} +{"Pretrain/Learning Rate": 4.012160458169286e-05, "Pretrain/Loss": 2.058283805847168, "Pretrain/Loss (Raw)": 2.088555097579956, "Pretrain/Step": 5997, "Pretrain/Step Time": 8.514424864202738} +{"Pretrain/Learning Rate": 4.011822381637877e-05, "Pretrain/Loss": 2.061366081237793, "Pretrain/Loss (Raw)": 2.4925148487091064, "Pretrain/Step": 5998, "Pretrain/Step Time": 8.510666349902749} +{"Pretrain/Learning Rate": 4.011484261514137e-05, "Pretrain/Loss": 2.0635290145874023, "Pretrain/Loss (Raw)": 2.1734139919281006, "Pretrain/Step": 5999, "Pretrain/Step Time": 8.513320572674274} +{"Pretrain/Learning Rate": 4.0111460978078134e-05, "Pretrain/Loss": 2.063549041748047, "Pretrain/Loss (Raw)": 1.9381588697433472, "Pretrain/Step": 6000, "Pretrain/Step Time": 8.516789603978395} +{"Pretrain/Learning Rate": 4.010807890528657e-05, "Pretrain/Loss": 2.0649056434631348, "Pretrain/Loss (Raw)": 1.9904530048370361, "Pretrain/Step": 6001, "Pretrain/Step Time": 8.515165647491813} +{"Pretrain/Learning Rate": 4.0104696396864214e-05, "Pretrain/Loss": 2.06691575050354, "Pretrain/Loss (Raw)": 2.1659181118011475, "Pretrain/Step": 6002, "Pretrain/Step Time": 8.515719305723906} +{"Pretrain/Learning Rate": 4.0101313452908575e-05, "Pretrain/Loss": 2.0674924850463867, "Pretrain/Loss (Raw)": 1.976951241493225, "Pretrain/Step": 6003, "Pretrain/Step Time": 8.513973580673337} +{"Pretrain/Learning Rate": 4.009793007351721e-05, "Pretrain/Loss": 2.0658464431762695, "Pretrain/Loss (Raw)": 1.9438611268997192, "Pretrain/Step": 6004, "Pretrain/Step Time": 8.515889141708612} +{"Pretrain/Learning Rate": 4.009454625878767e-05, "Pretrain/Loss": 2.066720485687256, "Pretrain/Loss (Raw)": 2.2233266830444336, "Pretrain/Step": 6005, "Pretrain/Step Time": 8.521119482815266} +{"Pretrain/Learning Rate": 4.0091162008817534e-05, "Pretrain/Loss": 2.067430257797241, "Pretrain/Loss (Raw)": 2.173910617828369, "Pretrain/Step": 6006, "Pretrain/Step Time": 8.516410721465945} +{"Pretrain/Learning Rate": 4.008777732370438e-05, "Pretrain/Loss": 2.0664849281311035, "Pretrain/Loss (Raw)": 1.9994615316390991, "Pretrain/Step": 6007, "Pretrain/Step Time": 8.518636239692569} +{"Pretrain/Learning Rate": 4.00843922035458e-05, "Pretrain/Loss": 2.0657572746276855, "Pretrain/Loss (Raw)": 2.1222317218780518, "Pretrain/Step": 6008, "Pretrain/Step Time": 8.519408063963056} +{"Pretrain/Learning Rate": 4.008100664843941e-05, "Pretrain/Loss": 2.064105987548828, "Pretrain/Loss (Raw)": 1.6979782581329346, "Pretrain/Step": 6009, "Pretrain/Step Time": 8.520156562328339} +{"Pretrain/Learning Rate": 4.0077620658482816e-05, "Pretrain/Loss": 2.0647010803222656, "Pretrain/Loss (Raw)": 2.158043146133423, "Pretrain/Step": 6010, "Pretrain/Step Time": 8.52206351235509} +{"Pretrain/Learning Rate": 4.007423423377367e-05, "Pretrain/Loss": 2.0629048347473145, "Pretrain/Loss (Raw)": 1.9379041194915771, "Pretrain/Step": 6011, "Pretrain/Step Time": 8.520026601850986} +{"Pretrain/Learning Rate": 4.00708473744096e-05, "Pretrain/Loss": 2.0638959407806396, "Pretrain/Loss (Raw)": 2.1142380237579346, "Pretrain/Step": 6012, "Pretrain/Step Time": 8.514576213434339} +{"Pretrain/Learning Rate": 4.0067460080488275e-05, "Pretrain/Loss": 2.0656728744506836, "Pretrain/Loss (Raw)": 2.155189037322998, "Pretrain/Step": 6013, "Pretrain/Step Time": 8.514620954170823} +{"Pretrain/Learning Rate": 4.006407235210736e-05, "Pretrain/Loss": 2.069398880004883, "Pretrain/Loss (Raw)": 2.28975772857666, "Pretrain/Step": 6014, "Pretrain/Step Time": 8.515983568504453} +{"Pretrain/Learning Rate": 4.0060684189364526e-05, "Pretrain/Loss": 2.068125009536743, "Pretrain/Loss (Raw)": 2.13142991065979, "Pretrain/Step": 6015, "Pretrain/Step Time": 8.510512819513679} +{"Pretrain/Learning Rate": 4.0057295592357496e-05, "Pretrain/Loss": 2.069408416748047, "Pretrain/Loss (Raw)": 2.0894951820373535, "Pretrain/Step": 6016, "Pretrain/Step Time": 8.50760755315423} +{"Pretrain/Learning Rate": 4.0053906561183955e-05, "Pretrain/Loss": 2.068242073059082, "Pretrain/Loss (Raw)": 1.9834558963775635, "Pretrain/Step": 6017, "Pretrain/Step Time": 8.505473297089338} +{"Pretrain/Learning Rate": 4.005051709594164e-05, "Pretrain/Loss": 2.0684070587158203, "Pretrain/Loss (Raw)": 1.9737823009490967, "Pretrain/Step": 6018, "Pretrain/Step Time": 8.50395119190216} +{"Pretrain/Learning Rate": 4.004712719672826e-05, "Pretrain/Loss": 2.0678720474243164, "Pretrain/Loss (Raw)": 2.100287675857544, "Pretrain/Step": 6019, "Pretrain/Step Time": 8.506790678948164} +{"Pretrain/Learning Rate": 4.0043736863641586e-05, "Pretrain/Loss": 2.0667340755462646, "Pretrain/Loss (Raw)": 2.005286693572998, "Pretrain/Step": 6020, "Pretrain/Step Time": 8.50609253719449} +{"Pretrain/Learning Rate": 4.004034609677936e-05, "Pretrain/Loss": 2.0681285858154297, "Pretrain/Loss (Raw)": 2.3199923038482666, "Pretrain/Step": 6021, "Pretrain/Step Time": 8.505314162001014} +{"Pretrain/Learning Rate": 4.003695489623935e-05, "Pretrain/Loss": 2.0673742294311523, "Pretrain/Loss (Raw)": 1.9489120244979858, "Pretrain/Step": 6022, "Pretrain/Step Time": 8.512542568147182} +{"Pretrain/Learning Rate": 4.0033563262119354e-05, "Pretrain/Loss": 2.0682623386383057, "Pretrain/Loss (Raw)": 2.0259058475494385, "Pretrain/Step": 6023, "Pretrain/Step Time": 8.512961206957698} +{"Pretrain/Learning Rate": 4.003017119451716e-05, "Pretrain/Loss": 2.066624641418457, "Pretrain/Loss (Raw)": 1.9754945039749146, "Pretrain/Step": 6024, "Pretrain/Step Time": 8.512680118903518} +{"Pretrain/Learning Rate": 4.0026778693530575e-05, "Pretrain/Loss": 2.0662620067596436, "Pretrain/Loss (Raw)": 2.1626968383789062, "Pretrain/Step": 6025, "Pretrain/Step Time": 8.514199802652001} +{"Pretrain/Learning Rate": 4.0023385759257416e-05, "Pretrain/Loss": 2.0674307346343994, "Pretrain/Loss (Raw)": 2.25221848487854, "Pretrain/Step": 6026, "Pretrain/Step Time": 8.514991160482168} +{"Pretrain/Learning Rate": 4.001999239179552e-05, "Pretrain/Loss": 2.0671329498291016, "Pretrain/Loss (Raw)": 1.9901671409606934, "Pretrain/Step": 6027, "Pretrain/Step Time": 8.515946842730045} +{"Pretrain/Learning Rate": 4.001659859124274e-05, "Pretrain/Loss": 2.066931962966919, "Pretrain/Loss (Raw)": 1.9617271423339844, "Pretrain/Step": 6028, "Pretrain/Step Time": 8.515397068113089} +{"Pretrain/Learning Rate": 4.0013204357696914e-05, "Pretrain/Loss": 2.0650668144226074, "Pretrain/Loss (Raw)": 1.9688843488693237, "Pretrain/Step": 6029, "Pretrain/Step Time": 8.516826920211315} +{"Pretrain/Learning Rate": 4.000980969125593e-05, "Pretrain/Loss": 2.068568706512451, "Pretrain/Loss (Raw)": 2.2002081871032715, "Pretrain/Step": 6030, "Pretrain/Step Time": 8.516981232911348} +{"Pretrain/Learning Rate": 4.000641459201766e-05, "Pretrain/Loss": 2.0696535110473633, "Pretrain/Loss (Raw)": 2.1260225772857666, "Pretrain/Step": 6031, "Pretrain/Step Time": 8.515842381864786} +{"Pretrain/Learning Rate": 4.000301906008001e-05, "Pretrain/Loss": 2.0700035095214844, "Pretrain/Loss (Raw)": 2.0867466926574707, "Pretrain/Step": 6032, "Pretrain/Step Time": 8.5179278627038} +{"Pretrain/Learning Rate": 3.999962309554088e-05, "Pretrain/Loss": 2.0707201957702637, "Pretrain/Loss (Raw)": 2.022660255432129, "Pretrain/Step": 6033, "Pretrain/Step Time": 8.518854195252061} +{"Pretrain/Learning Rate": 3.999622669849819e-05, "Pretrain/Loss": 2.07230281829834, "Pretrain/Loss (Raw)": 2.438469886779785, "Pretrain/Step": 6034, "Pretrain/Step Time": 8.511114787310362} +{"Pretrain/Learning Rate": 3.999282986904988e-05, "Pretrain/Loss": 2.070742130279541, "Pretrain/Loss (Raw)": 2.019832134246826, "Pretrain/Step": 6035, "Pretrain/Step Time": 8.510725434869528} +{"Pretrain/Learning Rate": 3.9989432607293886e-05, "Pretrain/Loss": 2.074556589126587, "Pretrain/Loss (Raw)": 2.3293566703796387, "Pretrain/Step": 6036, "Pretrain/Step Time": 8.509535135701299} +{"Pretrain/Learning Rate": 3.998603491332817e-05, "Pretrain/Loss": 2.0761852264404297, "Pretrain/Loss (Raw)": 2.194523334503174, "Pretrain/Step": 6037, "Pretrain/Step Time": 8.513624204322696} +{"Pretrain/Learning Rate": 3.998263678725071e-05, "Pretrain/Loss": 2.0759332180023193, "Pretrain/Loss (Raw)": 1.948153018951416, "Pretrain/Step": 6038, "Pretrain/Step Time": 8.512604353949428} +{"Pretrain/Learning Rate": 3.997923822915946e-05, "Pretrain/Loss": 2.0766258239746094, "Pretrain/Loss (Raw)": 2.175971269607544, "Pretrain/Step": 6039, "Pretrain/Step Time": 8.51283205486834} +{"Pretrain/Learning Rate": 3.9975839239152446e-05, "Pretrain/Loss": 2.077531337738037, "Pretrain/Loss (Raw)": 2.0996532440185547, "Pretrain/Step": 6040, "Pretrain/Step Time": 8.517180733382702} +{"Pretrain/Learning Rate": 3.997243981732767e-05, "Pretrain/Loss": 2.0804431438446045, "Pretrain/Loss (Raw)": 2.0245823860168457, "Pretrain/Step": 6041, "Pretrain/Step Time": 8.519888488575816} +{"Pretrain/Learning Rate": 3.996903996378314e-05, "Pretrain/Loss": 2.0821685791015625, "Pretrain/Loss (Raw)": 2.272400379180908, "Pretrain/Step": 6042, "Pretrain/Step Time": 8.524074111133814} +{"Pretrain/Learning Rate": 3.99656396786169e-05, "Pretrain/Loss": 2.0812036991119385, "Pretrain/Loss (Raw)": 1.9291729927062988, "Pretrain/Step": 6043, "Pretrain/Step Time": 8.522259265184402} +{"Pretrain/Learning Rate": 3.996223896192699e-05, "Pretrain/Loss": 2.080198049545288, "Pretrain/Loss (Raw)": 2.027158260345459, "Pretrain/Step": 6044, "Pretrain/Step Time": 8.526460748165846} +{"Pretrain/Learning Rate": 3.9958837813811464e-05, "Pretrain/Loss": 2.0801570415496826, "Pretrain/Loss (Raw)": 2.1383190155029297, "Pretrain/Step": 6045, "Pretrain/Step Time": 8.520694950595498} +{"Pretrain/Learning Rate": 3.995543623436839e-05, "Pretrain/Loss": 2.0797266960144043, "Pretrain/Loss (Raw)": 1.8329788446426392, "Pretrain/Step": 6046, "Pretrain/Step Time": 8.522195791825652} +{"Pretrain/Learning Rate": 3.9952034223695864e-05, "Pretrain/Loss": 2.0785279273986816, "Pretrain/Loss (Raw)": 2.0196192264556885, "Pretrain/Step": 6047, "Pretrain/Step Time": 8.521159391850233} +{"Pretrain/Learning Rate": 3.994863178189197e-05, "Pretrain/Loss": 2.0827770233154297, "Pretrain/Loss (Raw)": 2.5160460472106934, "Pretrain/Step": 6048, "Pretrain/Step Time": 8.519843455404043} +{"Pretrain/Learning Rate": 3.9945228909054815e-05, "Pretrain/Loss": 2.0834715366363525, "Pretrain/Loss (Raw)": 1.9439079761505127, "Pretrain/Step": 6049, "Pretrain/Step Time": 8.521472135558724} +{"Pretrain/Learning Rate": 3.994182560528253e-05, "Pretrain/Loss": 2.086874485015869, "Pretrain/Loss (Raw)": 2.2493653297424316, "Pretrain/Step": 6050, "Pretrain/Step Time": 8.518920715898275} +{"Pretrain/Learning Rate": 3.993842187067322e-05, "Pretrain/Loss": 2.0869059562683105, "Pretrain/Loss (Raw)": 1.9056408405303955, "Pretrain/Step": 6051, "Pretrain/Step Time": 8.52184041403234} +{"Pretrain/Learning Rate": 3.993501770532505e-05, "Pretrain/Loss": 2.0855090618133545, "Pretrain/Loss (Raw)": 1.8988643884658813, "Pretrain/Step": 6052, "Pretrain/Step Time": 8.522067876532674} +{"Pretrain/Learning Rate": 3.993161310933618e-05, "Pretrain/Loss": 2.08528995513916, "Pretrain/Loss (Raw)": 1.9928821325302124, "Pretrain/Step": 6053, "Pretrain/Step Time": 8.519851041957736} +{"Pretrain/Learning Rate": 3.992820808280477e-05, "Pretrain/Loss": 2.081817626953125, "Pretrain/Loss (Raw)": 2.0786592960357666, "Pretrain/Step": 6054, "Pretrain/Step Time": 8.523966610431671} +{"Pretrain/Learning Rate": 3.9924802625829e-05, "Pretrain/Loss": 2.085134983062744, "Pretrain/Loss (Raw)": 2.4271302223205566, "Pretrain/Step": 6055, "Pretrain/Step Time": 8.517242282629013} +{"Pretrain/Learning Rate": 3.992139673850707e-05, "Pretrain/Loss": 2.084848403930664, "Pretrain/Loss (Raw)": 1.8468538522720337, "Pretrain/Step": 6056, "Pretrain/Step Time": 8.523544996976852} +{"Pretrain/Learning Rate": 3.991799042093718e-05, "Pretrain/Loss": 2.0850207805633545, "Pretrain/Loss (Raw)": 2.058170795440674, "Pretrain/Step": 6057, "Pretrain/Step Time": 8.523562481626868} +{"Pretrain/Learning Rate": 3.991458367321756e-05, "Pretrain/Loss": 2.080564498901367, "Pretrain/Loss (Raw)": 1.8002781867980957, "Pretrain/Step": 6058, "Pretrain/Step Time": 8.524632565677166} +{"Pretrain/Learning Rate": 3.9911176495446436e-05, "Pretrain/Loss": 2.079890251159668, "Pretrain/Loss (Raw)": 1.9990652799606323, "Pretrain/Step": 6059, "Pretrain/Step Time": 8.523717075586319} +{"Pretrain/Learning Rate": 3.990776888772204e-05, "Pretrain/Loss": 2.078644037246704, "Pretrain/Loss (Raw)": 1.945021152496338, "Pretrain/Step": 6060, "Pretrain/Step Time": 8.520792143419385} +{"Pretrain/Learning Rate": 3.990436085014264e-05, "Pretrain/Loss": 2.078157901763916, "Pretrain/Loss (Raw)": 2.286759853363037, "Pretrain/Step": 6061, "Pretrain/Step Time": 8.523086234927177} +{"Pretrain/Learning Rate": 3.990095238280651e-05, "Pretrain/Loss": 2.0787923336029053, "Pretrain/Loss (Raw)": 2.242323875427246, "Pretrain/Step": 6062, "Pretrain/Step Time": 8.517093293368816} +{"Pretrain/Learning Rate": 3.989754348581191e-05, "Pretrain/Loss": 2.0804712772369385, "Pretrain/Loss (Raw)": 2.3394858837127686, "Pretrain/Step": 6063, "Pretrain/Step Time": 8.513380102813244} +{"Pretrain/Learning Rate": 3.989413415925715e-05, "Pretrain/Loss": 2.080462694168091, "Pretrain/Loss (Raw)": 2.132802963256836, "Pretrain/Step": 6064, "Pretrain/Step Time": 8.51171095483005} +{"Pretrain/Learning Rate": 3.989072440324054e-05, "Pretrain/Loss": 2.081683397293091, "Pretrain/Loss (Raw)": 2.1217398643493652, "Pretrain/Step": 6065, "Pretrain/Step Time": 8.510639149695635} +{"Pretrain/Learning Rate": 3.9887314217860376e-05, "Pretrain/Loss": 2.083737373352051, "Pretrain/Loss (Raw)": 2.0354387760162354, "Pretrain/Step": 6066, "Pretrain/Step Time": 8.503890154883265} +{"Pretrain/Learning Rate": 3.988390360321501e-05, "Pretrain/Loss": 2.082592010498047, "Pretrain/Loss (Raw)": 1.9515959024429321, "Pretrain/Step": 6067, "Pretrain/Step Time": 8.504580985754728} +{"Pretrain/Learning Rate": 3.9880492559402775e-05, "Pretrain/Loss": 2.082225799560547, "Pretrain/Loss (Raw)": 1.9975353479385376, "Pretrain/Step": 6068, "Pretrain/Step Time": 8.502755217254162} +{"Pretrain/Learning Rate": 3.9877081086522016e-05, "Pretrain/Loss": 2.0831172466278076, "Pretrain/Loss (Raw)": 2.072852373123169, "Pretrain/Step": 6069, "Pretrain/Step Time": 8.500751150771976} +{"Pretrain/Learning Rate": 3.9873669184671125e-05, "Pretrain/Loss": 2.083897829055786, "Pretrain/Loss (Raw)": 2.392550468444824, "Pretrain/Step": 6070, "Pretrain/Step Time": 8.511239342391491} +{"Pretrain/Learning Rate": 3.987025685394846e-05, "Pretrain/Loss": 2.0852150917053223, "Pretrain/Loss (Raw)": 2.0229761600494385, "Pretrain/Step": 6071, "Pretrain/Step Time": 8.50959794037044} +{"Pretrain/Learning Rate": 3.986684409445243e-05, "Pretrain/Loss": 2.080228328704834, "Pretrain/Loss (Raw)": 1.501228928565979, "Pretrain/Step": 6072, "Pretrain/Step Time": 8.51392044313252} +{"Pretrain/Learning Rate": 3.986343090628143e-05, "Pretrain/Loss": 2.080573558807373, "Pretrain/Loss (Raw)": 1.7504781484603882, "Pretrain/Step": 6073, "Pretrain/Step Time": 8.510834388434887} +{"Pretrain/Learning Rate": 3.986001728953387e-05, "Pretrain/Loss": 2.0781288146972656, "Pretrain/Loss (Raw)": 2.0284383296966553, "Pretrain/Step": 6074, "Pretrain/Step Time": 8.514853673055768} +{"Pretrain/Learning Rate": 3.985660324430819e-05, "Pretrain/Loss": 2.0786924362182617, "Pretrain/Loss (Raw)": 2.048020124435425, "Pretrain/Step": 6075, "Pretrain/Step Time": 8.519135234877467} +{"Pretrain/Learning Rate": 3.985318877070283e-05, "Pretrain/Loss": 2.0768070220947266, "Pretrain/Loss (Raw)": 1.9170427322387695, "Pretrain/Step": 6076, "Pretrain/Step Time": 8.51200120896101} +{"Pretrain/Learning Rate": 3.984977386881624e-05, "Pretrain/Loss": 2.0762720108032227, "Pretrain/Loss (Raw)": 2.00301456451416, "Pretrain/Step": 6077, "Pretrain/Step Time": 8.514363566413522} +{"Pretrain/Learning Rate": 3.98463585387469e-05, "Pretrain/Loss": 2.0780467987060547, "Pretrain/Loss (Raw)": 2.091761350631714, "Pretrain/Step": 6078, "Pretrain/Step Time": 8.509668830782175} +{"Pretrain/Learning Rate": 3.984294278059326e-05, "Pretrain/Loss": 2.0779199600219727, "Pretrain/Loss (Raw)": 1.9866067171096802, "Pretrain/Step": 6079, "Pretrain/Step Time": 8.510267108678818} +{"Pretrain/Learning Rate": 3.983952659445385e-05, "Pretrain/Loss": 2.078960657119751, "Pretrain/Loss (Raw)": 2.197784185409546, "Pretrain/Step": 6080, "Pretrain/Step Time": 8.508387941867113} +{"Pretrain/Learning Rate": 3.983610998042713e-05, "Pretrain/Loss": 2.0781147480010986, "Pretrain/Loss (Raw)": 2.0787484645843506, "Pretrain/Step": 6081, "Pretrain/Step Time": 8.507273148745298} +{"Pretrain/Learning Rate": 3.983269293861165e-05, "Pretrain/Loss": 2.078963279724121, "Pretrain/Loss (Raw)": 2.2312428951263428, "Pretrain/Step": 6082, "Pretrain/Step Time": 8.505308821797371} +{"Pretrain/Learning Rate": 3.982927546910592e-05, "Pretrain/Loss": 2.0793251991271973, "Pretrain/Loss (Raw)": 2.0096123218536377, "Pretrain/Step": 6083, "Pretrain/Step Time": 8.510303802788258} +{"Pretrain/Learning Rate": 3.982585757200849e-05, "Pretrain/Loss": 2.0835537910461426, "Pretrain/Loss (Raw)": 2.301583766937256, "Pretrain/Step": 6084, "Pretrain/Step Time": 8.505255728960037} +{"Pretrain/Learning Rate": 3.982243924741791e-05, "Pretrain/Loss": 2.0874950885772705, "Pretrain/Loss (Raw)": 1.9385477304458618, "Pretrain/Step": 6085, "Pretrain/Step Time": 8.503832848742604} +{"Pretrain/Learning Rate": 3.9819020495432736e-05, "Pretrain/Loss": 2.0867815017700195, "Pretrain/Loss (Raw)": 1.9871675968170166, "Pretrain/Step": 6086, "Pretrain/Step Time": 8.5029504802078} +{"Pretrain/Learning Rate": 3.981560131615156e-05, "Pretrain/Loss": 2.087545871734619, "Pretrain/Loss (Raw)": 2.1738791465759277, "Pretrain/Step": 6087, "Pretrain/Step Time": 8.502406615763903} +{"Pretrain/Learning Rate": 3.9812181709672954e-05, "Pretrain/Loss": 2.0855722427368164, "Pretrain/Loss (Raw)": 1.6635525226593018, "Pretrain/Step": 6088, "Pretrain/Step Time": 8.505901258438826} +{"Pretrain/Learning Rate": 3.980876167609554e-05, "Pretrain/Loss": 2.0852699279785156, "Pretrain/Loss (Raw)": 2.2047231197357178, "Pretrain/Step": 6089, "Pretrain/Step Time": 8.505183083936572} +{"Pretrain/Learning Rate": 3.980534121551792e-05, "Pretrain/Loss": 2.0827348232269287, "Pretrain/Loss (Raw)": 2.0304830074310303, "Pretrain/Step": 6090, "Pretrain/Step Time": 8.503706987947226} +{"Pretrain/Learning Rate": 3.980192032803872e-05, "Pretrain/Loss": 2.085141658782959, "Pretrain/Loss (Raw)": 2.2737338542938232, "Pretrain/Step": 6091, "Pretrain/Step Time": 8.506278865039349} +{"Pretrain/Learning Rate": 3.979849901375659e-05, "Pretrain/Loss": 2.0826659202575684, "Pretrain/Loss (Raw)": 1.9807395935058594, "Pretrain/Step": 6092, "Pretrain/Step Time": 8.506504192948341} +{"Pretrain/Learning Rate": 3.979507727277017e-05, "Pretrain/Loss": 2.084014892578125, "Pretrain/Loss (Raw)": 2.079447031021118, "Pretrain/Step": 6093, "Pretrain/Step Time": 8.506283117458224} +{"Pretrain/Learning Rate": 3.9791655105178125e-05, "Pretrain/Loss": 2.082963466644287, "Pretrain/Loss (Raw)": 2.045506715774536, "Pretrain/Step": 6094, "Pretrain/Step Time": 8.503059662878513} +{"Pretrain/Learning Rate": 3.978823251107913e-05, "Pretrain/Loss": 2.080061912536621, "Pretrain/Loss (Raw)": 1.9894108772277832, "Pretrain/Step": 6095, "Pretrain/Step Time": 8.507441848516464} +{"Pretrain/Learning Rate": 3.978480949057188e-05, "Pretrain/Loss": 2.0782055854797363, "Pretrain/Loss (Raw)": 1.9809929132461548, "Pretrain/Step": 6096, "Pretrain/Step Time": 8.499409945681691} +{"Pretrain/Learning Rate": 3.9781386043755066e-05, "Pretrain/Loss": 2.077678918838501, "Pretrain/Loss (Raw)": 2.1630160808563232, "Pretrain/Step": 6097, "Pretrain/Step Time": 8.503258857876062} +{"Pretrain/Learning Rate": 3.977796217072741e-05, "Pretrain/Loss": 2.0772342681884766, "Pretrain/Loss (Raw)": 2.0503475666046143, "Pretrain/Step": 6098, "Pretrain/Step Time": 8.501856608316302} +{"Pretrain/Learning Rate": 3.977453787158763e-05, "Pretrain/Loss": 2.077683210372925, "Pretrain/Loss (Raw)": 2.0541419982910156, "Pretrain/Step": 6099, "Pretrain/Step Time": 8.503944415599108} +{"Pretrain/Learning Rate": 3.977111314643447e-05, "Pretrain/Loss": 2.0760676860809326, "Pretrain/Loss (Raw)": 2.043700695037842, "Pretrain/Step": 6100, "Pretrain/Step Time": 8.497789097949862} +{"Pretrain/Learning Rate": 3.976768799536667e-05, "Pretrain/Loss": 2.0756850242614746, "Pretrain/Loss (Raw)": 2.0866849422454834, "Pretrain/Step": 6101, "Pretrain/Step Time": 8.498067950829864} +{"Pretrain/Learning Rate": 3.9764262418483e-05, "Pretrain/Loss": 2.0761818885803223, "Pretrain/Loss (Raw)": 2.0346219539642334, "Pretrain/Step": 6102, "Pretrain/Step Time": 8.49950803257525} +{"Pretrain/Learning Rate": 3.976083641588223e-05, "Pretrain/Loss": 2.077180862426758, "Pretrain/Loss (Raw)": 2.1836462020874023, "Pretrain/Step": 6103, "Pretrain/Step Time": 8.499063346534967} +{"Pretrain/Learning Rate": 3.9757409987663155e-05, "Pretrain/Loss": 2.075870990753174, "Pretrain/Loss (Raw)": 1.9687215089797974, "Pretrain/Step": 6104, "Pretrain/Step Time": 8.505547123029828} +{"Pretrain/Learning Rate": 3.9753983133924555e-05, "Pretrain/Loss": 2.0772576332092285, "Pretrain/Loss (Raw)": 2.086972713470459, "Pretrain/Step": 6105, "Pretrain/Step Time": 8.503692474216223} +{"Pretrain/Learning Rate": 3.9750555854765256e-05, "Pretrain/Loss": 2.0743255615234375, "Pretrain/Loss (Raw)": 1.9500713348388672, "Pretrain/Step": 6106, "Pretrain/Step Time": 8.50537215732038} +{"Pretrain/Learning Rate": 3.974712815028408e-05, "Pretrain/Loss": 2.0719149112701416, "Pretrain/Loss (Raw)": 1.7325307130813599, "Pretrain/Step": 6107, "Pretrain/Step Time": 8.508640438318253} +{"Pretrain/Learning Rate": 3.974370002057986e-05, "Pretrain/Loss": 2.073974132537842, "Pretrain/Loss (Raw)": 2.1062183380126953, "Pretrain/Step": 6108, "Pretrain/Step Time": 8.511616514995694} +{"Pretrain/Learning Rate": 3.9740271465751444e-05, "Pretrain/Loss": 2.0746264457702637, "Pretrain/Loss (Raw)": 2.120891809463501, "Pretrain/Step": 6109, "Pretrain/Step Time": 8.509620847180486} +{"Pretrain/Learning Rate": 3.973684248589768e-05, "Pretrain/Loss": 2.0740678310394287, "Pretrain/Loss (Raw)": 1.9530147314071655, "Pretrain/Step": 6110, "Pretrain/Step Time": 8.513840528205037} +{"Pretrain/Learning Rate": 3.973341308111746e-05, "Pretrain/Loss": 2.07611346244812, "Pretrain/Loss (Raw)": 2.1444170475006104, "Pretrain/Step": 6111, "Pretrain/Step Time": 8.506001152098179} +{"Pretrain/Learning Rate": 3.972998325150967e-05, "Pretrain/Loss": 2.0760138034820557, "Pretrain/Loss (Raw)": 1.9823237657546997, "Pretrain/Step": 6112, "Pretrain/Step Time": 8.502168951556087} +{"Pretrain/Learning Rate": 3.9726552997173185e-05, "Pretrain/Loss": 2.0749635696411133, "Pretrain/Loss (Raw)": 1.9807848930358887, "Pretrain/Step": 6113, "Pretrain/Step Time": 8.50097823701799} +{"Pretrain/Learning Rate": 3.972312231820693e-05, "Pretrain/Loss": 2.0747551918029785, "Pretrain/Loss (Raw)": 1.9319292306900024, "Pretrain/Step": 6114, "Pretrain/Step Time": 8.504063941538334} +{"Pretrain/Learning Rate": 3.971969121470982e-05, "Pretrain/Loss": 2.072659492492676, "Pretrain/Loss (Raw)": 1.8707729578018188, "Pretrain/Step": 6115, "Pretrain/Step Time": 8.501441767439246} +{"Pretrain/Learning Rate": 3.971625968678079e-05, "Pretrain/Loss": 2.0734705924987793, "Pretrain/Loss (Raw)": 2.116088390350342, "Pretrain/Step": 6116, "Pretrain/Step Time": 8.498121902346611} +{"Pretrain/Learning Rate": 3.9712827734518794e-05, "Pretrain/Loss": 2.0722005367279053, "Pretrain/Loss (Raw)": 1.9622173309326172, "Pretrain/Step": 6117, "Pretrain/Step Time": 8.50067824870348} +{"Pretrain/Learning Rate": 3.970939535802277e-05, "Pretrain/Loss": 2.066911220550537, "Pretrain/Loss (Raw)": 2.1814827919006348, "Pretrain/Step": 6118, "Pretrain/Step Time": 8.501614734530449} +{"Pretrain/Learning Rate": 3.970596255739171e-05, "Pretrain/Loss": 2.0623414516448975, "Pretrain/Loss (Raw)": 1.4756754636764526, "Pretrain/Step": 6119, "Pretrain/Step Time": 8.502681739628315} +{"Pretrain/Learning Rate": 3.970252933272458e-05, "Pretrain/Loss": 2.0603151321411133, "Pretrain/Loss (Raw)": 2.0408098697662354, "Pretrain/Step": 6120, "Pretrain/Step Time": 8.508434964343905} +{"Pretrain/Learning Rate": 3.9699095684120384e-05, "Pretrain/Loss": 2.0568244457244873, "Pretrain/Loss (Raw)": 1.8328087329864502, "Pretrain/Step": 6121, "Pretrain/Step Time": 8.508763829246163} +{"Pretrain/Learning Rate": 3.969566161167813e-05, "Pretrain/Loss": 2.058845043182373, "Pretrain/Loss (Raw)": 2.0955350399017334, "Pretrain/Step": 6122, "Pretrain/Step Time": 8.508010698482394} +{"Pretrain/Learning Rate": 3.9692227115496825e-05, "Pretrain/Loss": 2.0576417446136475, "Pretrain/Loss (Raw)": 1.9994465112686157, "Pretrain/Step": 6123, "Pretrain/Step Time": 8.502997459843755} +{"Pretrain/Learning Rate": 3.968879219567552e-05, "Pretrain/Loss": 2.0579071044921875, "Pretrain/Loss (Raw)": 2.0941050052642822, "Pretrain/Step": 6124, "Pretrain/Step Time": 8.507257286459208} +{"Pretrain/Learning Rate": 3.968535685231324e-05, "Pretrain/Loss": 2.0567758083343506, "Pretrain/Loss (Raw)": 1.9437562227249146, "Pretrain/Step": 6125, "Pretrain/Step Time": 8.512454506009817} +{"Pretrain/Learning Rate": 3.968192108550904e-05, "Pretrain/Loss": 2.0521302223205566, "Pretrain/Loss (Raw)": 1.8978897333145142, "Pretrain/Step": 6126, "Pretrain/Step Time": 8.511120546609163} +{"Pretrain/Learning Rate": 3.9678484895362e-05, "Pretrain/Loss": 2.05059814453125, "Pretrain/Loss (Raw)": 1.9772874116897583, "Pretrain/Step": 6127, "Pretrain/Step Time": 8.512833880260587} +{"Pretrain/Learning Rate": 3.9675048281971203e-05, "Pretrain/Loss": 2.0513992309570312, "Pretrain/Loss (Raw)": 2.040677309036255, "Pretrain/Step": 6128, "Pretrain/Step Time": 8.509359823539853} +{"Pretrain/Learning Rate": 3.967161124543573e-05, "Pretrain/Loss": 2.0518455505371094, "Pretrain/Loss (Raw)": 2.047616720199585, "Pretrain/Step": 6129, "Pretrain/Step Time": 8.508595017716289} +{"Pretrain/Learning Rate": 3.966817378585469e-05, "Pretrain/Loss": 2.051879405975342, "Pretrain/Loss (Raw)": 2.1702656745910645, "Pretrain/Step": 6130, "Pretrain/Step Time": 8.506444364786148} +{"Pretrain/Learning Rate": 3.96647359033272e-05, "Pretrain/Loss": 2.0515053272247314, "Pretrain/Loss (Raw)": 1.929054617881775, "Pretrain/Step": 6131, "Pretrain/Step Time": 8.505955245345831} +{"Pretrain/Learning Rate": 3.966129759795238e-05, "Pretrain/Loss": 2.0524580478668213, "Pretrain/Loss (Raw)": 2.0657973289489746, "Pretrain/Step": 6132, "Pretrain/Step Time": 8.507659619674087} +{"Pretrain/Learning Rate": 3.965785886982939e-05, "Pretrain/Loss": 2.051485300064087, "Pretrain/Loss (Raw)": 2.09881854057312, "Pretrain/Step": 6133, "Pretrain/Step Time": 8.505206754431129} +{"Pretrain/Learning Rate": 3.9654419719057365e-05, "Pretrain/Loss": 2.0500640869140625, "Pretrain/Loss (Raw)": 1.9920107126235962, "Pretrain/Step": 6134, "Pretrain/Step Time": 8.505507567897439} +{"Pretrain/Learning Rate": 3.9650980145735484e-05, "Pretrain/Loss": 2.050718069076538, "Pretrain/Loss (Raw)": 2.0831661224365234, "Pretrain/Step": 6135, "Pretrain/Step Time": 8.505892289802432} +{"Pretrain/Learning Rate": 3.964754014996292e-05, "Pretrain/Loss": 2.050616502761841, "Pretrain/Loss (Raw)": 2.109224796295166, "Pretrain/Step": 6136, "Pretrain/Step Time": 8.50375691615045} +{"Pretrain/Learning Rate": 3.964409973183886e-05, "Pretrain/Loss": 2.053849697113037, "Pretrain/Loss (Raw)": 2.1118099689483643, "Pretrain/Step": 6137, "Pretrain/Step Time": 8.507741559296846} +{"Pretrain/Learning Rate": 3.96406588914625e-05, "Pretrain/Loss": 2.0520505905151367, "Pretrain/Loss (Raw)": 1.9277737140655518, "Pretrain/Step": 6138, "Pretrain/Step Time": 8.508835030719638} +{"Pretrain/Learning Rate": 3.963721762893307e-05, "Pretrain/Loss": 2.053938150405884, "Pretrain/Loss (Raw)": 2.1795125007629395, "Pretrain/Step": 6139, "Pretrain/Step Time": 8.511063052341342} +{"Pretrain/Learning Rate": 3.963377594434978e-05, "Pretrain/Loss": 2.0532493591308594, "Pretrain/Loss (Raw)": 2.0260581970214844, "Pretrain/Step": 6140, "Pretrain/Step Time": 8.509919852018356} +{"Pretrain/Learning Rate": 3.963033383781189e-05, "Pretrain/Loss": 2.057223081588745, "Pretrain/Loss (Raw)": 2.663834810256958, "Pretrain/Step": 6141, "Pretrain/Step Time": 8.511824386194348} +{"Pretrain/Learning Rate": 3.962689130941863e-05, "Pretrain/Loss": 2.0554747581481934, "Pretrain/Loss (Raw)": 2.065964937210083, "Pretrain/Step": 6142, "Pretrain/Step Time": 8.50895743072033} +{"Pretrain/Learning Rate": 3.9623448359269264e-05, "Pretrain/Loss": 2.056715488433838, "Pretrain/Loss (Raw)": 2.2902865409851074, "Pretrain/Step": 6143, "Pretrain/Step Time": 8.511012328788638} +{"Pretrain/Learning Rate": 3.962000498746309e-05, "Pretrain/Loss": 2.057579755783081, "Pretrain/Loss (Raw)": 2.2000882625579834, "Pretrain/Step": 6144, "Pretrain/Step Time": 8.511493461206555} +{"Pretrain/Learning Rate": 3.9616561194099365e-05, "Pretrain/Loss": 2.058332681655884, "Pretrain/Loss (Raw)": 2.0798277854919434, "Pretrain/Step": 6145, "Pretrain/Step Time": 8.513635093346238} +{"Pretrain/Learning Rate": 3.961311697927741e-05, "Pretrain/Loss": 2.0584373474121094, "Pretrain/Loss (Raw)": 1.9871641397476196, "Pretrain/Step": 6146, "Pretrain/Step Time": 8.51347829401493} +{"Pretrain/Learning Rate": 3.960967234309652e-05, "Pretrain/Loss": 2.0575571060180664, "Pretrain/Loss (Raw)": 1.9876539707183838, "Pretrain/Step": 6147, "Pretrain/Step Time": 8.510071989148855} +{"Pretrain/Learning Rate": 3.9606227285656035e-05, "Pretrain/Loss": 2.058544635772705, "Pretrain/Loss (Raw)": 2.131645441055298, "Pretrain/Step": 6148, "Pretrain/Step Time": 8.505745202302933} +{"Pretrain/Learning Rate": 3.960278180705528e-05, "Pretrain/Loss": 2.0604798793792725, "Pretrain/Loss (Raw)": 2.5677356719970703, "Pretrain/Step": 6149, "Pretrain/Step Time": 8.510125571861863} +{"Pretrain/Learning Rate": 3.95993359073936e-05, "Pretrain/Loss": 2.061253309249878, "Pretrain/Loss (Raw)": 2.0479021072387695, "Pretrain/Step": 6150, "Pretrain/Step Time": 8.50423095561564} +{"Pretrain/Learning Rate": 3.959588958677036e-05, "Pretrain/Loss": 2.062612295150757, "Pretrain/Loss (Raw)": 2.1998820304870605, "Pretrain/Step": 6151, "Pretrain/Step Time": 8.499722376465797} +{"Pretrain/Learning Rate": 3.959244284528495e-05, "Pretrain/Loss": 2.063541889190674, "Pretrain/Loss (Raw)": 2.0944392681121826, "Pretrain/Step": 6152, "Pretrain/Step Time": 8.501914031803608} +{"Pretrain/Learning Rate": 3.958899568303672e-05, "Pretrain/Loss": 2.0616135597229004, "Pretrain/Loss (Raw)": 1.9158782958984375, "Pretrain/Step": 6153, "Pretrain/Step Time": 8.507194543257356} +{"Pretrain/Learning Rate": 3.958554810012509e-05, "Pretrain/Loss": 2.058734893798828, "Pretrain/Loss (Raw)": 1.8837748765945435, "Pretrain/Step": 6154, "Pretrain/Step Time": 8.509091032668948} +{"Pretrain/Learning Rate": 3.958210009664946e-05, "Pretrain/Loss": 2.0593042373657227, "Pretrain/Loss (Raw)": 2.0630204677581787, "Pretrain/Step": 6155, "Pretrain/Step Time": 8.506644655019045} +{"Pretrain/Learning Rate": 3.9578651672709264e-05, "Pretrain/Loss": 2.060127019882202, "Pretrain/Loss (Raw)": 2.0670487880706787, "Pretrain/Step": 6156, "Pretrain/Step Time": 8.506259262561798} +{"Pretrain/Learning Rate": 3.957520282840392e-05, "Pretrain/Loss": 2.0600149631500244, "Pretrain/Loss (Raw)": 1.9545360803604126, "Pretrain/Step": 6157, "Pretrain/Step Time": 8.510317040607333} +{"Pretrain/Learning Rate": 3.957175356383287e-05, "Pretrain/Loss": 2.0579190254211426, "Pretrain/Loss (Raw)": 1.9319088459014893, "Pretrain/Step": 6158, "Pretrain/Step Time": 8.509042797610164} +{"Pretrain/Learning Rate": 3.9568303879095584e-05, "Pretrain/Loss": 2.0578677654266357, "Pretrain/Loss (Raw)": 2.119502067565918, "Pretrain/Step": 6159, "Pretrain/Step Time": 8.513727739453316} +{"Pretrain/Learning Rate": 3.956485377429152e-05, "Pretrain/Loss": 2.058352470397949, "Pretrain/Loss (Raw)": 2.148799419403076, "Pretrain/Step": 6160, "Pretrain/Step Time": 8.510138850659132} +{"Pretrain/Learning Rate": 3.956140324952017e-05, "Pretrain/Loss": 2.0582191944122314, "Pretrain/Loss (Raw)": 2.00557017326355, "Pretrain/Step": 6161, "Pretrain/Step Time": 8.510070310905576} +{"Pretrain/Learning Rate": 3.9557952304881024e-05, "Pretrain/Loss": 2.0542001724243164, "Pretrain/Loss (Raw)": 1.924041509628296, "Pretrain/Step": 6162, "Pretrain/Step Time": 8.513542292639613} +{"Pretrain/Learning Rate": 3.9554500940473586e-05, "Pretrain/Loss": 2.053884267807007, "Pretrain/Loss (Raw)": 1.9794095754623413, "Pretrain/Step": 6163, "Pretrain/Step Time": 8.513537159189582} +{"Pretrain/Learning Rate": 3.955104915639737e-05, "Pretrain/Loss": 2.050563097000122, "Pretrain/Loss (Raw)": 1.9042181968688965, "Pretrain/Step": 6164, "Pretrain/Step Time": 8.511415122076869} +{"Pretrain/Learning Rate": 3.954759695275191e-05, "Pretrain/Loss": 2.049574136734009, "Pretrain/Loss (Raw)": 2.0679619312286377, "Pretrain/Step": 6165, "Pretrain/Step Time": 8.507778506726027} +{"Pretrain/Learning Rate": 3.954414432963674e-05, "Pretrain/Loss": 2.050353765487671, "Pretrain/Loss (Raw)": 2.047938823699951, "Pretrain/Step": 6166, "Pretrain/Step Time": 8.511524222791195} +{"Pretrain/Learning Rate": 3.954069128715144e-05, "Pretrain/Loss": 2.0499985218048096, "Pretrain/Loss (Raw)": 2.1305153369903564, "Pretrain/Step": 6167, "Pretrain/Step Time": 8.510503444820642} +{"Pretrain/Learning Rate": 3.9537237825395544e-05, "Pretrain/Loss": 2.0506887435913086, "Pretrain/Loss (Raw)": 2.1879992485046387, "Pretrain/Step": 6168, "Pretrain/Step Time": 8.513404179364443} +{"Pretrain/Learning Rate": 3.953378394446864e-05, "Pretrain/Loss": 2.049283981323242, "Pretrain/Loss (Raw)": 1.8447636365890503, "Pretrain/Step": 6169, "Pretrain/Step Time": 8.512797646224499} +{"Pretrain/Learning Rate": 3.953032964447033e-05, "Pretrain/Loss": 2.0490775108337402, "Pretrain/Loss (Raw)": 2.2459588050842285, "Pretrain/Step": 6170, "Pretrain/Step Time": 8.51608643680811} +{"Pretrain/Learning Rate": 3.952687492550021e-05, "Pretrain/Loss": 2.0505964756011963, "Pretrain/Loss (Raw)": 2.123608350753784, "Pretrain/Step": 6171, "Pretrain/Step Time": 8.512227788567543} +{"Pretrain/Learning Rate": 3.952341978765788e-05, "Pretrain/Loss": 2.0523219108581543, "Pretrain/Loss (Raw)": 2.2480177879333496, "Pretrain/Step": 6172, "Pretrain/Step Time": 8.508023969829082} +{"Pretrain/Learning Rate": 3.951996423104299e-05, "Pretrain/Loss": 2.0523416996002197, "Pretrain/Loss (Raw)": 2.1408371925354004, "Pretrain/Step": 6173, "Pretrain/Step Time": 8.515141613781452} +{"Pretrain/Learning Rate": 3.951650825575516e-05, "Pretrain/Loss": 2.0543766021728516, "Pretrain/Loss (Raw)": 2.0934536457061768, "Pretrain/Step": 6174, "Pretrain/Step Time": 8.510687913745642} +{"Pretrain/Learning Rate": 3.951305186189406e-05, "Pretrain/Loss": 2.05470609664917, "Pretrain/Loss (Raw)": 2.061798572540283, "Pretrain/Step": 6175, "Pretrain/Step Time": 8.510194260627031} +{"Pretrain/Learning Rate": 3.950959504955933e-05, "Pretrain/Loss": 2.051736354827881, "Pretrain/Loss (Raw)": 2.1359102725982666, "Pretrain/Step": 6176, "Pretrain/Step Time": 8.509751487523317} +{"Pretrain/Learning Rate": 3.9506137818850656e-05, "Pretrain/Loss": 2.0527400970458984, "Pretrain/Loss (Raw)": 2.0723772048950195, "Pretrain/Step": 6177, "Pretrain/Step Time": 8.50674294307828} +{"Pretrain/Learning Rate": 3.950268016986772e-05, "Pretrain/Loss": 2.0497958660125732, "Pretrain/Loss (Raw)": 1.8725380897521973, "Pretrain/Step": 6178, "Pretrain/Step Time": 8.50631164945662} +{"Pretrain/Learning Rate": 3.9499222102710236e-05, "Pretrain/Loss": 2.0506703853607178, "Pretrain/Loss (Raw)": 2.017564058303833, "Pretrain/Step": 6179, "Pretrain/Step Time": 8.504276731982827} +{"Pretrain/Learning Rate": 3.94957636174779e-05, "Pretrain/Loss": 2.05198335647583, "Pretrain/Loss (Raw)": 2.0669376850128174, "Pretrain/Step": 6180, "Pretrain/Step Time": 8.504052218049765} +{"Pretrain/Learning Rate": 3.949230471427043e-05, "Pretrain/Loss": 2.054091453552246, "Pretrain/Loss (Raw)": 2.262716054916382, "Pretrain/Step": 6181, "Pretrain/Step Time": 8.505563393235207} +{"Pretrain/Learning Rate": 3.948884539318758e-05, "Pretrain/Loss": 2.0514230728149414, "Pretrain/Loss (Raw)": 1.7371068000793457, "Pretrain/Step": 6182, "Pretrain/Step Time": 8.507442900910974} +{"Pretrain/Learning Rate": 3.948538565432909e-05, "Pretrain/Loss": 2.0474119186401367, "Pretrain/Loss (Raw)": 1.9136877059936523, "Pretrain/Step": 6183, "Pretrain/Step Time": 8.509566467255354} +{"Pretrain/Learning Rate": 3.948192549779471e-05, "Pretrain/Loss": 2.0499649047851562, "Pretrain/Loss (Raw)": 2.1736464500427246, "Pretrain/Step": 6184, "Pretrain/Step Time": 8.505696460604668} +{"Pretrain/Learning Rate": 3.9478464923684225e-05, "Pretrain/Loss": 2.0497701168060303, "Pretrain/Loss (Raw)": 2.03324031829834, "Pretrain/Step": 6185, "Pretrain/Step Time": 8.50666382536292} +{"Pretrain/Learning Rate": 3.9475003932097395e-05, "Pretrain/Loss": 2.0525474548339844, "Pretrain/Loss (Raw)": 2.1557910442352295, "Pretrain/Step": 6186, "Pretrain/Step Time": 8.506695101037621} +{"Pretrain/Learning Rate": 3.9471542523134045e-05, "Pretrain/Loss": 2.056008815765381, "Pretrain/Loss (Raw)": 2.4421095848083496, "Pretrain/Step": 6187, "Pretrain/Step Time": 8.508685635402799} +{"Pretrain/Learning Rate": 3.946808069689396e-05, "Pretrain/Loss": 2.0575242042541504, "Pretrain/Loss (Raw)": 2.1389739513397217, "Pretrain/Step": 6188, "Pretrain/Step Time": 8.505579926073551} +{"Pretrain/Learning Rate": 3.9464618453476975e-05, "Pretrain/Loss": 2.0545594692230225, "Pretrain/Loss (Raw)": 1.9072730541229248, "Pretrain/Step": 6189, "Pretrain/Step Time": 8.50590269640088} +{"Pretrain/Learning Rate": 3.9461155792982905e-05, "Pretrain/Loss": 2.0543923377990723, "Pretrain/Loss (Raw)": 2.2209436893463135, "Pretrain/Step": 6190, "Pretrain/Step Time": 8.511406490579247} +{"Pretrain/Learning Rate": 3.9457692715511605e-05, "Pretrain/Loss": 2.051907777786255, "Pretrain/Loss (Raw)": 2.021467447280884, "Pretrain/Step": 6191, "Pretrain/Step Time": 8.50628737732768} +{"Pretrain/Learning Rate": 3.945422922116293e-05, "Pretrain/Loss": 2.0500712394714355, "Pretrain/Loss (Raw)": 1.8977341651916504, "Pretrain/Step": 6192, "Pretrain/Step Time": 8.512802323326468} +{"Pretrain/Learning Rate": 3.945076531003674e-05, "Pretrain/Loss": 2.048752784729004, "Pretrain/Loss (Raw)": 1.9529551267623901, "Pretrain/Step": 6193, "Pretrain/Step Time": 8.507728641852736} +{"Pretrain/Learning Rate": 3.944730098223293e-05, "Pretrain/Loss": 2.0498809814453125, "Pretrain/Loss (Raw)": 2.179844856262207, "Pretrain/Step": 6194, "Pretrain/Step Time": 8.506474159657955} +{"Pretrain/Learning Rate": 3.944383623785137e-05, "Pretrain/Loss": 2.0512564182281494, "Pretrain/Loss (Raw)": 2.1276559829711914, "Pretrain/Step": 6195, "Pretrain/Step Time": 8.510413071140647} +{"Pretrain/Learning Rate": 3.944037107699198e-05, "Pretrain/Loss": 2.050861358642578, "Pretrain/Loss (Raw)": 1.9469910860061646, "Pretrain/Step": 6196, "Pretrain/Step Time": 8.507049048319459} +{"Pretrain/Learning Rate": 3.9436905499754666e-05, "Pretrain/Loss": 2.0501718521118164, "Pretrain/Loss (Raw)": 1.9846036434173584, "Pretrain/Step": 6197, "Pretrain/Step Time": 8.505240527912974} +{"Pretrain/Learning Rate": 3.943343950623936e-05, "Pretrain/Loss": 2.0472640991210938, "Pretrain/Loss (Raw)": 2.0203258991241455, "Pretrain/Step": 6198, "Pretrain/Step Time": 8.498568935319781} +{"Pretrain/Learning Rate": 3.9429973096546e-05, "Pretrain/Loss": 2.048004627227783, "Pretrain/Loss (Raw)": 2.117790699005127, "Pretrain/Step": 6199, "Pretrain/Step Time": 8.503058096393943} +{"Pretrain/Learning Rate": 3.942650627077454e-05, "Pretrain/Loss": 2.052048683166504, "Pretrain/Loss (Raw)": 2.0188722610473633, "Pretrain/Step": 6200, "Pretrain/Step Time": 8.49375942721963} +{"Pretrain/Learning Rate": 3.9423039029024944e-05, "Pretrain/Loss": 2.053985595703125, "Pretrain/Loss (Raw)": 1.9983724355697632, "Pretrain/Step": 6201, "Pretrain/Step Time": 8.497530553489923} +{"Pretrain/Learning Rate": 3.9419571371397186e-05, "Pretrain/Loss": 2.0548999309539795, "Pretrain/Loss (Raw)": 2.1454825401306152, "Pretrain/Step": 6202, "Pretrain/Step Time": 8.50146048516035} +{"Pretrain/Learning Rate": 3.9416103297991244e-05, "Pretrain/Loss": 2.053083896636963, "Pretrain/Loss (Raw)": 1.815575361251831, "Pretrain/Step": 6203, "Pretrain/Step Time": 8.499967304989696} +{"Pretrain/Learning Rate": 3.9412634808907136e-05, "Pretrain/Loss": 2.05393648147583, "Pretrain/Loss (Raw)": 2.026153564453125, "Pretrain/Step": 6204, "Pretrain/Step Time": 8.501042906194925} +{"Pretrain/Learning Rate": 3.940916590424486e-05, "Pretrain/Loss": 2.056722640991211, "Pretrain/Loss (Raw)": 2.359670877456665, "Pretrain/Step": 6205, "Pretrain/Step Time": 8.50038093701005} +{"Pretrain/Learning Rate": 3.940569658410444e-05, "Pretrain/Loss": 2.054755926132202, "Pretrain/Loss (Raw)": 1.8399920463562012, "Pretrain/Step": 6206, "Pretrain/Step Time": 8.503516174852848} +{"Pretrain/Learning Rate": 3.940222684858592e-05, "Pretrain/Loss": 2.05489182472229, "Pretrain/Loss (Raw)": 2.0040297508239746, "Pretrain/Step": 6207, "Pretrain/Step Time": 8.504178911447525} +{"Pretrain/Learning Rate": 3.939875669778933e-05, "Pretrain/Loss": 2.054269313812256, "Pretrain/Loss (Raw)": 2.118108034133911, "Pretrain/Step": 6208, "Pretrain/Step Time": 8.507060335949063} +{"Pretrain/Learning Rate": 3.939528613181476e-05, "Pretrain/Loss": 2.0511622428894043, "Pretrain/Loss (Raw)": 1.6810222864151, "Pretrain/Step": 6209, "Pretrain/Step Time": 8.506372166797519} +{"Pretrain/Learning Rate": 3.939181515076225e-05, "Pretrain/Loss": 2.0497331619262695, "Pretrain/Loss (Raw)": 2.048335075378418, "Pretrain/Step": 6210, "Pretrain/Step Time": 8.505548002198339} +{"Pretrain/Learning Rate": 3.938834375473189e-05, "Pretrain/Loss": 2.053846836090088, "Pretrain/Loss (Raw)": 2.5361483097076416, "Pretrain/Step": 6211, "Pretrain/Step Time": 8.501834498718381} +{"Pretrain/Learning Rate": 3.938487194382379e-05, "Pretrain/Loss": 2.054257392883301, "Pretrain/Loss (Raw)": 2.3541157245635986, "Pretrain/Step": 6212, "Pretrain/Step Time": 8.499752646312118} +{"Pretrain/Learning Rate": 3.9381399718138046e-05, "Pretrain/Loss": 2.055755853652954, "Pretrain/Loss (Raw)": 2.130368947982788, "Pretrain/Step": 6213, "Pretrain/Step Time": 8.499051794409752} +{"Pretrain/Learning Rate": 3.937792707777478e-05, "Pretrain/Loss": 2.0561509132385254, "Pretrain/Loss (Raw)": 2.037705421447754, "Pretrain/Step": 6214, "Pretrain/Step Time": 8.49971835501492} +{"Pretrain/Learning Rate": 3.9374454022834126e-05, "Pretrain/Loss": 2.0575947761535645, "Pretrain/Loss (Raw)": 2.3587088584899902, "Pretrain/Step": 6215, "Pretrain/Step Time": 8.501736681908369} +{"Pretrain/Learning Rate": 3.937098055341621e-05, "Pretrain/Loss": 2.060725212097168, "Pretrain/Loss (Raw)": 2.064265727996826, "Pretrain/Step": 6216, "Pretrain/Step Time": 8.49138874001801} +{"Pretrain/Learning Rate": 3.936750666962122e-05, "Pretrain/Loss": 2.060974597930908, "Pretrain/Loss (Raw)": 2.236623764038086, "Pretrain/Step": 6217, "Pretrain/Step Time": 8.494254248216748} +{"Pretrain/Learning Rate": 3.9364032371549293e-05, "Pretrain/Loss": 2.0603549480438232, "Pretrain/Loss (Raw)": 1.951189637184143, "Pretrain/Step": 6218, "Pretrain/Step Time": 8.500225450843573} +{"Pretrain/Learning Rate": 3.9360557659300617e-05, "Pretrain/Loss": 2.05890154838562, "Pretrain/Loss (Raw)": 2.087712287902832, "Pretrain/Step": 6219, "Pretrain/Step Time": 8.50352367758751} +{"Pretrain/Learning Rate": 3.9357082532975384e-05, "Pretrain/Loss": 2.0533227920532227, "Pretrain/Loss (Raw)": 1.2666363716125488, "Pretrain/Step": 6220, "Pretrain/Step Time": 8.505719054490328} +{"Pretrain/Learning Rate": 3.935360699267381e-05, "Pretrain/Loss": 2.053694725036621, "Pretrain/Loss (Raw)": 2.1270530223846436, "Pretrain/Step": 6221, "Pretrain/Step Time": 8.505224041640759} +{"Pretrain/Learning Rate": 3.935013103849609e-05, "Pretrain/Loss": 2.0540270805358887, "Pretrain/Loss (Raw)": 2.08805513381958, "Pretrain/Step": 6222, "Pretrain/Step Time": 8.504748230800033} +{"Pretrain/Learning Rate": 3.9346654670542446e-05, "Pretrain/Loss": 2.055209159851074, "Pretrain/Loss (Raw)": 2.1407201290130615, "Pretrain/Step": 6223, "Pretrain/Step Time": 8.504110615700483} +{"Pretrain/Learning Rate": 3.934317788891314e-05, "Pretrain/Loss": 2.0571978092193604, "Pretrain/Loss (Raw)": 2.235539197921753, "Pretrain/Step": 6224, "Pretrain/Step Time": 8.506536712870002} +{"Pretrain/Learning Rate": 3.93397006937084e-05, "Pretrain/Loss": 2.0552756786346436, "Pretrain/Loss (Raw)": 1.9169795513153076, "Pretrain/Step": 6225, "Pretrain/Step Time": 8.503622956573963} +{"Pretrain/Learning Rate": 3.933622308502851e-05, "Pretrain/Loss": 2.0552735328674316, "Pretrain/Loss (Raw)": 2.0500919818878174, "Pretrain/Step": 6226, "Pretrain/Step Time": 8.50330532900989} +{"Pretrain/Learning Rate": 3.933274506297373e-05, "Pretrain/Loss": 2.0561885833740234, "Pretrain/Loss (Raw)": 2.171245813369751, "Pretrain/Step": 6227, "Pretrain/Step Time": 8.502828147262335} +{"Pretrain/Learning Rate": 3.9329266627644356e-05, "Pretrain/Loss": 2.0551576614379883, "Pretrain/Loss (Raw)": 1.911767840385437, "Pretrain/Step": 6228, "Pretrain/Step Time": 8.501717932522297} +{"Pretrain/Learning Rate": 3.9325787779140675e-05, "Pretrain/Loss": 2.0541582107543945, "Pretrain/Loss (Raw)": 1.9587208032608032, "Pretrain/Step": 6229, "Pretrain/Step Time": 8.5012979041785} +{"Pretrain/Learning Rate": 3.9322308517563006e-05, "Pretrain/Loss": 2.0547871589660645, "Pretrain/Loss (Raw)": 2.115114212036133, "Pretrain/Step": 6230, "Pretrain/Step Time": 8.49843555688858} +{"Pretrain/Learning Rate": 3.9318828843011665e-05, "Pretrain/Loss": 2.054790496826172, "Pretrain/Loss (Raw)": 2.1840832233428955, "Pretrain/Step": 6231, "Pretrain/Step Time": 8.499408988282084} +{"Pretrain/Learning Rate": 3.931534875558699e-05, "Pretrain/Loss": 2.05436372756958, "Pretrain/Loss (Raw)": 1.9140819311141968, "Pretrain/Step": 6232, "Pretrain/Step Time": 8.497282704338431} +{"Pretrain/Learning Rate": 3.9311868255389315e-05, "Pretrain/Loss": 2.054849624633789, "Pretrain/Loss (Raw)": 2.1491830348968506, "Pretrain/Step": 6233, "Pretrain/Step Time": 8.498057315126061} +{"Pretrain/Learning Rate": 3.9308387342519025e-05, "Pretrain/Loss": 2.0560905933380127, "Pretrain/Loss (Raw)": 2.1089227199554443, "Pretrain/Step": 6234, "Pretrain/Step Time": 8.497944502159953} +{"Pretrain/Learning Rate": 3.930490601707646e-05, "Pretrain/Loss": 2.056774854660034, "Pretrain/Loss (Raw)": 1.8201279640197754, "Pretrain/Step": 6235, "Pretrain/Step Time": 8.501305429264903} +{"Pretrain/Learning Rate": 3.9301424279162024e-05, "Pretrain/Loss": 2.0567617416381836, "Pretrain/Loss (Raw)": 2.1045315265655518, "Pretrain/Step": 6236, "Pretrain/Step Time": 8.502392433583736} +{"Pretrain/Learning Rate": 3.9297942128876094e-05, "Pretrain/Loss": 2.056839942932129, "Pretrain/Loss (Raw)": 2.1308984756469727, "Pretrain/Step": 6237, "Pretrain/Step Time": 8.50343700684607} +{"Pretrain/Learning Rate": 3.9294459566319075e-05, "Pretrain/Loss": 2.0570473670959473, "Pretrain/Loss (Raw)": 1.9795805215835571, "Pretrain/Step": 6238, "Pretrain/Step Time": 8.499614896252751} +{"Pretrain/Learning Rate": 3.929097659159141e-05, "Pretrain/Loss": 2.0535027980804443, "Pretrain/Loss (Raw)": 1.6906965970993042, "Pretrain/Step": 6239, "Pretrain/Step Time": 8.501152582466602} +{"Pretrain/Learning Rate": 3.928749320479349e-05, "Pretrain/Loss": 2.05263090133667, "Pretrain/Loss (Raw)": 1.8707165718078613, "Pretrain/Step": 6240, "Pretrain/Step Time": 8.507367998361588} +{"Pretrain/Learning Rate": 3.928400940602578e-05, "Pretrain/Loss": 2.0539443492889404, "Pretrain/Loss (Raw)": 2.148918867111206, "Pretrain/Step": 6241, "Pretrain/Step Time": 8.502875657752156} +{"Pretrain/Learning Rate": 3.928052519538874e-05, "Pretrain/Loss": 2.0527212619781494, "Pretrain/Loss (Raw)": 1.7753527164459229, "Pretrain/Step": 6242, "Pretrain/Step Time": 8.50477109104395} +{"Pretrain/Learning Rate": 3.9277040572982816e-05, "Pretrain/Loss": 2.0530881881713867, "Pretrain/Loss (Raw)": 1.9177377223968506, "Pretrain/Step": 6243, "Pretrain/Step Time": 8.50511560589075} +{"Pretrain/Learning Rate": 3.927355553890849e-05, "Pretrain/Loss": 2.051403284072876, "Pretrain/Loss (Raw)": 1.9004380702972412, "Pretrain/Step": 6244, "Pretrain/Step Time": 8.502870861440897} +{"Pretrain/Learning Rate": 3.9270070093266256e-05, "Pretrain/Loss": 2.0520143508911133, "Pretrain/Loss (Raw)": 2.0404279232025146, "Pretrain/Step": 6245, "Pretrain/Step Time": 8.50246879644692} +{"Pretrain/Learning Rate": 3.9266584236156605e-05, "Pretrain/Loss": 2.048336982727051, "Pretrain/Loss (Raw)": 1.710771918296814, "Pretrain/Step": 6246, "Pretrain/Step Time": 8.49730614386499} +{"Pretrain/Learning Rate": 3.9263097967680063e-05, "Pretrain/Loss": 2.0520987510681152, "Pretrain/Loss (Raw)": 1.9571785926818848, "Pretrain/Step": 6247, "Pretrain/Step Time": 8.497951965779066} +{"Pretrain/Learning Rate": 3.925961128793714e-05, "Pretrain/Loss": 2.05233097076416, "Pretrain/Loss (Raw)": 2.0705318450927734, "Pretrain/Step": 6248, "Pretrain/Step Time": 8.498660599812865} +{"Pretrain/Learning Rate": 3.925612419702838e-05, "Pretrain/Loss": 2.052309989929199, "Pretrain/Loss (Raw)": 1.830150842666626, "Pretrain/Step": 6249, "Pretrain/Step Time": 8.498556390404701} +{"Pretrain/Learning Rate": 3.925263669505432e-05, "Pretrain/Loss": 2.0541110038757324, "Pretrain/Loss (Raw)": 2.326036214828491, "Pretrain/Step": 6250, "Pretrain/Step Time": 8.497678756713867} +{"Pretrain/Learning Rate": 3.9249148782115544e-05, "Pretrain/Loss": 2.054749011993408, "Pretrain/Loss (Raw)": 2.0811238288879395, "Pretrain/Step": 6251, "Pretrain/Step Time": 8.504133244976401} +{"Pretrain/Learning Rate": 3.9245660458312594e-05, "Pretrain/Loss": 2.0551538467407227, "Pretrain/Loss (Raw)": 2.1459169387817383, "Pretrain/Step": 6252, "Pretrain/Step Time": 8.496740717440844} +{"Pretrain/Learning Rate": 3.924217172374607e-05, "Pretrain/Loss": 2.055100917816162, "Pretrain/Loss (Raw)": 1.9370043277740479, "Pretrain/Step": 6253, "Pretrain/Step Time": 8.495427699759603} +{"Pretrain/Learning Rate": 3.923868257851657e-05, "Pretrain/Loss": 2.0555996894836426, "Pretrain/Loss (Raw)": 1.9617486000061035, "Pretrain/Step": 6254, "Pretrain/Step Time": 8.494080422446132} +{"Pretrain/Learning Rate": 3.9235193022724695e-05, "Pretrain/Loss": 2.0564181804656982, "Pretrain/Loss (Raw)": 2.082026243209839, "Pretrain/Step": 6255, "Pretrain/Step Time": 8.492589734494686} +{"Pretrain/Learning Rate": 3.923170305647106e-05, "Pretrain/Loss": 2.056424617767334, "Pretrain/Loss (Raw)": 2.041517496109009, "Pretrain/Step": 6256, "Pretrain/Step Time": 8.495132926851511} +{"Pretrain/Learning Rate": 3.92282126798563e-05, "Pretrain/Loss": 2.0552849769592285, "Pretrain/Loss (Raw)": 1.9017254114151, "Pretrain/Step": 6257, "Pretrain/Step Time": 8.49788067303598} +{"Pretrain/Learning Rate": 3.9224721892981064e-05, "Pretrain/Loss": 2.0526275634765625, "Pretrain/Loss (Raw)": 1.8301258087158203, "Pretrain/Step": 6258, "Pretrain/Step Time": 8.49592767097056} +{"Pretrain/Learning Rate": 3.922123069594599e-05, "Pretrain/Loss": 2.0517961978912354, "Pretrain/Loss (Raw)": 1.822628140449524, "Pretrain/Step": 6259, "Pretrain/Step Time": 8.499449765309691} +{"Pretrain/Learning Rate": 3.9217739088851766e-05, "Pretrain/Loss": 2.053490161895752, "Pretrain/Loss (Raw)": 2.2826409339904785, "Pretrain/Step": 6260, "Pretrain/Step Time": 8.493670534342527} +{"Pretrain/Learning Rate": 3.921424707179905e-05, "Pretrain/Loss": 2.0532660484313965, "Pretrain/Loss (Raw)": 2.0701189041137695, "Pretrain/Step": 6261, "Pretrain/Step Time": 8.493420897051692} +{"Pretrain/Learning Rate": 3.921075464488855e-05, "Pretrain/Loss": 2.0545434951782227, "Pretrain/Loss (Raw)": 2.1555066108703613, "Pretrain/Step": 6262, "Pretrain/Step Time": 8.49393955618143} +{"Pretrain/Learning Rate": 3.920726180822094e-05, "Pretrain/Loss": 2.0536820888519287, "Pretrain/Loss (Raw)": 1.9729253053665161, "Pretrain/Step": 6263, "Pretrain/Step Time": 8.492278322577477} +{"Pretrain/Learning Rate": 3.920376856189696e-05, "Pretrain/Loss": 2.0529212951660156, "Pretrain/Loss (Raw)": 2.011819839477539, "Pretrain/Step": 6264, "Pretrain/Step Time": 8.49515289440751} +{"Pretrain/Learning Rate": 3.9200274906017334e-05, "Pretrain/Loss": 2.051119327545166, "Pretrain/Loss (Raw)": 1.8812079429626465, "Pretrain/Step": 6265, "Pretrain/Step Time": 8.49118148162961} +{"Pretrain/Learning Rate": 3.9196780840682784e-05, "Pretrain/Loss": 2.05185604095459, "Pretrain/Loss (Raw)": 2.0220589637756348, "Pretrain/Step": 6266, "Pretrain/Step Time": 8.48873762972653} +{"Pretrain/Learning Rate": 3.919328636599407e-05, "Pretrain/Loss": 2.052183151245117, "Pretrain/Loss (Raw)": 2.221391439437866, "Pretrain/Step": 6267, "Pretrain/Step Time": 8.491703193634748} +{"Pretrain/Learning Rate": 3.918979148205194e-05, "Pretrain/Loss": 2.052543878555298, "Pretrain/Loss (Raw)": 2.0722227096557617, "Pretrain/Step": 6268, "Pretrain/Step Time": 8.495478712022305} +{"Pretrain/Learning Rate": 3.9186296188957184e-05, "Pretrain/Loss": 2.048027515411377, "Pretrain/Loss (Raw)": 2.0857510566711426, "Pretrain/Step": 6269, "Pretrain/Step Time": 8.492990527302027} +{"Pretrain/Learning Rate": 3.9182800486810584e-05, "Pretrain/Loss": 2.0490260124206543, "Pretrain/Loss (Raw)": 2.193737268447876, "Pretrain/Step": 6270, "Pretrain/Step Time": 8.491606777533889} +{"Pretrain/Learning Rate": 3.917930437571292e-05, "Pretrain/Loss": 2.047248125076294, "Pretrain/Loss (Raw)": 2.0627245903015137, "Pretrain/Step": 6271, "Pretrain/Step Time": 8.486498484387994} +{"Pretrain/Learning Rate": 3.9175807855765014e-05, "Pretrain/Loss": 2.045440673828125, "Pretrain/Loss (Raw)": 1.9687323570251465, "Pretrain/Step": 6272, "Pretrain/Step Time": 8.48848195001483} +{"Pretrain/Learning Rate": 3.917231092706768e-05, "Pretrain/Loss": 2.044576644897461, "Pretrain/Loss (Raw)": 1.969234585762024, "Pretrain/Step": 6273, "Pretrain/Step Time": 8.490923451259732} +{"Pretrain/Learning Rate": 3.916881358972175e-05, "Pretrain/Loss": 2.045112133026123, "Pretrain/Loss (Raw)": 2.0557096004486084, "Pretrain/Step": 6274, "Pretrain/Step Time": 8.497011931613088} +{"Pretrain/Learning Rate": 3.9165315843828076e-05, "Pretrain/Loss": 2.045506238937378, "Pretrain/Loss (Raw)": 2.0381057262420654, "Pretrain/Step": 6275, "Pretrain/Step Time": 8.495642811059952} +{"Pretrain/Learning Rate": 3.9161817689487504e-05, "Pretrain/Loss": 2.0444412231445312, "Pretrain/Loss (Raw)": 1.9952903985977173, "Pretrain/Step": 6276, "Pretrain/Step Time": 8.496371949091554} +{"Pretrain/Learning Rate": 3.91583191268009e-05, "Pretrain/Loss": 2.0414204597473145, "Pretrain/Loss (Raw)": 2.1811118125915527, "Pretrain/Step": 6277, "Pretrain/Step Time": 8.49335115775466} +{"Pretrain/Learning Rate": 3.915482015586914e-05, "Pretrain/Loss": 2.0396814346313477, "Pretrain/Loss (Raw)": 1.825287103652954, "Pretrain/Step": 6278, "Pretrain/Step Time": 8.492081420496106} +{"Pretrain/Learning Rate": 3.915132077679312e-05, "Pretrain/Loss": 2.038628101348877, "Pretrain/Loss (Raw)": 2.065089464187622, "Pretrain/Step": 6279, "Pretrain/Step Time": 8.494089599698782} +{"Pretrain/Learning Rate": 3.914782098967374e-05, "Pretrain/Loss": 2.038764476776123, "Pretrain/Loss (Raw)": 2.1118884086608887, "Pretrain/Step": 6280, "Pretrain/Step Time": 8.495478343218565} +{"Pretrain/Learning Rate": 3.914432079461193e-05, "Pretrain/Loss": 2.0394301414489746, "Pretrain/Loss (Raw)": 2.0010769367218018, "Pretrain/Step": 6281, "Pretrain/Step Time": 8.49052251316607} +{"Pretrain/Learning Rate": 3.9140820191708585e-05, "Pretrain/Loss": 2.0416955947875977, "Pretrain/Loss (Raw)": 2.17375111579895, "Pretrain/Step": 6282, "Pretrain/Step Time": 8.49039987847209} +{"Pretrain/Learning Rate": 3.9137319181064664e-05, "Pretrain/Loss": 2.041755199432373, "Pretrain/Loss (Raw)": 2.0706636905670166, "Pretrain/Step": 6283, "Pretrain/Step Time": 8.492726407945156} +{"Pretrain/Learning Rate": 3.913381776278111e-05, "Pretrain/Loss": 2.0416247844696045, "Pretrain/Loss (Raw)": 2.0503549575805664, "Pretrain/Step": 6284, "Pretrain/Step Time": 8.493320759385824} +{"Pretrain/Learning Rate": 3.9130315936958886e-05, "Pretrain/Loss": 2.042452573776245, "Pretrain/Loss (Raw)": 2.0604944229125977, "Pretrain/Step": 6285, "Pretrain/Step Time": 8.490086954087019} +{"Pretrain/Learning Rate": 3.912681370369896e-05, "Pretrain/Loss": 2.0422616004943848, "Pretrain/Loss (Raw)": 1.9074389934539795, "Pretrain/Step": 6286, "Pretrain/Step Time": 8.490046733990312} +{"Pretrain/Learning Rate": 3.9123311063102324e-05, "Pretrain/Loss": 2.0427815914154053, "Pretrain/Loss (Raw)": 2.186055898666382, "Pretrain/Step": 6287, "Pretrain/Step Time": 8.48522099852562} +{"Pretrain/Learning Rate": 3.9119808015269964e-05, "Pretrain/Loss": 2.0420889854431152, "Pretrain/Loss (Raw)": 2.0601625442504883, "Pretrain/Step": 6288, "Pretrain/Step Time": 8.487308220937848} +{"Pretrain/Learning Rate": 3.9116304560302904e-05, "Pretrain/Loss": 2.042717218399048, "Pretrain/Loss (Raw)": 2.085981607437134, "Pretrain/Step": 6289, "Pretrain/Step Time": 8.490360476076603} +{"Pretrain/Learning Rate": 3.911280069830214e-05, "Pretrain/Loss": 2.0444793701171875, "Pretrain/Loss (Raw)": 2.1496100425720215, "Pretrain/Step": 6290, "Pretrain/Step Time": 8.492471262812614} +{"Pretrain/Learning Rate": 3.910929642936872e-05, "Pretrain/Loss": 2.0422511100769043, "Pretrain/Loss (Raw)": 1.6941630840301514, "Pretrain/Step": 6291, "Pretrain/Step Time": 8.492958474904299} +{"Pretrain/Learning Rate": 3.910579175360369e-05, "Pretrain/Loss": 2.0458765029907227, "Pretrain/Loss (Raw)": 2.368292808532715, "Pretrain/Step": 6292, "Pretrain/Step Time": 8.49240461550653} +{"Pretrain/Learning Rate": 3.91022866711081e-05, "Pretrain/Loss": 2.0451598167419434, "Pretrain/Loss (Raw)": 1.9762287139892578, "Pretrain/Step": 6293, "Pretrain/Step Time": 8.49412533827126} +{"Pretrain/Learning Rate": 3.909878118198301e-05, "Pretrain/Loss": 2.043994903564453, "Pretrain/Loss (Raw)": 1.8988099098205566, "Pretrain/Step": 6294, "Pretrain/Step Time": 8.490796884521842} +{"Pretrain/Learning Rate": 3.909527528632951e-05, "Pretrain/Loss": 2.0426454544067383, "Pretrain/Loss (Raw)": 1.9577858448028564, "Pretrain/Step": 6295, "Pretrain/Step Time": 8.49248786456883} +{"Pretrain/Learning Rate": 3.9091768984248676e-05, "Pretrain/Loss": 2.0419554710388184, "Pretrain/Loss (Raw)": 2.099708080291748, "Pretrain/Step": 6296, "Pretrain/Step Time": 8.485422359779477} +{"Pretrain/Learning Rate": 3.908826227584162e-05, "Pretrain/Loss": 2.0436196327209473, "Pretrain/Loss (Raw)": 2.057748317718506, "Pretrain/Step": 6297, "Pretrain/Step Time": 8.485241200774908} +{"Pretrain/Learning Rate": 3.908475516120945e-05, "Pretrain/Loss": 2.041940689086914, "Pretrain/Loss (Raw)": 2.031088352203369, "Pretrain/Step": 6298, "Pretrain/Step Time": 8.48117402754724} +{"Pretrain/Learning Rate": 3.90812476404533e-05, "Pretrain/Loss": 2.0425024032592773, "Pretrain/Loss (Raw)": 2.1954598426818848, "Pretrain/Step": 6299, "Pretrain/Step Time": 8.486620595678687} +{"Pretrain/Learning Rate": 3.90777397136743e-05, "Pretrain/Loss": 2.044130563735962, "Pretrain/Loss (Raw)": 2.4564597606658936, "Pretrain/Step": 6300, "Pretrain/Step Time": 8.488999377936125} +{"Pretrain/Learning Rate": 3.907423138097359e-05, "Pretrain/Loss": 2.043164014816284, "Pretrain/Loss (Raw)": 2.0171213150024414, "Pretrain/Step": 6301, "Pretrain/Step Time": 8.48590013384819} +{"Pretrain/Learning Rate": 3.907072264245235e-05, "Pretrain/Loss": 2.043090581893921, "Pretrain/Loss (Raw)": 2.084052801132202, "Pretrain/Step": 6302, "Pretrain/Step Time": 8.4864348359406} +{"Pretrain/Learning Rate": 3.906721349821174e-05, "Pretrain/Loss": 2.042963981628418, "Pretrain/Loss (Raw)": 2.04555606842041, "Pretrain/Step": 6303, "Pretrain/Step Time": 8.491029566153884} +{"Pretrain/Learning Rate": 3.9063703948352946e-05, "Pretrain/Loss": 2.0416617393493652, "Pretrain/Loss (Raw)": 1.9692414999008179, "Pretrain/Step": 6304, "Pretrain/Step Time": 8.489826178178191} +{"Pretrain/Learning Rate": 3.9060193992977154e-05, "Pretrain/Loss": 2.0420522689819336, "Pretrain/Loss (Raw)": 2.122380495071411, "Pretrain/Step": 6305, "Pretrain/Step Time": 8.496991513296962} +{"Pretrain/Learning Rate": 3.905668363218559e-05, "Pretrain/Loss": 2.040955066680908, "Pretrain/Loss (Raw)": 1.7320799827575684, "Pretrain/Step": 6306, "Pretrain/Step Time": 8.498119128867984} +{"Pretrain/Learning Rate": 3.905317286607946e-05, "Pretrain/Loss": 2.0416417121887207, "Pretrain/Loss (Raw)": 2.10544490814209, "Pretrain/Step": 6307, "Pretrain/Step Time": 8.50166436471045} +{"Pretrain/Learning Rate": 3.904966169476e-05, "Pretrain/Loss": 2.042337417602539, "Pretrain/Loss (Raw)": 2.156022071838379, "Pretrain/Step": 6308, "Pretrain/Step Time": 8.499193500727415} +{"Pretrain/Learning Rate": 3.9046150118328445e-05, "Pretrain/Loss": 2.0398812294006348, "Pretrain/Loss (Raw)": 1.9483166933059692, "Pretrain/Step": 6309, "Pretrain/Step Time": 8.497514935210347} +{"Pretrain/Learning Rate": 3.9042638136886056e-05, "Pretrain/Loss": 2.0430397987365723, "Pretrain/Loss (Raw)": 2.14138126373291, "Pretrain/Step": 6310, "Pretrain/Step Time": 8.494673682376742} +{"Pretrain/Learning Rate": 3.9039125750534094e-05, "Pretrain/Loss": 2.043034553527832, "Pretrain/Loss (Raw)": 1.9130107164382935, "Pretrain/Step": 6311, "Pretrain/Step Time": 8.497469639405608} +{"Pretrain/Learning Rate": 3.903561295937384e-05, "Pretrain/Loss": 2.041926860809326, "Pretrain/Loss (Raw)": 2.0318737030029297, "Pretrain/Step": 6312, "Pretrain/Step Time": 8.496978346258402} +{"Pretrain/Learning Rate": 3.903209976350658e-05, "Pretrain/Loss": 2.043087959289551, "Pretrain/Loss (Raw)": 2.181868076324463, "Pretrain/Step": 6313, "Pretrain/Step Time": 8.49800574220717} +{"Pretrain/Learning Rate": 3.902858616303362e-05, "Pretrain/Loss": 2.041775703430176, "Pretrain/Loss (Raw)": 1.9878273010253906, "Pretrain/Step": 6314, "Pretrain/Step Time": 8.501139899715781} +{"Pretrain/Learning Rate": 3.902507215805625e-05, "Pretrain/Loss": 2.0401806831359863, "Pretrain/Loss (Raw)": 2.2379367351531982, "Pretrain/Step": 6315, "Pretrain/Step Time": 8.49942478723824} +{"Pretrain/Learning Rate": 3.902155774867583e-05, "Pretrain/Loss": 2.039095878601074, "Pretrain/Loss (Raw)": 2.0001206398010254, "Pretrain/Step": 6316, "Pretrain/Step Time": 8.501675140112638} +{"Pretrain/Learning Rate": 3.901804293499367e-05, "Pretrain/Loss": 2.0402071475982666, "Pretrain/Loss (Raw)": 2.049525499343872, "Pretrain/Step": 6317, "Pretrain/Step Time": 8.502488400787115} +{"Pretrain/Learning Rate": 3.901452771711113e-05, "Pretrain/Loss": 2.0380959510803223, "Pretrain/Loss (Raw)": 1.9506982564926147, "Pretrain/Step": 6318, "Pretrain/Step Time": 8.502909449860454} +{"Pretrain/Learning Rate": 3.901101209512955e-05, "Pretrain/Loss": 2.0375008583068848, "Pretrain/Loss (Raw)": 1.9452729225158691, "Pretrain/Step": 6319, "Pretrain/Step Time": 8.50479793176055} +{"Pretrain/Learning Rate": 3.9007496069150324e-05, "Pretrain/Loss": 2.038912296295166, "Pretrain/Loss (Raw)": 2.0784072875976562, "Pretrain/Step": 6320, "Pretrain/Step Time": 8.498724233359098} +{"Pretrain/Learning Rate": 3.9003979639274824e-05, "Pretrain/Loss": 2.0355348587036133, "Pretrain/Loss (Raw)": 1.5206422805786133, "Pretrain/Step": 6321, "Pretrain/Step Time": 8.503001518547535} +{"Pretrain/Learning Rate": 3.9000462805604433e-05, "Pretrain/Loss": 2.033818483352661, "Pretrain/Loss (Raw)": 1.9601621627807617, "Pretrain/Step": 6322, "Pretrain/Step Time": 8.504632132127881} +{"Pretrain/Learning Rate": 3.899694556824057e-05, "Pretrain/Loss": 2.034069061279297, "Pretrain/Loss (Raw)": 2.1597342491149902, "Pretrain/Step": 6323, "Pretrain/Step Time": 8.50262001901865} +{"Pretrain/Learning Rate": 3.8993427927284656e-05, "Pretrain/Loss": 2.0344390869140625, "Pretrain/Loss (Raw)": 1.9943430423736572, "Pretrain/Step": 6324, "Pretrain/Step Time": 8.502275001257658} +{"Pretrain/Learning Rate": 3.89899098828381e-05, "Pretrain/Loss": 2.035151481628418, "Pretrain/Loss (Raw)": 2.07578182220459, "Pretrain/Step": 6325, "Pretrain/Step Time": 8.504065597429872} +{"Pretrain/Learning Rate": 3.8986391435002375e-05, "Pretrain/Loss": 2.036468029022217, "Pretrain/Loss (Raw)": 2.18886661529541, "Pretrain/Step": 6326, "Pretrain/Step Time": 8.503861432895064} +{"Pretrain/Learning Rate": 3.898287258387889e-05, "Pretrain/Loss": 2.033163547515869, "Pretrain/Loss (Raw)": 1.6948031187057495, "Pretrain/Step": 6327, "Pretrain/Step Time": 8.50460303388536} +{"Pretrain/Learning Rate": 3.897935332956915e-05, "Pretrain/Loss": 2.030428409576416, "Pretrain/Loss (Raw)": 1.6687967777252197, "Pretrain/Step": 6328, "Pretrain/Step Time": 8.506039118394256} +{"Pretrain/Learning Rate": 3.89758336721746e-05, "Pretrain/Loss": 2.031141757965088, "Pretrain/Loss (Raw)": 2.0896663665771484, "Pretrain/Step": 6329, "Pretrain/Step Time": 8.503402950242162} +{"Pretrain/Learning Rate": 3.897231361179674e-05, "Pretrain/Loss": 2.0323333740234375, "Pretrain/Loss (Raw)": 2.2980287075042725, "Pretrain/Step": 6330, "Pretrain/Step Time": 8.497615732252598} +{"Pretrain/Learning Rate": 3.896879314853707e-05, "Pretrain/Loss": 2.033586025238037, "Pretrain/Loss (Raw)": 1.9758819341659546, "Pretrain/Step": 6331, "Pretrain/Step Time": 8.495257871225476} +{"Pretrain/Learning Rate": 3.8965272282497104e-05, "Pretrain/Loss": 2.0327887535095215, "Pretrain/Loss (Raw)": 1.9240940809249878, "Pretrain/Step": 6332, "Pretrain/Step Time": 8.498721929267049} +{"Pretrain/Learning Rate": 3.896175101377834e-05, "Pretrain/Loss": 2.030467987060547, "Pretrain/Loss (Raw)": 2.062624931335449, "Pretrain/Step": 6333, "Pretrain/Step Time": 8.500465583056211} +{"Pretrain/Learning Rate": 3.895822934248234e-05, "Pretrain/Loss": 2.031035900115967, "Pretrain/Loss (Raw)": 1.9126896858215332, "Pretrain/Step": 6334, "Pretrain/Step Time": 8.495914133265615} +{"Pretrain/Learning Rate": 3.895470726871063e-05, "Pretrain/Loss": 2.0320935249328613, "Pretrain/Loss (Raw)": 2.139441967010498, "Pretrain/Step": 6335, "Pretrain/Step Time": 8.494999827817082} +{"Pretrain/Learning Rate": 3.8951184792564775e-05, "Pretrain/Loss": 2.029606819152832, "Pretrain/Loss (Raw)": 1.7997814416885376, "Pretrain/Step": 6336, "Pretrain/Step Time": 8.493030697107315} +{"Pretrain/Learning Rate": 3.894766191414634e-05, "Pretrain/Loss": 2.0326061248779297, "Pretrain/Loss (Raw)": 2.064906120300293, "Pretrain/Step": 6337, "Pretrain/Step Time": 8.49628685042262} +{"Pretrain/Learning Rate": 3.894413863355692e-05, "Pretrain/Loss": 2.0316104888916016, "Pretrain/Loss (Raw)": 1.920946717262268, "Pretrain/Step": 6338, "Pretrain/Step Time": 8.500571362674236} +{"Pretrain/Learning Rate": 3.8940614950898075e-05, "Pretrain/Loss": 2.02762770652771, "Pretrain/Loss (Raw)": 2.0263359546661377, "Pretrain/Step": 6339, "Pretrain/Step Time": 8.501654403284192} +{"Pretrain/Learning Rate": 3.893709086627143e-05, "Pretrain/Loss": 2.0259294509887695, "Pretrain/Loss (Raw)": 2.136725902557373, "Pretrain/Step": 6340, "Pretrain/Step Time": 8.501108571887016} +{"Pretrain/Learning Rate": 3.8933566379778596e-05, "Pretrain/Loss": 2.0234341621398926, "Pretrain/Loss (Raw)": 1.810984492301941, "Pretrain/Step": 6341, "Pretrain/Step Time": 8.506432140246034} +{"Pretrain/Learning Rate": 3.89300414915212e-05, "Pretrain/Loss": 2.0251455307006836, "Pretrain/Loss (Raw)": 2.2567782402038574, "Pretrain/Step": 6342, "Pretrain/Step Time": 8.50545465759933} +{"Pretrain/Learning Rate": 3.892651620160088e-05, "Pretrain/Loss": 2.0226683616638184, "Pretrain/Loss (Raw)": 2.0416157245635986, "Pretrain/Step": 6343, "Pretrain/Step Time": 8.504586631432176} +{"Pretrain/Learning Rate": 3.892299051011927e-05, "Pretrain/Loss": 2.023794651031494, "Pretrain/Loss (Raw)": 2.208397388458252, "Pretrain/Step": 6344, "Pretrain/Step Time": 8.514561586081982} +{"Pretrain/Learning Rate": 3.891946441717806e-05, "Pretrain/Loss": 2.020982265472412, "Pretrain/Loss (Raw)": 1.8766517639160156, "Pretrain/Step": 6345, "Pretrain/Step Time": 8.510409967973828} +{"Pretrain/Learning Rate": 3.89159379228789e-05, "Pretrain/Loss": 2.021388053894043, "Pretrain/Loss (Raw)": 2.0031473636627197, "Pretrain/Step": 6346, "Pretrain/Step Time": 8.509623559191823} +{"Pretrain/Learning Rate": 3.891241102732348e-05, "Pretrain/Loss": 2.0209882259368896, "Pretrain/Loss (Raw)": 2.0365190505981445, "Pretrain/Step": 6347, "Pretrain/Step Time": 8.50203761830926} +{"Pretrain/Learning Rate": 3.890888373061349e-05, "Pretrain/Loss": 2.0280098915100098, "Pretrain/Loss (Raw)": 2.165426731109619, "Pretrain/Step": 6348, "Pretrain/Step Time": 8.500244237482548} +{"Pretrain/Learning Rate": 3.890535603285065e-05, "Pretrain/Loss": 2.0310776233673096, "Pretrain/Loss (Raw)": 2.519710063934326, "Pretrain/Step": 6349, "Pretrain/Step Time": 8.501688174903393} +{"Pretrain/Learning Rate": 3.890182793413667e-05, "Pretrain/Loss": 2.0309362411499023, "Pretrain/Loss (Raw)": 2.0699830055236816, "Pretrain/Step": 6350, "Pretrain/Step Time": 8.505743738263845} +{"Pretrain/Learning Rate": 3.889829943457328e-05, "Pretrain/Loss": 2.031053066253662, "Pretrain/Loss (Raw)": 2.1556758880615234, "Pretrain/Step": 6351, "Pretrain/Step Time": 8.50155588798225} +{"Pretrain/Learning Rate": 3.889477053426222e-05, "Pretrain/Loss": 2.0271716117858887, "Pretrain/Loss (Raw)": 1.7386678457260132, "Pretrain/Step": 6352, "Pretrain/Step Time": 8.504749100655317} +{"Pretrain/Learning Rate": 3.8891241233305254e-05, "Pretrain/Loss": 2.027113199234009, "Pretrain/Loss (Raw)": 1.9095144271850586, "Pretrain/Step": 6353, "Pretrain/Step Time": 8.504026988521218} +{"Pretrain/Learning Rate": 3.888771153180414e-05, "Pretrain/Loss": 2.028563976287842, "Pretrain/Loss (Raw)": 2.2358012199401855, "Pretrain/Step": 6354, "Pretrain/Step Time": 8.50981312058866} +{"Pretrain/Learning Rate": 3.8884181429860646e-05, "Pretrain/Loss": 2.028261661529541, "Pretrain/Loss (Raw)": 2.1325559616088867, "Pretrain/Step": 6355, "Pretrain/Step Time": 8.507893832400441} +{"Pretrain/Learning Rate": 3.888065092757658e-05, "Pretrain/Loss": 2.0290942192077637, "Pretrain/Loss (Raw)": 2.01831316947937, "Pretrain/Step": 6356, "Pretrain/Step Time": 8.510706078261137} +{"Pretrain/Learning Rate": 3.887712002505371e-05, "Pretrain/Loss": 2.030823230743408, "Pretrain/Loss (Raw)": 2.180036783218384, "Pretrain/Step": 6357, "Pretrain/Step Time": 8.508329834789038} +{"Pretrain/Learning Rate": 3.8873588722393886e-05, "Pretrain/Loss": 2.0298638343811035, "Pretrain/Loss (Raw)": 1.9923312664031982, "Pretrain/Step": 6358, "Pretrain/Step Time": 8.510821895673871} +{"Pretrain/Learning Rate": 3.8870057019698905e-05, "Pretrain/Loss": 2.0294008255004883, "Pretrain/Loss (Raw)": 2.1248130798339844, "Pretrain/Step": 6359, "Pretrain/Step Time": 8.508866196498275} +{"Pretrain/Learning Rate": 3.886652491707061e-05, "Pretrain/Loss": 2.028747081756592, "Pretrain/Loss (Raw)": 1.8304179906845093, "Pretrain/Step": 6360, "Pretrain/Step Time": 8.504253713414073} +{"Pretrain/Learning Rate": 3.886299241461084e-05, "Pretrain/Loss": 2.026553153991699, "Pretrain/Loss (Raw)": 1.8683401346206665, "Pretrain/Step": 6361, "Pretrain/Step Time": 8.503480024635792} +{"Pretrain/Learning Rate": 3.8859459512421456e-05, "Pretrain/Loss": 2.0258498191833496, "Pretrain/Loss (Raw)": 2.0188982486724854, "Pretrain/Step": 6362, "Pretrain/Step Time": 8.502248890697956} +{"Pretrain/Learning Rate": 3.8855926210604334e-05, "Pretrain/Loss": 2.0289788246154785, "Pretrain/Loss (Raw)": 2.2206227779388428, "Pretrain/Step": 6363, "Pretrain/Step Time": 8.496715854853392} +{"Pretrain/Learning Rate": 3.885239250926134e-05, "Pretrain/Loss": 2.026824951171875, "Pretrain/Loss (Raw)": 1.8288707733154297, "Pretrain/Step": 6364, "Pretrain/Step Time": 8.49426194280386} +{"Pretrain/Learning Rate": 3.884885840849437e-05, "Pretrain/Loss": 2.024721622467041, "Pretrain/Loss (Raw)": 1.8616472482681274, "Pretrain/Step": 6365, "Pretrain/Step Time": 8.497708562761545} +{"Pretrain/Learning Rate": 3.884532390840534e-05, "Pretrain/Loss": 2.0254547595977783, "Pretrain/Loss (Raw)": 2.0734241008758545, "Pretrain/Step": 6366, "Pretrain/Step Time": 8.50074227899313} +{"Pretrain/Learning Rate": 3.884178900909615e-05, "Pretrain/Loss": 2.0290045738220215, "Pretrain/Loss (Raw)": 2.1450748443603516, "Pretrain/Step": 6367, "Pretrain/Step Time": 8.500673854723573} +{"Pretrain/Learning Rate": 3.8838253710668736e-05, "Pretrain/Loss": 2.0302486419677734, "Pretrain/Loss (Raw)": 2.0299670696258545, "Pretrain/Step": 6368, "Pretrain/Step Time": 8.495426654815674} +{"Pretrain/Learning Rate": 3.883471801322503e-05, "Pretrain/Loss": 2.0288543701171875, "Pretrain/Loss (Raw)": 1.9704374074935913, "Pretrain/Step": 6369, "Pretrain/Step Time": 8.500423345714808} +{"Pretrain/Learning Rate": 3.883118191686698e-05, "Pretrain/Loss": 2.030757427215576, "Pretrain/Loss (Raw)": 2.018942356109619, "Pretrain/Step": 6370, "Pretrain/Step Time": 8.495855191722512} +{"Pretrain/Learning Rate": 3.8827645421696556e-05, "Pretrain/Loss": 2.029909372329712, "Pretrain/Loss (Raw)": 1.8091944456100464, "Pretrain/Step": 6371, "Pretrain/Step Time": 8.502757670357823} +{"Pretrain/Learning Rate": 3.8824108527815715e-05, "Pretrain/Loss": 2.0307910442352295, "Pretrain/Loss (Raw)": 2.0132997035980225, "Pretrain/Step": 6372, "Pretrain/Step Time": 8.502783613279462} +{"Pretrain/Learning Rate": 3.882057123532646e-05, "Pretrain/Loss": 2.0298404693603516, "Pretrain/Loss (Raw)": 1.9187721014022827, "Pretrain/Step": 6373, "Pretrain/Step Time": 8.503179728984833} +{"Pretrain/Learning Rate": 3.881703354433077e-05, "Pretrain/Loss": 2.032428741455078, "Pretrain/Loss (Raw)": 2.042029857635498, "Pretrain/Step": 6374, "Pretrain/Step Time": 8.505419412627816} +{"Pretrain/Learning Rate": 3.881349545493066e-05, "Pretrain/Loss": 2.032231330871582, "Pretrain/Loss (Raw)": 1.9319366216659546, "Pretrain/Step": 6375, "Pretrain/Step Time": 8.502847397699952} +{"Pretrain/Learning Rate": 3.8809956967228145e-05, "Pretrain/Loss": 2.0317301750183105, "Pretrain/Loss (Raw)": 2.0063834190368652, "Pretrain/Step": 6376, "Pretrain/Step Time": 8.498968610540032} +{"Pretrain/Learning Rate": 3.880641808132526e-05, "Pretrain/Loss": 2.0322489738464355, "Pretrain/Loss (Raw)": 1.8965375423431396, "Pretrain/Step": 6377, "Pretrain/Step Time": 8.497531678527594} +{"Pretrain/Learning Rate": 3.880287879732404e-05, "Pretrain/Loss": 2.0296802520751953, "Pretrain/Loss (Raw)": 1.997260332107544, "Pretrain/Step": 6378, "Pretrain/Step Time": 8.50035168044269} +{"Pretrain/Learning Rate": 3.879933911532654e-05, "Pretrain/Loss": 2.0294861793518066, "Pretrain/Loss (Raw)": 2.0562784671783447, "Pretrain/Step": 6379, "Pretrain/Step Time": 8.49557737633586} +{"Pretrain/Learning Rate": 3.879579903543482e-05, "Pretrain/Loss": 2.0274505615234375, "Pretrain/Loss (Raw)": 1.885374903678894, "Pretrain/Step": 6380, "Pretrain/Step Time": 8.498799113556743} +{"Pretrain/Learning Rate": 3.879225855775097e-05, "Pretrain/Loss": 2.0273385047912598, "Pretrain/Loss (Raw)": 1.922633409500122, "Pretrain/Step": 6381, "Pretrain/Step Time": 8.495268743485212} +{"Pretrain/Learning Rate": 3.8788717682377064e-05, "Pretrain/Loss": 2.0269367694854736, "Pretrain/Loss (Raw)": 1.9103401899337769, "Pretrain/Step": 6382, "Pretrain/Step Time": 8.498855886980891} +{"Pretrain/Learning Rate": 3.8785176409415195e-05, "Pretrain/Loss": 2.0253872871398926, "Pretrain/Loss (Raw)": 1.8836793899536133, "Pretrain/Step": 6383, "Pretrain/Step Time": 8.498880952596664} +{"Pretrain/Learning Rate": 3.8781634738967496e-05, "Pretrain/Loss": 2.024855613708496, "Pretrain/Loss (Raw)": 1.9734591245651245, "Pretrain/Step": 6384, "Pretrain/Step Time": 8.49694937095046} +{"Pretrain/Learning Rate": 3.8778092671136065e-05, "Pretrain/Loss": 2.025266647338867, "Pretrain/Loss (Raw)": 1.9543490409851074, "Pretrain/Step": 6385, "Pretrain/Step Time": 8.494923459365964} +{"Pretrain/Learning Rate": 3.877455020602305e-05, "Pretrain/Loss": 2.0289459228515625, "Pretrain/Loss (Raw)": 2.301079273223877, "Pretrain/Step": 6386, "Pretrain/Step Time": 8.50043181143701} +{"Pretrain/Learning Rate": 3.877100734373058e-05, "Pretrain/Loss": 2.030637741088867, "Pretrain/Loss (Raw)": 2.039153814315796, "Pretrain/Step": 6387, "Pretrain/Step Time": 8.500866958871484} +{"Pretrain/Learning Rate": 3.8767464084360835e-05, "Pretrain/Loss": 2.0292229652404785, "Pretrain/Loss (Raw)": 2.101594924926758, "Pretrain/Step": 6388, "Pretrain/Step Time": 8.50031889602542} +{"Pretrain/Learning Rate": 3.8763920428015965e-05, "Pretrain/Loss": 2.0283989906311035, "Pretrain/Loss (Raw)": 1.9646039009094238, "Pretrain/Step": 6389, "Pretrain/Step Time": 8.502539543434978} +{"Pretrain/Learning Rate": 3.8760376374798144e-05, "Pretrain/Loss": 2.027207374572754, "Pretrain/Loss (Raw)": 2.0029945373535156, "Pretrain/Step": 6390, "Pretrain/Step Time": 8.500864742323756} +{"Pretrain/Learning Rate": 3.875683192480958e-05, "Pretrain/Loss": 2.0250158309936523, "Pretrain/Loss (Raw)": 1.6924265623092651, "Pretrain/Step": 6391, "Pretrain/Step Time": 8.50377525947988} +{"Pretrain/Learning Rate": 3.875328707815246e-05, "Pretrain/Loss": 2.026031017303467, "Pretrain/Loss (Raw)": 2.1417477130889893, "Pretrain/Step": 6392, "Pretrain/Step Time": 8.503249119967222} +{"Pretrain/Learning Rate": 3.874974183492901e-05, "Pretrain/Loss": 2.0305416584014893, "Pretrain/Loss (Raw)": 2.4585626125335693, "Pretrain/Step": 6393, "Pretrain/Step Time": 8.504871908575296} +{"Pretrain/Learning Rate": 3.8746196195241434e-05, "Pretrain/Loss": 2.032367467880249, "Pretrain/Loss (Raw)": 2.255772590637207, "Pretrain/Step": 6394, "Pretrain/Step Time": 8.50432856567204} +{"Pretrain/Learning Rate": 3.8742650159191996e-05, "Pretrain/Loss": 2.0302271842956543, "Pretrain/Loss (Raw)": 1.9474176168441772, "Pretrain/Step": 6395, "Pretrain/Step Time": 8.505007795989513} +{"Pretrain/Learning Rate": 3.873910372688292e-05, "Pretrain/Loss": 2.0303945541381836, "Pretrain/Loss (Raw)": 2.0936810970306396, "Pretrain/Step": 6396, "Pretrain/Step Time": 8.502051018178463} +{"Pretrain/Learning Rate": 3.8735556898416475e-05, "Pretrain/Loss": 2.0287270545959473, "Pretrain/Loss (Raw)": 1.8722718954086304, "Pretrain/Step": 6397, "Pretrain/Step Time": 8.503629731014371} +{"Pretrain/Learning Rate": 3.873200967389493e-05, "Pretrain/Loss": 2.028035879135132, "Pretrain/Loss (Raw)": 2.1053054332733154, "Pretrain/Step": 6398, "Pretrain/Step Time": 8.507510045543313} +{"Pretrain/Learning Rate": 3.872846205342057e-05, "Pretrain/Loss": 2.030642032623291, "Pretrain/Loss (Raw)": 2.3962769508361816, "Pretrain/Step": 6399, "Pretrain/Step Time": 8.508848400786519} +{"Pretrain/Learning Rate": 3.8724914037095677e-05, "Pretrain/Loss": 2.0311741828918457, "Pretrain/Loss (Raw)": 2.0368614196777344, "Pretrain/Step": 6400, "Pretrain/Step Time": 8.506079176440835} +{"Pretrain/Learning Rate": 3.8721365625022565e-05, "Pretrain/Loss": 2.030588388442993, "Pretrain/Loss (Raw)": 1.8942545652389526, "Pretrain/Step": 6401, "Pretrain/Step Time": 8.49965349957347} +{"Pretrain/Learning Rate": 3.8717816817303555e-05, "Pretrain/Loss": 2.030585289001465, "Pretrain/Loss (Raw)": 2.0553205013275146, "Pretrain/Step": 6402, "Pretrain/Step Time": 8.499508103355765} +{"Pretrain/Learning Rate": 3.871426761404096e-05, "Pretrain/Loss": 2.029139518737793, "Pretrain/Loss (Raw)": 1.8530104160308838, "Pretrain/Step": 6403, "Pretrain/Step Time": 8.502447193488479} +{"Pretrain/Learning Rate": 3.8710718015337135e-05, "Pretrain/Loss": 2.0294792652130127, "Pretrain/Loss (Raw)": 2.0388119220733643, "Pretrain/Step": 6404, "Pretrain/Step Time": 8.501361144706607} +{"Pretrain/Learning Rate": 3.87071680212944e-05, "Pretrain/Loss": 2.028282642364502, "Pretrain/Loss (Raw)": 2.0279181003570557, "Pretrain/Step": 6405, "Pretrain/Step Time": 8.503490572795272} +{"Pretrain/Learning Rate": 3.8703617632015165e-05, "Pretrain/Loss": 2.030744791030884, "Pretrain/Loss (Raw)": 2.1404712200164795, "Pretrain/Step": 6406, "Pretrain/Step Time": 8.504398226737976} +{"Pretrain/Learning Rate": 3.870006684760176e-05, "Pretrain/Loss": 2.030438184738159, "Pretrain/Loss (Raw)": 2.0258278846740723, "Pretrain/Step": 6407, "Pretrain/Step Time": 8.503514535725117} +{"Pretrain/Learning Rate": 3.8696515668156596e-05, "Pretrain/Loss": 2.0292654037475586, "Pretrain/Loss (Raw)": 1.9617871046066284, "Pretrain/Step": 6408, "Pretrain/Step Time": 8.503328509628773} +{"Pretrain/Learning Rate": 3.869296409378205e-05, "Pretrain/Loss": 2.0293936729431152, "Pretrain/Loss (Raw)": 2.017472267150879, "Pretrain/Step": 6409, "Pretrain/Step Time": 8.50751705467701} +{"Pretrain/Learning Rate": 3.868941212458054e-05, "Pretrain/Loss": 2.0279223918914795, "Pretrain/Loss (Raw)": 1.9854459762573242, "Pretrain/Step": 6410, "Pretrain/Step Time": 8.506500957533717} +{"Pretrain/Learning Rate": 3.8685859760654475e-05, "Pretrain/Loss": 2.027026653289795, "Pretrain/Loss (Raw)": 1.9560036659240723, "Pretrain/Step": 6411, "Pretrain/Step Time": 8.503683865070343} +{"Pretrain/Learning Rate": 3.86823070021063e-05, "Pretrain/Loss": 2.025637149810791, "Pretrain/Loss (Raw)": 1.8725266456604004, "Pretrain/Step": 6412, "Pretrain/Step Time": 8.501676799729466} +{"Pretrain/Learning Rate": 3.867875384903845e-05, "Pretrain/Loss": 2.0253262519836426, "Pretrain/Loss (Raw)": 2.020678758621216, "Pretrain/Step": 6413, "Pretrain/Step Time": 8.498246589675546} +{"Pretrain/Learning Rate": 3.8675200301553364e-05, "Pretrain/Loss": 2.027559995651245, "Pretrain/Loss (Raw)": 2.1933510303497314, "Pretrain/Step": 6414, "Pretrain/Step Time": 8.498749883845448} +{"Pretrain/Learning Rate": 3.8671646359753524e-05, "Pretrain/Loss": 2.0260047912597656, "Pretrain/Loss (Raw)": 1.9870012998580933, "Pretrain/Step": 6415, "Pretrain/Step Time": 8.50101351365447} +{"Pretrain/Learning Rate": 3.866809202374141e-05, "Pretrain/Loss": 2.0262532234191895, "Pretrain/Loss (Raw)": 2.091951370239258, "Pretrain/Step": 6416, "Pretrain/Step Time": 8.504349909722805} +{"Pretrain/Learning Rate": 3.866453729361948e-05, "Pretrain/Loss": 2.0259881019592285, "Pretrain/Loss (Raw)": 2.0520436763763428, "Pretrain/Step": 6417, "Pretrain/Step Time": 8.503096260130405} +{"Pretrain/Learning Rate": 3.8660982169490255e-05, "Pretrain/Loss": 2.0251917839050293, "Pretrain/Loss (Raw)": 2.0477025508880615, "Pretrain/Step": 6418, "Pretrain/Step Time": 8.499523470178246} +{"Pretrain/Learning Rate": 3.865742665145625e-05, "Pretrain/Loss": 2.028007984161377, "Pretrain/Loss (Raw)": 2.0546369552612305, "Pretrain/Step": 6419, "Pretrain/Step Time": 8.502093624323606} +{"Pretrain/Learning Rate": 3.8653870739619965e-05, "Pretrain/Loss": 2.023463010787964, "Pretrain/Loss (Raw)": 1.7865225076675415, "Pretrain/Step": 6420, "Pretrain/Step Time": 8.500811103731394} +{"Pretrain/Learning Rate": 3.8650314434083945e-05, "Pretrain/Loss": 2.0235228538513184, "Pretrain/Loss (Raw)": 1.9838958978652954, "Pretrain/Step": 6421, "Pretrain/Step Time": 8.502088310196996} +{"Pretrain/Learning Rate": 3.8646757734950735e-05, "Pretrain/Loss": 2.0244977474212646, "Pretrain/Loss (Raw)": 2.023592710494995, "Pretrain/Step": 6422, "Pretrain/Step Time": 8.500832168385386} +{"Pretrain/Learning Rate": 3.8643200642322875e-05, "Pretrain/Loss": 2.025010585784912, "Pretrain/Loss (Raw)": 2.0234456062316895, "Pretrain/Step": 6423, "Pretrain/Step Time": 8.50133103132248} +{"Pretrain/Learning Rate": 3.863964315630295e-05, "Pretrain/Loss": 2.0242815017700195, "Pretrain/Loss (Raw)": 2.006375789642334, "Pretrain/Step": 6424, "Pretrain/Step Time": 8.499667454510927} +{"Pretrain/Learning Rate": 3.8636085276993536e-05, "Pretrain/Loss": 2.0232796669006348, "Pretrain/Loss (Raw)": 1.9294861555099487, "Pretrain/Step": 6425, "Pretrain/Step Time": 8.505156828090549} +{"Pretrain/Learning Rate": 3.863252700449721e-05, "Pretrain/Loss": 2.023287057876587, "Pretrain/Loss (Raw)": 2.0320346355438232, "Pretrain/Step": 6426, "Pretrain/Step Time": 8.507902609184384} +{"Pretrain/Learning Rate": 3.862896833891657e-05, "Pretrain/Loss": 2.0235862731933594, "Pretrain/Loss (Raw)": 2.2337539196014404, "Pretrain/Step": 6427, "Pretrain/Step Time": 8.506183398887515} +{"Pretrain/Learning Rate": 3.862540928035425e-05, "Pretrain/Loss": 2.02093505859375, "Pretrain/Loss (Raw)": 2.1171207427978516, "Pretrain/Step": 6428, "Pretrain/Step Time": 8.507987886667252} +{"Pretrain/Learning Rate": 3.862184982891285e-05, "Pretrain/Loss": 2.021218776702881, "Pretrain/Loss (Raw)": 2.0534603595733643, "Pretrain/Step": 6429, "Pretrain/Step Time": 8.505234131589532} +{"Pretrain/Learning Rate": 3.861828998469501e-05, "Pretrain/Loss": 2.0201895236968994, "Pretrain/Loss (Raw)": 1.9522749185562134, "Pretrain/Step": 6430, "Pretrain/Step Time": 8.505995746701956} +{"Pretrain/Learning Rate": 3.861472974780339e-05, "Pretrain/Loss": 2.018876075744629, "Pretrain/Loss (Raw)": 1.87746000289917, "Pretrain/Step": 6431, "Pretrain/Step Time": 8.504682816565037} +{"Pretrain/Learning Rate": 3.861116911834063e-05, "Pretrain/Loss": 2.02002215385437, "Pretrain/Loss (Raw)": 2.115955352783203, "Pretrain/Step": 6432, "Pretrain/Step Time": 8.503835640847683} +{"Pretrain/Learning Rate": 3.86076080964094e-05, "Pretrain/Loss": 2.0189971923828125, "Pretrain/Loss (Raw)": 1.9911409616470337, "Pretrain/Step": 6433, "Pretrain/Step Time": 8.500510653480887} +{"Pretrain/Learning Rate": 3.8604046682112384e-05, "Pretrain/Loss": 2.018338441848755, "Pretrain/Loss (Raw)": 1.647789716720581, "Pretrain/Step": 6434, "Pretrain/Step Time": 8.502702558413148} +{"Pretrain/Learning Rate": 3.8600484875552276e-05, "Pretrain/Loss": 2.018847942352295, "Pretrain/Loss (Raw)": 2.1706430912017822, "Pretrain/Step": 6435, "Pretrain/Step Time": 8.497150108218193} +{"Pretrain/Learning Rate": 3.859692267683177e-05, "Pretrain/Loss": 2.018202781677246, "Pretrain/Loss (Raw)": 2.0734522342681885, "Pretrain/Step": 6436, "Pretrain/Step Time": 8.50072323717177} +{"Pretrain/Learning Rate": 3.859336008605359e-05, "Pretrain/Loss": 2.019230842590332, "Pretrain/Loss (Raw)": 2.079878330230713, "Pretrain/Step": 6437, "Pretrain/Step Time": 8.505970345810056} +{"Pretrain/Learning Rate": 3.8589797103320455e-05, "Pretrain/Loss": 2.0191009044647217, "Pretrain/Loss (Raw)": 2.12477970123291, "Pretrain/Step": 6438, "Pretrain/Step Time": 8.503782453015447} +{"Pretrain/Learning Rate": 3.8586233728735096e-05, "Pretrain/Loss": 2.019313335418701, "Pretrain/Loss (Raw)": 1.9402250051498413, "Pretrain/Step": 6439, "Pretrain/Step Time": 8.499380828812718} +{"Pretrain/Learning Rate": 3.8582669962400265e-05, "Pretrain/Loss": 2.017534017562866, "Pretrain/Loss (Raw)": 1.8041146993637085, "Pretrain/Step": 6440, "Pretrain/Step Time": 8.502149134874344} +{"Pretrain/Learning Rate": 3.857910580441872e-05, "Pretrain/Loss": 2.0209555625915527, "Pretrain/Loss (Raw)": 2.6197991371154785, "Pretrain/Step": 6441, "Pretrain/Step Time": 8.497035467997193} +{"Pretrain/Learning Rate": 3.857554125489323e-05, "Pretrain/Loss": 2.0212974548339844, "Pretrain/Loss (Raw)": 2.031585931777954, "Pretrain/Step": 6442, "Pretrain/Step Time": 8.497264705598354} +{"Pretrain/Learning Rate": 3.857197631392658e-05, "Pretrain/Loss": 2.02005672454834, "Pretrain/Loss (Raw)": 2.079127788543701, "Pretrain/Step": 6443, "Pretrain/Step Time": 8.500511534512043} +{"Pretrain/Learning Rate": 3.8568410981621565e-05, "Pretrain/Loss": 2.01975679397583, "Pretrain/Loss (Raw)": 1.9617338180541992, "Pretrain/Step": 6444, "Pretrain/Step Time": 8.498989578336477} +{"Pretrain/Learning Rate": 3.856484525808098e-05, "Pretrain/Loss": 2.0195350646972656, "Pretrain/Loss (Raw)": 2.0211639404296875, "Pretrain/Step": 6445, "Pretrain/Step Time": 8.49747496470809} +{"Pretrain/Learning Rate": 3.856127914340765e-05, "Pretrain/Loss": 2.019357681274414, "Pretrain/Loss (Raw)": 1.9279718399047852, "Pretrain/Step": 6446, "Pretrain/Step Time": 8.495499022305012} +{"Pretrain/Learning Rate": 3.855771263770439e-05, "Pretrain/Loss": 2.0185906887054443, "Pretrain/Loss (Raw)": 1.8471081256866455, "Pretrain/Step": 6447, "Pretrain/Step Time": 8.495574686676264} +{"Pretrain/Learning Rate": 3.8554145741074046e-05, "Pretrain/Loss": 2.019179582595825, "Pretrain/Loss (Raw)": 2.1537976264953613, "Pretrain/Step": 6448, "Pretrain/Step Time": 8.49751896969974} +{"Pretrain/Learning Rate": 3.8550578453619465e-05, "Pretrain/Loss": 2.0223898887634277, "Pretrain/Loss (Raw)": 1.9315224885940552, "Pretrain/Step": 6449, "Pretrain/Step Time": 8.494272209703922} +{"Pretrain/Learning Rate": 3.85470107754435e-05, "Pretrain/Loss": 2.02376389503479, "Pretrain/Loss (Raw)": 2.1360511779785156, "Pretrain/Step": 6450, "Pretrain/Step Time": 8.494883069768548} +{"Pretrain/Learning Rate": 3.854344270664904e-05, "Pretrain/Loss": 2.0234732627868652, "Pretrain/Loss (Raw)": 2.1225199699401855, "Pretrain/Step": 6451, "Pretrain/Step Time": 8.493449606001377} +{"Pretrain/Learning Rate": 3.8539874247338956e-05, "Pretrain/Loss": 2.02341365814209, "Pretrain/Loss (Raw)": 1.9867186546325684, "Pretrain/Step": 6452, "Pretrain/Step Time": 8.498124647885561} +{"Pretrain/Learning Rate": 3.853630539761614e-05, "Pretrain/Loss": 2.0219838619232178, "Pretrain/Loss (Raw)": 1.8927719593048096, "Pretrain/Step": 6453, "Pretrain/Step Time": 8.49912722967565} +{"Pretrain/Learning Rate": 3.8532736157583497e-05, "Pretrain/Loss": 2.0211853981018066, "Pretrain/Loss (Raw)": 2.086665391921997, "Pretrain/Step": 6454, "Pretrain/Step Time": 8.498871916905046} +{"Pretrain/Learning Rate": 3.8529166527343954e-05, "Pretrain/Loss": 2.0241544246673584, "Pretrain/Loss (Raw)": 2.0748491287231445, "Pretrain/Step": 6455, "Pretrain/Step Time": 8.492024946957827} +{"Pretrain/Learning Rate": 3.8525596507000425e-05, "Pretrain/Loss": 2.025299310684204, "Pretrain/Loss (Raw)": 1.8153272867202759, "Pretrain/Step": 6456, "Pretrain/Step Time": 8.493604520335793} +{"Pretrain/Learning Rate": 3.852202609665586e-05, "Pretrain/Loss": 2.0254712104797363, "Pretrain/Loss (Raw)": 2.1116693019866943, "Pretrain/Step": 6457, "Pretrain/Step Time": 8.494999652728438} +{"Pretrain/Learning Rate": 3.8518455296413194e-05, "Pretrain/Loss": 2.0218191146850586, "Pretrain/Loss (Raw)": 1.8305648565292358, "Pretrain/Step": 6458, "Pretrain/Step Time": 8.495235100388527} +{"Pretrain/Learning Rate": 3.8514884106375414e-05, "Pretrain/Loss": 2.021005630493164, "Pretrain/Loss (Raw)": 1.871740698814392, "Pretrain/Step": 6459, "Pretrain/Step Time": 8.49532557465136} +{"Pretrain/Learning Rate": 3.851131252664547e-05, "Pretrain/Loss": 2.021514415740967, "Pretrain/Loss (Raw)": 1.9892369508743286, "Pretrain/Step": 6460, "Pretrain/Step Time": 8.490830063819885} +{"Pretrain/Learning Rate": 3.8507740557326354e-05, "Pretrain/Loss": 2.0208563804626465, "Pretrain/Loss (Raw)": 1.9784184694290161, "Pretrain/Step": 6461, "Pretrain/Step Time": 8.488513892516494} +{"Pretrain/Learning Rate": 3.8504168198521066e-05, "Pretrain/Loss": 2.022122383117676, "Pretrain/Loss (Raw)": 2.07474684715271, "Pretrain/Step": 6462, "Pretrain/Step Time": 8.4922686368227} +{"Pretrain/Learning Rate": 3.850059545033261e-05, "Pretrain/Loss": 2.022073268890381, "Pretrain/Loss (Raw)": 2.133119821548462, "Pretrain/Step": 6463, "Pretrain/Step Time": 8.492983059957623} +{"Pretrain/Learning Rate": 3.8497022312863994e-05, "Pretrain/Loss": 2.0245227813720703, "Pretrain/Loss (Raw)": 2.113325834274292, "Pretrain/Step": 6464, "Pretrain/Step Time": 8.489837922155857} +{"Pretrain/Learning Rate": 3.8493448786218256e-05, "Pretrain/Loss": 2.024064302444458, "Pretrain/Loss (Raw)": 2.00620436668396, "Pretrain/Step": 6465, "Pretrain/Step Time": 8.493766400963068} +{"Pretrain/Learning Rate": 3.848987487049843e-05, "Pretrain/Loss": 2.025073528289795, "Pretrain/Loss (Raw)": 2.0501346588134766, "Pretrain/Step": 6466, "Pretrain/Step Time": 8.48949054069817} +{"Pretrain/Learning Rate": 3.8486300565807585e-05, "Pretrain/Loss": 2.0248429775238037, "Pretrain/Loss (Raw)": 1.9968371391296387, "Pretrain/Step": 6467, "Pretrain/Step Time": 8.492688251659274} +{"Pretrain/Learning Rate": 3.848272587224876e-05, "Pretrain/Loss": 2.0256805419921875, "Pretrain/Loss (Raw)": 2.2439262866973877, "Pretrain/Step": 6468, "Pretrain/Step Time": 8.495217218995094} +{"Pretrain/Learning Rate": 3.847915078992504e-05, "Pretrain/Loss": 2.0256381034851074, "Pretrain/Loss (Raw)": 1.805551290512085, "Pretrain/Step": 6469, "Pretrain/Step Time": 8.493191616609693} +{"Pretrain/Learning Rate": 3.8475575318939516e-05, "Pretrain/Loss": 2.024028778076172, "Pretrain/Loss (Raw)": 2.0507748126983643, "Pretrain/Step": 6470, "Pretrain/Step Time": 8.493919052183628} +{"Pretrain/Learning Rate": 3.847199945939527e-05, "Pretrain/Loss": 2.0237011909484863, "Pretrain/Loss (Raw)": 1.999691128730774, "Pretrain/Step": 6471, "Pretrain/Step Time": 8.492616068571806} +{"Pretrain/Learning Rate": 3.8468423211395424e-05, "Pretrain/Loss": 2.021909475326538, "Pretrain/Loss (Raw)": 1.979057788848877, "Pretrain/Step": 6472, "Pretrain/Step Time": 8.491515016183257} +{"Pretrain/Learning Rate": 3.846484657504308e-05, "Pretrain/Loss": 2.0242083072662354, "Pretrain/Loss (Raw)": 2.170917510986328, "Pretrain/Step": 6473, "Pretrain/Step Time": 8.491424884647131} +{"Pretrain/Learning Rate": 3.8461269550441385e-05, "Pretrain/Loss": 2.024578332901001, "Pretrain/Loss (Raw)": 2.050499677658081, "Pretrain/Step": 6474, "Pretrain/Step Time": 8.491267485544086} +{"Pretrain/Learning Rate": 3.845769213769347e-05, "Pretrain/Loss": 2.02315354347229, "Pretrain/Loss (Raw)": 1.85415518283844, "Pretrain/Step": 6475, "Pretrain/Step Time": 8.49159155972302} +{"Pretrain/Learning Rate": 3.845411433690248e-05, "Pretrain/Loss": 2.0224380493164062, "Pretrain/Loss (Raw)": 2.073819160461426, "Pretrain/Step": 6476, "Pretrain/Step Time": 8.494244141504169} +{"Pretrain/Learning Rate": 3.845053614817161e-05, "Pretrain/Loss": 2.0184550285339355, "Pretrain/Loss (Raw)": 2.009901285171509, "Pretrain/Step": 6477, "Pretrain/Step Time": 8.49127759411931} +{"Pretrain/Learning Rate": 3.844695757160399e-05, "Pretrain/Loss": 2.0201339721679688, "Pretrain/Loss (Raw)": 2.284874200820923, "Pretrain/Step": 6478, "Pretrain/Step Time": 8.489474451169372} +{"Pretrain/Learning Rate": 3.8443378607302835e-05, "Pretrain/Loss": 2.0180978775024414, "Pretrain/Loss (Raw)": 1.8950691223144531, "Pretrain/Step": 6479, "Pretrain/Step Time": 8.49034514464438} +{"Pretrain/Learning Rate": 3.843979925537135e-05, "Pretrain/Loss": 2.0196821689605713, "Pretrain/Loss (Raw)": 1.9414583444595337, "Pretrain/Step": 6480, "Pretrain/Step Time": 8.487481992691755} +{"Pretrain/Learning Rate": 3.8436219515912706e-05, "Pretrain/Loss": 2.020284652709961, "Pretrain/Loss (Raw)": 1.9866143465042114, "Pretrain/Step": 6481, "Pretrain/Step Time": 8.48966863937676} +{"Pretrain/Learning Rate": 3.843263938903015e-05, "Pretrain/Loss": 2.0190269947052, "Pretrain/Loss (Raw)": 2.0748276710510254, "Pretrain/Step": 6482, "Pretrain/Step Time": 8.485060164704919} +{"Pretrain/Learning Rate": 3.84290588748269e-05, "Pretrain/Loss": 2.0175323486328125, "Pretrain/Loss (Raw)": 1.9412754774093628, "Pretrain/Step": 6483, "Pretrain/Step Time": 8.485298184677958} +{"Pretrain/Learning Rate": 3.842547797340623e-05, "Pretrain/Loss": 2.017345905303955, "Pretrain/Loss (Raw)": 1.9944229125976562, "Pretrain/Step": 6484, "Pretrain/Step Time": 8.482686962932348} +{"Pretrain/Learning Rate": 3.8421896684871344e-05, "Pretrain/Loss": 2.0157470703125, "Pretrain/Loss (Raw)": 1.9753905534744263, "Pretrain/Step": 6485, "Pretrain/Step Time": 8.485146982595325} +{"Pretrain/Learning Rate": 3.841831500932553e-05, "Pretrain/Loss": 2.0165505409240723, "Pretrain/Loss (Raw)": 2.095198154449463, "Pretrain/Step": 6486, "Pretrain/Step Time": 8.48425216972828} +{"Pretrain/Learning Rate": 3.841473294687207e-05, "Pretrain/Loss": 2.014404773712158, "Pretrain/Loss (Raw)": 1.850127935409546, "Pretrain/Step": 6487, "Pretrain/Step Time": 8.487118175253272} +{"Pretrain/Learning Rate": 3.841115049761424e-05, "Pretrain/Loss": 2.016869068145752, "Pretrain/Loss (Raw)": 2.1458740234375, "Pretrain/Step": 6488, "Pretrain/Step Time": 8.485220421105623} +{"Pretrain/Learning Rate": 3.840756766165534e-05, "Pretrain/Loss": 2.0194272994995117, "Pretrain/Loss (Raw)": 2.1957733631134033, "Pretrain/Step": 6489, "Pretrain/Step Time": 8.484743557870388} +{"Pretrain/Learning Rate": 3.840398443909867e-05, "Pretrain/Loss": 2.0198192596435547, "Pretrain/Loss (Raw)": 2.0690858364105225, "Pretrain/Step": 6490, "Pretrain/Step Time": 8.48760055936873} +{"Pretrain/Learning Rate": 3.8400400830047564e-05, "Pretrain/Loss": 2.0178823471069336, "Pretrain/Loss (Raw)": 1.9726860523223877, "Pretrain/Step": 6491, "Pretrain/Step Time": 8.489680891856551} +{"Pretrain/Learning Rate": 3.8396816834605356e-05, "Pretrain/Loss": 2.0202207565307617, "Pretrain/Loss (Raw)": 2.128190755844116, "Pretrain/Step": 6492, "Pretrain/Step Time": 8.488003466278315} +{"Pretrain/Learning Rate": 3.839323245287536e-05, "Pretrain/Loss": 2.0215044021606445, "Pretrain/Loss (Raw)": 2.025942802429199, "Pretrain/Step": 6493, "Pretrain/Step Time": 8.490251641720533} +{"Pretrain/Learning Rate": 3.838964768496097e-05, "Pretrain/Loss": 2.0199785232543945, "Pretrain/Loss (Raw)": 1.8781057596206665, "Pretrain/Step": 6494, "Pretrain/Step Time": 8.48657876253128} +{"Pretrain/Learning Rate": 3.838606253096551e-05, "Pretrain/Loss": 2.018214464187622, "Pretrain/Loss (Raw)": 1.9192848205566406, "Pretrain/Step": 6495, "Pretrain/Step Time": 8.485529555007815} +{"Pretrain/Learning Rate": 3.838247699099238e-05, "Pretrain/Loss": 2.0179543495178223, "Pretrain/Loss (Raw)": 1.9966768026351929, "Pretrain/Step": 6496, "Pretrain/Step Time": 8.486100429669023} +{"Pretrain/Learning Rate": 3.837889106514496e-05, "Pretrain/Loss": 2.0173583030700684, "Pretrain/Loss (Raw)": 1.8941410779953003, "Pretrain/Step": 6497, "Pretrain/Step Time": 8.483292950317264} +{"Pretrain/Learning Rate": 3.8375304753526645e-05, "Pretrain/Loss": 2.016529083251953, "Pretrain/Loss (Raw)": 1.9127779006958008, "Pretrain/Step": 6498, "Pretrain/Step Time": 8.483115131035447} +{"Pretrain/Learning Rate": 3.837171805624085e-05, "Pretrain/Loss": 2.0181026458740234, "Pretrain/Loss (Raw)": 2.010646104812622, "Pretrain/Step": 6499, "Pretrain/Step Time": 8.47795457392931} +{"Pretrain/Learning Rate": 3.836813097339099e-05, "Pretrain/Loss": 2.01706600189209, "Pretrain/Loss (Raw)": 1.8805946111679077, "Pretrain/Step": 6500, "Pretrain/Step Time": 8.480682356283069} +{"Pretrain/Learning Rate": 3.8364543505080494e-05, "Pretrain/Loss": 2.0200858116149902, "Pretrain/Loss (Raw)": 2.305314779281616, "Pretrain/Step": 6501, "Pretrain/Step Time": 8.475755808874965} +{"Pretrain/Learning Rate": 3.8360955651412814e-05, "Pretrain/Loss": 2.021697521209717, "Pretrain/Loss (Raw)": 2.2483208179473877, "Pretrain/Step": 6502, "Pretrain/Step Time": 8.477331692352891} +{"Pretrain/Learning Rate": 3.8357367412491394e-05, "Pretrain/Loss": 2.022874116897583, "Pretrain/Loss (Raw)": 2.082547187805176, "Pretrain/Step": 6503, "Pretrain/Step Time": 8.476939000189304} +{"Pretrain/Learning Rate": 3.83537787884197e-05, "Pretrain/Loss": 2.0222220420837402, "Pretrain/Loss (Raw)": 1.9229161739349365, "Pretrain/Step": 6504, "Pretrain/Step Time": 8.476345736533403} +{"Pretrain/Learning Rate": 3.8350189779301205e-05, "Pretrain/Loss": 2.0228052139282227, "Pretrain/Loss (Raw)": 1.9711716175079346, "Pretrain/Step": 6505, "Pretrain/Step Time": 8.477687239646912} +{"Pretrain/Learning Rate": 3.8346600385239403e-05, "Pretrain/Loss": 2.022552967071533, "Pretrain/Loss (Raw)": 1.9649932384490967, "Pretrain/Step": 6506, "Pretrain/Step Time": 8.47948664240539} +{"Pretrain/Learning Rate": 3.8343010606337784e-05, "Pretrain/Loss": 2.0218052864074707, "Pretrain/Loss (Raw)": 1.9605528116226196, "Pretrain/Step": 6507, "Pretrain/Step Time": 8.47947565279901} +{"Pretrain/Learning Rate": 3.833942044269987e-05, "Pretrain/Loss": 2.0211195945739746, "Pretrain/Loss (Raw)": 1.7976019382476807, "Pretrain/Step": 6508, "Pretrain/Step Time": 8.478898257017136} +{"Pretrain/Learning Rate": 3.833582989442916e-05, "Pretrain/Loss": 2.020810842514038, "Pretrain/Loss (Raw)": 1.8831194639205933, "Pretrain/Step": 6509, "Pretrain/Step Time": 8.483263419941068} +{"Pretrain/Learning Rate": 3.833223896162921e-05, "Pretrain/Loss": 2.0224053859710693, "Pretrain/Loss (Raw)": 2.114445686340332, "Pretrain/Step": 6510, "Pretrain/Step Time": 8.483773892745376} +{"Pretrain/Learning Rate": 3.832864764440353e-05, "Pretrain/Loss": 2.024428129196167, "Pretrain/Loss (Raw)": 2.1425907611846924, "Pretrain/Step": 6511, "Pretrain/Step Time": 8.48129622079432} +{"Pretrain/Learning Rate": 3.8325055942855705e-05, "Pretrain/Loss": 2.02528715133667, "Pretrain/Loss (Raw)": 2.083439588546753, "Pretrain/Step": 6512, "Pretrain/Step Time": 8.479719398543239} +{"Pretrain/Learning Rate": 3.8321463857089276e-05, "Pretrain/Loss": 2.026681423187256, "Pretrain/Loss (Raw)": 2.1327826976776123, "Pretrain/Step": 6513, "Pretrain/Step Time": 8.477399120107293} +{"Pretrain/Learning Rate": 3.831787138720783e-05, "Pretrain/Loss": 2.025628089904785, "Pretrain/Loss (Raw)": 2.1662590503692627, "Pretrain/Step": 6514, "Pretrain/Step Time": 8.4767444152385} +{"Pretrain/Learning Rate": 3.831427853331496e-05, "Pretrain/Loss": 2.025489568710327, "Pretrain/Loss (Raw)": 2.021409034729004, "Pretrain/Step": 6515, "Pretrain/Step Time": 8.47862677462399} +{"Pretrain/Learning Rate": 3.831068529551425e-05, "Pretrain/Loss": 2.0245091915130615, "Pretrain/Loss (Raw)": 1.9761117696762085, "Pretrain/Step": 6516, "Pretrain/Step Time": 8.481363516300917} +{"Pretrain/Learning Rate": 3.8307091673909306e-05, "Pretrain/Loss": 2.0255913734436035, "Pretrain/Loss (Raw)": 2.103118419647217, "Pretrain/Step": 6517, "Pretrain/Step Time": 8.476409105584025} +{"Pretrain/Learning Rate": 3.830349766860376e-05, "Pretrain/Loss": 2.02543306350708, "Pretrain/Loss (Raw)": 1.982743263244629, "Pretrain/Step": 6518, "Pretrain/Step Time": 8.479169592261314} +{"Pretrain/Learning Rate": 3.8299903279701234e-05, "Pretrain/Loss": 2.0289125442504883, "Pretrain/Loss (Raw)": 2.1377933025360107, "Pretrain/Step": 6519, "Pretrain/Step Time": 8.477455496788025} +{"Pretrain/Learning Rate": 3.8296308507305376e-05, "Pretrain/Loss": 2.0286340713500977, "Pretrain/Loss (Raw)": 2.1061289310455322, "Pretrain/Step": 6520, "Pretrain/Step Time": 8.472280537709594} +{"Pretrain/Learning Rate": 3.829271335151984e-05, "Pretrain/Loss": 2.024385929107666, "Pretrain/Loss (Raw)": 1.9147700071334839, "Pretrain/Step": 6521, "Pretrain/Step Time": 8.471299782395363} +{"Pretrain/Learning Rate": 3.8289117812448286e-05, "Pretrain/Loss": 2.020951747894287, "Pretrain/Loss (Raw)": 1.8162057399749756, "Pretrain/Step": 6522, "Pretrain/Step Time": 8.478288481011987} +{"Pretrain/Learning Rate": 3.8285521890194374e-05, "Pretrain/Loss": 2.020822048187256, "Pretrain/Loss (Raw)": 1.930815577507019, "Pretrain/Step": 6523, "Pretrain/Step Time": 8.475819984450936} +{"Pretrain/Learning Rate": 3.828192558486181e-05, "Pretrain/Loss": 2.0199382305145264, "Pretrain/Loss (Raw)": 1.9805513620376587, "Pretrain/Step": 6524, "Pretrain/Step Time": 8.476370627060533} +{"Pretrain/Learning Rate": 3.827832889655428e-05, "Pretrain/Loss": 2.020472526550293, "Pretrain/Loss (Raw)": 1.940666913986206, "Pretrain/Step": 6525, "Pretrain/Step Time": 8.475639706477523} +{"Pretrain/Learning Rate": 3.8274731825375514e-05, "Pretrain/Loss": 2.020399332046509, "Pretrain/Loss (Raw)": 2.095945119857788, "Pretrain/Step": 6526, "Pretrain/Step Time": 8.474127942696214} +{"Pretrain/Learning Rate": 3.82711343714292e-05, "Pretrain/Loss": 2.018982410430908, "Pretrain/Loss (Raw)": 2.2149219512939453, "Pretrain/Step": 6527, "Pretrain/Step Time": 8.472566977143288} +{"Pretrain/Learning Rate": 3.826753653481909e-05, "Pretrain/Loss": 2.0197620391845703, "Pretrain/Loss (Raw)": 2.136626720428467, "Pretrain/Step": 6528, "Pretrain/Step Time": 8.472009846940637} +{"Pretrain/Learning Rate": 3.82639383156489e-05, "Pretrain/Loss": 2.018902540206909, "Pretrain/Loss (Raw)": 1.7842557430267334, "Pretrain/Step": 6529, "Pretrain/Step Time": 8.476498758420348} +{"Pretrain/Learning Rate": 3.826033971402242e-05, "Pretrain/Loss": 2.0207719802856445, "Pretrain/Loss (Raw)": 2.294607400894165, "Pretrain/Step": 6530, "Pretrain/Step Time": 8.470297465100884} +{"Pretrain/Learning Rate": 3.8256740730043384e-05, "Pretrain/Loss": 2.021536350250244, "Pretrain/Loss (Raw)": 1.9508564472198486, "Pretrain/Step": 6531, "Pretrain/Step Time": 8.472019454464316} +{"Pretrain/Learning Rate": 3.825314136381557e-05, "Pretrain/Loss": 2.020437002182007, "Pretrain/Loss (Raw)": 1.8980798721313477, "Pretrain/Step": 6532, "Pretrain/Step Time": 8.472085397690535} +{"Pretrain/Learning Rate": 3.8249541615442775e-05, "Pretrain/Loss": 2.023016929626465, "Pretrain/Loss (Raw)": 2.3581786155700684, "Pretrain/Step": 6533, "Pretrain/Step Time": 8.475485637784004} +{"Pretrain/Learning Rate": 3.8245941485028784e-05, "Pretrain/Loss": 2.022921323776245, "Pretrain/Loss (Raw)": 2.128208637237549, "Pretrain/Step": 6534, "Pretrain/Step Time": 8.476722998544574} +{"Pretrain/Learning Rate": 3.824234097267741e-05, "Pretrain/Loss": 2.021428108215332, "Pretrain/Loss (Raw)": 1.8346844911575317, "Pretrain/Step": 6535, "Pretrain/Step Time": 8.473317999392748} +{"Pretrain/Learning Rate": 3.8238740078492476e-05, "Pretrain/Loss": 2.0214691162109375, "Pretrain/Loss (Raw)": 1.9670244455337524, "Pretrain/Step": 6536, "Pretrain/Step Time": 8.476181328296661} +{"Pretrain/Learning Rate": 3.823513880257779e-05, "Pretrain/Loss": 2.0208935737609863, "Pretrain/Loss (Raw)": 1.9438410997390747, "Pretrain/Step": 6537, "Pretrain/Step Time": 8.477958222851157} +{"Pretrain/Learning Rate": 3.823153714503721e-05, "Pretrain/Loss": 2.0205318927764893, "Pretrain/Loss (Raw)": 1.9391448497772217, "Pretrain/Step": 6538, "Pretrain/Step Time": 8.477492474019527} +{"Pretrain/Learning Rate": 3.8227935105974585e-05, "Pretrain/Loss": 2.0217106342315674, "Pretrain/Loss (Raw)": 2.1068668365478516, "Pretrain/Step": 6539, "Pretrain/Step Time": 8.477955128997564} +{"Pretrain/Learning Rate": 3.822433268549378e-05, "Pretrain/Loss": 2.0231704711914062, "Pretrain/Loss (Raw)": 2.0593714714050293, "Pretrain/Step": 6540, "Pretrain/Step Time": 8.476291393861175} +{"Pretrain/Learning Rate": 3.822072988369867e-05, "Pretrain/Loss": 2.023502826690674, "Pretrain/Loss (Raw)": 2.063277244567871, "Pretrain/Step": 6541, "Pretrain/Step Time": 8.478682953864336} +{"Pretrain/Learning Rate": 3.8217126700693126e-05, "Pretrain/Loss": 2.020672082901001, "Pretrain/Loss (Raw)": 1.830987572669983, "Pretrain/Step": 6542, "Pretrain/Step Time": 8.478577576577663} +{"Pretrain/Learning Rate": 3.821352313658105e-05, "Pretrain/Loss": 2.019771099090576, "Pretrain/Loss (Raw)": 1.8716880083084106, "Pretrain/Step": 6543, "Pretrain/Step Time": 8.474085252732038} +{"Pretrain/Learning Rate": 3.820991919146635e-05, "Pretrain/Loss": 2.019235134124756, "Pretrain/Loss (Raw)": 2.023322820663452, "Pretrain/Step": 6544, "Pretrain/Step Time": 8.473927797749639} +{"Pretrain/Learning Rate": 3.8206314865452945e-05, "Pretrain/Loss": 2.0206069946289062, "Pretrain/Loss (Raw)": 2.2276339530944824, "Pretrain/Step": 6545, "Pretrain/Step Time": 8.47381592541933} +{"Pretrain/Learning Rate": 3.820271015864476e-05, "Pretrain/Loss": 2.0203092098236084, "Pretrain/Loss (Raw)": 2.0096046924591064, "Pretrain/Step": 6546, "Pretrain/Step Time": 8.47405525483191} +{"Pretrain/Learning Rate": 3.819910507114574e-05, "Pretrain/Loss": 2.0209991931915283, "Pretrain/Loss (Raw)": 2.1429386138916016, "Pretrain/Step": 6547, "Pretrain/Step Time": 8.47220521606505} +{"Pretrain/Learning Rate": 3.819549960305982e-05, "Pretrain/Loss": 2.020965576171875, "Pretrain/Loss (Raw)": 1.7822563648223877, "Pretrain/Step": 6548, "Pretrain/Step Time": 8.479319911450148} +{"Pretrain/Learning Rate": 3.8191893754490976e-05, "Pretrain/Loss": 2.021252155303955, "Pretrain/Loss (Raw)": 2.020548105239868, "Pretrain/Step": 6549, "Pretrain/Step Time": 8.477173311635852} +{"Pretrain/Learning Rate": 3.818828752554318e-05, "Pretrain/Loss": 2.0204858779907227, "Pretrain/Loss (Raw)": 1.9255133867263794, "Pretrain/Step": 6550, "Pretrain/Step Time": 8.478241728618741} +{"Pretrain/Learning Rate": 3.81846809163204e-05, "Pretrain/Loss": 2.021554946899414, "Pretrain/Loss (Raw)": 2.1602983474731445, "Pretrain/Step": 6551, "Pretrain/Step Time": 8.484296221286058} +{"Pretrain/Learning Rate": 3.8181073926926645e-05, "Pretrain/Loss": 2.020693302154541, "Pretrain/Loss (Raw)": 1.896093487739563, "Pretrain/Step": 6552, "Pretrain/Step Time": 8.489202599972486} +{"Pretrain/Learning Rate": 3.817746655746591e-05, "Pretrain/Loss": 2.021883487701416, "Pretrain/Loss (Raw)": 2.081817865371704, "Pretrain/Step": 6553, "Pretrain/Step Time": 8.486531678587198} +{"Pretrain/Learning Rate": 3.817385880804223e-05, "Pretrain/Loss": 2.0210704803466797, "Pretrain/Loss (Raw)": 1.927950143814087, "Pretrain/Step": 6554, "Pretrain/Step Time": 8.483688116073608} +{"Pretrain/Learning Rate": 3.817025067875961e-05, "Pretrain/Loss": 2.0195932388305664, "Pretrain/Loss (Raw)": 2.044670581817627, "Pretrain/Step": 6555, "Pretrain/Step Time": 8.480055144056678} +{"Pretrain/Learning Rate": 3.8166642169722095e-05, "Pretrain/Loss": 2.0179896354675293, "Pretrain/Loss (Raw)": 1.9118826389312744, "Pretrain/Step": 6556, "Pretrain/Step Time": 8.477753093466163} +{"Pretrain/Learning Rate": 3.816303328103374e-05, "Pretrain/Loss": 2.018998384475708, "Pretrain/Loss (Raw)": 2.1825754642486572, "Pretrain/Step": 6557, "Pretrain/Step Time": 8.482364853844047} +{"Pretrain/Learning Rate": 3.815942401279859e-05, "Pretrain/Loss": 2.01914644241333, "Pretrain/Loss (Raw)": 1.9712207317352295, "Pretrain/Step": 6558, "Pretrain/Step Time": 8.48329335078597} +{"Pretrain/Learning Rate": 3.815581436512073e-05, "Pretrain/Loss": 2.022017240524292, "Pretrain/Loss (Raw)": 2.2449305057525635, "Pretrain/Step": 6559, "Pretrain/Step Time": 8.47982944175601} +{"Pretrain/Learning Rate": 3.815220433810424e-05, "Pretrain/Loss": 2.021627426147461, "Pretrain/Loss (Raw)": 2.0660300254821777, "Pretrain/Step": 6560, "Pretrain/Step Time": 8.481666181236506} +{"Pretrain/Learning Rate": 3.814859393185321e-05, "Pretrain/Loss": 2.0221662521362305, "Pretrain/Loss (Raw)": 2.060117483139038, "Pretrain/Step": 6561, "Pretrain/Step Time": 8.478411758318543} +{"Pretrain/Learning Rate": 3.8144983146471744e-05, "Pretrain/Loss": 2.024277687072754, "Pretrain/Loss (Raw)": 1.9180704355239868, "Pretrain/Step": 6562, "Pretrain/Step Time": 8.478656977415085} +{"Pretrain/Learning Rate": 3.814137198206396e-05, "Pretrain/Loss": 2.024210214614868, "Pretrain/Loss (Raw)": 2.1619889736175537, "Pretrain/Step": 6563, "Pretrain/Step Time": 8.485413614660501} +{"Pretrain/Learning Rate": 3.813776043873397e-05, "Pretrain/Loss": 2.0239193439483643, "Pretrain/Loss (Raw)": 2.0362470149993896, "Pretrain/Step": 6564, "Pretrain/Step Time": 8.483565742149949} +{"Pretrain/Learning Rate": 3.813414851658592e-05, "Pretrain/Loss": 2.022819995880127, "Pretrain/Loss (Raw)": 1.9391698837280273, "Pretrain/Step": 6565, "Pretrain/Step Time": 8.47828458994627} +{"Pretrain/Learning Rate": 3.813053621572395e-05, "Pretrain/Loss": 2.02197265625, "Pretrain/Loss (Raw)": 2.0162899494171143, "Pretrain/Step": 6566, "Pretrain/Step Time": 8.48352207802236} +{"Pretrain/Learning Rate": 3.8126923536252234e-05, "Pretrain/Loss": 2.024384021759033, "Pretrain/Loss (Raw)": 2.248884439468384, "Pretrain/Step": 6567, "Pretrain/Step Time": 8.480357630178332} +{"Pretrain/Learning Rate": 3.812331047827494e-05, "Pretrain/Loss": 2.027538776397705, "Pretrain/Loss (Raw)": 2.207927703857422, "Pretrain/Step": 6568, "Pretrain/Step Time": 8.482904475182295} +{"Pretrain/Learning Rate": 3.811969704189623e-05, "Pretrain/Loss": 2.024580478668213, "Pretrain/Loss (Raw)": 2.2411234378814697, "Pretrain/Step": 6569, "Pretrain/Step Time": 8.48597002774477} +{"Pretrain/Learning Rate": 3.81160832272203e-05, "Pretrain/Loss": 2.024130344390869, "Pretrain/Loss (Raw)": 1.9739954471588135, "Pretrain/Step": 6570, "Pretrain/Step Time": 8.481270536780357} +{"Pretrain/Learning Rate": 3.811246903435136e-05, "Pretrain/Loss": 2.0250649452209473, "Pretrain/Loss (Raw)": 2.1987576484680176, "Pretrain/Step": 6571, "Pretrain/Step Time": 8.480581665411592} +{"Pretrain/Learning Rate": 3.810885446339362e-05, "Pretrain/Loss": 2.02612566947937, "Pretrain/Loss (Raw)": 2.0974857807159424, "Pretrain/Step": 6572, "Pretrain/Step Time": 8.484029745683074} +{"Pretrain/Learning Rate": 3.8105239514451304e-05, "Pretrain/Loss": 2.02518367767334, "Pretrain/Loss (Raw)": 1.9006236791610718, "Pretrain/Step": 6573, "Pretrain/Step Time": 8.48216538131237} +{"Pretrain/Learning Rate": 3.810162418762864e-05, "Pretrain/Loss": 2.0256409645080566, "Pretrain/Loss (Raw)": 1.9864693880081177, "Pretrain/Step": 6574, "Pretrain/Step Time": 8.48215975239873} +{"Pretrain/Learning Rate": 3.809800848302988e-05, "Pretrain/Loss": 2.0274524688720703, "Pretrain/Loss (Raw)": 2.0789997577667236, "Pretrain/Step": 6575, "Pretrain/Step Time": 8.485546745359898} +{"Pretrain/Learning Rate": 3.8094392400759284e-05, "Pretrain/Loss": 2.027942180633545, "Pretrain/Loss (Raw)": 2.2164697647094727, "Pretrain/Step": 6576, "Pretrain/Step Time": 8.486626755446196} +{"Pretrain/Learning Rate": 3.809077594092111e-05, "Pretrain/Loss": 2.0305185317993164, "Pretrain/Loss (Raw)": 2.2612926959991455, "Pretrain/Step": 6577, "Pretrain/Step Time": 8.485442847013474} +{"Pretrain/Learning Rate": 3.808715910361964e-05, "Pretrain/Loss": 2.0285420417785645, "Pretrain/Loss (Raw)": 1.8830726146697998, "Pretrain/Step": 6578, "Pretrain/Step Time": 8.493141427636147} +{"Pretrain/Learning Rate": 3.808354188895917e-05, "Pretrain/Loss": 2.0287985801696777, "Pretrain/Loss (Raw)": 2.155339479446411, "Pretrain/Step": 6579, "Pretrain/Step Time": 8.49136739037931} +{"Pretrain/Learning Rate": 3.8079924297043985e-05, "Pretrain/Loss": 2.029391288757324, "Pretrain/Loss (Raw)": 2.062574863433838, "Pretrain/Step": 6580, "Pretrain/Step Time": 8.488217666745186} +{"Pretrain/Learning Rate": 3.8076306327978404e-05, "Pretrain/Loss": 2.029528856277466, "Pretrain/Loss (Raw)": 1.9103924036026, "Pretrain/Step": 6581, "Pretrain/Step Time": 8.490094425156713} +{"Pretrain/Learning Rate": 3.807268798186675e-05, "Pretrain/Loss": 2.0299949645996094, "Pretrain/Loss (Raw)": 2.1463332176208496, "Pretrain/Step": 6582, "Pretrain/Step Time": 8.48773997835815} +{"Pretrain/Learning Rate": 3.806906925881335e-05, "Pretrain/Loss": 2.027449131011963, "Pretrain/Loss (Raw)": 1.7490023374557495, "Pretrain/Step": 6583, "Pretrain/Step Time": 8.492720915004611} +{"Pretrain/Learning Rate": 3.806545015892256e-05, "Pretrain/Loss": 2.0295140743255615, "Pretrain/Loss (Raw)": 2.0796122550964355, "Pretrain/Step": 6584, "Pretrain/Step Time": 8.491762759163976} +{"Pretrain/Learning Rate": 3.806183068229872e-05, "Pretrain/Loss": 2.0291190147399902, "Pretrain/Loss (Raw)": 2.0610883235931396, "Pretrain/Step": 6585, "Pretrain/Step Time": 8.49119644984603} +{"Pretrain/Learning Rate": 3.80582108290462e-05, "Pretrain/Loss": 2.029268264770508, "Pretrain/Loss (Raw)": 1.8497109413146973, "Pretrain/Step": 6586, "Pretrain/Step Time": 8.489281836897135} +{"Pretrain/Learning Rate": 3.805459059926937e-05, "Pretrain/Loss": 2.0316286087036133, "Pretrain/Loss (Raw)": 2.173837184906006, "Pretrain/Step": 6587, "Pretrain/Step Time": 8.491283863782883} +{"Pretrain/Learning Rate": 3.8050969993072636e-05, "Pretrain/Loss": 2.031776189804077, "Pretrain/Loss (Raw)": 2.008127450942993, "Pretrain/Step": 6588, "Pretrain/Step Time": 8.493705565109849} +{"Pretrain/Learning Rate": 3.804734901056037e-05, "Pretrain/Loss": 2.033069372177124, "Pretrain/Loss (Raw)": 2.1439521312713623, "Pretrain/Step": 6589, "Pretrain/Step Time": 8.492672497406602} +{"Pretrain/Learning Rate": 3.8043727651837e-05, "Pretrain/Loss": 2.0327558517456055, "Pretrain/Loss (Raw)": 2.0346033573150635, "Pretrain/Step": 6590, "Pretrain/Step Time": 8.490613607689738} +{"Pretrain/Learning Rate": 3.804010591700694e-05, "Pretrain/Loss": 2.0322341918945312, "Pretrain/Loss (Raw)": 2.0663788318634033, "Pretrain/Step": 6591, "Pretrain/Step Time": 8.49098170362413} +{"Pretrain/Learning Rate": 3.803648380617461e-05, "Pretrain/Loss": 2.0317282676696777, "Pretrain/Loss (Raw)": 2.0485336780548096, "Pretrain/Step": 6592, "Pretrain/Step Time": 8.491405550390482} +{"Pretrain/Learning Rate": 3.803286131944447e-05, "Pretrain/Loss": 2.0319881439208984, "Pretrain/Loss (Raw)": 2.03947377204895, "Pretrain/Step": 6593, "Pretrain/Step Time": 8.484987117350101} +{"Pretrain/Learning Rate": 3.8029238456920955e-05, "Pretrain/Loss": 2.033839225769043, "Pretrain/Loss (Raw)": 2.2870922088623047, "Pretrain/Step": 6594, "Pretrain/Step Time": 8.491748690605164} +{"Pretrain/Learning Rate": 3.802561521870854e-05, "Pretrain/Loss": 2.033750057220459, "Pretrain/Loss (Raw)": 1.985447645187378, "Pretrain/Step": 6595, "Pretrain/Step Time": 8.488104116171598} +{"Pretrain/Learning Rate": 3.802199160491169e-05, "Pretrain/Loss": 2.0319089889526367, "Pretrain/Loss (Raw)": 2.008225679397583, "Pretrain/Step": 6596, "Pretrain/Step Time": 8.486378019675612} +{"Pretrain/Learning Rate": 3.801836761563489e-05, "Pretrain/Loss": 2.0334062576293945, "Pretrain/Loss (Raw)": 1.9971933364868164, "Pretrain/Step": 6597, "Pretrain/Step Time": 8.483416676521301} +{"Pretrain/Learning Rate": 3.801474325098263e-05, "Pretrain/Loss": 2.0354185104370117, "Pretrain/Loss (Raw)": 2.3083789348602295, "Pretrain/Step": 6598, "Pretrain/Step Time": 8.484823131933808} +{"Pretrain/Learning Rate": 3.801111851105944e-05, "Pretrain/Loss": 2.0334701538085938, "Pretrain/Loss (Raw)": 1.7503068447113037, "Pretrain/Step": 6599, "Pretrain/Step Time": 8.48332498781383} +{"Pretrain/Learning Rate": 3.800749339596981e-05, "Pretrain/Loss": 2.032794713973999, "Pretrain/Loss (Raw)": 1.8925848007202148, "Pretrain/Step": 6600, "Pretrain/Step Time": 8.482007479295135} +{"Pretrain/Learning Rate": 3.800386790581828e-05, "Pretrain/Loss": 2.032869338989258, "Pretrain/Loss (Raw)": 2.1804497241973877, "Pretrain/Step": 6601, "Pretrain/Step Time": 8.485865607857704} +{"Pretrain/Learning Rate": 3.8000242040709377e-05, "Pretrain/Loss": 2.0342206954956055, "Pretrain/Loss (Raw)": 2.223477363586426, "Pretrain/Step": 6602, "Pretrain/Step Time": 8.482364851981401} +{"Pretrain/Learning Rate": 3.799661580074767e-05, "Pretrain/Loss": 2.036660671234131, "Pretrain/Loss (Raw)": 2.166506052017212, "Pretrain/Step": 6603, "Pretrain/Step Time": 8.483002986758947} +{"Pretrain/Learning Rate": 3.7992989186037705e-05, "Pretrain/Loss": 2.0354814529418945, "Pretrain/Loss (Raw)": 1.9228503704071045, "Pretrain/Step": 6604, "Pretrain/Step Time": 8.47965188138187} +{"Pretrain/Learning Rate": 3.798936219668406e-05, "Pretrain/Loss": 2.035165786743164, "Pretrain/Loss (Raw)": 1.969502568244934, "Pretrain/Step": 6605, "Pretrain/Step Time": 8.480892768129706} +{"Pretrain/Learning Rate": 3.7985734832791305e-05, "Pretrain/Loss": 2.0327224731445312, "Pretrain/Loss (Raw)": 1.972106695175171, "Pretrain/Step": 6606, "Pretrain/Step Time": 8.482100930064917} +{"Pretrain/Learning Rate": 3.798210709446405e-05, "Pretrain/Loss": 2.0315749645233154, "Pretrain/Loss (Raw)": 1.748221516609192, "Pretrain/Step": 6607, "Pretrain/Step Time": 8.480834752321243} +{"Pretrain/Learning Rate": 3.797847898180689e-05, "Pretrain/Loss": 2.0331506729125977, "Pretrain/Loss (Raw)": 2.143141269683838, "Pretrain/Step": 6608, "Pretrain/Step Time": 8.479202177375555} +{"Pretrain/Learning Rate": 3.7974850494924425e-05, "Pretrain/Loss": 2.0349528789520264, "Pretrain/Loss (Raw)": 2.2172625064849854, "Pretrain/Step": 6609, "Pretrain/Step Time": 8.479915793985128} +{"Pretrain/Learning Rate": 3.7971221633921305e-05, "Pretrain/Loss": 2.0352253913879395, "Pretrain/Loss (Raw)": 2.1097466945648193, "Pretrain/Step": 6610, "Pretrain/Step Time": 8.48110993206501} +{"Pretrain/Learning Rate": 3.796759239890214e-05, "Pretrain/Loss": 2.0370266437530518, "Pretrain/Loss (Raw)": 2.1718287467956543, "Pretrain/Step": 6611, "Pretrain/Step Time": 8.484360378235579} +{"Pretrain/Learning Rate": 3.79639627899716e-05, "Pretrain/Loss": 2.0383553504943848, "Pretrain/Loss (Raw)": 2.164468288421631, "Pretrain/Step": 6612, "Pretrain/Step Time": 8.483137687668204} +{"Pretrain/Learning Rate": 3.796033280723433e-05, "Pretrain/Loss": 2.0403952598571777, "Pretrain/Loss (Raw)": 2.2364978790283203, "Pretrain/Step": 6613, "Pretrain/Step Time": 8.483620129525661} +{"Pretrain/Learning Rate": 3.7956702450794994e-05, "Pretrain/Loss": 2.042240619659424, "Pretrain/Loss (Raw)": 2.3314218521118164, "Pretrain/Step": 6614, "Pretrain/Step Time": 8.485336845740676} +{"Pretrain/Learning Rate": 3.795307172075828e-05, "Pretrain/Loss": 2.0428824424743652, "Pretrain/Loss (Raw)": 1.9322901964187622, "Pretrain/Step": 6615, "Pretrain/Step Time": 8.480458891019225} +{"Pretrain/Learning Rate": 3.794944061722888e-05, "Pretrain/Loss": 2.041236400604248, "Pretrain/Loss (Raw)": 1.9351913928985596, "Pretrain/Step": 6616, "Pretrain/Step Time": 8.485183328390121} +{"Pretrain/Learning Rate": 3.7945809140311485e-05, "Pretrain/Loss": 2.038796901702881, "Pretrain/Loss (Raw)": 1.8834850788116455, "Pretrain/Step": 6617, "Pretrain/Step Time": 8.489114355295897} +{"Pretrain/Learning Rate": 3.794217729011081e-05, "Pretrain/Loss": 2.039480686187744, "Pretrain/Loss (Raw)": 2.1566476821899414, "Pretrain/Step": 6618, "Pretrain/Step Time": 8.483523478731513} +{"Pretrain/Learning Rate": 3.793854506673157e-05, "Pretrain/Loss": 2.0429985523223877, "Pretrain/Loss (Raw)": 2.4229629039764404, "Pretrain/Step": 6619, "Pretrain/Step Time": 8.4819161221385} +{"Pretrain/Learning Rate": 3.7934912470278514e-05, "Pretrain/Loss": 2.042623519897461, "Pretrain/Loss (Raw)": 2.0802037715911865, "Pretrain/Step": 6620, "Pretrain/Step Time": 8.48337708413601} +{"Pretrain/Learning Rate": 3.793127950085638e-05, "Pretrain/Loss": 2.043527603149414, "Pretrain/Loss (Raw)": 2.1416425704956055, "Pretrain/Step": 6621, "Pretrain/Step Time": 8.47771724872291} +{"Pretrain/Learning Rate": 3.79276461585699e-05, "Pretrain/Loss": 2.0433311462402344, "Pretrain/Loss (Raw)": 1.8529618978500366, "Pretrain/Step": 6622, "Pretrain/Step Time": 8.481170466169715} +{"Pretrain/Learning Rate": 3.7924012443523864e-05, "Pretrain/Loss": 2.0445094108581543, "Pretrain/Loss (Raw)": 2.0701024532318115, "Pretrain/Step": 6623, "Pretrain/Step Time": 8.479647593572736} +{"Pretrain/Learning Rate": 3.792037835582304e-05, "Pretrain/Loss": 2.044222354888916, "Pretrain/Loss (Raw)": 1.959930419921875, "Pretrain/Step": 6624, "Pretrain/Step Time": 8.47931069880724} +{"Pretrain/Learning Rate": 3.791674389557222e-05, "Pretrain/Loss": 2.0463709831237793, "Pretrain/Loss (Raw)": 2.169137716293335, "Pretrain/Step": 6625, "Pretrain/Step Time": 8.485070198774338} +{"Pretrain/Learning Rate": 3.79131090628762e-05, "Pretrain/Loss": 2.04738187789917, "Pretrain/Loss (Raw)": 2.0421924591064453, "Pretrain/Step": 6626, "Pretrain/Step Time": 8.484995940700173} +{"Pretrain/Learning Rate": 3.790947385783976e-05, "Pretrain/Loss": 2.0486855506896973, "Pretrain/Loss (Raw)": 2.177518844604492, "Pretrain/Step": 6627, "Pretrain/Step Time": 8.488190446048975} +{"Pretrain/Learning Rate": 3.790583828056776e-05, "Pretrain/Loss": 2.0492610931396484, "Pretrain/Loss (Raw)": 1.954264521598816, "Pretrain/Step": 6628, "Pretrain/Step Time": 8.488409761339426} +{"Pretrain/Learning Rate": 3.7902202331165e-05, "Pretrain/Loss": 2.0471062660217285, "Pretrain/Loss (Raw)": 2.029513120651245, "Pretrain/Step": 6629, "Pretrain/Step Time": 8.488486181944609} +{"Pretrain/Learning Rate": 3.789856600973635e-05, "Pretrain/Loss": 2.045153856277466, "Pretrain/Loss (Raw)": 1.9984068870544434, "Pretrain/Step": 6630, "Pretrain/Step Time": 8.487279025837779} +{"Pretrain/Learning Rate": 3.789492931638663e-05, "Pretrain/Loss": 2.043407917022705, "Pretrain/Loss (Raw)": 1.8590755462646484, "Pretrain/Step": 6631, "Pretrain/Step Time": 8.488673724234104} +{"Pretrain/Learning Rate": 3.789129225122071e-05, "Pretrain/Loss": 2.0468411445617676, "Pretrain/Loss (Raw)": 2.3623602390289307, "Pretrain/Step": 6632, "Pretrain/Step Time": 8.490566182881594} +{"Pretrain/Learning Rate": 3.788765481434347e-05, "Pretrain/Loss": 2.0454883575439453, "Pretrain/Loss (Raw)": 1.7979929447174072, "Pretrain/Step": 6633, "Pretrain/Step Time": 8.496736131608486} +{"Pretrain/Learning Rate": 3.7884017005859786e-05, "Pretrain/Loss": 2.0452914237976074, "Pretrain/Loss (Raw)": 1.9398250579833984, "Pretrain/Step": 6634, "Pretrain/Step Time": 8.495858043432236} +{"Pretrain/Learning Rate": 3.7880378825874556e-05, "Pretrain/Loss": 2.0472517013549805, "Pretrain/Loss (Raw)": 2.211451292037964, "Pretrain/Step": 6635, "Pretrain/Step Time": 8.494346300140023} +{"Pretrain/Learning Rate": 3.787674027449269e-05, "Pretrain/Loss": 2.0496044158935547, "Pretrain/Loss (Raw)": 2.098754405975342, "Pretrain/Step": 6636, "Pretrain/Step Time": 8.49564235843718} +{"Pretrain/Learning Rate": 3.787310135181908e-05, "Pretrain/Loss": 2.0517191886901855, "Pretrain/Loss (Raw)": 2.153796672821045, "Pretrain/Step": 6637, "Pretrain/Step Time": 8.494083994999528} +{"Pretrain/Learning Rate": 3.786946205795868e-05, "Pretrain/Loss": 2.051760673522949, "Pretrain/Loss (Raw)": 2.1197516918182373, "Pretrain/Step": 6638, "Pretrain/Step Time": 8.490620514377952} +{"Pretrain/Learning Rate": 3.7865822393016416e-05, "Pretrain/Loss": 2.051323175430298, "Pretrain/Loss (Raw)": 2.086603879928589, "Pretrain/Step": 6639, "Pretrain/Step Time": 8.494859294965863} +{"Pretrain/Learning Rate": 3.786218235709722e-05, "Pretrain/Loss": 2.0512266159057617, "Pretrain/Loss (Raw)": 2.0710721015930176, "Pretrain/Step": 6640, "Pretrain/Step Time": 8.496107753366232} +{"Pretrain/Learning Rate": 3.785854195030607e-05, "Pretrain/Loss": 2.0494918823242188, "Pretrain/Loss (Raw)": 1.9107249975204468, "Pretrain/Step": 6641, "Pretrain/Step Time": 8.501370130106807} +{"Pretrain/Learning Rate": 3.7854901172747936e-05, "Pretrain/Loss": 2.0492000579833984, "Pretrain/Loss (Raw)": 2.1289215087890625, "Pretrain/Step": 6642, "Pretrain/Step Time": 8.49966410920024} +{"Pretrain/Learning Rate": 3.785126002452778e-05, "Pretrain/Loss": 2.0484089851379395, "Pretrain/Loss (Raw)": 1.9201581478118896, "Pretrain/Step": 6643, "Pretrain/Step Time": 8.496499435976148} +{"Pretrain/Learning Rate": 3.7847618505750595e-05, "Pretrain/Loss": 2.048659563064575, "Pretrain/Loss (Raw)": 2.008192777633667, "Pretrain/Step": 6644, "Pretrain/Step Time": 8.49957224726677} +{"Pretrain/Learning Rate": 3.7843976616521394e-05, "Pretrain/Loss": 2.0481057167053223, "Pretrain/Loss (Raw)": 2.0322084426879883, "Pretrain/Step": 6645, "Pretrain/Step Time": 8.502517646178603} +{"Pretrain/Learning Rate": 3.7840334356945183e-05, "Pretrain/Loss": 2.048983097076416, "Pretrain/Loss (Raw)": 2.095062732696533, "Pretrain/Step": 6646, "Pretrain/Step Time": 8.501344060525298} +{"Pretrain/Learning Rate": 3.783669172712698e-05, "Pretrain/Loss": 2.0480873584747314, "Pretrain/Loss (Raw)": 2.0231311321258545, "Pretrain/Step": 6647, "Pretrain/Step Time": 8.502542512491345} +{"Pretrain/Learning Rate": 3.783304872717183e-05, "Pretrain/Loss": 2.045584201812744, "Pretrain/Loss (Raw)": 1.7857310771942139, "Pretrain/Step": 6648, "Pretrain/Step Time": 8.505225909873843} +{"Pretrain/Learning Rate": 3.7829405357184755e-05, "Pretrain/Loss": 2.0466737747192383, "Pretrain/Loss (Raw)": 2.0542221069335938, "Pretrain/Step": 6649, "Pretrain/Step Time": 8.50531317293644} +{"Pretrain/Learning Rate": 3.782576161727083e-05, "Pretrain/Loss": 2.047395706176758, "Pretrain/Loss (Raw)": 1.9086339473724365, "Pretrain/Step": 6650, "Pretrain/Step Time": 8.499403273686767} +{"Pretrain/Learning Rate": 3.78221175075351e-05, "Pretrain/Loss": 2.0474889278411865, "Pretrain/Loss (Raw)": 1.942745566368103, "Pretrain/Step": 6651, "Pretrain/Step Time": 8.501008054241538} +{"Pretrain/Learning Rate": 3.781847302808265e-05, "Pretrain/Loss": 2.0480031967163086, "Pretrain/Loss (Raw)": 2.0463662147521973, "Pretrain/Step": 6652, "Pretrain/Step Time": 8.500863954424858} +{"Pretrain/Learning Rate": 3.781482817901858e-05, "Pretrain/Loss": 2.0491223335266113, "Pretrain/Loss (Raw)": 2.083907127380371, "Pretrain/Step": 6653, "Pretrain/Step Time": 8.50014566630125} +{"Pretrain/Learning Rate": 3.781118296044796e-05, "Pretrain/Loss": 2.048104763031006, "Pretrain/Loss (Raw)": 1.9656914472579956, "Pretrain/Step": 6654, "Pretrain/Step Time": 8.499936101958156} +{"Pretrain/Learning Rate": 3.7807537372475916e-05, "Pretrain/Loss": 2.045457363128662, "Pretrain/Loss (Raw)": 1.8760879039764404, "Pretrain/Step": 6655, "Pretrain/Step Time": 8.502468798309565} +{"Pretrain/Learning Rate": 3.780389141520756e-05, "Pretrain/Loss": 2.0453505516052246, "Pretrain/Loss (Raw)": 2.122934103012085, "Pretrain/Step": 6656, "Pretrain/Step Time": 8.50657314620912} +{"Pretrain/Learning Rate": 3.780024508874802e-05, "Pretrain/Loss": 2.047354221343994, "Pretrain/Loss (Raw)": 2.0407216548919678, "Pretrain/Step": 6657, "Pretrain/Step Time": 8.503699073567986} +{"Pretrain/Learning Rate": 3.779659839320244e-05, "Pretrain/Loss": 2.0462918281555176, "Pretrain/Loss (Raw)": 2.158637523651123, "Pretrain/Step": 6658, "Pretrain/Step Time": 8.509543601423502} +{"Pretrain/Learning Rate": 3.7792951328675965e-05, "Pretrain/Loss": 2.047879219055176, "Pretrain/Loss (Raw)": 2.154015064239502, "Pretrain/Step": 6659, "Pretrain/Step Time": 8.507234930992126} +{"Pretrain/Learning Rate": 3.778930389527375e-05, "Pretrain/Loss": 2.0508151054382324, "Pretrain/Loss (Raw)": 2.2739248275756836, "Pretrain/Step": 6660, "Pretrain/Step Time": 8.507522692903876} +{"Pretrain/Learning Rate": 3.778565609310098e-05, "Pretrain/Loss": 2.0485541820526123, "Pretrain/Loss (Raw)": 2.06872820854187, "Pretrain/Step": 6661, "Pretrain/Step Time": 8.506055826321244} +{"Pretrain/Learning Rate": 3.7782007922262827e-05, "Pretrain/Loss": 2.046966075897217, "Pretrain/Loss (Raw)": 1.9249510765075684, "Pretrain/Step": 6662, "Pretrain/Step Time": 8.504027165472507} +{"Pretrain/Learning Rate": 3.7778359382864495e-05, "Pretrain/Loss": 2.0475847721099854, "Pretrain/Loss (Raw)": 1.913864016532898, "Pretrain/Step": 6663, "Pretrain/Step Time": 8.508016273379326} +{"Pretrain/Learning Rate": 3.777471047501117e-05, "Pretrain/Loss": 2.0492148399353027, "Pretrain/Loss (Raw)": 2.1756999492645264, "Pretrain/Step": 6664, "Pretrain/Step Time": 8.502809749916196} +{"Pretrain/Learning Rate": 3.777106119880808e-05, "Pretrain/Loss": 2.049973249435425, "Pretrain/Loss (Raw)": 2.0409176349639893, "Pretrain/Step": 6665, "Pretrain/Step Time": 8.49464163556695} +{"Pretrain/Learning Rate": 3.7767411554360435e-05, "Pretrain/Loss": 2.0549538135528564, "Pretrain/Loss (Raw)": 2.57664155960083, "Pretrain/Step": 6666, "Pretrain/Step Time": 8.499560540542006} +{"Pretrain/Learning Rate": 3.776376154177348e-05, "Pretrain/Loss": 2.0549628734588623, "Pretrain/Loss (Raw)": 2.1080150604248047, "Pretrain/Step": 6667, "Pretrain/Step Time": 8.49910331144929} +{"Pretrain/Learning Rate": 3.7760111161152465e-05, "Pretrain/Loss": 2.0562446117401123, "Pretrain/Loss (Raw)": 2.223461627960205, "Pretrain/Step": 6668, "Pretrain/Step Time": 8.500726100057364} +{"Pretrain/Learning Rate": 3.775646041260264e-05, "Pretrain/Loss": 2.0545969009399414, "Pretrain/Loss (Raw)": 1.85233736038208, "Pretrain/Step": 6669, "Pretrain/Step Time": 8.501513130962849} +{"Pretrain/Learning Rate": 3.7752809296229255e-05, "Pretrain/Loss": 2.057030200958252, "Pretrain/Loss (Raw)": 2.1424479484558105, "Pretrain/Step": 6670, "Pretrain/Step Time": 8.500787563621998} +{"Pretrain/Learning Rate": 3.774915781213762e-05, "Pretrain/Loss": 2.058525562286377, "Pretrain/Loss (Raw)": 2.063124656677246, "Pretrain/Step": 6671, "Pretrain/Step Time": 8.508185185492039} +{"Pretrain/Learning Rate": 3.7745505960433e-05, "Pretrain/Loss": 2.058312177658081, "Pretrain/Loss (Raw)": 1.9959962368011475, "Pretrain/Step": 6672, "Pretrain/Step Time": 8.504638187587261} +{"Pretrain/Learning Rate": 3.7741853741220714e-05, "Pretrain/Loss": 2.0556774139404297, "Pretrain/Loss (Raw)": 1.8903725147247314, "Pretrain/Step": 6673, "Pretrain/Step Time": 8.502161970362067} +{"Pretrain/Learning Rate": 3.7738201154606044e-05, "Pretrain/Loss": 2.0565457344055176, "Pretrain/Loss (Raw)": 2.120789051055908, "Pretrain/Step": 6674, "Pretrain/Step Time": 8.50486259534955} +{"Pretrain/Learning Rate": 3.773454820069433e-05, "Pretrain/Loss": 2.0557069778442383, "Pretrain/Loss (Raw)": 2.0355334281921387, "Pretrain/Step": 6675, "Pretrain/Step Time": 8.504999356344342} +{"Pretrain/Learning Rate": 3.7730894879590886e-05, "Pretrain/Loss": 2.0575857162475586, "Pretrain/Loss (Raw)": 2.022752046585083, "Pretrain/Step": 6676, "Pretrain/Step Time": 8.499740172177553} +{"Pretrain/Learning Rate": 3.772724119140107e-05, "Pretrain/Loss": 2.057546615600586, "Pretrain/Loss (Raw)": 2.0155115127563477, "Pretrain/Step": 6677, "Pretrain/Step Time": 8.503774048760533} +{"Pretrain/Learning Rate": 3.772358713623023e-05, "Pretrain/Loss": 2.0570144653320312, "Pretrain/Loss (Raw)": 1.8574024438858032, "Pretrain/Step": 6678, "Pretrain/Step Time": 8.50398937240243} +{"Pretrain/Learning Rate": 3.771993271418372e-05, "Pretrain/Loss": 2.058544158935547, "Pretrain/Loss (Raw)": 2.3560988903045654, "Pretrain/Step": 6679, "Pretrain/Step Time": 8.498510539531708} +{"Pretrain/Learning Rate": 3.7716277925366914e-05, "Pretrain/Loss": 2.0599284172058105, "Pretrain/Loss (Raw)": 2.073289155960083, "Pretrain/Step": 6680, "Pretrain/Step Time": 8.49526629038155} +{"Pretrain/Learning Rate": 3.771262276988521e-05, "Pretrain/Loss": 2.059776544570923, "Pretrain/Loss (Raw)": 2.0623939037323, "Pretrain/Step": 6681, "Pretrain/Step Time": 8.493001924827695} +{"Pretrain/Learning Rate": 3.770896724784398e-05, "Pretrain/Loss": 2.061485528945923, "Pretrain/Loss (Raw)": 2.146697998046875, "Pretrain/Step": 6682, "Pretrain/Step Time": 8.493836814537644} +{"Pretrain/Learning Rate": 3.7705311359348635e-05, "Pretrain/Loss": 2.06234073638916, "Pretrain/Loss (Raw)": 2.1541171073913574, "Pretrain/Step": 6683, "Pretrain/Step Time": 8.495174502953887} +{"Pretrain/Learning Rate": 3.770165510450461e-05, "Pretrain/Loss": 2.0623064041137695, "Pretrain/Loss (Raw)": 1.9075007438659668, "Pretrain/Step": 6684, "Pretrain/Step Time": 8.495802210643888} +{"Pretrain/Learning Rate": 3.769799848341731e-05, "Pretrain/Loss": 2.0598812103271484, "Pretrain/Loss (Raw)": 1.8721669912338257, "Pretrain/Step": 6685, "Pretrain/Step Time": 8.491787610575557} +{"Pretrain/Learning Rate": 3.7694341496192166e-05, "Pretrain/Loss": 2.0592875480651855, "Pretrain/Loss (Raw)": 1.895208716392517, "Pretrain/Step": 6686, "Pretrain/Step Time": 8.493789864704013} +{"Pretrain/Learning Rate": 3.769068414293463e-05, "Pretrain/Loss": 2.0566046237945557, "Pretrain/Loss (Raw)": 1.901519775390625, "Pretrain/Step": 6687, "Pretrain/Step Time": 8.492150513455272} +{"Pretrain/Learning Rate": 3.768702642375017e-05, "Pretrain/Loss": 2.0534844398498535, "Pretrain/Loss (Raw)": 1.6666415929794312, "Pretrain/Step": 6688, "Pretrain/Step Time": 8.49266748689115} +{"Pretrain/Learning Rate": 3.768336833874425e-05, "Pretrain/Loss": 2.051868438720703, "Pretrain/Loss (Raw)": 1.8532873392105103, "Pretrain/Step": 6689, "Pretrain/Step Time": 8.495017614215612} +{"Pretrain/Learning Rate": 3.767970988802235e-05, "Pretrain/Loss": 2.0536928176879883, "Pretrain/Loss (Raw)": 2.1515958309173584, "Pretrain/Step": 6690, "Pretrain/Step Time": 8.495707528665662} +{"Pretrain/Learning Rate": 3.7676051071689944e-05, "Pretrain/Loss": 2.0537467002868652, "Pretrain/Loss (Raw)": 2.1688876152038574, "Pretrain/Step": 6691, "Pretrain/Step Time": 8.495018064975739} +{"Pretrain/Learning Rate": 3.767239188985254e-05, "Pretrain/Loss": 2.055205821990967, "Pretrain/Loss (Raw)": 2.222993850708008, "Pretrain/Step": 6692, "Pretrain/Step Time": 8.492566766217351} +{"Pretrain/Learning Rate": 3.7668732342615654e-05, "Pretrain/Loss": 2.056408405303955, "Pretrain/Loss (Raw)": 2.0931005477905273, "Pretrain/Step": 6693, "Pretrain/Step Time": 8.49519537575543} +{"Pretrain/Learning Rate": 3.7665072430084804e-05, "Pretrain/Loss": 2.0562820434570312, "Pretrain/Loss (Raw)": 2.000147819519043, "Pretrain/Step": 6694, "Pretrain/Step Time": 8.493524242192507} +{"Pretrain/Learning Rate": 3.766141215236552e-05, "Pretrain/Loss": 2.05434513092041, "Pretrain/Loss (Raw)": 2.0009243488311768, "Pretrain/Step": 6695, "Pretrain/Step Time": 8.499282833188772} +{"Pretrain/Learning Rate": 3.7657751509563335e-05, "Pretrain/Loss": 2.054279088973999, "Pretrain/Loss (Raw)": 2.199486017227173, "Pretrain/Step": 6696, "Pretrain/Step Time": 8.491831803694367} +{"Pretrain/Learning Rate": 3.765409050178381e-05, "Pretrain/Loss": 2.0530483722686768, "Pretrain/Loss (Raw)": 2.0835859775543213, "Pretrain/Step": 6697, "Pretrain/Step Time": 8.493288638070226} +{"Pretrain/Learning Rate": 3.7650429129132504e-05, "Pretrain/Loss": 2.053492784500122, "Pretrain/Loss (Raw)": 2.0308871269226074, "Pretrain/Step": 6698, "Pretrain/Step Time": 8.4974568746984} +{"Pretrain/Learning Rate": 3.7646767391715e-05, "Pretrain/Loss": 2.052739143371582, "Pretrain/Loss (Raw)": 2.102280378341675, "Pretrain/Step": 6699, "Pretrain/Step Time": 8.493726525455713} +{"Pretrain/Learning Rate": 3.764310528963687e-05, "Pretrain/Loss": 2.0526347160339355, "Pretrain/Loss (Raw)": 2.08412504196167, "Pretrain/Step": 6700, "Pretrain/Step Time": 8.495805138722062} +{"Pretrain/Learning Rate": 3.763944282300371e-05, "Pretrain/Loss": 2.055509090423584, "Pretrain/Loss (Raw)": 2.2685375213623047, "Pretrain/Step": 6701, "Pretrain/Step Time": 8.495925407856703} +{"Pretrain/Learning Rate": 3.763577999192113e-05, "Pretrain/Loss": 2.0549118518829346, "Pretrain/Loss (Raw)": 1.9100371599197388, "Pretrain/Step": 6702, "Pretrain/Step Time": 8.493799466639757} +{"Pretrain/Learning Rate": 3.763211679649473e-05, "Pretrain/Loss": 2.053337812423706, "Pretrain/Loss (Raw)": 1.8775197267532349, "Pretrain/Step": 6703, "Pretrain/Step Time": 8.494020096957684} +{"Pretrain/Learning Rate": 3.762845323683016e-05, "Pretrain/Loss": 2.051511764526367, "Pretrain/Loss (Raw)": 1.9827587604522705, "Pretrain/Step": 6704, "Pretrain/Step Time": 8.490270314738154} +{"Pretrain/Learning Rate": 3.762478931303304e-05, "Pretrain/Loss": 2.049795627593994, "Pretrain/Loss (Raw)": 2.0415780544281006, "Pretrain/Step": 6705, "Pretrain/Step Time": 8.494392905384302} +{"Pretrain/Learning Rate": 3.762112502520902e-05, "Pretrain/Loss": 2.0498998165130615, "Pretrain/Loss (Raw)": 1.8964426517486572, "Pretrain/Step": 6706, "Pretrain/Step Time": 8.487820541486144} +{"Pretrain/Learning Rate": 3.761746037346375e-05, "Pretrain/Loss": 2.049029588699341, "Pretrain/Loss (Raw)": 2.043945074081421, "Pretrain/Step": 6707, "Pretrain/Step Time": 8.494412399828434} +{"Pretrain/Learning Rate": 3.761379535790291e-05, "Pretrain/Loss": 2.0496573448181152, "Pretrain/Loss (Raw)": 2.142927885055542, "Pretrain/Step": 6708, "Pretrain/Step Time": 8.492696957662702} +{"Pretrain/Learning Rate": 3.761012997863218e-05, "Pretrain/Loss": 2.0518240928649902, "Pretrain/Loss (Raw)": 2.1877474784851074, "Pretrain/Step": 6709, "Pretrain/Step Time": 8.493341211229563} +{"Pretrain/Learning Rate": 3.760646423575724e-05, "Pretrain/Loss": 2.050921678543091, "Pretrain/Loss (Raw)": 2.030825138092041, "Pretrain/Step": 6710, "Pretrain/Step Time": 8.497173126786947} +{"Pretrain/Learning Rate": 3.760279812938379e-05, "Pretrain/Loss": 2.055306911468506, "Pretrain/Loss (Raw)": 2.310307025909424, "Pretrain/Step": 6711, "Pretrain/Step Time": 8.493787325918674} +{"Pretrain/Learning Rate": 3.759913165961753e-05, "Pretrain/Loss": 2.0554280281066895, "Pretrain/Loss (Raw)": 2.0950803756713867, "Pretrain/Step": 6712, "Pretrain/Step Time": 8.494330246001482} +{"Pretrain/Learning Rate": 3.75954648265642e-05, "Pretrain/Loss": 2.056009531021118, "Pretrain/Loss (Raw)": 2.1355535984039307, "Pretrain/Step": 6713, "Pretrain/Step Time": 8.496410159394145} +{"Pretrain/Learning Rate": 3.7591797630329515e-05, "Pretrain/Loss": 2.058131456375122, "Pretrain/Loss (Raw)": 2.121309757232666, "Pretrain/Step": 6714, "Pretrain/Step Time": 8.497092206031084} +{"Pretrain/Learning Rate": 3.758813007101922e-05, "Pretrain/Loss": 2.056516408920288, "Pretrain/Loss (Raw)": 1.9671247005462646, "Pretrain/Step": 6715, "Pretrain/Step Time": 8.493668207898736} +{"Pretrain/Learning Rate": 3.758446214873909e-05, "Pretrain/Loss": 2.0566563606262207, "Pretrain/Loss (Raw)": 2.0260491371154785, "Pretrain/Step": 6716, "Pretrain/Step Time": 8.494756359606981} +{"Pretrain/Learning Rate": 3.7580793863594846e-05, "Pretrain/Loss": 2.057302474975586, "Pretrain/Loss (Raw)": 2.2266294956207275, "Pretrain/Step": 6717, "Pretrain/Step Time": 8.498131647706032} +{"Pretrain/Learning Rate": 3.7577125215692276e-05, "Pretrain/Loss": 2.0594544410705566, "Pretrain/Loss (Raw)": 2.3100693225860596, "Pretrain/Step": 6718, "Pretrain/Step Time": 8.496645212173462} +{"Pretrain/Learning Rate": 3.757345620513718e-05, "Pretrain/Loss": 2.0593137741088867, "Pretrain/Loss (Raw)": 2.048379898071289, "Pretrain/Step": 6719, "Pretrain/Step Time": 8.496385753154755} +{"Pretrain/Learning Rate": 3.756978683203532e-05, "Pretrain/Loss": 2.0586624145507812, "Pretrain/Loss (Raw)": 1.9651507139205933, "Pretrain/Step": 6720, "Pretrain/Step Time": 8.495778677985072} +{"Pretrain/Learning Rate": 3.7566117096492536e-05, "Pretrain/Loss": 2.059650421142578, "Pretrain/Loss (Raw)": 2.1659045219421387, "Pretrain/Step": 6721, "Pretrain/Step Time": 8.495512176305056} +{"Pretrain/Learning Rate": 3.756244699861462e-05, "Pretrain/Loss": 2.0578482151031494, "Pretrain/Loss (Raw)": 2.0564401149749756, "Pretrain/Step": 6722, "Pretrain/Step Time": 8.492474844679236} +{"Pretrain/Learning Rate": 3.75587765385074e-05, "Pretrain/Loss": 2.057314872741699, "Pretrain/Loss (Raw)": 1.917158603668213, "Pretrain/Step": 6723, "Pretrain/Step Time": 8.494721829891205} +{"Pretrain/Learning Rate": 3.7555105716276704e-05, "Pretrain/Loss": 2.057745933532715, "Pretrain/Loss (Raw)": 2.0634171962738037, "Pretrain/Step": 6724, "Pretrain/Step Time": 8.495561938732862} +{"Pretrain/Learning Rate": 3.7551434532028395e-05, "Pretrain/Loss": 2.0563817024230957, "Pretrain/Loss (Raw)": 1.8225607872009277, "Pretrain/Step": 6725, "Pretrain/Step Time": 8.49939908273518} +{"Pretrain/Learning Rate": 3.754776298586832e-05, "Pretrain/Loss": 2.0540990829467773, "Pretrain/Loss (Raw)": 2.0162155628204346, "Pretrain/Step": 6726, "Pretrain/Step Time": 8.495867818593979} +{"Pretrain/Learning Rate": 3.754409107790234e-05, "Pretrain/Loss": 2.0549416542053223, "Pretrain/Loss (Raw)": 1.8581737279891968, "Pretrain/Step": 6727, "Pretrain/Step Time": 8.498909030109644} +{"Pretrain/Learning Rate": 3.754041880823633e-05, "Pretrain/Loss": 2.0569305419921875, "Pretrain/Loss (Raw)": 2.147153615951538, "Pretrain/Step": 6728, "Pretrain/Step Time": 8.493386989459395} +{"Pretrain/Learning Rate": 3.75367461769762e-05, "Pretrain/Loss": 2.054279327392578, "Pretrain/Loss (Raw)": 1.8410990238189697, "Pretrain/Step": 6729, "Pretrain/Step Time": 8.493950480595231} +{"Pretrain/Learning Rate": 3.753307318422782e-05, "Pretrain/Loss": 2.0540103912353516, "Pretrain/Loss (Raw)": 2.189056396484375, "Pretrain/Step": 6730, "Pretrain/Step Time": 8.49736064299941} +{"Pretrain/Learning Rate": 3.752939983009712e-05, "Pretrain/Loss": 2.0533370971679688, "Pretrain/Loss (Raw)": 2.0803112983703613, "Pretrain/Step": 6731, "Pretrain/Step Time": 8.497413352131844} +{"Pretrain/Learning Rate": 3.7525726114690006e-05, "Pretrain/Loss": 2.053880214691162, "Pretrain/Loss (Raw)": 1.992384910583496, "Pretrain/Step": 6732, "Pretrain/Step Time": 8.49850358068943} +{"Pretrain/Learning Rate": 3.7522052038112396e-05, "Pretrain/Loss": 2.054807424545288, "Pretrain/Loss (Raw)": 2.0881640911102295, "Pretrain/Step": 6733, "Pretrain/Step Time": 8.496332040056586} +{"Pretrain/Learning Rate": 3.7518377600470256e-05, "Pretrain/Loss": 2.054434061050415, "Pretrain/Loss (Raw)": 1.9243125915527344, "Pretrain/Step": 6734, "Pretrain/Step Time": 8.496281007304788} +{"Pretrain/Learning Rate": 3.751470280186952e-05, "Pretrain/Loss": 2.0574841499328613, "Pretrain/Loss (Raw)": 2.138627767562866, "Pretrain/Step": 6735, "Pretrain/Step Time": 8.497955568134785} +{"Pretrain/Learning Rate": 3.7511027642416155e-05, "Pretrain/Loss": 2.0571036338806152, "Pretrain/Loss (Raw)": 2.094433069229126, "Pretrain/Step": 6736, "Pretrain/Step Time": 8.49646839313209} +{"Pretrain/Learning Rate": 3.750735212221612e-05, "Pretrain/Loss": 2.0564441680908203, "Pretrain/Loss (Raw)": 2.1328701972961426, "Pretrain/Step": 6737, "Pretrain/Step Time": 8.493652550503612} +{"Pretrain/Learning Rate": 3.750367624137541e-05, "Pretrain/Loss": 2.0556282997131348, "Pretrain/Loss (Raw)": 2.005323648452759, "Pretrain/Step": 6738, "Pretrain/Step Time": 8.49110497161746} +{"Pretrain/Learning Rate": 3.7500000000000003e-05, "Pretrain/Loss": 2.054368019104004, "Pretrain/Loss (Raw)": 2.010514259338379, "Pretrain/Step": 6739, "Pretrain/Step Time": 8.492678510025144} +{"Pretrain/Learning Rate": 3.749632339819591e-05, "Pretrain/Loss": 2.0520830154418945, "Pretrain/Loss (Raw)": 1.8719791173934937, "Pretrain/Step": 6740, "Pretrain/Step Time": 8.49467994645238} +{"Pretrain/Learning Rate": 3.749264643606914e-05, "Pretrain/Loss": 2.0489020347595215, "Pretrain/Loss (Raw)": 1.8293499946594238, "Pretrain/Step": 6741, "Pretrain/Step Time": 8.498382221907377} +{"Pretrain/Learning Rate": 3.748896911372572e-05, "Pretrain/Loss": 2.046144485473633, "Pretrain/Loss (Raw)": 1.978416085243225, "Pretrain/Step": 6742, "Pretrain/Step Time": 8.495152605697513} +{"Pretrain/Learning Rate": 3.7485291431271684e-05, "Pretrain/Loss": 2.0475597381591797, "Pretrain/Loss (Raw)": 2.1134402751922607, "Pretrain/Step": 6743, "Pretrain/Step Time": 8.496876373887062} +{"Pretrain/Learning Rate": 3.748161338881307e-05, "Pretrain/Loss": 2.0475847721099854, "Pretrain/Loss (Raw)": 1.9384084939956665, "Pretrain/Step": 6744, "Pretrain/Step Time": 8.495240798220038} +{"Pretrain/Learning Rate": 3.747793498645593e-05, "Pretrain/Loss": 2.0479583740234375, "Pretrain/Loss (Raw)": 1.9313215017318726, "Pretrain/Step": 6745, "Pretrain/Step Time": 8.491255750879645} +{"Pretrain/Learning Rate": 3.7474256224306326e-05, "Pretrain/Loss": 2.0452518463134766, "Pretrain/Loss (Raw)": 1.81022047996521, "Pretrain/Step": 6746, "Pretrain/Step Time": 8.496052782982588} +{"Pretrain/Learning Rate": 3.7470577102470336e-05, "Pretrain/Loss": 2.0414700508117676, "Pretrain/Loss (Raw)": 1.9388707876205444, "Pretrain/Step": 6747, "Pretrain/Step Time": 8.495814625173807} +{"Pretrain/Learning Rate": 3.746689762105407e-05, "Pretrain/Loss": 2.0400681495666504, "Pretrain/Loss (Raw)": 1.9007858037948608, "Pretrain/Step": 6748, "Pretrain/Step Time": 8.49524873495102} +{"Pretrain/Learning Rate": 3.7463217780163576e-05, "Pretrain/Loss": 2.038785457611084, "Pretrain/Loss (Raw)": 1.977458119392395, "Pretrain/Step": 6749, "Pretrain/Step Time": 8.497608534991741} +{"Pretrain/Learning Rate": 3.7459537579904984e-05, "Pretrain/Loss": 2.0401017665863037, "Pretrain/Loss (Raw)": 2.0214359760284424, "Pretrain/Step": 6750, "Pretrain/Step Time": 8.496561331674457} +{"Pretrain/Learning Rate": 3.7455857020384414e-05, "Pretrain/Loss": 2.040287494659424, "Pretrain/Loss (Raw)": 2.09389066696167, "Pretrain/Step": 6751, "Pretrain/Step Time": 8.499261377379298} +{"Pretrain/Learning Rate": 3.7452176101707984e-05, "Pretrain/Loss": 2.0416693687438965, "Pretrain/Loss (Raw)": 2.1367926597595215, "Pretrain/Step": 6752, "Pretrain/Step Time": 8.499518385156989} +{"Pretrain/Learning Rate": 3.744849482398185e-05, "Pretrain/Loss": 2.0407028198242188, "Pretrain/Loss (Raw)": 2.0454089641571045, "Pretrain/Step": 6753, "Pretrain/Step Time": 8.493900524452329} +{"Pretrain/Learning Rate": 3.744481318731213e-05, "Pretrain/Loss": 2.04064679145813, "Pretrain/Loss (Raw)": 2.0350427627563477, "Pretrain/Step": 6754, "Pretrain/Step Time": 8.494768898934126} +{"Pretrain/Learning Rate": 3.7441131191804995e-05, "Pretrain/Loss": 2.042360305786133, "Pretrain/Loss (Raw)": 2.396820068359375, "Pretrain/Step": 6755, "Pretrain/Step Time": 8.49139291420579} +{"Pretrain/Learning Rate": 3.7437448837566615e-05, "Pretrain/Loss": 2.0418787002563477, "Pretrain/Loss (Raw)": 1.8926347494125366, "Pretrain/Step": 6756, "Pretrain/Step Time": 8.496465183794498} +{"Pretrain/Learning Rate": 3.743376612470316e-05, "Pretrain/Loss": 2.04001522064209, "Pretrain/Loss (Raw)": 1.7909960746765137, "Pretrain/Step": 6757, "Pretrain/Step Time": 8.498980458825827} +{"Pretrain/Learning Rate": 3.743008305332084e-05, "Pretrain/Loss": 2.0408496856689453, "Pretrain/Loss (Raw)": 2.1052064895629883, "Pretrain/Step": 6758, "Pretrain/Step Time": 8.496739035472274} +{"Pretrain/Learning Rate": 3.742639962352582e-05, "Pretrain/Loss": 2.042375087738037, "Pretrain/Loss (Raw)": 2.05431866645813, "Pretrain/Step": 6759, "Pretrain/Step Time": 8.49547016993165} +{"Pretrain/Learning Rate": 3.742271583542433e-05, "Pretrain/Loss": 2.0388643741607666, "Pretrain/Loss (Raw)": 1.9129937887191772, "Pretrain/Step": 6760, "Pretrain/Step Time": 8.4947503618896} +{"Pretrain/Learning Rate": 3.7419031689122594e-05, "Pretrain/Loss": 2.038912057876587, "Pretrain/Loss (Raw)": 1.8041105270385742, "Pretrain/Step": 6761, "Pretrain/Step Time": 8.486956100910902} +{"Pretrain/Learning Rate": 3.741534718472682e-05, "Pretrain/Loss": 2.0411906242370605, "Pretrain/Loss (Raw)": 2.2314653396606445, "Pretrain/Step": 6762, "Pretrain/Step Time": 8.487957207486033} +{"Pretrain/Learning Rate": 3.741166232234328e-05, "Pretrain/Loss": 2.0396344661712646, "Pretrain/Loss (Raw)": 2.012279510498047, "Pretrain/Step": 6763, "Pretrain/Step Time": 8.48949215747416} +{"Pretrain/Learning Rate": 3.74079771020782e-05, "Pretrain/Loss": 2.0392045974731445, "Pretrain/Loss (Raw)": 2.0437278747558594, "Pretrain/Step": 6764, "Pretrain/Step Time": 8.490376265719533} +{"Pretrain/Learning Rate": 3.740429152403785e-05, "Pretrain/Loss": 2.037510633468628, "Pretrain/Loss (Raw)": 1.936972737312317, "Pretrain/Step": 6765, "Pretrain/Step Time": 8.493582144379616} +{"Pretrain/Learning Rate": 3.740060558832849e-05, "Pretrain/Loss": 2.0363993644714355, "Pretrain/Loss (Raw)": 1.9774969816207886, "Pretrain/Step": 6766, "Pretrain/Step Time": 8.49300779774785} +{"Pretrain/Learning Rate": 3.739691929505641e-05, "Pretrain/Loss": 2.036463499069214, "Pretrain/Loss (Raw)": 2.0948195457458496, "Pretrain/Step": 6767, "Pretrain/Step Time": 8.489447761327028} +{"Pretrain/Learning Rate": 3.7393232644327914e-05, "Pretrain/Loss": 2.0362682342529297, "Pretrain/Loss (Raw)": 2.04606556892395, "Pretrain/Step": 6768, "Pretrain/Step Time": 8.495440924540162} +{"Pretrain/Learning Rate": 3.738954563624928e-05, "Pretrain/Loss": 2.0346834659576416, "Pretrain/Loss (Raw)": 1.7078857421875, "Pretrain/Step": 6769, "Pretrain/Step Time": 8.49328131787479} +{"Pretrain/Learning Rate": 3.738585827092683e-05, "Pretrain/Loss": 2.032620429992676, "Pretrain/Loss (Raw)": 1.8648309707641602, "Pretrain/Step": 6770, "Pretrain/Step Time": 8.49078170210123} +{"Pretrain/Learning Rate": 3.738217054846689e-05, "Pretrain/Loss": 2.0366666316986084, "Pretrain/Loss (Raw)": 2.438103675842285, "Pretrain/Step": 6771, "Pretrain/Step Time": 8.491877956315875} +{"Pretrain/Learning Rate": 3.7378482468975796e-05, "Pretrain/Loss": 2.03548526763916, "Pretrain/Loss (Raw)": 1.8569527864456177, "Pretrain/Step": 6772, "Pretrain/Step Time": 8.492064613848925} +{"Pretrain/Learning Rate": 3.737479403255989e-05, "Pretrain/Loss": 2.036440372467041, "Pretrain/Loss (Raw)": 2.1544675827026367, "Pretrain/Step": 6773, "Pretrain/Step Time": 8.491506973281503} +{"Pretrain/Learning Rate": 3.737110523932551e-05, "Pretrain/Loss": 2.035670280456543, "Pretrain/Loss (Raw)": 1.996497631072998, "Pretrain/Step": 6774, "Pretrain/Step Time": 8.490429043769836} +{"Pretrain/Learning Rate": 3.7367416089379047e-05, "Pretrain/Loss": 2.035031795501709, "Pretrain/Loss (Raw)": 1.9414247274398804, "Pretrain/Step": 6775, "Pretrain/Step Time": 8.490976924076676} +{"Pretrain/Learning Rate": 3.7363726582826844e-05, "Pretrain/Loss": 2.0375800132751465, "Pretrain/Loss (Raw)": 2.111877202987671, "Pretrain/Step": 6776, "Pretrain/Step Time": 8.491278314962983} +{"Pretrain/Learning Rate": 3.736003671977531e-05, "Pretrain/Loss": 2.0371506214141846, "Pretrain/Loss (Raw)": 1.999274730682373, "Pretrain/Step": 6777, "Pretrain/Step Time": 8.491924742236733} +{"Pretrain/Learning Rate": 3.735634650033082e-05, "Pretrain/Loss": 2.039273500442505, "Pretrain/Loss (Raw)": 2.1803500652313232, "Pretrain/Step": 6778, "Pretrain/Step Time": 8.489674923941493} +{"Pretrain/Learning Rate": 3.73526559245998e-05, "Pretrain/Loss": 2.0383780002593994, "Pretrain/Loss (Raw)": 1.8281344175338745, "Pretrain/Step": 6779, "Pretrain/Step Time": 8.485746851190925} +{"Pretrain/Learning Rate": 3.734896499268866e-05, "Pretrain/Loss": 2.038418769836426, "Pretrain/Loss (Raw)": 2.051602602005005, "Pretrain/Step": 6780, "Pretrain/Step Time": 8.490704003721476} +{"Pretrain/Learning Rate": 3.73452737047038e-05, "Pretrain/Loss": 2.037951946258545, "Pretrain/Loss (Raw)": 2.024127244949341, "Pretrain/Step": 6781, "Pretrain/Step Time": 8.492665460333228} +{"Pretrain/Learning Rate": 3.734158206075169e-05, "Pretrain/Loss": 2.0386388301849365, "Pretrain/Loss (Raw)": 2.0536019802093506, "Pretrain/Step": 6782, "Pretrain/Step Time": 8.489721307531} +{"Pretrain/Learning Rate": 3.7337890060938755e-05, "Pretrain/Loss": 2.0408883094787598, "Pretrain/Loss (Raw)": 2.164010524749756, "Pretrain/Step": 6783, "Pretrain/Step Time": 8.489120731130242} +{"Pretrain/Learning Rate": 3.733419770537147e-05, "Pretrain/Loss": 2.0403342247009277, "Pretrain/Loss (Raw)": 2.052032232284546, "Pretrain/Step": 6784, "Pretrain/Step Time": 8.490745954215527} +{"Pretrain/Learning Rate": 3.733050499415628e-05, "Pretrain/Loss": 2.040661334991455, "Pretrain/Loss (Raw)": 2.082585573196411, "Pretrain/Step": 6785, "Pretrain/Step Time": 8.489830251783133} +{"Pretrain/Learning Rate": 3.7326811927399664e-05, "Pretrain/Loss": 2.039707899093628, "Pretrain/Loss (Raw)": 2.0366013050079346, "Pretrain/Step": 6786, "Pretrain/Step Time": 8.48187737353146} +{"Pretrain/Learning Rate": 3.7323118505208123e-05, "Pretrain/Loss": 2.0409369468688965, "Pretrain/Loss (Raw)": 2.3113605976104736, "Pretrain/Step": 6787, "Pretrain/Step Time": 8.484443306922913} +{"Pretrain/Learning Rate": 3.7319424727688146e-05, "Pretrain/Loss": 2.0400333404541016, "Pretrain/Loss (Raw)": 2.158240556716919, "Pretrain/Step": 6788, "Pretrain/Step Time": 8.484326904639602} +{"Pretrain/Learning Rate": 3.731573059494624e-05, "Pretrain/Loss": 2.041496992111206, "Pretrain/Loss (Raw)": 2.256058692932129, "Pretrain/Step": 6789, "Pretrain/Step Time": 8.483522027730942} +{"Pretrain/Learning Rate": 3.7312036107088935e-05, "Pretrain/Loss": 2.043285846710205, "Pretrain/Loss (Raw)": 2.153934955596924, "Pretrain/Step": 6790, "Pretrain/Step Time": 8.485819218680263} +{"Pretrain/Learning Rate": 3.7308341264222735e-05, "Pretrain/Loss": 2.0455288887023926, "Pretrain/Loss (Raw)": 2.2009851932525635, "Pretrain/Step": 6791, "Pretrain/Step Time": 8.484410548582673} +{"Pretrain/Learning Rate": 3.7304646066454195e-05, "Pretrain/Loss": 2.0435292720794678, "Pretrain/Loss (Raw)": 1.919749140739441, "Pretrain/Step": 6792, "Pretrain/Step Time": 8.485941033810377} +{"Pretrain/Learning Rate": 3.730095051388986e-05, "Pretrain/Loss": 2.0440988540649414, "Pretrain/Loss (Raw)": 2.1138288974761963, "Pretrain/Step": 6793, "Pretrain/Step Time": 8.487224334850907} +{"Pretrain/Learning Rate": 3.729725460663629e-05, "Pretrain/Loss": 2.0389981269836426, "Pretrain/Loss (Raw)": 1.9237135648727417, "Pretrain/Step": 6794, "Pretrain/Step Time": 8.48253477923572} +{"Pretrain/Learning Rate": 3.729355834480006e-05, "Pretrain/Loss": 2.0373849868774414, "Pretrain/Loss (Raw)": 1.901561975479126, "Pretrain/Step": 6795, "Pretrain/Step Time": 8.484570503234863} +{"Pretrain/Learning Rate": 3.728986172848773e-05, "Pretrain/Loss": 2.0353970527648926, "Pretrain/Loss (Raw)": 1.9690018892288208, "Pretrain/Step": 6796, "Pretrain/Step Time": 8.480712024495006} +{"Pretrain/Learning Rate": 3.7286164757805904e-05, "Pretrain/Loss": 2.035536050796509, "Pretrain/Loss (Raw)": 1.870123267173767, "Pretrain/Step": 6797, "Pretrain/Step Time": 8.485795391723514} +{"Pretrain/Learning Rate": 3.728246743286118e-05, "Pretrain/Loss": 2.0323281288146973, "Pretrain/Loss (Raw)": 1.7318392992019653, "Pretrain/Step": 6798, "Pretrain/Step Time": 8.488877048715949} +{"Pretrain/Learning Rate": 3.727876975376016e-05, "Pretrain/Loss": 2.032106399536133, "Pretrain/Loss (Raw)": 2.0347254276275635, "Pretrain/Step": 6799, "Pretrain/Step Time": 8.482807341963053} +{"Pretrain/Learning Rate": 3.727507172060948e-05, "Pretrain/Loss": 2.0315258502960205, "Pretrain/Loss (Raw)": 1.9216961860656738, "Pretrain/Step": 6800, "Pretrain/Step Time": 8.484640277922153} +{"Pretrain/Learning Rate": 3.727137333351576e-05, "Pretrain/Loss": 2.0341649055480957, "Pretrain/Loss (Raw)": 2.2281835079193115, "Pretrain/Step": 6801, "Pretrain/Step Time": 8.484842993319035} +{"Pretrain/Learning Rate": 3.726767459258563e-05, "Pretrain/Loss": 2.0357675552368164, "Pretrain/Loss (Raw)": 2.325900077819824, "Pretrain/Step": 6802, "Pretrain/Step Time": 8.486731326207519} +{"Pretrain/Learning Rate": 3.7263975497925756e-05, "Pretrain/Loss": 2.03519868850708, "Pretrain/Loss (Raw)": 1.9627254009246826, "Pretrain/Step": 6803, "Pretrain/Step Time": 8.488673210144043} +{"Pretrain/Learning Rate": 3.726027604964279e-05, "Pretrain/Loss": 2.0343832969665527, "Pretrain/Loss (Raw)": 1.9183745384216309, "Pretrain/Step": 6804, "Pretrain/Step Time": 8.489366997033358} +{"Pretrain/Learning Rate": 3.7256576247843425e-05, "Pretrain/Loss": 2.034400701522827, "Pretrain/Loss (Raw)": 2.0177650451660156, "Pretrain/Step": 6805, "Pretrain/Step Time": 8.483502706512809} +{"Pretrain/Learning Rate": 3.7252876092634306e-05, "Pretrain/Loss": 2.036785364151001, "Pretrain/Loss (Raw)": 2.1626408100128174, "Pretrain/Step": 6806, "Pretrain/Step Time": 8.486309232190251} +{"Pretrain/Learning Rate": 3.724917558412215e-05, "Pretrain/Loss": 2.0332322120666504, "Pretrain/Loss (Raw)": 1.901313066482544, "Pretrain/Step": 6807, "Pretrain/Step Time": 8.487246399745345} +{"Pretrain/Learning Rate": 3.724547472241365e-05, "Pretrain/Loss": 2.0312464237213135, "Pretrain/Loss (Raw)": 1.8190808296203613, "Pretrain/Step": 6808, "Pretrain/Step Time": 8.483909467235208} +{"Pretrain/Learning Rate": 3.7241773507615515e-05, "Pretrain/Loss": 2.028445243835449, "Pretrain/Loss (Raw)": 1.7038551568984985, "Pretrain/Step": 6809, "Pretrain/Step Time": 8.489913506433368} +{"Pretrain/Learning Rate": 3.723807193983447e-05, "Pretrain/Loss": 2.028831958770752, "Pretrain/Loss (Raw)": 2.196162462234497, "Pretrain/Step": 6810, "Pretrain/Step Time": 8.487515177577734} +{"Pretrain/Learning Rate": 3.7234370019177255e-05, "Pretrain/Loss": 2.0282318592071533, "Pretrain/Loss (Raw)": 2.0773308277130127, "Pretrain/Step": 6811, "Pretrain/Step Time": 8.488585095852613} +{"Pretrain/Learning Rate": 3.72306677457506e-05, "Pretrain/Loss": 2.0308265686035156, "Pretrain/Loss (Raw)": 2.239619255065918, "Pretrain/Step": 6812, "Pretrain/Step Time": 8.488254332914948} +{"Pretrain/Learning Rate": 3.7226965119661265e-05, "Pretrain/Loss": 2.0320961475372314, "Pretrain/Loss (Raw)": 2.034665822982788, "Pretrain/Step": 6813, "Pretrain/Step Time": 8.48943491652608} +{"Pretrain/Learning Rate": 3.722326214101601e-05, "Pretrain/Loss": 2.0334558486938477, "Pretrain/Loss (Raw)": 2.0692496299743652, "Pretrain/Step": 6814, "Pretrain/Step Time": 8.488376909866929} +{"Pretrain/Learning Rate": 3.7219558809921605e-05, "Pretrain/Loss": 2.0336594581604004, "Pretrain/Loss (Raw)": 1.927593469619751, "Pretrain/Step": 6815, "Pretrain/Step Time": 8.488200901076198} +{"Pretrain/Learning Rate": 3.721585512648484e-05, "Pretrain/Loss": 2.0359463691711426, "Pretrain/Loss (Raw)": 1.9593379497528076, "Pretrain/Step": 6816, "Pretrain/Step Time": 8.491907043382525} +{"Pretrain/Learning Rate": 3.721215109081251e-05, "Pretrain/Loss": 2.037464141845703, "Pretrain/Loss (Raw)": 2.0476014614105225, "Pretrain/Step": 6817, "Pretrain/Step Time": 8.489110823720694} +{"Pretrain/Learning Rate": 3.720844670301141e-05, "Pretrain/Loss": 2.0377883911132812, "Pretrain/Loss (Raw)": 2.193061590194702, "Pretrain/Step": 6818, "Pretrain/Step Time": 8.483656695112586} +{"Pretrain/Learning Rate": 3.720474196318835e-05, "Pretrain/Loss": 2.035348892211914, "Pretrain/Loss (Raw)": 1.85664963722229, "Pretrain/Step": 6819, "Pretrain/Step Time": 8.48189838975668} +{"Pretrain/Learning Rate": 3.720103687145016e-05, "Pretrain/Loss": 2.0335779190063477, "Pretrain/Loss (Raw)": 1.9962928295135498, "Pretrain/Step": 6820, "Pretrain/Step Time": 8.488811178132892} +{"Pretrain/Learning Rate": 3.719733142790367e-05, "Pretrain/Loss": 2.033297061920166, "Pretrain/Loss (Raw)": 2.057166337966919, "Pretrain/Step": 6821, "Pretrain/Step Time": 8.485506732016802} +{"Pretrain/Learning Rate": 3.719362563265573e-05, "Pretrain/Loss": 2.0344529151916504, "Pretrain/Loss (Raw)": 2.148123264312744, "Pretrain/Step": 6822, "Pretrain/Step Time": 8.487522665411234} +{"Pretrain/Learning Rate": 3.71899194858132e-05, "Pretrain/Loss": 2.0348734855651855, "Pretrain/Loss (Raw)": 2.05474591255188, "Pretrain/Step": 6823, "Pretrain/Step Time": 8.4871532227844} +{"Pretrain/Learning Rate": 3.7186212987482915e-05, "Pretrain/Loss": 2.033459424972534, "Pretrain/Loss (Raw)": 2.0184547901153564, "Pretrain/Step": 6824, "Pretrain/Step Time": 8.490175761282444} +{"Pretrain/Learning Rate": 3.718250613777178e-05, "Pretrain/Loss": 2.0322957038879395, "Pretrain/Loss (Raw)": 1.934647560119629, "Pretrain/Step": 6825, "Pretrain/Step Time": 8.487231750041246} +{"Pretrain/Learning Rate": 3.717879893678667e-05, "Pretrain/Loss": 2.0315756797790527, "Pretrain/Loss (Raw)": 1.9387458562850952, "Pretrain/Step": 6826, "Pretrain/Step Time": 8.481978058815002} +{"Pretrain/Learning Rate": 3.717509138463448e-05, "Pretrain/Loss": 2.0320382118225098, "Pretrain/Loss (Raw)": 2.161461591720581, "Pretrain/Step": 6827, "Pretrain/Step Time": 8.483447359874845} +{"Pretrain/Learning Rate": 3.717138348142211e-05, "Pretrain/Loss": 2.0317869186401367, "Pretrain/Loss (Raw)": 2.05195689201355, "Pretrain/Step": 6828, "Pretrain/Step Time": 8.483369084075093} +{"Pretrain/Learning Rate": 3.716767522725648e-05, "Pretrain/Loss": 2.029067277908325, "Pretrain/Loss (Raw)": 1.9204267263412476, "Pretrain/Step": 6829, "Pretrain/Step Time": 8.485050735995173} +{"Pretrain/Learning Rate": 3.71639666222445e-05, "Pretrain/Loss": 2.0307674407958984, "Pretrain/Loss (Raw)": 2.1276447772979736, "Pretrain/Step": 6830, "Pretrain/Step Time": 8.486692104488611} +{"Pretrain/Learning Rate": 3.716025766649313e-05, "Pretrain/Loss": 2.028764247894287, "Pretrain/Loss (Raw)": 1.6211200952529907, "Pretrain/Step": 6831, "Pretrain/Step Time": 8.485326893627644} +{"Pretrain/Learning Rate": 3.71565483601093e-05, "Pretrain/Loss": 2.0296471118927, "Pretrain/Loss (Raw)": 2.095766067504883, "Pretrain/Step": 6832, "Pretrain/Step Time": 8.48878981359303} +{"Pretrain/Learning Rate": 3.715283870319997e-05, "Pretrain/Loss": 2.0309906005859375, "Pretrain/Loss (Raw)": 2.21356463432312, "Pretrain/Step": 6833, "Pretrain/Step Time": 8.489641729742289} +{"Pretrain/Learning Rate": 3.71491286958721e-05, "Pretrain/Loss": 2.0316901206970215, "Pretrain/Loss (Raw)": 1.9859519004821777, "Pretrain/Step": 6834, "Pretrain/Step Time": 8.486856101080775} +{"Pretrain/Learning Rate": 3.714541833823267e-05, "Pretrain/Loss": 2.031008005142212, "Pretrain/Loss (Raw)": 1.9566491842269897, "Pretrain/Step": 6835, "Pretrain/Step Time": 8.486628724262118} +{"Pretrain/Learning Rate": 3.714170763038866e-05, "Pretrain/Loss": 2.0306098461151123, "Pretrain/Loss (Raw)": 2.0919480323791504, "Pretrain/Step": 6836, "Pretrain/Step Time": 8.49171063862741} +{"Pretrain/Learning Rate": 3.7137996572447077e-05, "Pretrain/Loss": 2.025210380554199, "Pretrain/Loss (Raw)": 1.4966474771499634, "Pretrain/Step": 6837, "Pretrain/Step Time": 8.48692568950355} +{"Pretrain/Learning Rate": 3.713428516451491e-05, "Pretrain/Loss": 2.024078369140625, "Pretrain/Loss (Raw)": 1.8859299421310425, "Pretrain/Step": 6838, "Pretrain/Step Time": 8.487881796434522} +{"Pretrain/Learning Rate": 3.7130573406699196e-05, "Pretrain/Loss": 2.0229339599609375, "Pretrain/Loss (Raw)": 2.1638026237487793, "Pretrain/Step": 6839, "Pretrain/Step Time": 8.48584234714508} +{"Pretrain/Learning Rate": 3.712686129910694e-05, "Pretrain/Loss": 2.0233659744262695, "Pretrain/Loss (Raw)": 2.1503987312316895, "Pretrain/Step": 6840, "Pretrain/Step Time": 8.487405577674508} +{"Pretrain/Learning Rate": 3.712314884184519e-05, "Pretrain/Loss": 2.023897647857666, "Pretrain/Loss (Raw)": 2.203577756881714, "Pretrain/Step": 6841, "Pretrain/Step Time": 8.486988691613078} +{"Pretrain/Learning Rate": 3.711943603502099e-05, "Pretrain/Loss": 2.02229905128479, "Pretrain/Loss (Raw)": 1.9167134761810303, "Pretrain/Step": 6842, "Pretrain/Step Time": 8.486085494980216} +{"Pretrain/Learning Rate": 3.7115722878741397e-05, "Pretrain/Loss": 2.023649215698242, "Pretrain/Loss (Raw)": 2.1399245262145996, "Pretrain/Step": 6843, "Pretrain/Step Time": 8.482800886034966} +{"Pretrain/Learning Rate": 3.711200937311348e-05, "Pretrain/Loss": 2.023988723754883, "Pretrain/Loss (Raw)": 2.0695078372955322, "Pretrain/Step": 6844, "Pretrain/Step Time": 8.486393004655838} +{"Pretrain/Learning Rate": 3.71082955182443e-05, "Pretrain/Loss": 2.0228705406188965, "Pretrain/Loss (Raw)": 2.0835120677948, "Pretrain/Step": 6845, "Pretrain/Step Time": 8.484347511082888} +{"Pretrain/Learning Rate": 3.710458131424096e-05, "Pretrain/Loss": 2.0194945335388184, "Pretrain/Loss (Raw)": 1.8779631853103638, "Pretrain/Step": 6846, "Pretrain/Step Time": 8.487799456343055} +{"Pretrain/Learning Rate": 3.710086676121055e-05, "Pretrain/Loss": 2.0191330909729004, "Pretrain/Loss (Raw)": 2.0020854473114014, "Pretrain/Step": 6847, "Pretrain/Step Time": 8.485586822032928} +{"Pretrain/Learning Rate": 3.709715185926018e-05, "Pretrain/Loss": 2.0184903144836426, "Pretrain/Loss (Raw)": 1.882891297340393, "Pretrain/Step": 6848, "Pretrain/Step Time": 8.490173675119877} +{"Pretrain/Learning Rate": 3.709343660849697e-05, "Pretrain/Loss": 2.016045331954956, "Pretrain/Loss (Raw)": 1.8529484272003174, "Pretrain/Step": 6849, "Pretrain/Step Time": 8.494758699089289} +{"Pretrain/Learning Rate": 3.7089721009028025e-05, "Pretrain/Loss": 2.0165629386901855, "Pretrain/Loss (Raw)": 2.1226999759674072, "Pretrain/Step": 6850, "Pretrain/Step Time": 8.489188795909286} +{"Pretrain/Learning Rate": 3.708600506096051e-05, "Pretrain/Loss": 2.017608880996704, "Pretrain/Loss (Raw)": 2.0510284900665283, "Pretrain/Step": 6851, "Pretrain/Step Time": 8.487956685945392} +{"Pretrain/Learning Rate": 3.708228876440155e-05, "Pretrain/Loss": 2.0173263549804688, "Pretrain/Loss (Raw)": 2.0272281169891357, "Pretrain/Step": 6852, "Pretrain/Step Time": 8.490833410993218} +{"Pretrain/Learning Rate": 3.707857211945832e-05, "Pretrain/Loss": 2.0191071033477783, "Pretrain/Loss (Raw)": 2.0505166053771973, "Pretrain/Step": 6853, "Pretrain/Step Time": 8.492590468376875} +{"Pretrain/Learning Rate": 3.707485512623798e-05, "Pretrain/Loss": 2.0199637413024902, "Pretrain/Loss (Raw)": 2.125868797302246, "Pretrain/Step": 6854, "Pretrain/Step Time": 8.495977396145463} +{"Pretrain/Learning Rate": 3.707113778484769e-05, "Pretrain/Loss": 2.021576404571533, "Pretrain/Loss (Raw)": 2.0645899772644043, "Pretrain/Step": 6855, "Pretrain/Step Time": 8.494349788874388} +{"Pretrain/Learning Rate": 3.7067420095394665e-05, "Pretrain/Loss": 2.020725727081299, "Pretrain/Loss (Raw)": 2.0382745265960693, "Pretrain/Step": 6856, "Pretrain/Step Time": 8.495569840073586} +{"Pretrain/Learning Rate": 3.706370205798608e-05, "Pretrain/Loss": 2.022691249847412, "Pretrain/Loss (Raw)": 2.0926642417907715, "Pretrain/Step": 6857, "Pretrain/Step Time": 8.490575248375535} +{"Pretrain/Learning Rate": 3.705998367272916e-05, "Pretrain/Loss": 2.0215492248535156, "Pretrain/Loss (Raw)": 2.0428969860076904, "Pretrain/Step": 6858, "Pretrain/Step Time": 8.492317786440253} +{"Pretrain/Learning Rate": 3.705626493973111e-05, "Pretrain/Loss": 2.022087574005127, "Pretrain/Loss (Raw)": 2.1492271423339844, "Pretrain/Step": 6859, "Pretrain/Step Time": 8.489877358078957} +{"Pretrain/Learning Rate": 3.705254585909915e-05, "Pretrain/Loss": 2.0218329429626465, "Pretrain/Loss (Raw)": 1.9597728252410889, "Pretrain/Step": 6860, "Pretrain/Step Time": 8.491104958578944} +{"Pretrain/Learning Rate": 3.7048826430940536e-05, "Pretrain/Loss": 2.020979404449463, "Pretrain/Loss (Raw)": 1.9789294004440308, "Pretrain/Step": 6861, "Pretrain/Step Time": 8.491478018462658} +{"Pretrain/Learning Rate": 3.70451066553625e-05, "Pretrain/Loss": 2.0223193168640137, "Pretrain/Loss (Raw)": 2.0958023071289062, "Pretrain/Step": 6862, "Pretrain/Step Time": 8.488746432587504} +{"Pretrain/Learning Rate": 3.704138653247231e-05, "Pretrain/Loss": 2.0217843055725098, "Pretrain/Loss (Raw)": 2.0701847076416016, "Pretrain/Step": 6863, "Pretrain/Step Time": 8.487521104514599} +{"Pretrain/Learning Rate": 3.703766606237723e-05, "Pretrain/Loss": 2.021254539489746, "Pretrain/Loss (Raw)": 2.0265979766845703, "Pretrain/Step": 6864, "Pretrain/Step Time": 8.492797626182437} +{"Pretrain/Learning Rate": 3.703394524518452e-05, "Pretrain/Loss": 2.020254135131836, "Pretrain/Loss (Raw)": 2.004821300506592, "Pretrain/Step": 6865, "Pretrain/Step Time": 8.494836702942848} +{"Pretrain/Learning Rate": 3.70302240810015e-05, "Pretrain/Loss": 2.0195538997650146, "Pretrain/Loss (Raw)": 1.9157087802886963, "Pretrain/Step": 6866, "Pretrain/Step Time": 8.495922148227692} +{"Pretrain/Learning Rate": 3.702650256993544e-05, "Pretrain/Loss": 2.020263671875, "Pretrain/Loss (Raw)": 2.1013479232788086, "Pretrain/Step": 6867, "Pretrain/Step Time": 8.492673309519887} +{"Pretrain/Learning Rate": 3.702278071209366e-05, "Pretrain/Loss": 2.023672580718994, "Pretrain/Loss (Raw)": 2.308318614959717, "Pretrain/Step": 6868, "Pretrain/Step Time": 8.4905038587749} +{"Pretrain/Learning Rate": 3.701905850758347e-05, "Pretrain/Loss": 2.0246543884277344, "Pretrain/Loss (Raw)": 1.9550176858901978, "Pretrain/Step": 6869, "Pretrain/Step Time": 8.486284252256155} +{"Pretrain/Learning Rate": 3.701533595651221e-05, "Pretrain/Loss": 2.024259328842163, "Pretrain/Loss (Raw)": 1.9278507232666016, "Pretrain/Step": 6870, "Pretrain/Step Time": 8.491641707718372} +{"Pretrain/Learning Rate": 3.701161305898719e-05, "Pretrain/Loss": 2.0224528312683105, "Pretrain/Loss (Raw)": 1.8821943998336792, "Pretrain/Step": 6871, "Pretrain/Step Time": 8.491592291742563} +{"Pretrain/Learning Rate": 3.7007889815115796e-05, "Pretrain/Loss": 2.022552251815796, "Pretrain/Loss (Raw)": 1.9511675834655762, "Pretrain/Step": 6872, "Pretrain/Step Time": 8.48824929818511} +{"Pretrain/Learning Rate": 3.700416622500535e-05, "Pretrain/Loss": 2.02319073677063, "Pretrain/Loss (Raw)": 2.01303768157959, "Pretrain/Step": 6873, "Pretrain/Step Time": 8.492739820852876} +{"Pretrain/Learning Rate": 3.7000442288763236e-05, "Pretrain/Loss": 2.0253396034240723, "Pretrain/Loss (Raw)": 2.0852560997009277, "Pretrain/Step": 6874, "Pretrain/Step Time": 8.489751422777772} +{"Pretrain/Learning Rate": 3.699671800649683e-05, "Pretrain/Loss": 2.026823043823242, "Pretrain/Loss (Raw)": 2.1287691593170166, "Pretrain/Step": 6875, "Pretrain/Step Time": 8.492814309895039} +{"Pretrain/Learning Rate": 3.6992993378313514e-05, "Pretrain/Loss": 2.0282421112060547, "Pretrain/Loss (Raw)": 2.0824148654937744, "Pretrain/Step": 6876, "Pretrain/Step Time": 8.492002710700035} +{"Pretrain/Learning Rate": 3.6989268404320695e-05, "Pretrain/Loss": 2.0314345359802246, "Pretrain/Loss (Raw)": 2.3860909938812256, "Pretrain/Step": 6877, "Pretrain/Step Time": 8.492316087707877} +{"Pretrain/Learning Rate": 3.6985543084625765e-05, "Pretrain/Loss": 2.030914783477783, "Pretrain/Loss (Raw)": 1.954890251159668, "Pretrain/Step": 6878, "Pretrain/Step Time": 8.491644505411386} +{"Pretrain/Learning Rate": 3.6981817419336155e-05, "Pretrain/Loss": 2.0305514335632324, "Pretrain/Loss (Raw)": 2.047389268875122, "Pretrain/Step": 6879, "Pretrain/Step Time": 8.489867351949215} +{"Pretrain/Learning Rate": 3.697809140855929e-05, "Pretrain/Loss": 2.0349819660186768, "Pretrain/Loss (Raw)": 2.7039172649383545, "Pretrain/Step": 6880, "Pretrain/Step Time": 8.491846453398466} +{"Pretrain/Learning Rate": 3.69743650524026e-05, "Pretrain/Loss": 2.036098003387451, "Pretrain/Loss (Raw)": 2.1882712841033936, "Pretrain/Step": 6881, "Pretrain/Step Time": 8.49406036734581} +{"Pretrain/Learning Rate": 3.6970638350973535e-05, "Pretrain/Loss": 2.0355820655822754, "Pretrain/Loss (Raw)": 1.9689805507659912, "Pretrain/Step": 6882, "Pretrain/Step Time": 8.495402438566089} +{"Pretrain/Learning Rate": 3.6966911304379545e-05, "Pretrain/Loss": 2.0327813625335693, "Pretrain/Loss (Raw)": 2.0383427143096924, "Pretrain/Step": 6883, "Pretrain/Step Time": 8.497276239097118} +{"Pretrain/Learning Rate": 3.696318391272812e-05, "Pretrain/Loss": 2.0355753898620605, "Pretrain/Loss (Raw)": 2.2502925395965576, "Pretrain/Step": 6884, "Pretrain/Step Time": 8.49273861758411} +{"Pretrain/Learning Rate": 3.695945617612671e-05, "Pretrain/Loss": 2.0366475582122803, "Pretrain/Loss (Raw)": 1.9282045364379883, "Pretrain/Step": 6885, "Pretrain/Step Time": 8.49356590397656} +{"Pretrain/Learning Rate": 3.6955728094682806e-05, "Pretrain/Loss": 2.0364320278167725, "Pretrain/Loss (Raw)": 2.0776195526123047, "Pretrain/Step": 6886, "Pretrain/Step Time": 8.495924811810255} +{"Pretrain/Learning Rate": 3.695199966850392e-05, "Pretrain/Loss": 2.0347018241882324, "Pretrain/Loss (Raw)": 1.832849383354187, "Pretrain/Step": 6887, "Pretrain/Step Time": 8.496825456619263} +{"Pretrain/Learning Rate": 3.694827089769754e-05, "Pretrain/Loss": 2.0354866981506348, "Pretrain/Loss (Raw)": 2.0134809017181396, "Pretrain/Step": 6888, "Pretrain/Step Time": 8.495525874197483} +{"Pretrain/Learning Rate": 3.69445417823712e-05, "Pretrain/Loss": 2.036350965499878, "Pretrain/Loss (Raw)": 1.9147303104400635, "Pretrain/Step": 6889, "Pretrain/Step Time": 8.498820897191763} +{"Pretrain/Learning Rate": 3.694081232263242e-05, "Pretrain/Loss": 2.0335841178894043, "Pretrain/Loss (Raw)": 1.8772779703140259, "Pretrain/Step": 6890, "Pretrain/Step Time": 8.495519131422043} +{"Pretrain/Learning Rate": 3.6937082518588725e-05, "Pretrain/Loss": 2.034247875213623, "Pretrain/Loss (Raw)": 2.0972352027893066, "Pretrain/Step": 6891, "Pretrain/Step Time": 8.499040694907308} +{"Pretrain/Learning Rate": 3.693335237034768e-05, "Pretrain/Loss": 2.0314767360687256, "Pretrain/Loss (Raw)": 1.6890519857406616, "Pretrain/Step": 6892, "Pretrain/Step Time": 8.495087698101997} +{"Pretrain/Learning Rate": 3.692962187801683e-05, "Pretrain/Loss": 2.0325169563293457, "Pretrain/Loss (Raw)": 2.070108652114868, "Pretrain/Step": 6893, "Pretrain/Step Time": 8.490414457395673} +{"Pretrain/Learning Rate": 3.6925891041703735e-05, "Pretrain/Loss": 2.0317554473876953, "Pretrain/Loss (Raw)": 1.8800201416015625, "Pretrain/Step": 6894, "Pretrain/Step Time": 8.4898318964988} +{"Pretrain/Learning Rate": 3.692215986151599e-05, "Pretrain/Loss": 2.0292255878448486, "Pretrain/Loss (Raw)": 1.770997405052185, "Pretrain/Step": 6895, "Pretrain/Step Time": 8.493374489247799} +{"Pretrain/Learning Rate": 3.691842833756116e-05, "Pretrain/Loss": 2.0294837951660156, "Pretrain/Loss (Raw)": 2.0791447162628174, "Pretrain/Step": 6896, "Pretrain/Step Time": 8.485953969880939} +{"Pretrain/Learning Rate": 3.691469646994686e-05, "Pretrain/Loss": 2.029609203338623, "Pretrain/Loss (Raw)": 1.7239055633544922, "Pretrain/Step": 6897, "Pretrain/Step Time": 8.48936777189374} +{"Pretrain/Learning Rate": 3.6910964258780676e-05, "Pretrain/Loss": 2.030195474624634, "Pretrain/Loss (Raw)": 1.9398730993270874, "Pretrain/Step": 6898, "Pretrain/Step Time": 8.491330793127418} +{"Pretrain/Learning Rate": 3.690723170417024e-05, "Pretrain/Loss": 2.02760910987854, "Pretrain/Loss (Raw)": 2.10705304145813, "Pretrain/Step": 6899, "Pretrain/Step Time": 8.490314742550254} +{"Pretrain/Learning Rate": 3.6903498806223175e-05, "Pretrain/Loss": 2.028853178024292, "Pretrain/Loss (Raw)": 2.016223192214966, "Pretrain/Step": 6900, "Pretrain/Step Time": 8.486204842105508} +{"Pretrain/Learning Rate": 3.689976556504712e-05, "Pretrain/Loss": 2.026766777038574, "Pretrain/Loss (Raw)": 1.8873836994171143, "Pretrain/Step": 6901, "Pretrain/Step Time": 8.487340781837702} +{"Pretrain/Learning Rate": 3.68960319807497e-05, "Pretrain/Loss": 2.026477813720703, "Pretrain/Loss (Raw)": 1.9595321416854858, "Pretrain/Step": 6902, "Pretrain/Step Time": 8.48823225684464} +{"Pretrain/Learning Rate": 3.6892298053438584e-05, "Pretrain/Loss": 2.0275630950927734, "Pretrain/Loss (Raw)": 2.080324411392212, "Pretrain/Step": 6903, "Pretrain/Step Time": 8.483908876776695} +{"Pretrain/Learning Rate": 3.688856378322144e-05, "Pretrain/Loss": 2.027414321899414, "Pretrain/Loss (Raw)": 2.092832565307617, "Pretrain/Step": 6904, "Pretrain/Step Time": 8.481532296165824} +{"Pretrain/Learning Rate": 3.688482917020594e-05, "Pretrain/Loss": 2.0258729457855225, "Pretrain/Loss (Raw)": 1.8019827604293823, "Pretrain/Step": 6905, "Pretrain/Step Time": 8.480932872742414} +{"Pretrain/Learning Rate": 3.6881094214499776e-05, "Pretrain/Loss": 2.024826765060425, "Pretrain/Loss (Raw)": 2.046445846557617, "Pretrain/Step": 6906, "Pretrain/Step Time": 8.48590692318976} +{"Pretrain/Learning Rate": 3.687735891621063e-05, "Pretrain/Loss": 2.0260941982269287, "Pretrain/Loss (Raw)": 1.9903615713119507, "Pretrain/Step": 6907, "Pretrain/Step Time": 8.48812586069107} +{"Pretrain/Learning Rate": 3.687362327544621e-05, "Pretrain/Loss": 2.025373697280884, "Pretrain/Loss (Raw)": 1.9593826532363892, "Pretrain/Step": 6908, "Pretrain/Step Time": 8.486244754865766} +{"Pretrain/Learning Rate": 3.6869887292314237e-05, "Pretrain/Loss": 2.024953603744507, "Pretrain/Loss (Raw)": 1.970352053642273, "Pretrain/Step": 6909, "Pretrain/Step Time": 8.483660290017724} +{"Pretrain/Learning Rate": 3.686615096692243e-05, "Pretrain/Loss": 2.024383544921875, "Pretrain/Loss (Raw)": 1.9806455373764038, "Pretrain/Step": 6910, "Pretrain/Step Time": 8.486911531537771} +{"Pretrain/Learning Rate": 3.686241429937853e-05, "Pretrain/Loss": 2.0232162475585938, "Pretrain/Loss (Raw)": 2.0145890712738037, "Pretrain/Step": 6911, "Pretrain/Step Time": 8.484730020165443} +{"Pretrain/Learning Rate": 3.685867728979027e-05, "Pretrain/Loss": 2.0221686363220215, "Pretrain/Loss (Raw)": 1.9179472923278809, "Pretrain/Step": 6912, "Pretrain/Step Time": 8.483385058119893} +{"Pretrain/Learning Rate": 3.6854939938265414e-05, "Pretrain/Loss": 2.021099090576172, "Pretrain/Loss (Raw)": 1.945684790611267, "Pretrain/Step": 6913, "Pretrain/Step Time": 8.483509860932827} +{"Pretrain/Learning Rate": 3.685120224491172e-05, "Pretrain/Loss": 2.0200822353363037, "Pretrain/Loss (Raw)": 1.9064239263534546, "Pretrain/Step": 6914, "Pretrain/Step Time": 8.49418362416327} +{"Pretrain/Learning Rate": 3.684746420983696e-05, "Pretrain/Loss": 2.017533779144287, "Pretrain/Loss (Raw)": 1.9851627349853516, "Pretrain/Step": 6915, "Pretrain/Step Time": 8.490419279783964} +{"Pretrain/Learning Rate": 3.684372583314893e-05, "Pretrain/Loss": 2.018285036087036, "Pretrain/Loss (Raw)": 2.2544145584106445, "Pretrain/Step": 6916, "Pretrain/Step Time": 8.491528533399105} +{"Pretrain/Learning Rate": 3.683998711495541e-05, "Pretrain/Loss": 2.0154824256896973, "Pretrain/Loss (Raw)": 1.8973100185394287, "Pretrain/Step": 6917, "Pretrain/Step Time": 8.492109429091215} +{"Pretrain/Learning Rate": 3.683624805536421e-05, "Pretrain/Loss": 2.0150840282440186, "Pretrain/Loss (Raw)": 2.102944850921631, "Pretrain/Step": 6918, "Pretrain/Step Time": 8.490749571472406} +{"Pretrain/Learning Rate": 3.683250865448314e-05, "Pretrain/Loss": 2.012645959854126, "Pretrain/Loss (Raw)": 1.8889245986938477, "Pretrain/Step": 6919, "Pretrain/Step Time": 8.491655968129635} +{"Pretrain/Learning Rate": 3.682876891242002e-05, "Pretrain/Loss": 2.013239860534668, "Pretrain/Loss (Raw)": 1.9957380294799805, "Pretrain/Step": 6920, "Pretrain/Step Time": 8.490674279630184} +{"Pretrain/Learning Rate": 3.682502882928269e-05, "Pretrain/Loss": 2.013603687286377, "Pretrain/Loss (Raw)": 2.1604230403900146, "Pretrain/Step": 6921, "Pretrain/Step Time": 8.490787081420422} +{"Pretrain/Learning Rate": 3.6821288405179e-05, "Pretrain/Loss": 2.0159740447998047, "Pretrain/Loss (Raw)": 2.2271196842193604, "Pretrain/Step": 6922, "Pretrain/Step Time": 8.496377632021904} +{"Pretrain/Learning Rate": 3.6817547640216775e-05, "Pretrain/Loss": 2.016709804534912, "Pretrain/Loss (Raw)": 1.9957337379455566, "Pretrain/Step": 6923, "Pretrain/Step Time": 8.491867607459426} +{"Pretrain/Learning Rate": 3.681380653450391e-05, "Pretrain/Loss": 2.0169408321380615, "Pretrain/Loss (Raw)": 1.9985744953155518, "Pretrain/Step": 6924, "Pretrain/Step Time": 8.497487537562847} +{"Pretrain/Learning Rate": 3.681006508814825e-05, "Pretrain/Loss": 2.01855206489563, "Pretrain/Loss (Raw)": 2.0763540267944336, "Pretrain/Step": 6925, "Pretrain/Step Time": 8.488213127478957} +{"Pretrain/Learning Rate": 3.680632330125769e-05, "Pretrain/Loss": 2.0190253257751465, "Pretrain/Loss (Raw)": 1.7924177646636963, "Pretrain/Step": 6926, "Pretrain/Step Time": 8.494538065046072} +{"Pretrain/Learning Rate": 3.6802581173940134e-05, "Pretrain/Loss": 2.0205726623535156, "Pretrain/Loss (Raw)": 2.2327818870544434, "Pretrain/Step": 6927, "Pretrain/Step Time": 8.496691623702645} +{"Pretrain/Learning Rate": 3.679883870630346e-05, "Pretrain/Loss": 2.0218305587768555, "Pretrain/Loss (Raw)": 2.082707405090332, "Pretrain/Step": 6928, "Pretrain/Step Time": 8.493073521181941} +{"Pretrain/Learning Rate": 3.679509589845558e-05, "Pretrain/Loss": 2.021515369415283, "Pretrain/Loss (Raw)": 2.187838077545166, "Pretrain/Step": 6929, "Pretrain/Step Time": 8.493737848475575} +{"Pretrain/Learning Rate": 3.679135275050444e-05, "Pretrain/Loss": 2.0179872512817383, "Pretrain/Loss (Raw)": 1.874314785003662, "Pretrain/Step": 6930, "Pretrain/Step Time": 8.48967837356031} +{"Pretrain/Learning Rate": 3.678760926255795e-05, "Pretrain/Loss": 2.0187525749206543, "Pretrain/Loss (Raw)": 2.0606579780578613, "Pretrain/Step": 6931, "Pretrain/Step Time": 8.489862244576216} +{"Pretrain/Learning Rate": 3.6783865434724064e-05, "Pretrain/Loss": 2.019329071044922, "Pretrain/Loss (Raw)": 1.9921859502792358, "Pretrain/Step": 6932, "Pretrain/Step Time": 8.49522584863007} +{"Pretrain/Learning Rate": 3.678012126711071e-05, "Pretrain/Loss": 2.019558906555176, "Pretrain/Loss (Raw)": 2.047193765640259, "Pretrain/Step": 6933, "Pretrain/Step Time": 8.499981850385666} +{"Pretrain/Learning Rate": 3.6776376759825874e-05, "Pretrain/Loss": 2.019136667251587, "Pretrain/Loss (Raw)": 2.1085665225982666, "Pretrain/Step": 6934, "Pretrain/Step Time": 8.4964335039258} +{"Pretrain/Learning Rate": 3.677263191297751e-05, "Pretrain/Loss": 2.019505739212036, "Pretrain/Loss (Raw)": 1.9485727548599243, "Pretrain/Step": 6935, "Pretrain/Step Time": 8.494393162429333} +{"Pretrain/Learning Rate": 3.676888672667361e-05, "Pretrain/Loss": 2.0208606719970703, "Pretrain/Loss (Raw)": 1.9925190210342407, "Pretrain/Step": 6936, "Pretrain/Step Time": 8.498945781961083} +{"Pretrain/Learning Rate": 3.676514120102216e-05, "Pretrain/Loss": 2.022935390472412, "Pretrain/Loss (Raw)": 1.9694095849990845, "Pretrain/Step": 6937, "Pretrain/Step Time": 8.494345352053642} +{"Pretrain/Learning Rate": 3.676139533613116e-05, "Pretrain/Loss": 2.0183517932891846, "Pretrain/Loss (Raw)": 1.6094540357589722, "Pretrain/Step": 6938, "Pretrain/Step Time": 8.495544781908393} +{"Pretrain/Learning Rate": 3.67576491321086e-05, "Pretrain/Loss": 2.0192508697509766, "Pretrain/Loss (Raw)": 2.192405939102173, "Pretrain/Step": 6939, "Pretrain/Step Time": 8.499483896419406} +{"Pretrain/Learning Rate": 3.675390258906253e-05, "Pretrain/Loss": 2.0176644325256348, "Pretrain/Loss (Raw)": 2.0365610122680664, "Pretrain/Step": 6940, "Pretrain/Step Time": 8.49524856545031} +{"Pretrain/Learning Rate": 3.675015570710095e-05, "Pretrain/Loss": 2.017943859100342, "Pretrain/Loss (Raw)": 2.070451021194458, "Pretrain/Step": 6941, "Pretrain/Step Time": 8.498286629095674} +{"Pretrain/Learning Rate": 3.674640848633193e-05, "Pretrain/Loss": 2.016714096069336, "Pretrain/Loss (Raw)": 1.9118345975875854, "Pretrain/Step": 6942, "Pretrain/Step Time": 8.496442062780261} +{"Pretrain/Learning Rate": 3.6742660926863506e-05, "Pretrain/Loss": 2.016594648361206, "Pretrain/Loss (Raw)": 1.9123157262802124, "Pretrain/Step": 6943, "Pretrain/Step Time": 8.500662136822939} +{"Pretrain/Learning Rate": 3.673891302880372e-05, "Pretrain/Loss": 2.0169389247894287, "Pretrain/Loss (Raw)": 2.0033929347991943, "Pretrain/Step": 6944, "Pretrain/Step Time": 8.495434802025557} +{"Pretrain/Learning Rate": 3.6735164792260654e-05, "Pretrain/Loss": 2.0173275470733643, "Pretrain/Loss (Raw)": 2.097349166870117, "Pretrain/Step": 6945, "Pretrain/Step Time": 8.495522521436214} +{"Pretrain/Learning Rate": 3.673141621734238e-05, "Pretrain/Loss": 2.0162177085876465, "Pretrain/Loss (Raw)": 2.0509979724884033, "Pretrain/Step": 6946, "Pretrain/Step Time": 8.499394612386823} +{"Pretrain/Learning Rate": 3.6727667304156996e-05, "Pretrain/Loss": 2.0171310901641846, "Pretrain/Loss (Raw)": 1.9735554456710815, "Pretrain/Step": 6947, "Pretrain/Step Time": 8.494984969496727} +{"Pretrain/Learning Rate": 3.6723918052812584e-05, "Pretrain/Loss": 2.018004894256592, "Pretrain/Loss (Raw)": 2.108123302459717, "Pretrain/Step": 6948, "Pretrain/Step Time": 8.491485623642802} +{"Pretrain/Learning Rate": 3.672016846341727e-05, "Pretrain/Loss": 2.0189356803894043, "Pretrain/Loss (Raw)": 2.17634916305542, "Pretrain/Step": 6949, "Pretrain/Step Time": 8.493853833526373} +{"Pretrain/Learning Rate": 3.671641853607916e-05, "Pretrain/Loss": 2.0177788734436035, "Pretrain/Loss (Raw)": 2.00004243850708, "Pretrain/Step": 6950, "Pretrain/Step Time": 8.496990192681551} +{"Pretrain/Learning Rate": 3.6712668270906376e-05, "Pretrain/Loss": 2.0175156593322754, "Pretrain/Loss (Raw)": 2.021040678024292, "Pretrain/Step": 6951, "Pretrain/Step Time": 8.493173774331808} +{"Pretrain/Learning Rate": 3.670891766800706e-05, "Pretrain/Loss": 2.0181736946105957, "Pretrain/Loss (Raw)": 2.1027071475982666, "Pretrain/Step": 6952, "Pretrain/Step Time": 8.493150973692536} +{"Pretrain/Learning Rate": 3.6705166727489354e-05, "Pretrain/Loss": 2.0190024375915527, "Pretrain/Loss (Raw)": 2.040698766708374, "Pretrain/Step": 6953, "Pretrain/Step Time": 8.492563482373953} +{"Pretrain/Learning Rate": 3.6701415449461427e-05, "Pretrain/Loss": 2.0198373794555664, "Pretrain/Loss (Raw)": 2.0456326007843018, "Pretrain/Step": 6954, "Pretrain/Step Time": 8.499122396111488} +{"Pretrain/Learning Rate": 3.669766383403142e-05, "Pretrain/Loss": 2.0166079998016357, "Pretrain/Loss (Raw)": 1.7480801343917847, "Pretrain/Step": 6955, "Pretrain/Step Time": 8.501166332513094} +{"Pretrain/Learning Rate": 3.669391188130754e-05, "Pretrain/Loss": 2.017148494720459, "Pretrain/Loss (Raw)": 2.1211540699005127, "Pretrain/Step": 6956, "Pretrain/Step Time": 8.496415229514241} +{"Pretrain/Learning Rate": 3.669015959139794e-05, "Pretrain/Loss": 2.0184555053710938, "Pretrain/Loss (Raw)": 2.0877249240875244, "Pretrain/Step": 6957, "Pretrain/Step Time": 8.497420454397798} +{"Pretrain/Learning Rate": 3.6686406964410834e-05, "Pretrain/Loss": 2.016385555267334, "Pretrain/Loss (Raw)": 1.8626843690872192, "Pretrain/Step": 6958, "Pretrain/Step Time": 8.49855569936335} +{"Pretrain/Learning Rate": 3.668265400045443e-05, "Pretrain/Loss": 2.019324779510498, "Pretrain/Loss (Raw)": 1.9973376989364624, "Pretrain/Step": 6959, "Pretrain/Step Time": 8.500590544193983} +{"Pretrain/Learning Rate": 3.667890069963693e-05, "Pretrain/Loss": 2.0173604488372803, "Pretrain/Loss (Raw)": 1.84433913230896, "Pretrain/Step": 6960, "Pretrain/Step Time": 8.49537375755608} +{"Pretrain/Learning Rate": 3.667514706206655e-05, "Pretrain/Loss": 2.0153253078460693, "Pretrain/Loss (Raw)": 1.953079342842102, "Pretrain/Step": 6961, "Pretrain/Step Time": 8.493780184537172} +{"Pretrain/Learning Rate": 3.6671393087851544e-05, "Pretrain/Loss": 2.0146186351776123, "Pretrain/Loss (Raw)": 1.895470142364502, "Pretrain/Step": 6962, "Pretrain/Step Time": 8.499795937910676} +{"Pretrain/Learning Rate": 3.6667638777100144e-05, "Pretrain/Loss": 2.0162181854248047, "Pretrain/Loss (Raw)": 2.161386013031006, "Pretrain/Step": 6963, "Pretrain/Step Time": 8.493486724793911} +{"Pretrain/Learning Rate": 3.666388412992061e-05, "Pretrain/Loss": 2.0147578716278076, "Pretrain/Loss (Raw)": 1.9050499200820923, "Pretrain/Step": 6964, "Pretrain/Step Time": 8.49373683705926} +{"Pretrain/Learning Rate": 3.6660129146421196e-05, "Pretrain/Loss": 2.021066188812256, "Pretrain/Loss (Raw)": 2.3041176795959473, "Pretrain/Step": 6965, "Pretrain/Step Time": 8.49601175636053} +{"Pretrain/Learning Rate": 3.665637382671018e-05, "Pretrain/Loss": 2.0248875617980957, "Pretrain/Loss (Raw)": 2.375087022781372, "Pretrain/Step": 6966, "Pretrain/Step Time": 8.490645540878177} +{"Pretrain/Learning Rate": 3.6652618170895834e-05, "Pretrain/Loss": 2.0250768661499023, "Pretrain/Loss (Raw)": 2.1879944801330566, "Pretrain/Step": 6967, "Pretrain/Step Time": 8.495915874838829} +{"Pretrain/Learning Rate": 3.6648862179086465e-05, "Pretrain/Loss": 2.0251431465148926, "Pretrain/Loss (Raw)": 2.1588871479034424, "Pretrain/Step": 6968, "Pretrain/Step Time": 8.492188470438123} +{"Pretrain/Learning Rate": 3.664510585139037e-05, "Pretrain/Loss": 2.0247561931610107, "Pretrain/Loss (Raw)": 2.1540496349334717, "Pretrain/Step": 6969, "Pretrain/Step Time": 8.490524156019092} +{"Pretrain/Learning Rate": 3.664134918791584e-05, "Pretrain/Loss": 2.0259461402893066, "Pretrain/Loss (Raw)": 2.0690078735351562, "Pretrain/Step": 6970, "Pretrain/Step Time": 8.490316964685917} +{"Pretrain/Learning Rate": 3.663759218877123e-05, "Pretrain/Loss": 2.026726722717285, "Pretrain/Loss (Raw)": 2.239854335784912, "Pretrain/Step": 6971, "Pretrain/Step Time": 8.498395742848516} +{"Pretrain/Learning Rate": 3.6633834854064847e-05, "Pretrain/Loss": 2.0271847248077393, "Pretrain/Loss (Raw)": 2.1281423568725586, "Pretrain/Step": 6972, "Pretrain/Step Time": 8.492078147828579} +{"Pretrain/Learning Rate": 3.663007718390504e-05, "Pretrain/Loss": 2.028001308441162, "Pretrain/Loss (Raw)": 2.18804931640625, "Pretrain/Step": 6973, "Pretrain/Step Time": 8.490606617182493} +{"Pretrain/Learning Rate": 3.662631917840015e-05, "Pretrain/Loss": 2.0297813415527344, "Pretrain/Loss (Raw)": 2.105808973312378, "Pretrain/Step": 6974, "Pretrain/Step Time": 8.490167506039143} +{"Pretrain/Learning Rate": 3.662256083765855e-05, "Pretrain/Loss": 2.0294947624206543, "Pretrain/Loss (Raw)": 1.9653819799423218, "Pretrain/Step": 6975, "Pretrain/Step Time": 8.494783883914351} +{"Pretrain/Learning Rate": 3.66188021617886e-05, "Pretrain/Loss": 2.0306806564331055, "Pretrain/Loss (Raw)": 2.034701108932495, "Pretrain/Step": 6976, "Pretrain/Step Time": 8.491648500785232} +{"Pretrain/Learning Rate": 3.6615043150898674e-05, "Pretrain/Loss": 2.034719944000244, "Pretrain/Loss (Raw)": 2.3699610233306885, "Pretrain/Step": 6977, "Pretrain/Step Time": 8.487588012591004} +{"Pretrain/Learning Rate": 3.661128380509717e-05, "Pretrain/Loss": 2.038332462310791, "Pretrain/Loss (Raw)": 2.58508563041687, "Pretrain/Step": 6978, "Pretrain/Step Time": 8.491454798728228} +{"Pretrain/Learning Rate": 3.660752412449249e-05, "Pretrain/Loss": 2.037517547607422, "Pretrain/Loss (Raw)": 1.9467226266860962, "Pretrain/Step": 6979, "Pretrain/Step Time": 8.48971077054739} +{"Pretrain/Learning Rate": 3.660376410919303e-05, "Pretrain/Loss": 2.0366296768188477, "Pretrain/Loss (Raw)": 1.913576602935791, "Pretrain/Step": 6980, "Pretrain/Step Time": 8.488284301012754} +{"Pretrain/Learning Rate": 3.660000375930721e-05, "Pretrain/Loss": 2.0345044136047363, "Pretrain/Loss (Raw)": 1.778485655784607, "Pretrain/Step": 6981, "Pretrain/Step Time": 8.488283028826118} +{"Pretrain/Learning Rate": 3.659624307494346e-05, "Pretrain/Loss": 2.0324041843414307, "Pretrain/Loss (Raw)": 1.8570574522018433, "Pretrain/Step": 6982, "Pretrain/Step Time": 8.485759660601616} +{"Pretrain/Learning Rate": 3.6592482056210214e-05, "Pretrain/Loss": 2.032064199447632, "Pretrain/Loss (Raw)": 2.021071434020996, "Pretrain/Step": 6983, "Pretrain/Step Time": 8.486911162734032} +{"Pretrain/Learning Rate": 3.658872070321592e-05, "Pretrain/Loss": 2.033993721008301, "Pretrain/Loss (Raw)": 2.2852659225463867, "Pretrain/Step": 6984, "Pretrain/Step Time": 8.486449228599668} +{"Pretrain/Learning Rate": 3.6584959016069046e-05, "Pretrain/Loss": 2.0361595153808594, "Pretrain/Loss (Raw)": 2.369851589202881, "Pretrain/Step": 6985, "Pretrain/Step Time": 8.488568117842078} +{"Pretrain/Learning Rate": 3.658119699487803e-05, "Pretrain/Loss": 2.033613443374634, "Pretrain/Loss (Raw)": 1.7170124053955078, "Pretrain/Step": 6986, "Pretrain/Step Time": 8.487077984958887} +{"Pretrain/Learning Rate": 3.6577434639751374e-05, "Pretrain/Loss": 2.0342857837677, "Pretrain/Loss (Raw)": 2.2352826595306396, "Pretrain/Step": 6987, "Pretrain/Step Time": 8.490447092801332} +{"Pretrain/Learning Rate": 3.6573671950797545e-05, "Pretrain/Loss": 2.0354950428009033, "Pretrain/Loss (Raw)": 2.114565849304199, "Pretrain/Step": 6988, "Pretrain/Step Time": 8.489528730511665} +{"Pretrain/Learning Rate": 3.656990892812504e-05, "Pretrain/Loss": 2.034025192260742, "Pretrain/Loss (Raw)": 1.7908036708831787, "Pretrain/Step": 6989, "Pretrain/Step Time": 8.4903663713485} +{"Pretrain/Learning Rate": 3.656614557184238e-05, "Pretrain/Loss": 2.0332260131835938, "Pretrain/Loss (Raw)": 1.9934782981872559, "Pretrain/Step": 6990, "Pretrain/Step Time": 8.495152724906802} +{"Pretrain/Learning Rate": 3.656238188205805e-05, "Pretrain/Loss": 2.0345091819763184, "Pretrain/Loss (Raw)": 2.234436511993408, "Pretrain/Step": 6991, "Pretrain/Step Time": 8.49479492008686} +{"Pretrain/Learning Rate": 3.6558617858880606e-05, "Pretrain/Loss": 2.0334973335266113, "Pretrain/Loss (Raw)": 1.8970993757247925, "Pretrain/Step": 6992, "Pretrain/Step Time": 8.490431353449821} +{"Pretrain/Learning Rate": 3.655485350241855e-05, "Pretrain/Loss": 2.0343570709228516, "Pretrain/Loss (Raw)": 2.114851474761963, "Pretrain/Step": 6993, "Pretrain/Step Time": 8.491704665124416} +{"Pretrain/Learning Rate": 3.655108881278045e-05, "Pretrain/Loss": 2.036396026611328, "Pretrain/Loss (Raw)": 2.1766791343688965, "Pretrain/Step": 6994, "Pretrain/Step Time": 8.490139717236161} +{"Pretrain/Learning Rate": 3.654732379007484e-05, "Pretrain/Loss": 2.0358176231384277, "Pretrain/Loss (Raw)": 2.0273213386535645, "Pretrain/Step": 6995, "Pretrain/Step Time": 8.49137268960476} +{"Pretrain/Learning Rate": 3.65435584344103e-05, "Pretrain/Loss": 2.0333056449890137, "Pretrain/Loss (Raw)": 1.98679518699646, "Pretrain/Step": 6996, "Pretrain/Step Time": 8.495067464187741} +{"Pretrain/Learning Rate": 3.6539792745895374e-05, "Pretrain/Loss": 2.034141778945923, "Pretrain/Loss (Raw)": 2.0620548725128174, "Pretrain/Step": 6997, "Pretrain/Step Time": 8.495795659720898} +{"Pretrain/Learning Rate": 3.653602672463867e-05, "Pretrain/Loss": 2.0349233150482178, "Pretrain/Loss (Raw)": 2.0278749465942383, "Pretrain/Step": 6998, "Pretrain/Step Time": 8.495060635730624} +{"Pretrain/Learning Rate": 3.653226037074876e-05, "Pretrain/Loss": 2.035911798477173, "Pretrain/Loss (Raw)": 2.008718252182007, "Pretrain/Step": 6999, "Pretrain/Step Time": 8.493102809414268} +{"Pretrain/Learning Rate": 3.652849368433425e-05, "Pretrain/Loss": 2.036093235015869, "Pretrain/Loss (Raw)": 1.9743890762329102, "Pretrain/Step": 7000, "Pretrain/Step Time": 8.497908154502511} +{"Pretrain/Learning Rate": 3.652472666550377e-05, "Pretrain/Loss": 2.0346832275390625, "Pretrain/Loss (Raw)": 1.832580327987671, "Pretrain/Step": 7001, "Pretrain/Step Time": 8.49463452771306} +{"Pretrain/Learning Rate": 3.65209593143659e-05, "Pretrain/Loss": 2.032886028289795, "Pretrain/Loss (Raw)": 1.8551816940307617, "Pretrain/Step": 7002, "Pretrain/Step Time": 8.496789989992976} +{"Pretrain/Learning Rate": 3.65171916310293e-05, "Pretrain/Loss": 2.0323691368103027, "Pretrain/Loss (Raw)": 2.062596321105957, "Pretrain/Step": 7003, "Pretrain/Step Time": 8.491812773048878} +{"Pretrain/Learning Rate": 3.65134236156026e-05, "Pretrain/Loss": 2.031909942626953, "Pretrain/Loss (Raw)": 2.0236899852752686, "Pretrain/Step": 7004, "Pretrain/Step Time": 8.49195895344019} +{"Pretrain/Learning Rate": 3.650965526819444e-05, "Pretrain/Loss": 2.0298895835876465, "Pretrain/Loss (Raw)": 2.1274571418762207, "Pretrain/Step": 7005, "Pretrain/Step Time": 8.492927549406886} +{"Pretrain/Learning Rate": 3.6505886588913494e-05, "Pretrain/Loss": 2.0296034812927246, "Pretrain/Loss (Raw)": 1.9182772636413574, "Pretrain/Step": 7006, "Pretrain/Step Time": 8.492340870201588} +{"Pretrain/Learning Rate": 3.650211757786841e-05, "Pretrain/Loss": 2.0302977561950684, "Pretrain/Loss (Raw)": 2.136244535446167, "Pretrain/Step": 7007, "Pretrain/Step Time": 8.494523564353585} +{"Pretrain/Learning Rate": 3.6498348235167877e-05, "Pretrain/Loss": 2.0246880054473877, "Pretrain/Loss (Raw)": 1.985885739326477, "Pretrain/Step": 7008, "Pretrain/Step Time": 8.492809997871518} +{"Pretrain/Learning Rate": 3.649457856092058e-05, "Pretrain/Loss": 2.021775722503662, "Pretrain/Loss (Raw)": 1.815514326095581, "Pretrain/Step": 7009, "Pretrain/Step Time": 8.490739298984408} +{"Pretrain/Learning Rate": 3.6490808555235215e-05, "Pretrain/Loss": 2.0207509994506836, "Pretrain/Loss (Raw)": 1.8377983570098877, "Pretrain/Step": 7010, "Pretrain/Step Time": 8.489265376701951} +{"Pretrain/Learning Rate": 3.6487038218220484e-05, "Pretrain/Loss": 2.0199599266052246, "Pretrain/Loss (Raw)": 1.9370852708816528, "Pretrain/Step": 7011, "Pretrain/Step Time": 8.489858547225595} +{"Pretrain/Learning Rate": 3.64832675499851e-05, "Pretrain/Loss": 2.0170199871063232, "Pretrain/Loss (Raw)": 1.8739769458770752, "Pretrain/Step": 7012, "Pretrain/Step Time": 8.488674288615584} +{"Pretrain/Learning Rate": 3.6479496550637794e-05, "Pretrain/Loss": 2.017576217651367, "Pretrain/Loss (Raw)": 1.9994195699691772, "Pretrain/Step": 7013, "Pretrain/Step Time": 8.487797187641263} +{"Pretrain/Learning Rate": 3.64757252202873e-05, "Pretrain/Loss": 2.0173513889312744, "Pretrain/Loss (Raw)": 2.0488293170928955, "Pretrain/Step": 7014, "Pretrain/Step Time": 8.490049283951521} +{"Pretrain/Learning Rate": 3.647195355904235e-05, "Pretrain/Loss": 2.0128369331359863, "Pretrain/Loss (Raw)": 1.2549797296524048, "Pretrain/Step": 7015, "Pretrain/Step Time": 8.488784108310938} +{"Pretrain/Learning Rate": 3.6468181567011714e-05, "Pretrain/Loss": 2.012876033782959, "Pretrain/Loss (Raw)": 2.018476724624634, "Pretrain/Step": 7016, "Pretrain/Step Time": 8.490455212071538} +{"Pretrain/Learning Rate": 3.646440924430416e-05, "Pretrain/Loss": 2.014280319213867, "Pretrain/Loss (Raw)": 2.0945117473602295, "Pretrain/Step": 7017, "Pretrain/Step Time": 8.48581923916936} +{"Pretrain/Learning Rate": 3.6460636591028426e-05, "Pretrain/Loss": 2.014976739883423, "Pretrain/Loss (Raw)": 1.9664061069488525, "Pretrain/Step": 7018, "Pretrain/Step Time": 8.490944361314178} +{"Pretrain/Learning Rate": 3.6456863607293314e-05, "Pretrain/Loss": 2.0137906074523926, "Pretrain/Loss (Raw)": 1.945407509803772, "Pretrain/Step": 7019, "Pretrain/Step Time": 8.485747635364532} +{"Pretrain/Learning Rate": 3.645309029320763e-05, "Pretrain/Loss": 2.0166914463043213, "Pretrain/Loss (Raw)": 2.0603652000427246, "Pretrain/Step": 7020, "Pretrain/Step Time": 8.49019137583673} +{"Pretrain/Learning Rate": 3.6449316648880154e-05, "Pretrain/Loss": 2.018984079360962, "Pretrain/Loss (Raw)": 2.363572835922241, "Pretrain/Step": 7021, "Pretrain/Step Time": 8.495131688192487} +{"Pretrain/Learning Rate": 3.644554267441971e-05, "Pretrain/Loss": 2.020908832550049, "Pretrain/Loss (Raw)": 2.126366138458252, "Pretrain/Step": 7022, "Pretrain/Step Time": 8.499907182529569} +{"Pretrain/Learning Rate": 3.644176836993511e-05, "Pretrain/Loss": 2.0231142044067383, "Pretrain/Loss (Raw)": 2.0533299446105957, "Pretrain/Step": 7023, "Pretrain/Step Time": 8.496588418260217} +{"Pretrain/Learning Rate": 3.643799373553518e-05, "Pretrain/Loss": 2.022956371307373, "Pretrain/Loss (Raw)": 2.058922529220581, "Pretrain/Step": 7024, "Pretrain/Step Time": 8.493278270587325} +{"Pretrain/Learning Rate": 3.643421877132877e-05, "Pretrain/Loss": 2.027021884918213, "Pretrain/Loss (Raw)": 2.244291305541992, "Pretrain/Step": 7025, "Pretrain/Step Time": 8.489614609628916} +{"Pretrain/Learning Rate": 3.6430443477424714e-05, "Pretrain/Loss": 2.030019998550415, "Pretrain/Loss (Raw)": 2.323621988296509, "Pretrain/Step": 7026, "Pretrain/Step Time": 8.487270060926676} +{"Pretrain/Learning Rate": 3.6426667853931886e-05, "Pretrain/Loss": 2.030782699584961, "Pretrain/Loss (Raw)": 2.2046737670898438, "Pretrain/Step": 7027, "Pretrain/Step Time": 8.487097632139921} +{"Pretrain/Learning Rate": 3.6422891900959146e-05, "Pretrain/Loss": 2.0309371948242188, "Pretrain/Loss (Raw)": 2.035991907119751, "Pretrain/Step": 7028, "Pretrain/Step Time": 8.49033404700458} +{"Pretrain/Learning Rate": 3.641911561861536e-05, "Pretrain/Loss": 2.0322625637054443, "Pretrain/Loss (Raw)": 2.0570411682128906, "Pretrain/Step": 7029, "Pretrain/Step Time": 8.489492487162352} +{"Pretrain/Learning Rate": 3.641533900700944e-05, "Pretrain/Loss": 2.03149676322937, "Pretrain/Loss (Raw)": 1.8615156412124634, "Pretrain/Step": 7030, "Pretrain/Step Time": 8.49317391961813} +{"Pretrain/Learning Rate": 3.641156206625025e-05, "Pretrain/Loss": 2.0319323539733887, "Pretrain/Loss (Raw)": 2.1360933780670166, "Pretrain/Step": 7031, "Pretrain/Step Time": 8.49381204508245} +{"Pretrain/Learning Rate": 3.640778479644673e-05, "Pretrain/Loss": 2.033111095428467, "Pretrain/Loss (Raw)": 2.2436740398406982, "Pretrain/Step": 7032, "Pretrain/Step Time": 8.49429482780397} +{"Pretrain/Learning Rate": 3.640400719770777e-05, "Pretrain/Loss": 2.034482955932617, "Pretrain/Loss (Raw)": 1.977595329284668, "Pretrain/Step": 7033, "Pretrain/Step Time": 8.497596116736531} +{"Pretrain/Learning Rate": 3.64002292701423e-05, "Pretrain/Loss": 2.0331473350524902, "Pretrain/Loss (Raw)": 1.875480055809021, "Pretrain/Step": 7034, "Pretrain/Step Time": 8.499368507415056} +{"Pretrain/Learning Rate": 3.639645101385926e-05, "Pretrain/Loss": 2.033372163772583, "Pretrain/Loss (Raw)": 2.019146203994751, "Pretrain/Step": 7035, "Pretrain/Step Time": 8.495133874937892} +{"Pretrain/Learning Rate": 3.6392672428967576e-05, "Pretrain/Loss": 2.0329575538635254, "Pretrain/Loss (Raw)": 1.906308889389038, "Pretrain/Step": 7036, "Pretrain/Step Time": 8.49132445640862} +{"Pretrain/Learning Rate": 3.638889351557623e-05, "Pretrain/Loss": 2.0348410606384277, "Pretrain/Loss (Raw)": 2.2114481925964355, "Pretrain/Step": 7037, "Pretrain/Step Time": 8.496117098256946} +{"Pretrain/Learning Rate": 3.638511427379416e-05, "Pretrain/Loss": 2.036299705505371, "Pretrain/Loss (Raw)": 2.167367458343506, "Pretrain/Step": 7038, "Pretrain/Step Time": 8.494451159611344} +{"Pretrain/Learning Rate": 3.6381334703730344e-05, "Pretrain/Loss": 2.035191535949707, "Pretrain/Loss (Raw)": 1.8727364540100098, "Pretrain/Step": 7039, "Pretrain/Step Time": 8.494067251682281} +{"Pretrain/Learning Rate": 3.637755480549377e-05, "Pretrain/Loss": 2.0372531414031982, "Pretrain/Loss (Raw)": 2.181816339492798, "Pretrain/Step": 7040, "Pretrain/Step Time": 8.495702132582664} +{"Pretrain/Learning Rate": 3.637377457919342e-05, "Pretrain/Loss": 2.0356428623199463, "Pretrain/Loss (Raw)": 1.7395823001861572, "Pretrain/Step": 7041, "Pretrain/Step Time": 8.494542270898819} +{"Pretrain/Learning Rate": 3.6369994024938306e-05, "Pretrain/Loss": 2.0356087684631348, "Pretrain/Loss (Raw)": 1.9020402431488037, "Pretrain/Step": 7042, "Pretrain/Step Time": 8.485908417031169} +{"Pretrain/Learning Rate": 3.636621314283742e-05, "Pretrain/Loss": 2.0365376472473145, "Pretrain/Loss (Raw)": 2.10406756401062, "Pretrain/Step": 7043, "Pretrain/Step Time": 8.490470873191953} +{"Pretrain/Learning Rate": 3.63624319329998e-05, "Pretrain/Loss": 2.035449504852295, "Pretrain/Loss (Raw)": 2.1151227951049805, "Pretrain/Step": 7044, "Pretrain/Step Time": 8.492716830223799} +{"Pretrain/Learning Rate": 3.6358650395534454e-05, "Pretrain/Loss": 2.0376973152160645, "Pretrain/Loss (Raw)": 2.185049295425415, "Pretrain/Step": 7045, "Pretrain/Step Time": 8.493452481925488} +{"Pretrain/Learning Rate": 3.6354868530550436e-05, "Pretrain/Loss": 2.0372314453125, "Pretrain/Loss (Raw)": 2.0432913303375244, "Pretrain/Step": 7046, "Pretrain/Step Time": 8.491262670606375} +{"Pretrain/Learning Rate": 3.635108633815679e-05, "Pretrain/Loss": 2.039000988006592, "Pretrain/Loss (Raw)": 2.1154532432556152, "Pretrain/Step": 7047, "Pretrain/Step Time": 8.493084335699677} +{"Pretrain/Learning Rate": 3.634730381846257e-05, "Pretrain/Loss": 2.0390028953552246, "Pretrain/Loss (Raw)": 1.9959570169448853, "Pretrain/Step": 7048, "Pretrain/Step Time": 8.493610765784979} +{"Pretrain/Learning Rate": 3.6343520971576847e-05, "Pretrain/Loss": 2.0378026962280273, "Pretrain/Loss (Raw)": 2.0068259239196777, "Pretrain/Step": 7049, "Pretrain/Step Time": 8.499745901674032} +{"Pretrain/Learning Rate": 3.633973779760869e-05, "Pretrain/Loss": 2.036534547805786, "Pretrain/Loss (Raw)": 2.064772844314575, "Pretrain/Step": 7050, "Pretrain/Step Time": 8.494835134595633} +{"Pretrain/Learning Rate": 3.633595429666719e-05, "Pretrain/Loss": 2.037191867828369, "Pretrain/Loss (Raw)": 2.0798943042755127, "Pretrain/Step": 7051, "Pretrain/Step Time": 8.495765751227736} +{"Pretrain/Learning Rate": 3.6332170468861436e-05, "Pretrain/Loss": 2.038752555847168, "Pretrain/Loss (Raw)": 2.19834041595459, "Pretrain/Step": 7052, "Pretrain/Step Time": 8.494468634948134} +{"Pretrain/Learning Rate": 3.632838631430054e-05, "Pretrain/Loss": 2.039097785949707, "Pretrain/Loss (Raw)": 2.120525360107422, "Pretrain/Step": 7053, "Pretrain/Step Time": 8.499031180515885} +{"Pretrain/Learning Rate": 3.632460183309361e-05, "Pretrain/Loss": 2.0417261123657227, "Pretrain/Loss (Raw)": 2.1288533210754395, "Pretrain/Step": 7054, "Pretrain/Step Time": 8.491884239017963} +{"Pretrain/Learning Rate": 3.6320817025349764e-05, "Pretrain/Loss": 2.039957284927368, "Pretrain/Loss (Raw)": 2.0063629150390625, "Pretrain/Step": 7055, "Pretrain/Step Time": 8.492938904091716} +{"Pretrain/Learning Rate": 3.6317031891178146e-05, "Pretrain/Loss": 2.039578914642334, "Pretrain/Loss (Raw)": 2.0342822074890137, "Pretrain/Step": 7056, "Pretrain/Step Time": 8.493833784013987} +{"Pretrain/Learning Rate": 3.6313246430687884e-05, "Pretrain/Loss": 2.037644386291504, "Pretrain/Loss (Raw)": 1.940220594406128, "Pretrain/Step": 7057, "Pretrain/Step Time": 8.491732640191913} +{"Pretrain/Learning Rate": 3.6309460643988144e-05, "Pretrain/Loss": 2.040235996246338, "Pretrain/Loss (Raw)": 2.206040859222412, "Pretrain/Step": 7058, "Pretrain/Step Time": 8.494566217064857} +{"Pretrain/Learning Rate": 3.630567453118808e-05, "Pretrain/Loss": 2.0405325889587402, "Pretrain/Loss (Raw)": 2.0986220836639404, "Pretrain/Step": 7059, "Pretrain/Step Time": 8.48969162069261} +{"Pretrain/Learning Rate": 3.6301888092396854e-05, "Pretrain/Loss": 2.0408735275268555, "Pretrain/Loss (Raw)": 2.035813331604004, "Pretrain/Step": 7060, "Pretrain/Step Time": 8.48439434543252} +{"Pretrain/Learning Rate": 3.629810132772365e-05, "Pretrain/Loss": 2.041292190551758, "Pretrain/Loss (Raw)": 2.1007933616638184, "Pretrain/Step": 7061, "Pretrain/Step Time": 8.480368562042713} +{"Pretrain/Learning Rate": 3.6294314237277667e-05, "Pretrain/Loss": 2.039534091949463, "Pretrain/Loss (Raw)": 1.8835043907165527, "Pretrain/Step": 7062, "Pretrain/Step Time": 8.484538218006492} +{"Pretrain/Learning Rate": 3.629052682116808e-05, "Pretrain/Loss": 2.043518543243408, "Pretrain/Loss (Raw)": 2.4586315155029297, "Pretrain/Step": 7063, "Pretrain/Step Time": 8.482853196561337} +{"Pretrain/Learning Rate": 3.628673907950413e-05, "Pretrain/Loss": 2.040590763092041, "Pretrain/Loss (Raw)": 1.6177430152893066, "Pretrain/Step": 7064, "Pretrain/Step Time": 8.48557610809803} +{"Pretrain/Learning Rate": 3.628295101239501e-05, "Pretrain/Loss": 2.0415902137756348, "Pretrain/Loss (Raw)": 2.09735107421875, "Pretrain/Step": 7065, "Pretrain/Step Time": 8.4823387414217} +{"Pretrain/Learning Rate": 3.627916261994995e-05, "Pretrain/Loss": 2.044166088104248, "Pretrain/Loss (Raw)": 1.9391471147537231, "Pretrain/Step": 7066, "Pretrain/Step Time": 8.486573055386543} +{"Pretrain/Learning Rate": 3.6275373902278186e-05, "Pretrain/Loss": 2.0464224815368652, "Pretrain/Loss (Raw)": 2.481210231781006, "Pretrain/Step": 7067, "Pretrain/Step Time": 8.48082995787263} +{"Pretrain/Learning Rate": 3.627158485948896e-05, "Pretrain/Loss": 2.046463966369629, "Pretrain/Loss (Raw)": 2.041874647140503, "Pretrain/Step": 7068, "Pretrain/Step Time": 8.482090039178729} +{"Pretrain/Learning Rate": 3.6267795491691545e-05, "Pretrain/Loss": 2.046236991882324, "Pretrain/Loss (Raw)": 2.041419506072998, "Pretrain/Step": 7069, "Pretrain/Step Time": 8.478701891377568} +{"Pretrain/Learning Rate": 3.626400579899518e-05, "Pretrain/Loss": 2.049832820892334, "Pretrain/Loss (Raw)": 2.372084856033325, "Pretrain/Step": 7070, "Pretrain/Step Time": 8.481470564380288} +{"Pretrain/Learning Rate": 3.626021578150915e-05, "Pretrain/Loss": 2.0517728328704834, "Pretrain/Loss (Raw)": 2.1606459617614746, "Pretrain/Step": 7071, "Pretrain/Step Time": 8.479916706681252} +{"Pretrain/Learning Rate": 3.625642543934273e-05, "Pretrain/Loss": 2.0540599822998047, "Pretrain/Loss (Raw)": 2.2961437702178955, "Pretrain/Step": 7072, "Pretrain/Step Time": 8.484374122694135} +{"Pretrain/Learning Rate": 3.6252634772605225e-05, "Pretrain/Loss": 2.0548038482666016, "Pretrain/Loss (Raw)": 2.1925759315490723, "Pretrain/Step": 7073, "Pretrain/Step Time": 8.484751937910914} +{"Pretrain/Learning Rate": 3.624884378140593e-05, "Pretrain/Loss": 2.056506633758545, "Pretrain/Loss (Raw)": 2.268929958343506, "Pretrain/Step": 7074, "Pretrain/Step Time": 8.481502786278725} +{"Pretrain/Learning Rate": 3.624505246585416e-05, "Pretrain/Loss": 2.05781888961792, "Pretrain/Loss (Raw)": 2.141540050506592, "Pretrain/Step": 7075, "Pretrain/Step Time": 8.484370436519384} +{"Pretrain/Learning Rate": 3.624126082605922e-05, "Pretrain/Loss": 2.056825637817383, "Pretrain/Loss (Raw)": 1.9809751510620117, "Pretrain/Step": 7076, "Pretrain/Step Time": 8.482914324849844} +{"Pretrain/Learning Rate": 3.623746886213044e-05, "Pretrain/Loss": 2.053236722946167, "Pretrain/Loss (Raw)": 1.7169668674468994, "Pretrain/Step": 7077, "Pretrain/Step Time": 8.486351434141397} +{"Pretrain/Learning Rate": 3.623367657417718e-05, "Pretrain/Loss": 2.052464485168457, "Pretrain/Loss (Raw)": 1.9012130498886108, "Pretrain/Step": 7078, "Pretrain/Step Time": 8.478187814354897} +{"Pretrain/Learning Rate": 3.622988396230877e-05, "Pretrain/Loss": 2.052415370941162, "Pretrain/Loss (Raw)": 2.0147838592529297, "Pretrain/Step": 7079, "Pretrain/Step Time": 8.486613102257252} +{"Pretrain/Learning Rate": 3.6226091026634576e-05, "Pretrain/Loss": 2.0527284145355225, "Pretrain/Loss (Raw)": 2.14273738861084, "Pretrain/Step": 7080, "Pretrain/Step Time": 8.485241368412971} +{"Pretrain/Learning Rate": 3.622229776726396e-05, "Pretrain/Loss": 2.0516629219055176, "Pretrain/Loss (Raw)": 1.9043406248092651, "Pretrain/Step": 7081, "Pretrain/Step Time": 8.484227595850825} +{"Pretrain/Learning Rate": 3.6218504184306295e-05, "Pretrain/Loss": 2.051325559616089, "Pretrain/Loss (Raw)": 2.002439022064209, "Pretrain/Step": 7082, "Pretrain/Step Time": 8.481619549915195} +{"Pretrain/Learning Rate": 3.621471027787097e-05, "Pretrain/Loss": 2.0547056198120117, "Pretrain/Loss (Raw)": 2.180701732635498, "Pretrain/Step": 7083, "Pretrain/Step Time": 8.476887702941895} +{"Pretrain/Learning Rate": 3.621091604806739e-05, "Pretrain/Loss": 2.0532162189483643, "Pretrain/Loss (Raw)": 1.930531620979309, "Pretrain/Step": 7084, "Pretrain/Step Time": 8.486527053639293} +{"Pretrain/Learning Rate": 3.6207121495004935e-05, "Pretrain/Loss": 2.050675868988037, "Pretrain/Loss (Raw)": 1.762547254562378, "Pretrain/Step": 7085, "Pretrain/Step Time": 8.484556376934052} +{"Pretrain/Learning Rate": 3.6203326618793046e-05, "Pretrain/Loss": 2.05206036567688, "Pretrain/Loss (Raw)": 2.0399069786071777, "Pretrain/Step": 7086, "Pretrain/Step Time": 8.483330205082893} +{"Pretrain/Learning Rate": 3.619953141954113e-05, "Pretrain/Loss": 2.051942825317383, "Pretrain/Loss (Raw)": 1.9822943210601807, "Pretrain/Step": 7087, "Pretrain/Step Time": 8.48322725482285} +{"Pretrain/Learning Rate": 3.6195735897358616e-05, "Pretrain/Loss": 2.053995132446289, "Pretrain/Loss (Raw)": 2.1070406436920166, "Pretrain/Step": 7088, "Pretrain/Step Time": 8.488229881972075} +{"Pretrain/Learning Rate": 3.619194005235494e-05, "Pretrain/Loss": 2.0531985759735107, "Pretrain/Loss (Raw)": 1.851117730140686, "Pretrain/Step": 7089, "Pretrain/Step Time": 8.48764762096107} +{"Pretrain/Learning Rate": 3.6188143884639575e-05, "Pretrain/Loss": 2.0534939765930176, "Pretrain/Loss (Raw)": 1.933255672454834, "Pretrain/Step": 7090, "Pretrain/Step Time": 8.482065403833985} +{"Pretrain/Learning Rate": 3.618434739432197e-05, "Pretrain/Loss": 2.053907871246338, "Pretrain/Loss (Raw)": 2.214378833770752, "Pretrain/Step": 7091, "Pretrain/Step Time": 8.486128157004714} +{"Pretrain/Learning Rate": 3.6180550581511585e-05, "Pretrain/Loss": 2.0560812950134277, "Pretrain/Loss (Raw)": 2.183260917663574, "Pretrain/Step": 7092, "Pretrain/Step Time": 8.484861679375172} +{"Pretrain/Learning Rate": 3.617675344631791e-05, "Pretrain/Loss": 2.0541207790374756, "Pretrain/Loss (Raw)": 2.0531654357910156, "Pretrain/Step": 7093, "Pretrain/Step Time": 8.483420141041279} +{"Pretrain/Learning Rate": 3.6172955988850424e-05, "Pretrain/Loss": 2.052504539489746, "Pretrain/Loss (Raw)": 2.1681969165802, "Pretrain/Step": 7094, "Pretrain/Step Time": 8.48769653774798} +{"Pretrain/Learning Rate": 3.616915820921863e-05, "Pretrain/Loss": 2.051912307739258, "Pretrain/Loss (Raw)": 2.112187147140503, "Pretrain/Step": 7095, "Pretrain/Step Time": 8.484086753800511} +{"Pretrain/Learning Rate": 3.616536010753204e-05, "Pretrain/Loss": 2.0522947311401367, "Pretrain/Loss (Raw)": 2.2078640460968018, "Pretrain/Step": 7096, "Pretrain/Step Time": 8.485527919605374} +{"Pretrain/Learning Rate": 3.616156168390016e-05, "Pretrain/Loss": 2.0488829612731934, "Pretrain/Loss (Raw)": 1.7173200845718384, "Pretrain/Step": 7097, "Pretrain/Step Time": 8.489396484568715} +{"Pretrain/Learning Rate": 3.615776293843251e-05, "Pretrain/Loss": 2.0470597743988037, "Pretrain/Loss (Raw)": 1.835644245147705, "Pretrain/Step": 7098, "Pretrain/Step Time": 8.49257729947567} +{"Pretrain/Learning Rate": 3.615396387123864e-05, "Pretrain/Loss": 2.0451576709747314, "Pretrain/Loss (Raw)": 1.9963972568511963, "Pretrain/Step": 7099, "Pretrain/Step Time": 8.484583685174584} +{"Pretrain/Learning Rate": 3.6150164482428076e-05, "Pretrain/Loss": 2.04516339302063, "Pretrain/Loss (Raw)": 2.128894329071045, "Pretrain/Step": 7100, "Pretrain/Step Time": 8.48912363871932} +{"Pretrain/Learning Rate": 3.614636477211039e-05, "Pretrain/Loss": 2.04470157623291, "Pretrain/Loss (Raw)": 2.1289377212524414, "Pretrain/Step": 7101, "Pretrain/Step Time": 8.489281250163913} +{"Pretrain/Learning Rate": 3.614256474039512e-05, "Pretrain/Loss": 2.044767379760742, "Pretrain/Loss (Raw)": 2.1142075061798096, "Pretrain/Step": 7102, "Pretrain/Step Time": 8.490295542404056} +{"Pretrain/Learning Rate": 3.613876438739186e-05, "Pretrain/Loss": 2.044557571411133, "Pretrain/Loss (Raw)": 1.9385120868682861, "Pretrain/Step": 7103, "Pretrain/Step Time": 8.485157137736678} +{"Pretrain/Learning Rate": 3.613496371321018e-05, "Pretrain/Loss": 2.0448079109191895, "Pretrain/Loss (Raw)": 2.066782236099243, "Pretrain/Step": 7104, "Pretrain/Step Time": 8.486753793433309} +{"Pretrain/Learning Rate": 3.613116271795967e-05, "Pretrain/Loss": 2.0403945446014404, "Pretrain/Loss (Raw)": 1.8050220012664795, "Pretrain/Step": 7105, "Pretrain/Step Time": 8.488578768447042} +{"Pretrain/Learning Rate": 3.612736140174993e-05, "Pretrain/Loss": 2.034557819366455, "Pretrain/Loss (Raw)": 1.8379673957824707, "Pretrain/Step": 7106, "Pretrain/Step Time": 8.488303733989596} +{"Pretrain/Learning Rate": 3.612355976469057e-05, "Pretrain/Loss": 2.035473346710205, "Pretrain/Loss (Raw)": 2.063944101333618, "Pretrain/Step": 7107, "Pretrain/Step Time": 8.490599812939763} +{"Pretrain/Learning Rate": 3.6119757806891204e-05, "Pretrain/Loss": 2.035102128982544, "Pretrain/Loss (Raw)": 1.866057276725769, "Pretrain/Step": 7108, "Pretrain/Step Time": 8.49010681733489} +{"Pretrain/Learning Rate": 3.611595552846146e-05, "Pretrain/Loss": 2.034867763519287, "Pretrain/Loss (Raw)": 1.7484742403030396, "Pretrain/Step": 7109, "Pretrain/Step Time": 8.483801690861583} +{"Pretrain/Learning Rate": 3.611215292951097e-05, "Pretrain/Loss": 2.037116050720215, "Pretrain/Loss (Raw)": 2.1448614597320557, "Pretrain/Step": 7110, "Pretrain/Step Time": 8.486912000924349} +{"Pretrain/Learning Rate": 3.61083500101494e-05, "Pretrain/Loss": 2.0383124351501465, "Pretrain/Loss (Raw)": 2.1741878986358643, "Pretrain/Step": 7111, "Pretrain/Step Time": 8.490641944110394} +{"Pretrain/Learning Rate": 3.6104546770486375e-05, "Pretrain/Loss": 2.037290096282959, "Pretrain/Loss (Raw)": 2.1544089317321777, "Pretrain/Step": 7112, "Pretrain/Step Time": 8.493525998666883} +{"Pretrain/Learning Rate": 3.610074321063158e-05, "Pretrain/Loss": 2.0342698097229004, "Pretrain/Loss (Raw)": 1.9832640886306763, "Pretrain/Step": 7113, "Pretrain/Step Time": 8.492402097210288} +{"Pretrain/Learning Rate": 3.609693933069467e-05, "Pretrain/Loss": 2.0379228591918945, "Pretrain/Loss (Raw)": 2.1845791339874268, "Pretrain/Step": 7114, "Pretrain/Step Time": 8.490631978958845} +{"Pretrain/Learning Rate": 3.609313513078534e-05, "Pretrain/Loss": 2.036076068878174, "Pretrain/Loss (Raw)": 1.998920202255249, "Pretrain/Step": 7115, "Pretrain/Step Time": 8.490493409335613} +{"Pretrain/Learning Rate": 3.6089330611013284e-05, "Pretrain/Loss": 2.0325846672058105, "Pretrain/Loss (Raw)": 1.6676584482192993, "Pretrain/Step": 7116, "Pretrain/Step Time": 8.489298064261675} +{"Pretrain/Learning Rate": 3.6085525771488187e-05, "Pretrain/Loss": 2.034846305847168, "Pretrain/Loss (Raw)": 2.0803117752075195, "Pretrain/Step": 7117, "Pretrain/Step Time": 8.490846449509263} +{"Pretrain/Learning Rate": 3.608172061231978e-05, "Pretrain/Loss": 2.0353822708129883, "Pretrain/Loss (Raw)": 2.0620510578155518, "Pretrain/Step": 7118, "Pretrain/Step Time": 8.489294728264213} +{"Pretrain/Learning Rate": 3.607791513361777e-05, "Pretrain/Loss": 2.0334815979003906, "Pretrain/Loss (Raw)": 1.9911773204803467, "Pretrain/Step": 7119, "Pretrain/Step Time": 8.489020306617022} +{"Pretrain/Learning Rate": 3.607410933549188e-05, "Pretrain/Loss": 2.033766269683838, "Pretrain/Loss (Raw)": 1.9335389137268066, "Pretrain/Step": 7120, "Pretrain/Step Time": 8.487251494079828} +{"Pretrain/Learning Rate": 3.607030321805186e-05, "Pretrain/Loss": 2.033276081085205, "Pretrain/Loss (Raw)": 2.052076578140259, "Pretrain/Step": 7121, "Pretrain/Step Time": 8.487530201673508} +{"Pretrain/Learning Rate": 3.6066496781407443e-05, "Pretrain/Loss": 2.0328352451324463, "Pretrain/Loss (Raw)": 2.12026047706604, "Pretrain/Step": 7122, "Pretrain/Step Time": 8.48864029161632} +{"Pretrain/Learning Rate": 3.606269002566841e-05, "Pretrain/Loss": 2.0316720008850098, "Pretrain/Loss (Raw)": 1.8784254789352417, "Pretrain/Step": 7123, "Pretrain/Step Time": 8.488433681428432} +{"Pretrain/Learning Rate": 3.605888295094449e-05, "Pretrain/Loss": 2.0315446853637695, "Pretrain/Loss (Raw)": 1.9705002307891846, "Pretrain/Step": 7124, "Pretrain/Step Time": 8.483930237591267} +{"Pretrain/Learning Rate": 3.605507555734549e-05, "Pretrain/Loss": 2.030978202819824, "Pretrain/Loss (Raw)": 1.9895269870758057, "Pretrain/Step": 7125, "Pretrain/Step Time": 8.482923885807395} +{"Pretrain/Learning Rate": 3.6051267844981164e-05, "Pretrain/Loss": 2.030623435974121, "Pretrain/Loss (Raw)": 1.9824990034103394, "Pretrain/Step": 7126, "Pretrain/Step Time": 8.478974021971226} +{"Pretrain/Learning Rate": 3.604745981396132e-05, "Pretrain/Loss": 2.027604103088379, "Pretrain/Loss (Raw)": 1.6222304105758667, "Pretrain/Step": 7127, "Pretrain/Step Time": 8.483416268602014} +{"Pretrain/Learning Rate": 3.604365146439578e-05, "Pretrain/Loss": 2.026693105697632, "Pretrain/Loss (Raw)": 1.8577876091003418, "Pretrain/Step": 7128, "Pretrain/Step Time": 8.483034925535321} +{"Pretrain/Learning Rate": 3.6039842796394324e-05, "Pretrain/Loss": 2.028240442276001, "Pretrain/Loss (Raw)": 2.0306236743927, "Pretrain/Step": 7129, "Pretrain/Step Time": 8.484298953786492} +{"Pretrain/Learning Rate": 3.6036033810066785e-05, "Pretrain/Loss": 2.0288727283477783, "Pretrain/Loss (Raw)": 1.9361263513565063, "Pretrain/Step": 7130, "Pretrain/Step Time": 8.481288300827146} +{"Pretrain/Learning Rate": 3.603222450552299e-05, "Pretrain/Loss": 2.0277583599090576, "Pretrain/Loss (Raw)": 1.9199618101119995, "Pretrain/Step": 7131, "Pretrain/Step Time": 8.479948030784726} +{"Pretrain/Learning Rate": 3.6028414882872775e-05, "Pretrain/Loss": 2.0266265869140625, "Pretrain/Loss (Raw)": 1.8788365125656128, "Pretrain/Step": 7132, "Pretrain/Step Time": 8.48633111640811} +{"Pretrain/Learning Rate": 3.6024604942226005e-05, "Pretrain/Loss": 2.0263049602508545, "Pretrain/Loss (Raw)": 2.086272954940796, "Pretrain/Step": 7133, "Pretrain/Step Time": 8.483809933066368} +{"Pretrain/Learning Rate": 3.6020794683692506e-05, "Pretrain/Loss": 2.027679920196533, "Pretrain/Loss (Raw)": 2.0942559242248535, "Pretrain/Step": 7134, "Pretrain/Step Time": 8.487068694084883} +{"Pretrain/Learning Rate": 3.601698410738217e-05, "Pretrain/Loss": 2.0268452167510986, "Pretrain/Loss (Raw)": 2.029423236846924, "Pretrain/Step": 7135, "Pretrain/Step Time": 8.486425809562206} +{"Pretrain/Learning Rate": 3.601317321340486e-05, "Pretrain/Loss": 2.027292251586914, "Pretrain/Loss (Raw)": 2.043092727661133, "Pretrain/Step": 7136, "Pretrain/Step Time": 8.48649457655847} +{"Pretrain/Learning Rate": 3.600936200187047e-05, "Pretrain/Loss": 2.0318925380706787, "Pretrain/Loss (Raw)": 2.4043614864349365, "Pretrain/Step": 7137, "Pretrain/Step Time": 8.48516196012497} +{"Pretrain/Learning Rate": 3.600555047288888e-05, "Pretrain/Loss": 2.0338878631591797, "Pretrain/Loss (Raw)": 2.093168020248413, "Pretrain/Step": 7138, "Pretrain/Step Time": 8.485608393326402} +{"Pretrain/Learning Rate": 3.6001738626570005e-05, "Pretrain/Loss": 2.0348381996154785, "Pretrain/Loss (Raw)": 2.058772325515747, "Pretrain/Step": 7139, "Pretrain/Step Time": 8.48377831466496} +{"Pretrain/Learning Rate": 3.599792646302376e-05, "Pretrain/Loss": 2.036799430847168, "Pretrain/Loss (Raw)": 2.125011682510376, "Pretrain/Step": 7140, "Pretrain/Step Time": 8.48345229960978} +{"Pretrain/Learning Rate": 3.5994113982360044e-05, "Pretrain/Loss": 2.03861141204834, "Pretrain/Loss (Raw)": 2.231360673904419, "Pretrain/Step": 7141, "Pretrain/Step Time": 8.480117103084922} +{"Pretrain/Learning Rate": 3.599030118468881e-05, "Pretrain/Loss": 2.037442922592163, "Pretrain/Loss (Raw)": 1.8992472887039185, "Pretrain/Step": 7142, "Pretrain/Step Time": 8.480806414037943} +{"Pretrain/Learning Rate": 3.598648807011999e-05, "Pretrain/Loss": 2.0433602333068848, "Pretrain/Loss (Raw)": 2.012385606765747, "Pretrain/Step": 7143, "Pretrain/Step Time": 8.483343413099647} +{"Pretrain/Learning Rate": 3.598267463876352e-05, "Pretrain/Loss": 2.043250799179077, "Pretrain/Loss (Raw)": 2.004481077194214, "Pretrain/Step": 7144, "Pretrain/Step Time": 8.48547220788896} +{"Pretrain/Learning Rate": 3.5978860890729384e-05, "Pretrain/Loss": 2.0422134399414062, "Pretrain/Loss (Raw)": 1.9617127180099487, "Pretrain/Step": 7145, "Pretrain/Step Time": 8.486413581296802} +{"Pretrain/Learning Rate": 3.597504682612753e-05, "Pretrain/Loss": 2.043630599975586, "Pretrain/Loss (Raw)": 2.1478123664855957, "Pretrain/Step": 7146, "Pretrain/Step Time": 8.48142128251493} +{"Pretrain/Learning Rate": 3.597123244506793e-05, "Pretrain/Loss": 2.042670726776123, "Pretrain/Loss (Raw)": 1.8225690126419067, "Pretrain/Step": 7147, "Pretrain/Step Time": 8.48525132983923} +{"Pretrain/Learning Rate": 3.5967417747660584e-05, "Pretrain/Loss": 2.041811466217041, "Pretrain/Loss (Raw)": 1.9503512382507324, "Pretrain/Step": 7148, "Pretrain/Step Time": 8.482252433896065} +{"Pretrain/Learning Rate": 3.596360273401548e-05, "Pretrain/Loss": 2.037466049194336, "Pretrain/Loss (Raw)": 1.8073800802230835, "Pretrain/Step": 7149, "Pretrain/Step Time": 8.480651369318366} +{"Pretrain/Learning Rate": 3.595978740424262e-05, "Pretrain/Loss": 2.0364303588867188, "Pretrain/Loss (Raw)": 1.9937769174575806, "Pretrain/Step": 7150, "Pretrain/Step Time": 8.479234034195542} +{"Pretrain/Learning Rate": 3.595597175845201e-05, "Pretrain/Loss": 2.03489351272583, "Pretrain/Loss (Raw)": 1.8566193580627441, "Pretrain/Step": 7151, "Pretrain/Step Time": 8.483033897355199} +{"Pretrain/Learning Rate": 3.5952155796753676e-05, "Pretrain/Loss": 2.0339298248291016, "Pretrain/Loss (Raw)": 1.9355542659759521, "Pretrain/Step": 7152, "Pretrain/Step Time": 8.486416364088655} +{"Pretrain/Learning Rate": 3.594833951925766e-05, "Pretrain/Loss": 2.032895088195801, "Pretrain/Loss (Raw)": 2.1118717193603516, "Pretrain/Step": 7153, "Pretrain/Step Time": 8.483827577903867} +{"Pretrain/Learning Rate": 3.5944522926073984e-05, "Pretrain/Loss": 2.02805233001709, "Pretrain/Loss (Raw)": 1.7037231922149658, "Pretrain/Step": 7154, "Pretrain/Step Time": 8.489285480231047} +{"Pretrain/Learning Rate": 3.594070601731272e-05, "Pretrain/Loss": 2.02701473236084, "Pretrain/Loss (Raw)": 2.0718705654144287, "Pretrain/Step": 7155, "Pretrain/Step Time": 8.490062829107046} +{"Pretrain/Learning Rate": 3.593688879308389e-05, "Pretrain/Loss": 2.026613712310791, "Pretrain/Loss (Raw)": 1.9846829175949097, "Pretrain/Step": 7156, "Pretrain/Step Time": 8.488190615549684} +{"Pretrain/Learning Rate": 3.59330712534976e-05, "Pretrain/Loss": 2.0270166397094727, "Pretrain/Loss (Raw)": 2.1086266040802, "Pretrain/Step": 7157, "Pretrain/Step Time": 8.485530896112323} +{"Pretrain/Learning Rate": 3.592925339866389e-05, "Pretrain/Loss": 2.027449131011963, "Pretrain/Loss (Raw)": 1.916874885559082, "Pretrain/Step": 7158, "Pretrain/Step Time": 8.484101751819253} +{"Pretrain/Learning Rate": 3.5925435228692874e-05, "Pretrain/Loss": 2.025554656982422, "Pretrain/Loss (Raw)": 1.8935798406600952, "Pretrain/Step": 7159, "Pretrain/Step Time": 8.482978366315365} +{"Pretrain/Learning Rate": 3.592161674369464e-05, "Pretrain/Loss": 2.0254592895507812, "Pretrain/Loss (Raw)": 2.231463670730591, "Pretrain/Step": 7160, "Pretrain/Step Time": 8.482928643003106} +{"Pretrain/Learning Rate": 3.591779794377928e-05, "Pretrain/Loss": 2.025367498397827, "Pretrain/Loss (Raw)": 1.9658350944519043, "Pretrain/Step": 7161, "Pretrain/Step Time": 8.481923623010516} +{"Pretrain/Learning Rate": 3.5913978829056904e-05, "Pretrain/Loss": 2.027562379837036, "Pretrain/Loss (Raw)": 2.1564385890960693, "Pretrain/Step": 7162, "Pretrain/Step Time": 8.479755379259586} +{"Pretrain/Learning Rate": 3.591015939963764e-05, "Pretrain/Loss": 2.028491258621216, "Pretrain/Loss (Raw)": 2.1380398273468018, "Pretrain/Step": 7163, "Pretrain/Step Time": 8.48048147186637} +{"Pretrain/Learning Rate": 3.5906339655631635e-05, "Pretrain/Loss": 2.030334949493408, "Pretrain/Loss (Raw)": 2.1423110961914062, "Pretrain/Step": 7164, "Pretrain/Step Time": 8.484223922714591} +{"Pretrain/Learning Rate": 3.5902519597149015e-05, "Pretrain/Loss": 2.0290560722351074, "Pretrain/Loss (Raw)": 2.0477347373962402, "Pretrain/Step": 7165, "Pretrain/Step Time": 8.480119356885552} +{"Pretrain/Learning Rate": 3.589869922429993e-05, "Pretrain/Loss": 2.0271155834198, "Pretrain/Loss (Raw)": 1.9189969301223755, "Pretrain/Step": 7166, "Pretrain/Step Time": 8.483419880270958} +{"Pretrain/Learning Rate": 3.589487853719452e-05, "Pretrain/Loss": 2.0286264419555664, "Pretrain/Loss (Raw)": 2.066110134124756, "Pretrain/Step": 7167, "Pretrain/Step Time": 8.483604710549116} +{"Pretrain/Learning Rate": 3.589105753594298e-05, "Pretrain/Loss": 2.0285286903381348, "Pretrain/Loss (Raw)": 2.1693077087402344, "Pretrain/Step": 7168, "Pretrain/Step Time": 8.482507890090346} +{"Pretrain/Learning Rate": 3.588723622065547e-05, "Pretrain/Loss": 2.029714584350586, "Pretrain/Loss (Raw)": 1.8913675546646118, "Pretrain/Step": 7169, "Pretrain/Step Time": 8.483883682638407} +{"Pretrain/Learning Rate": 3.588341459144218e-05, "Pretrain/Loss": 2.0305380821228027, "Pretrain/Loss (Raw)": 2.0074784755706787, "Pretrain/Step": 7170, "Pretrain/Step Time": 8.481852499768138} +{"Pretrain/Learning Rate": 3.58795926484133e-05, "Pretrain/Loss": 2.0310115814208984, "Pretrain/Loss (Raw)": 2.1646718978881836, "Pretrain/Step": 7171, "Pretrain/Step Time": 8.482962960377336} +{"Pretrain/Learning Rate": 3.587577039167904e-05, "Pretrain/Loss": 2.0299439430236816, "Pretrain/Loss (Raw)": 1.9784369468688965, "Pretrain/Step": 7172, "Pretrain/Step Time": 8.476993702352047} +{"Pretrain/Learning Rate": 3.587194782134961e-05, "Pretrain/Loss": 2.032773494720459, "Pretrain/Loss (Raw)": 2.5472772121429443, "Pretrain/Step": 7173, "Pretrain/Step Time": 8.475469252094626} +{"Pretrain/Learning Rate": 3.5868124937535215e-05, "Pretrain/Loss": 2.031900405883789, "Pretrain/Loss (Raw)": 1.9315197467803955, "Pretrain/Step": 7174, "Pretrain/Step Time": 8.478067938238382} +{"Pretrain/Learning Rate": 3.586430174034611e-05, "Pretrain/Loss": 2.032017230987549, "Pretrain/Loss (Raw)": 2.130413055419922, "Pretrain/Step": 7175, "Pretrain/Step Time": 8.47581129334867} +{"Pretrain/Learning Rate": 3.586047822989253e-05, "Pretrain/Loss": 2.0378975868225098, "Pretrain/Loss (Raw)": 2.7486042976379395, "Pretrain/Step": 7176, "Pretrain/Step Time": 8.47322547622025} +{"Pretrain/Learning Rate": 3.585665440628469e-05, "Pretrain/Loss": 2.0383810997009277, "Pretrain/Loss (Raw)": 2.068727493286133, "Pretrain/Step": 7177, "Pretrain/Step Time": 8.465760888531804} +{"Pretrain/Learning Rate": 3.58528302696329e-05, "Pretrain/Loss": 2.038095474243164, "Pretrain/Loss (Raw)": 2.0282442569732666, "Pretrain/Step": 7178, "Pretrain/Step Time": 8.467789141461253} +{"Pretrain/Learning Rate": 3.584900582004739e-05, "Pretrain/Loss": 2.0376148223876953, "Pretrain/Loss (Raw)": 2.0183238983154297, "Pretrain/Step": 7179, "Pretrain/Step Time": 8.467529634013772} +{"Pretrain/Learning Rate": 3.5845181057638446e-05, "Pretrain/Loss": 2.0368411540985107, "Pretrain/Loss (Raw)": 2.099321126937866, "Pretrain/Step": 7180, "Pretrain/Step Time": 8.471112819388509} +{"Pretrain/Learning Rate": 3.584135598251636e-05, "Pretrain/Loss": 2.036367893218994, "Pretrain/Loss (Raw)": 2.059952974319458, "Pretrain/Step": 7181, "Pretrain/Step Time": 8.471240753307939} +{"Pretrain/Learning Rate": 3.58375305947914e-05, "Pretrain/Loss": 2.037501811981201, "Pretrain/Loss (Raw)": 2.2740063667297363, "Pretrain/Step": 7182, "Pretrain/Step Time": 8.468941098079085} +{"Pretrain/Learning Rate": 3.583370489457389e-05, "Pretrain/Loss": 2.0382933616638184, "Pretrain/Loss (Raw)": 2.107665777206421, "Pretrain/Step": 7183, "Pretrain/Step Time": 8.467740697786212} +{"Pretrain/Learning Rate": 3.582987888197414e-05, "Pretrain/Loss": 2.03741192817688, "Pretrain/Loss (Raw)": 1.9214587211608887, "Pretrain/Step": 7184, "Pretrain/Step Time": 8.46595580689609} +{"Pretrain/Learning Rate": 3.582605255710247e-05, "Pretrain/Loss": 2.0389404296875, "Pretrain/Loss (Raw)": 2.135887622833252, "Pretrain/Step": 7185, "Pretrain/Step Time": 8.469834513962269} +{"Pretrain/Learning Rate": 3.582222592006921e-05, "Pretrain/Loss": 2.0389552116394043, "Pretrain/Loss (Raw)": 2.207942485809326, "Pretrain/Step": 7186, "Pretrain/Step Time": 8.466747676953673} +{"Pretrain/Learning Rate": 3.581839897098468e-05, "Pretrain/Loss": 2.0365936756134033, "Pretrain/Loss (Raw)": 1.796337604522705, "Pretrain/Step": 7187, "Pretrain/Step Time": 8.469233591109514} +{"Pretrain/Learning Rate": 3.5814571709959254e-05, "Pretrain/Loss": 2.0348315238952637, "Pretrain/Loss (Raw)": 1.8102285861968994, "Pretrain/Step": 7188, "Pretrain/Step Time": 8.466444859281182} +{"Pretrain/Learning Rate": 3.581074413710327e-05, "Pretrain/Loss": 2.03393816947937, "Pretrain/Loss (Raw)": 1.9864706993103027, "Pretrain/Step": 7189, "Pretrain/Step Time": 8.46716490201652} +{"Pretrain/Learning Rate": 3.5806916252527106e-05, "Pretrain/Loss": 2.034973382949829, "Pretrain/Loss (Raw)": 2.015981674194336, "Pretrain/Step": 7190, "Pretrain/Step Time": 8.463172057643533} +{"Pretrain/Learning Rate": 3.580308805634113e-05, "Pretrain/Loss": 2.031629800796509, "Pretrain/Loss (Raw)": 2.030665874481201, "Pretrain/Step": 7191, "Pretrain/Step Time": 8.47087438032031} +{"Pretrain/Learning Rate": 3.579925954865572e-05, "Pretrain/Loss": 2.035637855529785, "Pretrain/Loss (Raw)": 2.130788803100586, "Pretrain/Step": 7192, "Pretrain/Step Time": 8.464475199580193} +{"Pretrain/Learning Rate": 3.579543072958128e-05, "Pretrain/Loss": 2.0347037315368652, "Pretrain/Loss (Raw)": 1.9777888059616089, "Pretrain/Step": 7193, "Pretrain/Step Time": 8.46473098360002} +{"Pretrain/Learning Rate": 3.5791601599228194e-05, "Pretrain/Loss": 2.035327911376953, "Pretrain/Loss (Raw)": 2.019049882888794, "Pretrain/Step": 7194, "Pretrain/Step Time": 8.460710354149342} +{"Pretrain/Learning Rate": 3.57877721577069e-05, "Pretrain/Loss": 2.0322673320770264, "Pretrain/Loss (Raw)": 2.089425802230835, "Pretrain/Step": 7195, "Pretrain/Step Time": 8.462431106716394} +{"Pretrain/Learning Rate": 3.578394240512779e-05, "Pretrain/Loss": 2.031756639480591, "Pretrain/Loss (Raw)": 1.9765150547027588, "Pretrain/Step": 7196, "Pretrain/Step Time": 8.466284373775125} +{"Pretrain/Learning Rate": 3.578011234160131e-05, "Pretrain/Loss": 2.033414602279663, "Pretrain/Loss (Raw)": 2.253641128540039, "Pretrain/Step": 7197, "Pretrain/Step Time": 8.46855022199452} +{"Pretrain/Learning Rate": 3.577628196723789e-05, "Pretrain/Loss": 2.02791690826416, "Pretrain/Loss (Raw)": 1.66836416721344, "Pretrain/Step": 7198, "Pretrain/Step Time": 8.465947499498725} +{"Pretrain/Learning Rate": 3.5772451282147965e-05, "Pretrain/Loss": 2.0274553298950195, "Pretrain/Loss (Raw)": 2.1015877723693848, "Pretrain/Step": 7199, "Pretrain/Step Time": 8.466952444985509} +{"Pretrain/Learning Rate": 3.576862028644201e-05, "Pretrain/Loss": 2.0250110626220703, "Pretrain/Loss (Raw)": 1.9832572937011719, "Pretrain/Step": 7200, "Pretrain/Step Time": 8.463738799095154} +{"Pretrain/Learning Rate": 3.576478898023048e-05, "Pretrain/Loss": 2.0243468284606934, "Pretrain/Loss (Raw)": 2.10758900642395, "Pretrain/Step": 7201, "Pretrain/Step Time": 8.466303933411837} +{"Pretrain/Learning Rate": 3.5760957363623846e-05, "Pretrain/Loss": 2.023493528366089, "Pretrain/Loss (Raw)": 2.159672975540161, "Pretrain/Step": 7202, "Pretrain/Step Time": 8.467139530926943} +{"Pretrain/Learning Rate": 3.575712543673259e-05, "Pretrain/Loss": 2.021914482116699, "Pretrain/Loss (Raw)": 1.9394580125808716, "Pretrain/Step": 7203, "Pretrain/Step Time": 8.46529072523117} +{"Pretrain/Learning Rate": 3.575329319966721e-05, "Pretrain/Loss": 2.022392511367798, "Pretrain/Loss (Raw)": 2.0421359539031982, "Pretrain/Step": 7204, "Pretrain/Step Time": 8.465640258044004} +{"Pretrain/Learning Rate": 3.57494606525382e-05, "Pretrain/Loss": 2.024742841720581, "Pretrain/Loss (Raw)": 2.0178096294403076, "Pretrain/Step": 7205, "Pretrain/Step Time": 8.46111004985869} +{"Pretrain/Learning Rate": 3.5745627795456074e-05, "Pretrain/Loss": 2.0273962020874023, "Pretrain/Loss (Raw)": 2.2408127784729004, "Pretrain/Step": 7206, "Pretrain/Step Time": 8.464840441942215} +{"Pretrain/Learning Rate": 3.574179462853134e-05, "Pretrain/Loss": 2.0276427268981934, "Pretrain/Loss (Raw)": 2.0463521480560303, "Pretrain/Step": 7207, "Pretrain/Step Time": 8.455665925517678} +{"Pretrain/Learning Rate": 3.5737961151874534e-05, "Pretrain/Loss": 2.030679225921631, "Pretrain/Loss (Raw)": 2.5314180850982666, "Pretrain/Step": 7208, "Pretrain/Step Time": 8.45849473029375} +{"Pretrain/Learning Rate": 3.573412736559618e-05, "Pretrain/Loss": 2.0313658714294434, "Pretrain/Loss (Raw)": 1.992256999015808, "Pretrain/Step": 7209, "Pretrain/Step Time": 8.462107826024294} +{"Pretrain/Learning Rate": 3.5730293269806834e-05, "Pretrain/Loss": 2.032020092010498, "Pretrain/Loss (Raw)": 2.0861456394195557, "Pretrain/Step": 7210, "Pretrain/Step Time": 8.459808768704534} +{"Pretrain/Learning Rate": 3.572645886461705e-05, "Pretrain/Loss": 2.032095432281494, "Pretrain/Loss (Raw)": 2.1903653144836426, "Pretrain/Step": 7211, "Pretrain/Step Time": 8.462513010948896} +{"Pretrain/Learning Rate": 3.5722624150137384e-05, "Pretrain/Loss": 2.033184051513672, "Pretrain/Loss (Raw)": 2.0698556900024414, "Pretrain/Step": 7212, "Pretrain/Step Time": 8.456034367904067} +{"Pretrain/Learning Rate": 3.5718789126478415e-05, "Pretrain/Loss": 2.0347445011138916, "Pretrain/Loss (Raw)": 1.962303876876831, "Pretrain/Step": 7213, "Pretrain/Step Time": 8.458996392786503} +{"Pretrain/Learning Rate": 3.57149537937507e-05, "Pretrain/Loss": 2.0365724563598633, "Pretrain/Loss (Raw)": 2.2738537788391113, "Pretrain/Step": 7214, "Pretrain/Step Time": 8.457015629857779} +{"Pretrain/Learning Rate": 3.5711118152064864e-05, "Pretrain/Loss": 2.03743839263916, "Pretrain/Loss (Raw)": 2.0931317806243896, "Pretrain/Step": 7215, "Pretrain/Step Time": 8.46174274198711} +{"Pretrain/Learning Rate": 3.5707282201531487e-05, "Pretrain/Loss": 2.037522792816162, "Pretrain/Loss (Raw)": 2.1178879737854004, "Pretrain/Step": 7216, "Pretrain/Step Time": 8.458805970847607} +{"Pretrain/Learning Rate": 3.5703445942261166e-05, "Pretrain/Loss": 2.038266181945801, "Pretrain/Loss (Raw)": 1.9462676048278809, "Pretrain/Step": 7217, "Pretrain/Step Time": 8.458909561857581} +{"Pretrain/Learning Rate": 3.569960937436453e-05, "Pretrain/Loss": 2.038696050643921, "Pretrain/Loss (Raw)": 1.9882595539093018, "Pretrain/Step": 7218, "Pretrain/Step Time": 8.461251340806484} +{"Pretrain/Learning Rate": 3.5695772497952206e-05, "Pretrain/Loss": 2.0367789268493652, "Pretrain/Loss (Raw)": 1.9689782857894897, "Pretrain/Step": 7219, "Pretrain/Step Time": 8.459681695327163} +{"Pretrain/Learning Rate": 3.569193531313482e-05, "Pretrain/Loss": 2.0364575386047363, "Pretrain/Loss (Raw)": 2.142155647277832, "Pretrain/Step": 7220, "Pretrain/Step Time": 8.45923014357686} +{"Pretrain/Learning Rate": 3.568809782002301e-05, "Pretrain/Loss": 2.0350594520568848, "Pretrain/Loss (Raw)": 1.8742129802703857, "Pretrain/Step": 7221, "Pretrain/Step Time": 8.457468576729298} +{"Pretrain/Learning Rate": 3.5684260018727435e-05, "Pretrain/Loss": 2.034503936767578, "Pretrain/Loss (Raw)": 2.0970468521118164, "Pretrain/Step": 7222, "Pretrain/Step Time": 8.458160184323788} +{"Pretrain/Learning Rate": 3.5680421909358765e-05, "Pretrain/Loss": 2.0344252586364746, "Pretrain/Loss (Raw)": 2.102140188217163, "Pretrain/Step": 7223, "Pretrain/Step Time": 8.457562677562237} +{"Pretrain/Learning Rate": 3.5676583492027646e-05, "Pretrain/Loss": 2.0333189964294434, "Pretrain/Loss (Raw)": 2.0662553310394287, "Pretrain/Step": 7224, "Pretrain/Step Time": 8.459998717531562} +{"Pretrain/Learning Rate": 3.5672744766844774e-05, "Pretrain/Loss": 2.0365147590637207, "Pretrain/Loss (Raw)": 2.126394748687744, "Pretrain/Step": 7225, "Pretrain/Step Time": 8.453685449436307} +{"Pretrain/Learning Rate": 3.5668905733920825e-05, "Pretrain/Loss": 2.039386749267578, "Pretrain/Loss (Raw)": 2.2032315731048584, "Pretrain/Step": 7226, "Pretrain/Step Time": 8.450755968689919} +{"Pretrain/Learning Rate": 3.566506639336651e-05, "Pretrain/Loss": 2.03932523727417, "Pretrain/Loss (Raw)": 1.988542079925537, "Pretrain/Step": 7227, "Pretrain/Step Time": 8.452891636639833} +{"Pretrain/Learning Rate": 3.566122674529252e-05, "Pretrain/Loss": 2.0382862091064453, "Pretrain/Loss (Raw)": 1.9959003925323486, "Pretrain/Step": 7228, "Pretrain/Step Time": 8.44704114459455} +{"Pretrain/Learning Rate": 3.5657386789809567e-05, "Pretrain/Loss": 2.035879611968994, "Pretrain/Loss (Raw)": 1.8208966255187988, "Pretrain/Step": 7229, "Pretrain/Step Time": 8.45918420702219} +{"Pretrain/Learning Rate": 3.565354652702838e-05, "Pretrain/Loss": 2.036590099334717, "Pretrain/Loss (Raw)": 2.205141067504883, "Pretrain/Step": 7230, "Pretrain/Step Time": 8.456269342452288} +{"Pretrain/Learning Rate": 3.56497059570597e-05, "Pretrain/Loss": 2.0382823944091797, "Pretrain/Loss (Raw)": 2.1551241874694824, "Pretrain/Step": 7231, "Pretrain/Step Time": 8.455377349629998} +{"Pretrain/Learning Rate": 3.564586508001424e-05, "Pretrain/Loss": 2.035794734954834, "Pretrain/Loss (Raw)": 1.7483619451522827, "Pretrain/Step": 7232, "Pretrain/Step Time": 8.45797954313457} +{"Pretrain/Learning Rate": 3.564202389600278e-05, "Pretrain/Loss": 2.036525249481201, "Pretrain/Loss (Raw)": 1.8985248804092407, "Pretrain/Step": 7233, "Pretrain/Step Time": 8.456894967705011} +{"Pretrain/Learning Rate": 3.563818240513605e-05, "Pretrain/Loss": 2.0360159873962402, "Pretrain/Loss (Raw)": 1.7727820873260498, "Pretrain/Step": 7234, "Pretrain/Step Time": 8.460950072854757} +{"Pretrain/Learning Rate": 3.563434060752484e-05, "Pretrain/Loss": 2.0350866317749023, "Pretrain/Loss (Raw)": 1.9449856281280518, "Pretrain/Step": 7235, "Pretrain/Step Time": 8.458715436980128} +{"Pretrain/Learning Rate": 3.563049850327991e-05, "Pretrain/Loss": 2.03410005569458, "Pretrain/Loss (Raw)": 1.7397961616516113, "Pretrain/Step": 7236, "Pretrain/Step Time": 8.460265269502997} +{"Pretrain/Learning Rate": 3.562665609251206e-05, "Pretrain/Loss": 2.036540985107422, "Pretrain/Loss (Raw)": 2.0609071254730225, "Pretrain/Step": 7237, "Pretrain/Step Time": 8.459524221718311} +{"Pretrain/Learning Rate": 3.5622813375332065e-05, "Pretrain/Loss": 2.035460948944092, "Pretrain/Loss (Raw)": 2.0065948963165283, "Pretrain/Step": 7238, "Pretrain/Step Time": 8.4574443846941} +{"Pretrain/Learning Rate": 3.5618970351850734e-05, "Pretrain/Loss": 2.0347657203674316, "Pretrain/Loss (Raw)": 2.085195541381836, "Pretrain/Step": 7239, "Pretrain/Step Time": 8.45278748869896} +{"Pretrain/Learning Rate": 3.561512702217888e-05, "Pretrain/Loss": 2.033492088317871, "Pretrain/Loss (Raw)": 1.9914054870605469, "Pretrain/Step": 7240, "Pretrain/Step Time": 8.447539497166872} +{"Pretrain/Learning Rate": 3.5611283386427316e-05, "Pretrain/Loss": 2.032527446746826, "Pretrain/Loss (Raw)": 1.8597962856292725, "Pretrain/Step": 7241, "Pretrain/Step Time": 8.45058393664658} +{"Pretrain/Learning Rate": 3.560743944470688e-05, "Pretrain/Loss": 2.030968189239502, "Pretrain/Loss (Raw)": 1.9849900007247925, "Pretrain/Step": 7242, "Pretrain/Step Time": 8.451561257243156} +{"Pretrain/Learning Rate": 3.560359519712841e-05, "Pretrain/Loss": 2.0299081802368164, "Pretrain/Loss (Raw)": 1.8632636070251465, "Pretrain/Step": 7243, "Pretrain/Step Time": 8.450564417988062} +{"Pretrain/Learning Rate": 3.559975064380274e-05, "Pretrain/Loss": 2.0329017639160156, "Pretrain/Loss (Raw)": 2.0508077144622803, "Pretrain/Step": 7244, "Pretrain/Step Time": 8.450784148648381} +{"Pretrain/Learning Rate": 3.559590578484074e-05, "Pretrain/Loss": 2.0329413414001465, "Pretrain/Loss (Raw)": 2.085355758666992, "Pretrain/Step": 7245, "Pretrain/Step Time": 8.451187605038285} +{"Pretrain/Learning Rate": 3.559206062035326e-05, "Pretrain/Loss": 2.033989191055298, "Pretrain/Loss (Raw)": 2.196211576461792, "Pretrain/Step": 7246, "Pretrain/Step Time": 8.453820381313562} +{"Pretrain/Learning Rate": 3.5588215150451185e-05, "Pretrain/Loss": 2.0336968898773193, "Pretrain/Loss (Raw)": 1.9537557363510132, "Pretrain/Step": 7247, "Pretrain/Step Time": 8.452574538066983} +{"Pretrain/Learning Rate": 3.558436937524539e-05, "Pretrain/Loss": 2.033169746398926, "Pretrain/Loss (Raw)": 1.8660681247711182, "Pretrain/Step": 7248, "Pretrain/Step Time": 8.45398075133562} +{"Pretrain/Learning Rate": 3.558052329484676e-05, "Pretrain/Loss": 2.033780097961426, "Pretrain/Loss (Raw)": 2.130197286605835, "Pretrain/Step": 7249, "Pretrain/Step Time": 8.451703315600753} +{"Pretrain/Learning Rate": 3.5576676909366206e-05, "Pretrain/Loss": 2.0330843925476074, "Pretrain/Loss (Raw)": 2.031214952468872, "Pretrain/Step": 7250, "Pretrain/Step Time": 8.452455596998334} +{"Pretrain/Learning Rate": 3.557283021891462e-05, "Pretrain/Loss": 2.0328898429870605, "Pretrain/Loss (Raw)": 1.853532314300537, "Pretrain/Step": 7251, "Pretrain/Step Time": 8.44767190888524} +{"Pretrain/Learning Rate": 3.5568983223602933e-05, "Pretrain/Loss": 2.037611484527588, "Pretrain/Loss (Raw)": 2.5748660564422607, "Pretrain/Step": 7252, "Pretrain/Step Time": 8.453429985791445} +{"Pretrain/Learning Rate": 3.5565135923542064e-05, "Pretrain/Loss": 2.0390353202819824, "Pretrain/Loss (Raw)": 2.1717474460601807, "Pretrain/Step": 7253, "Pretrain/Step Time": 8.450799925252795} +{"Pretrain/Learning Rate": 3.556128831884295e-05, "Pretrain/Loss": 2.040663719177246, "Pretrain/Loss (Raw)": 2.190946340560913, "Pretrain/Step": 7254, "Pretrain/Step Time": 8.455686179921031} +{"Pretrain/Learning Rate": 3.5557440409616536e-05, "Pretrain/Loss": 2.0447440147399902, "Pretrain/Loss (Raw)": 2.1445043087005615, "Pretrain/Step": 7255, "Pretrain/Step Time": 8.451042821630836} +{"Pretrain/Learning Rate": 3.555359219597377e-05, "Pretrain/Loss": 2.047008991241455, "Pretrain/Loss (Raw)": 2.147740364074707, "Pretrain/Step": 7256, "Pretrain/Step Time": 8.448972893878818} +{"Pretrain/Learning Rate": 3.55497436780256e-05, "Pretrain/Loss": 2.0470309257507324, "Pretrain/Loss (Raw)": 2.0333967208862305, "Pretrain/Step": 7257, "Pretrain/Step Time": 8.449283061549067} +{"Pretrain/Learning Rate": 3.5545894855883023e-05, "Pretrain/Loss": 2.048224449157715, "Pretrain/Loss (Raw)": 2.08891224861145, "Pretrain/Step": 7258, "Pretrain/Step Time": 8.451914757490158} +{"Pretrain/Learning Rate": 3.554204572965699e-05, "Pretrain/Loss": 2.0488109588623047, "Pretrain/Loss (Raw)": 1.9950600862503052, "Pretrain/Step": 7259, "Pretrain/Step Time": 8.452340967953205} +{"Pretrain/Learning Rate": 3.553819629945852e-05, "Pretrain/Loss": 2.0502686500549316, "Pretrain/Loss (Raw)": 2.0653810501098633, "Pretrain/Step": 7260, "Pretrain/Step Time": 8.447498146444559} +{"Pretrain/Learning Rate": 3.553434656539857e-05, "Pretrain/Loss": 2.050534248352051, "Pretrain/Loss (Raw)": 2.1202666759490967, "Pretrain/Step": 7261, "Pretrain/Step Time": 8.447757354006171} +{"Pretrain/Learning Rate": 3.553049652758817e-05, "Pretrain/Loss": 2.0518651008605957, "Pretrain/Loss (Raw)": 2.2646126747131348, "Pretrain/Step": 7262, "Pretrain/Step Time": 8.446882106363773} +{"Pretrain/Learning Rate": 3.552664618613832e-05, "Pretrain/Loss": 2.0515575408935547, "Pretrain/Loss (Raw)": 1.9900449514389038, "Pretrain/Step": 7263, "Pretrain/Step Time": 8.447152454406023} +{"Pretrain/Learning Rate": 3.552279554116005e-05, "Pretrain/Loss": 2.051945686340332, "Pretrain/Loss (Raw)": 2.0927858352661133, "Pretrain/Step": 7264, "Pretrain/Step Time": 8.446121331304312} +{"Pretrain/Learning Rate": 3.55189445927644e-05, "Pretrain/Loss": 2.0508873462677, "Pretrain/Loss (Raw)": 2.2688839435577393, "Pretrain/Step": 7265, "Pretrain/Step Time": 8.449414420872927} +{"Pretrain/Learning Rate": 3.5515093341062386e-05, "Pretrain/Loss": 2.051114320755005, "Pretrain/Loss (Raw)": 2.1222541332244873, "Pretrain/Step": 7266, "Pretrain/Step Time": 8.454910112544894} +{"Pretrain/Learning Rate": 3.551124178616507e-05, "Pretrain/Loss": 2.05184268951416, "Pretrain/Loss (Raw)": 2.1519882678985596, "Pretrain/Step": 7267, "Pretrain/Step Time": 8.452725173905492} +{"Pretrain/Learning Rate": 3.550738992818351e-05, "Pretrain/Loss": 2.051118850708008, "Pretrain/Loss (Raw)": 2.0323643684387207, "Pretrain/Step": 7268, "Pretrain/Step Time": 8.4539736174047} +{"Pretrain/Learning Rate": 3.550353776722877e-05, "Pretrain/Loss": 2.0498740673065186, "Pretrain/Loss (Raw)": 2.07202410697937, "Pretrain/Step": 7269, "Pretrain/Step Time": 8.457326946780086} +{"Pretrain/Learning Rate": 3.5499685303411925e-05, "Pretrain/Loss": 2.0486598014831543, "Pretrain/Loss (Raw)": 1.7438395023345947, "Pretrain/Step": 7270, "Pretrain/Step Time": 8.452237727120519} +{"Pretrain/Learning Rate": 3.549583253684405e-05, "Pretrain/Loss": 2.049213409423828, "Pretrain/Loss (Raw)": 2.0832395553588867, "Pretrain/Step": 7271, "Pretrain/Step Time": 8.451680392026901} +{"Pretrain/Learning Rate": 3.5491979467636246e-05, "Pretrain/Loss": 2.049565315246582, "Pretrain/Loss (Raw)": 2.0495095252990723, "Pretrain/Step": 7272, "Pretrain/Step Time": 8.447829628363252} +{"Pretrain/Learning Rate": 3.54881260958996e-05, "Pretrain/Loss": 2.048208236694336, "Pretrain/Loss (Raw)": 1.7880134582519531, "Pretrain/Step": 7273, "Pretrain/Step Time": 8.447245510295033} +{"Pretrain/Learning Rate": 3.5484272421745245e-05, "Pretrain/Loss": 2.0478734970092773, "Pretrain/Loss (Raw)": 2.1049556732177734, "Pretrain/Step": 7274, "Pretrain/Step Time": 8.45117748901248} +{"Pretrain/Learning Rate": 3.548041844528429e-05, "Pretrain/Loss": 2.0501325130462646, "Pretrain/Loss (Raw)": 2.111733913421631, "Pretrain/Step": 7275, "Pretrain/Step Time": 8.448967603966594} +{"Pretrain/Learning Rate": 3.547656416662784e-05, "Pretrain/Loss": 2.0534274578094482, "Pretrain/Loss (Raw)": 2.3721091747283936, "Pretrain/Step": 7276, "Pretrain/Step Time": 8.452297186478972} +{"Pretrain/Learning Rate": 3.547270958588705e-05, "Pretrain/Loss": 2.05544114112854, "Pretrain/Loss (Raw)": 2.0651140213012695, "Pretrain/Step": 7277, "Pretrain/Step Time": 8.451749878004193} +{"Pretrain/Learning Rate": 3.546885470317307e-05, "Pretrain/Loss": 2.0572214126586914, "Pretrain/Loss (Raw)": 2.2216672897338867, "Pretrain/Step": 7278, "Pretrain/Step Time": 8.448070710524917} +{"Pretrain/Learning Rate": 3.546499951859705e-05, "Pretrain/Loss": 2.0593461990356445, "Pretrain/Loss (Raw)": 2.1286065578460693, "Pretrain/Step": 7279, "Pretrain/Step Time": 8.445071691647172} +{"Pretrain/Learning Rate": 3.546114403227014e-05, "Pretrain/Loss": 2.0611395835876465, "Pretrain/Loss (Raw)": 2.16508150100708, "Pretrain/Step": 7280, "Pretrain/Step Time": 8.452713062986732} +{"Pretrain/Learning Rate": 3.545728824430352e-05, "Pretrain/Loss": 2.0606560707092285, "Pretrain/Loss (Raw)": 2.0499625205993652, "Pretrain/Step": 7281, "Pretrain/Step Time": 8.454781690612435} +{"Pretrain/Learning Rate": 3.545343215480836e-05, "Pretrain/Loss": 2.0636277198791504, "Pretrain/Loss (Raw)": 2.0841007232666016, "Pretrain/Step": 7282, "Pretrain/Step Time": 8.450294034555554} +{"Pretrain/Learning Rate": 3.5449575763895856e-05, "Pretrain/Loss": 2.0647501945495605, "Pretrain/Loss (Raw)": 2.2155873775482178, "Pretrain/Step": 7283, "Pretrain/Step Time": 8.45217046700418} +{"Pretrain/Learning Rate": 3.54457190716772e-05, "Pretrain/Loss": 2.065398931503296, "Pretrain/Loss (Raw)": 2.067697763442993, "Pretrain/Step": 7284, "Pretrain/Step Time": 8.450223112478852} +{"Pretrain/Learning Rate": 3.544186207826359e-05, "Pretrain/Loss": 2.0663912296295166, "Pretrain/Loss (Raw)": 2.235645294189453, "Pretrain/Step": 7285, "Pretrain/Step Time": 8.453274993225932} +{"Pretrain/Learning Rate": 3.5438004783766253e-05, "Pretrain/Loss": 2.069821834564209, "Pretrain/Loss (Raw)": 2.3559792041778564, "Pretrain/Step": 7286, "Pretrain/Step Time": 8.454014278948307} +{"Pretrain/Learning Rate": 3.5434147188296416e-05, "Pretrain/Loss": 2.0694899559020996, "Pretrain/Loss (Raw)": 1.8510979413986206, "Pretrain/Step": 7287, "Pretrain/Step Time": 8.455876033753157} +{"Pretrain/Learning Rate": 3.543028929196529e-05, "Pretrain/Loss": 2.068647861480713, "Pretrain/Loss (Raw)": 2.1237151622772217, "Pretrain/Step": 7288, "Pretrain/Step Time": 8.458687020465732} +{"Pretrain/Learning Rate": 3.5426431094884124e-05, "Pretrain/Loss": 2.0678329467773438, "Pretrain/Loss (Raw)": 1.8614721298217773, "Pretrain/Step": 7289, "Pretrain/Step Time": 8.453848162665963} +{"Pretrain/Learning Rate": 3.5422572597164176e-05, "Pretrain/Loss": 2.0667576789855957, "Pretrain/Loss (Raw)": 2.0188140869140625, "Pretrain/Step": 7290, "Pretrain/Step Time": 8.449499009177089} +{"Pretrain/Learning Rate": 3.5418713798916694e-05, "Pretrain/Loss": 2.0671119689941406, "Pretrain/Loss (Raw)": 2.183405876159668, "Pretrain/Step": 7291, "Pretrain/Step Time": 8.451781444251537} +{"Pretrain/Learning Rate": 3.5414854700252945e-05, "Pretrain/Loss": 2.065530300140381, "Pretrain/Loss (Raw)": 1.939855694770813, "Pretrain/Step": 7292, "Pretrain/Step Time": 8.449686128646135} +{"Pretrain/Learning Rate": 3.5410995301284195e-05, "Pretrain/Loss": 2.0657896995544434, "Pretrain/Loss (Raw)": 2.080923318862915, "Pretrain/Step": 7293, "Pretrain/Step Time": 8.450364632532} +{"Pretrain/Learning Rate": 3.540713560212173e-05, "Pretrain/Loss": 2.0662894248962402, "Pretrain/Loss (Raw)": 1.9829856157302856, "Pretrain/Step": 7294, "Pretrain/Step Time": 8.445891903713346} +{"Pretrain/Learning Rate": 3.5403275602876864e-05, "Pretrain/Loss": 2.0670721530914307, "Pretrain/Loss (Raw)": 2.166282892227173, "Pretrain/Step": 7295, "Pretrain/Step Time": 8.449972171336412} +{"Pretrain/Learning Rate": 3.5399415303660864e-05, "Pretrain/Loss": 2.0628952980041504, "Pretrain/Loss (Raw)": 1.634695291519165, "Pretrain/Step": 7296, "Pretrain/Step Time": 8.44893417134881} +{"Pretrain/Learning Rate": 3.539555470458506e-05, "Pretrain/Loss": 2.064608097076416, "Pretrain/Loss (Raw)": 2.1105856895446777, "Pretrain/Step": 7297, "Pretrain/Step Time": 8.447534209117293} +{"Pretrain/Learning Rate": 3.5391693805760775e-05, "Pretrain/Loss": 2.0662198066711426, "Pretrain/Loss (Raw)": 2.2137553691864014, "Pretrain/Step": 7298, "Pretrain/Step Time": 8.45094077475369} +{"Pretrain/Learning Rate": 3.538783260729931e-05, "Pretrain/Loss": 2.0654489994049072, "Pretrain/Loss (Raw)": 2.066023588180542, "Pretrain/Step": 7299, "Pretrain/Step Time": 8.448343776166439} +{"Pretrain/Learning Rate": 3.538397110931202e-05, "Pretrain/Loss": 2.0666558742523193, "Pretrain/Loss (Raw)": 2.132920980453491, "Pretrain/Step": 7300, "Pretrain/Step Time": 8.450437502935529} +{"Pretrain/Learning Rate": 3.538010931191024e-05, "Pretrain/Loss": 2.0635290145874023, "Pretrain/Loss (Raw)": 2.147038459777832, "Pretrain/Step": 7301, "Pretrain/Step Time": 8.44766472838819} +{"Pretrain/Learning Rate": 3.537624721520534e-05, "Pretrain/Loss": 2.063681125640869, "Pretrain/Loss (Raw)": 1.95098876953125, "Pretrain/Step": 7302, "Pretrain/Step Time": 8.451436035335064} +{"Pretrain/Learning Rate": 3.5372384819308654e-05, "Pretrain/Loss": 2.063870429992676, "Pretrain/Loss (Raw)": 2.154618501663208, "Pretrain/Step": 7303, "Pretrain/Step Time": 8.450165800750256} +{"Pretrain/Learning Rate": 3.536852212433156e-05, "Pretrain/Loss": 2.058239459991455, "Pretrain/Loss (Raw)": 2.0278737545013428, "Pretrain/Step": 7304, "Pretrain/Step Time": 8.453329876065254} +{"Pretrain/Learning Rate": 3.536465913038545e-05, "Pretrain/Loss": 2.057581901550293, "Pretrain/Loss (Raw)": 1.9845402240753174, "Pretrain/Step": 7305, "Pretrain/Step Time": 8.456196840852499} +{"Pretrain/Learning Rate": 3.536079583758169e-05, "Pretrain/Loss": 2.056881904602051, "Pretrain/Loss (Raw)": 1.9386695623397827, "Pretrain/Step": 7306, "Pretrain/Step Time": 8.454395718872547} +{"Pretrain/Learning Rate": 3.535693224603169e-05, "Pretrain/Loss": 2.057466506958008, "Pretrain/Loss (Raw)": 2.0931220054626465, "Pretrain/Step": 7307, "Pretrain/Step Time": 8.458697889000177} +{"Pretrain/Learning Rate": 3.535306835584686e-05, "Pretrain/Loss": 2.0581247806549072, "Pretrain/Loss (Raw)": 2.1835949420928955, "Pretrain/Step": 7308, "Pretrain/Step Time": 8.456221379339695} +{"Pretrain/Learning Rate": 3.534920416713859e-05, "Pretrain/Loss": 2.060349941253662, "Pretrain/Loss (Raw)": 2.344783067703247, "Pretrain/Step": 7309, "Pretrain/Step Time": 8.454417757689953} +{"Pretrain/Learning Rate": 3.534533968001832e-05, "Pretrain/Loss": 2.0576391220092773, "Pretrain/Loss (Raw)": 1.9270224571228027, "Pretrain/Step": 7310, "Pretrain/Step Time": 8.453604204580188} +{"Pretrain/Learning Rate": 3.534147489459746e-05, "Pretrain/Loss": 2.058833122253418, "Pretrain/Loss (Raw)": 2.260493755340576, "Pretrain/Step": 7311, "Pretrain/Step Time": 8.456267546862364} +{"Pretrain/Learning Rate": 3.533760981098748e-05, "Pretrain/Loss": 2.058481216430664, "Pretrain/Loss (Raw)": 1.8764090538024902, "Pretrain/Step": 7312, "Pretrain/Step Time": 8.459243616089225} +{"Pretrain/Learning Rate": 3.53337444292998e-05, "Pretrain/Loss": 2.0611915588378906, "Pretrain/Loss (Raw)": 2.482797145843506, "Pretrain/Step": 7313, "Pretrain/Step Time": 8.456847012043} +{"Pretrain/Learning Rate": 3.5329878749645885e-05, "Pretrain/Loss": 2.058546781539917, "Pretrain/Loss (Raw)": 1.8694339990615845, "Pretrain/Step": 7314, "Pretrain/Step Time": 8.463635377585888} +{"Pretrain/Learning Rate": 3.53260127721372e-05, "Pretrain/Loss": 2.0597615242004395, "Pretrain/Loss (Raw)": 1.9518295526504517, "Pretrain/Step": 7315, "Pretrain/Step Time": 8.465468984097242} +{"Pretrain/Learning Rate": 3.532214649688521e-05, "Pretrain/Loss": 2.059189796447754, "Pretrain/Loss (Raw)": 1.7370175123214722, "Pretrain/Step": 7316, "Pretrain/Step Time": 8.466684065759182} +{"Pretrain/Learning Rate": 3.531827992400141e-05, "Pretrain/Loss": 2.059140205383301, "Pretrain/Loss (Raw)": 1.9801372289657593, "Pretrain/Step": 7317, "Pretrain/Step Time": 8.465661657974124} +{"Pretrain/Learning Rate": 3.531441305359728e-05, "Pretrain/Loss": 2.05954647064209, "Pretrain/Loss (Raw)": 2.0679852962493896, "Pretrain/Step": 7318, "Pretrain/Step Time": 8.469997957348824} +{"Pretrain/Learning Rate": 3.531054588578432e-05, "Pretrain/Loss": 2.059730052947998, "Pretrain/Loss (Raw)": 2.054176092147827, "Pretrain/Step": 7319, "Pretrain/Step Time": 8.46434379182756} +{"Pretrain/Learning Rate": 3.530667842067404e-05, "Pretrain/Loss": 2.059230327606201, "Pretrain/Loss (Raw)": 2.0668087005615234, "Pretrain/Step": 7320, "Pretrain/Step Time": 8.46840226277709} +{"Pretrain/Learning Rate": 3.530281065837795e-05, "Pretrain/Loss": 2.0594372749328613, "Pretrain/Loss (Raw)": 2.0042645931243896, "Pretrain/Step": 7321, "Pretrain/Step Time": 8.467313077300787} +{"Pretrain/Learning Rate": 3.529894259900758e-05, "Pretrain/Loss": 2.0593924522399902, "Pretrain/Loss (Raw)": 2.0133213996887207, "Pretrain/Step": 7322, "Pretrain/Step Time": 8.467222336679697} +{"Pretrain/Learning Rate": 3.529507424267446e-05, "Pretrain/Loss": 2.0585060119628906, "Pretrain/Loss (Raw)": 1.975999116897583, "Pretrain/Step": 7323, "Pretrain/Step Time": 8.464641284197569} +{"Pretrain/Learning Rate": 3.529120558949014e-05, "Pretrain/Loss": 2.059823989868164, "Pretrain/Loss (Raw)": 2.1452202796936035, "Pretrain/Step": 7324, "Pretrain/Step Time": 8.466101663187146} +{"Pretrain/Learning Rate": 3.528733663956615e-05, "Pretrain/Loss": 2.0582759380340576, "Pretrain/Loss (Raw)": 2.0554792881011963, "Pretrain/Step": 7325, "Pretrain/Step Time": 8.463764457032084} +{"Pretrain/Learning Rate": 3.5283467393014057e-05, "Pretrain/Loss": 2.0610361099243164, "Pretrain/Loss (Raw)": 2.0216593742370605, "Pretrain/Step": 7326, "Pretrain/Step Time": 8.46523160673678} +{"Pretrain/Learning Rate": 3.527959784994544e-05, "Pretrain/Loss": 2.0605647563934326, "Pretrain/Loss (Raw)": 2.041240930557251, "Pretrain/Step": 7327, "Pretrain/Step Time": 8.46281012520194} +{"Pretrain/Learning Rate": 3.527572801047186e-05, "Pretrain/Loss": 2.0597758293151855, "Pretrain/Loss (Raw)": 1.8823118209838867, "Pretrain/Step": 7328, "Pretrain/Step Time": 8.463039902970195} +{"Pretrain/Learning Rate": 3.5271857874704917e-05, "Pretrain/Loss": 2.0589098930358887, "Pretrain/Loss (Raw)": 1.9967137575149536, "Pretrain/Step": 7329, "Pretrain/Step Time": 8.467819640412927} +{"Pretrain/Learning Rate": 3.526798744275618e-05, "Pretrain/Loss": 2.0578980445861816, "Pretrain/Loss (Raw)": 2.030174493789673, "Pretrain/Step": 7330, "Pretrain/Step Time": 8.465883580967784} +{"Pretrain/Learning Rate": 3.5264116714737274e-05, "Pretrain/Loss": 2.0578064918518066, "Pretrain/Loss (Raw)": 1.9277170896530151, "Pretrain/Step": 7331, "Pretrain/Step Time": 8.470327975228429} +{"Pretrain/Learning Rate": 3.526024569075979e-05, "Pretrain/Loss": 2.0581061840057373, "Pretrain/Loss (Raw)": 2.080510377883911, "Pretrain/Step": 7332, "Pretrain/Step Time": 8.471505671739578} +{"Pretrain/Learning Rate": 3.525637437093536e-05, "Pretrain/Loss": 2.059408664703369, "Pretrain/Loss (Raw)": 2.184535026550293, "Pretrain/Step": 7333, "Pretrain/Step Time": 8.469585966318846} +{"Pretrain/Learning Rate": 3.525250275537561e-05, "Pretrain/Loss": 2.0572965145111084, "Pretrain/Loss (Raw)": 1.9704570770263672, "Pretrain/Step": 7334, "Pretrain/Step Time": 8.470708465203643} +{"Pretrain/Learning Rate": 3.524863084419216e-05, "Pretrain/Loss": 2.055964946746826, "Pretrain/Loss (Raw)": 1.8758889436721802, "Pretrain/Step": 7335, "Pretrain/Step Time": 8.47215137258172} +{"Pretrain/Learning Rate": 3.5244758637496664e-05, "Pretrain/Loss": 2.052304744720459, "Pretrain/Loss (Raw)": 2.062950849533081, "Pretrain/Step": 7336, "Pretrain/Step Time": 8.471703892573714} +{"Pretrain/Learning Rate": 3.524088613540078e-05, "Pretrain/Loss": 2.0515499114990234, "Pretrain/Loss (Raw)": 1.895628571510315, "Pretrain/Step": 7337, "Pretrain/Step Time": 8.47033534385264} +{"Pretrain/Learning Rate": 3.523701333801616e-05, "Pretrain/Loss": 2.0514190196990967, "Pretrain/Loss (Raw)": 2.0693790912628174, "Pretrain/Step": 7338, "Pretrain/Step Time": 8.472758673131466} +{"Pretrain/Learning Rate": 3.523314024545449e-05, "Pretrain/Loss": 2.0503835678100586, "Pretrain/Loss (Raw)": 2.057840585708618, "Pretrain/Step": 7339, "Pretrain/Step Time": 8.471660740673542} +{"Pretrain/Learning Rate": 3.522926685782742e-05, "Pretrain/Loss": 2.049874782562256, "Pretrain/Loss (Raw)": 2.0047178268432617, "Pretrain/Step": 7340, "Pretrain/Step Time": 8.472005315124989} +{"Pretrain/Learning Rate": 3.5225393175246655e-05, "Pretrain/Loss": 2.050273895263672, "Pretrain/Loss (Raw)": 2.0134024620056152, "Pretrain/Step": 7341, "Pretrain/Step Time": 8.47352153249085} +{"Pretrain/Learning Rate": 3.522151919782389e-05, "Pretrain/Loss": 2.0475914478302, "Pretrain/Loss (Raw)": 1.9304932355880737, "Pretrain/Step": 7342, "Pretrain/Step Time": 8.475887956097722} +{"Pretrain/Learning Rate": 3.5217644925670815e-05, "Pretrain/Loss": 2.0476956367492676, "Pretrain/Loss (Raw)": 2.1064817905426025, "Pretrain/Step": 7343, "Pretrain/Step Time": 8.467964654788375} +{"Pretrain/Learning Rate": 3.521377035889916e-05, "Pretrain/Loss": 2.0449728965759277, "Pretrain/Loss (Raw)": 1.769361138343811, "Pretrain/Step": 7344, "Pretrain/Step Time": 8.468203347176313} +{"Pretrain/Learning Rate": 3.520989549762064e-05, "Pretrain/Loss": 2.0458765029907227, "Pretrain/Loss (Raw)": 2.0619444847106934, "Pretrain/Step": 7345, "Pretrain/Step Time": 8.471677489578724} +{"Pretrain/Learning Rate": 3.520602034194698e-05, "Pretrain/Loss": 2.0457992553710938, "Pretrain/Loss (Raw)": 1.9783207178115845, "Pretrain/Step": 7346, "Pretrain/Step Time": 8.469822699204087} +{"Pretrain/Learning Rate": 3.5202144891989905e-05, "Pretrain/Loss": 2.045034170150757, "Pretrain/Loss (Raw)": 1.8710838556289673, "Pretrain/Step": 7347, "Pretrain/Step Time": 8.4702044185251} +{"Pretrain/Learning Rate": 3.519826914786118e-05, "Pretrain/Loss": 2.0460965633392334, "Pretrain/Loss (Raw)": 2.2781314849853516, "Pretrain/Step": 7348, "Pretrain/Step Time": 8.469924727454782} +{"Pretrain/Learning Rate": 3.519439310967256e-05, "Pretrain/Loss": 2.047553777694702, "Pretrain/Loss (Raw)": 2.0607705116271973, "Pretrain/Step": 7349, "Pretrain/Step Time": 8.470495605841279} +{"Pretrain/Learning Rate": 3.51905167775358e-05, "Pretrain/Loss": 2.0455386638641357, "Pretrain/Loss (Raw)": 1.8390823602676392, "Pretrain/Step": 7350, "Pretrain/Step Time": 8.467573828995228} +{"Pretrain/Learning Rate": 3.518664015156267e-05, "Pretrain/Loss": 2.0451483726501465, "Pretrain/Loss (Raw)": 2.052184820175171, "Pretrain/Step": 7351, "Pretrain/Step Time": 8.468556018546224} +{"Pretrain/Learning Rate": 3.518276323186496e-05, "Pretrain/Loss": 2.0450825691223145, "Pretrain/Loss (Raw)": 2.057831048965454, "Pretrain/Step": 7352, "Pretrain/Step Time": 8.470005437731743} +{"Pretrain/Learning Rate": 3.517888601855444e-05, "Pretrain/Loss": 2.0447425842285156, "Pretrain/Loss (Raw)": 2.082876443862915, "Pretrain/Step": 7353, "Pretrain/Step Time": 8.471244363114238} +{"Pretrain/Learning Rate": 3.517500851174292e-05, "Pretrain/Loss": 2.0437800884246826, "Pretrain/Loss (Raw)": 2.0800278186798096, "Pretrain/Step": 7354, "Pretrain/Step Time": 8.470842001959682} +{"Pretrain/Learning Rate": 3.51711307115422e-05, "Pretrain/Loss": 2.044343948364258, "Pretrain/Loss (Raw)": 2.0607171058654785, "Pretrain/Step": 7355, "Pretrain/Step Time": 8.474253779277205} +{"Pretrain/Learning Rate": 3.5167252618064105e-05, "Pretrain/Loss": 2.043038845062256, "Pretrain/Loss (Raw)": 1.8288432359695435, "Pretrain/Step": 7356, "Pretrain/Step Time": 8.477242354303598} +{"Pretrain/Learning Rate": 3.5163374231420445e-05, "Pretrain/Loss": 2.044437885284424, "Pretrain/Loss (Raw)": 1.9999850988388062, "Pretrain/Step": 7357, "Pretrain/Step Time": 8.464962905272841} +{"Pretrain/Learning Rate": 3.515949555172305e-05, "Pretrain/Loss": 2.043301820755005, "Pretrain/Loss (Raw)": 2.0597307682037354, "Pretrain/Step": 7358, "Pretrain/Step Time": 8.469802716746926} +{"Pretrain/Learning Rate": 3.515561657908376e-05, "Pretrain/Loss": 2.04192852973938, "Pretrain/Loss (Raw)": 1.9793243408203125, "Pretrain/Step": 7359, "Pretrain/Step Time": 8.47187028080225} +{"Pretrain/Learning Rate": 3.5151737313614435e-05, "Pretrain/Loss": 2.0427703857421875, "Pretrain/Loss (Raw)": 1.8561121225357056, "Pretrain/Step": 7360, "Pretrain/Step Time": 8.46502335369587} +{"Pretrain/Learning Rate": 3.5147857755426915e-05, "Pretrain/Loss": 2.042834997177124, "Pretrain/Loss (Raw)": 1.9068224430084229, "Pretrain/Step": 7361, "Pretrain/Step Time": 8.470398912206292} +{"Pretrain/Learning Rate": 3.514397790463307e-05, "Pretrain/Loss": 2.0474765300750732, "Pretrain/Loss (Raw)": 2.366858959197998, "Pretrain/Step": 7362, "Pretrain/Step Time": 8.465391632169485} +{"Pretrain/Learning Rate": 3.5140097761344774e-05, "Pretrain/Loss": 2.048950433731079, "Pretrain/Loss (Raw)": 2.1336669921875, "Pretrain/Step": 7363, "Pretrain/Step Time": 8.463784515857697} +{"Pretrain/Learning Rate": 3.5136217325673906e-05, "Pretrain/Loss": 2.0509207248687744, "Pretrain/Loss (Raw)": 1.991985559463501, "Pretrain/Step": 7364, "Pretrain/Step Time": 8.463373582810163} +{"Pretrain/Learning Rate": 3.513233659773236e-05, "Pretrain/Loss": 2.050384759902954, "Pretrain/Loss (Raw)": 1.9923248291015625, "Pretrain/Step": 7365, "Pretrain/Step Time": 8.465780204162002} +{"Pretrain/Learning Rate": 3.5128455577632036e-05, "Pretrain/Loss": 2.0511090755462646, "Pretrain/Loss (Raw)": 2.099278688430786, "Pretrain/Step": 7366, "Pretrain/Step Time": 8.465588128194213} +{"Pretrain/Learning Rate": 3.5124574265484826e-05, "Pretrain/Loss": 2.052107810974121, "Pretrain/Loss (Raw)": 2.2130537033081055, "Pretrain/Step": 7367, "Pretrain/Step Time": 8.46572301350534} +{"Pretrain/Learning Rate": 3.512069266140266e-05, "Pretrain/Loss": 2.051069736480713, "Pretrain/Loss (Raw)": 1.858535885810852, "Pretrain/Step": 7368, "Pretrain/Step Time": 8.466743126511574} +{"Pretrain/Learning Rate": 3.511681076549745e-05, "Pretrain/Loss": 2.0501391887664795, "Pretrain/Loss (Raw)": 1.7406706809997559, "Pretrain/Step": 7369, "Pretrain/Step Time": 8.467242240905762} +{"Pretrain/Learning Rate": 3.511292857788113e-05, "Pretrain/Loss": 2.0512804985046387, "Pretrain/Loss (Raw)": 2.1310579776763916, "Pretrain/Step": 7370, "Pretrain/Step Time": 8.47037166543305} +{"Pretrain/Learning Rate": 3.510904609866566e-05, "Pretrain/Loss": 2.0526270866394043, "Pretrain/Loss (Raw)": 2.0356485843658447, "Pretrain/Step": 7371, "Pretrain/Step Time": 8.469042129814625} +{"Pretrain/Learning Rate": 3.510516332796296e-05, "Pretrain/Loss": 2.053215503692627, "Pretrain/Loss (Raw)": 2.1261308193206787, "Pretrain/Step": 7372, "Pretrain/Step Time": 8.469451991841197} +{"Pretrain/Learning Rate": 3.5101280265885e-05, "Pretrain/Loss": 2.052907943725586, "Pretrain/Loss (Raw)": 2.0459835529327393, "Pretrain/Step": 7373, "Pretrain/Step Time": 8.467358296737075} +{"Pretrain/Learning Rate": 3.5097396912543745e-05, "Pretrain/Loss": 2.051513671875, "Pretrain/Loss (Raw)": 2.0177388191223145, "Pretrain/Step": 7374, "Pretrain/Step Time": 8.465376827865839} +{"Pretrain/Learning Rate": 3.509351326805117e-05, "Pretrain/Loss": 2.051267147064209, "Pretrain/Loss (Raw)": 1.9222084283828735, "Pretrain/Step": 7375, "Pretrain/Step Time": 8.469800617545843} +{"Pretrain/Learning Rate": 3.508962933251926e-05, "Pretrain/Loss": 2.0533742904663086, "Pretrain/Loss (Raw)": 2.135776996612549, "Pretrain/Step": 7376, "Pretrain/Step Time": 8.468576239421964} +{"Pretrain/Learning Rate": 3.508574510605999e-05, "Pretrain/Loss": 2.052276134490967, "Pretrain/Loss (Raw)": 1.9896318912506104, "Pretrain/Step": 7377, "Pretrain/Step Time": 8.47001437842846} +{"Pretrain/Learning Rate": 3.508186058878537e-05, "Pretrain/Loss": 2.0523900985717773, "Pretrain/Loss (Raw)": 2.045793294906616, "Pretrain/Step": 7378, "Pretrain/Step Time": 8.468821259215474} +{"Pretrain/Learning Rate": 3.5077975780807416e-05, "Pretrain/Loss": 2.052380084991455, "Pretrain/Loss (Raw)": 1.8522502183914185, "Pretrain/Step": 7379, "Pretrain/Step Time": 8.4734728038311} +{"Pretrain/Learning Rate": 3.507409068223813e-05, "Pretrain/Loss": 2.0480706691741943, "Pretrain/Loss (Raw)": 2.0232748985290527, "Pretrain/Step": 7380, "Pretrain/Step Time": 8.468085039407015} +{"Pretrain/Learning Rate": 3.507020529318954e-05, "Pretrain/Loss": 2.0478649139404297, "Pretrain/Loss (Raw)": 2.1454050540924072, "Pretrain/Step": 7381, "Pretrain/Step Time": 8.473991300910711} +{"Pretrain/Learning Rate": 3.506631961377369e-05, "Pretrain/Loss": 2.0436794757843018, "Pretrain/Loss (Raw)": 1.6552289724349976, "Pretrain/Step": 7382, "Pretrain/Step Time": 8.472158044576645} +{"Pretrain/Learning Rate": 3.50624336441026e-05, "Pretrain/Loss": 2.0417888164520264, "Pretrain/Loss (Raw)": 1.9024906158447266, "Pretrain/Step": 7383, "Pretrain/Step Time": 8.47768484055996} +{"Pretrain/Learning Rate": 3.505854738428833e-05, "Pretrain/Loss": 2.0397682189941406, "Pretrain/Loss (Raw)": 1.8891172409057617, "Pretrain/Step": 7384, "Pretrain/Step Time": 8.47864730656147} +{"Pretrain/Learning Rate": 3.505466083444294e-05, "Pretrain/Loss": 2.0386428833007812, "Pretrain/Loss (Raw)": 1.8893448114395142, "Pretrain/Step": 7385, "Pretrain/Step Time": 8.474861469119787} +{"Pretrain/Learning Rate": 3.505077399467849e-05, "Pretrain/Loss": 2.0364532470703125, "Pretrain/Loss (Raw)": 1.80862557888031, "Pretrain/Step": 7386, "Pretrain/Step Time": 8.47581440769136} +{"Pretrain/Learning Rate": 3.504688686510706e-05, "Pretrain/Loss": 2.035534381866455, "Pretrain/Loss (Raw)": 1.8774285316467285, "Pretrain/Step": 7387, "Pretrain/Step Time": 8.478134363889694} +{"Pretrain/Learning Rate": 3.504299944584073e-05, "Pretrain/Loss": 2.036432981491089, "Pretrain/Loss (Raw)": 2.180424928665161, "Pretrain/Step": 7388, "Pretrain/Step Time": 8.47669417411089} +{"Pretrain/Learning Rate": 3.503911173699159e-05, "Pretrain/Loss": 2.036740303039551, "Pretrain/Loss (Raw)": 2.1595962047576904, "Pretrain/Step": 7389, "Pretrain/Step Time": 8.47798709012568} +{"Pretrain/Learning Rate": 3.5035223738671733e-05, "Pretrain/Loss": 2.0383524894714355, "Pretrain/Loss (Raw)": 2.4709787368774414, "Pretrain/Step": 7390, "Pretrain/Step Time": 8.479752091690898} +{"Pretrain/Learning Rate": 3.503133545099328e-05, "Pretrain/Loss": 2.0392448902130127, "Pretrain/Loss (Raw)": 2.1042704582214355, "Pretrain/Step": 7391, "Pretrain/Step Time": 8.479343922808766} +{"Pretrain/Learning Rate": 3.5027446874068344e-05, "Pretrain/Loss": 2.0414505004882812, "Pretrain/Loss (Raw)": 2.3751182556152344, "Pretrain/Step": 7392, "Pretrain/Step Time": 8.47889095544815} +{"Pretrain/Learning Rate": 3.502355800800904e-05, "Pretrain/Loss": 2.038770914077759, "Pretrain/Loss (Raw)": 1.9258875846862793, "Pretrain/Step": 7393, "Pretrain/Step Time": 8.479606127366424} +{"Pretrain/Learning Rate": 3.501966885292751e-05, "Pretrain/Loss": 2.03940749168396, "Pretrain/Loss (Raw)": 2.203740119934082, "Pretrain/Step": 7394, "Pretrain/Step Time": 8.471772151067853} +{"Pretrain/Learning Rate": 3.501577940893589e-05, "Pretrain/Loss": 2.0391883850097656, "Pretrain/Loss (Raw)": 2.1239283084869385, "Pretrain/Step": 7395, "Pretrain/Step Time": 8.477111233398318} +{"Pretrain/Learning Rate": 3.501188967614634e-05, "Pretrain/Loss": 2.039341926574707, "Pretrain/Loss (Raw)": 2.052006721496582, "Pretrain/Step": 7396, "Pretrain/Step Time": 8.476396711543202} +{"Pretrain/Learning Rate": 3.5007999654671004e-05, "Pretrain/Loss": 2.0375099182128906, "Pretrain/Loss (Raw)": 1.8375786542892456, "Pretrain/Step": 7397, "Pretrain/Step Time": 8.47769203223288} +{"Pretrain/Learning Rate": 3.5004109344622047e-05, "Pretrain/Loss": 2.0406088829040527, "Pretrain/Loss (Raw)": 2.1405110359191895, "Pretrain/Step": 7398, "Pretrain/Step Time": 8.481386166065931} +{"Pretrain/Learning Rate": 3.5000218746111655e-05, "Pretrain/Loss": 2.041191577911377, "Pretrain/Loss (Raw)": 2.157806873321533, "Pretrain/Step": 7399, "Pretrain/Step Time": 8.478053642436862} +{"Pretrain/Learning Rate": 3.4996327859252004e-05, "Pretrain/Loss": 2.0414648056030273, "Pretrain/Loss (Raw)": 2.0844643115997314, "Pretrain/Step": 7400, "Pretrain/Step Time": 8.482759796082973} +{"Pretrain/Learning Rate": 3.499243668415528e-05, "Pretrain/Loss": 2.0451135635375977, "Pretrain/Loss (Raw)": 2.255089044570923, "Pretrain/Step": 7401, "Pretrain/Step Time": 8.482448816299438} +{"Pretrain/Learning Rate": 3.4988545220933706e-05, "Pretrain/Loss": 2.0453381538391113, "Pretrain/Loss (Raw)": 2.133671760559082, "Pretrain/Step": 7402, "Pretrain/Step Time": 8.484033789485693} +{"Pretrain/Learning Rate": 3.4984653469699456e-05, "Pretrain/Loss": 2.0445399284362793, "Pretrain/Loss (Raw)": 2.009538412094116, "Pretrain/Step": 7403, "Pretrain/Step Time": 8.482349663972855} +{"Pretrain/Learning Rate": 3.4980761430564766e-05, "Pretrain/Loss": 2.0413737297058105, "Pretrain/Loss (Raw)": 1.966876745223999, "Pretrain/Step": 7404, "Pretrain/Step Time": 8.483003383502364} +{"Pretrain/Learning Rate": 3.497686910364186e-05, "Pretrain/Loss": 2.0416598320007324, "Pretrain/Loss (Raw)": 2.101724147796631, "Pretrain/Step": 7405, "Pretrain/Step Time": 8.48146609030664} +{"Pretrain/Learning Rate": 3.497297648904297e-05, "Pretrain/Loss": 2.039395809173584, "Pretrain/Loss (Raw)": 1.9318712949752808, "Pretrain/Step": 7406, "Pretrain/Step Time": 8.485303299501538} +{"Pretrain/Learning Rate": 3.496908358688033e-05, "Pretrain/Loss": 2.039487600326538, "Pretrain/Loss (Raw)": 2.1403567790985107, "Pretrain/Step": 7407, "Pretrain/Step Time": 8.484013648703694} +{"Pretrain/Learning Rate": 3.496519039726619e-05, "Pretrain/Loss": 2.037144660949707, "Pretrain/Loss (Raw)": 1.8651728630065918, "Pretrain/Step": 7408, "Pretrain/Step Time": 8.475584588944912} +{"Pretrain/Learning Rate": 3.4961296920312806e-05, "Pretrain/Loss": 2.0393259525299072, "Pretrain/Loss (Raw)": 2.329177141189575, "Pretrain/Step": 7409, "Pretrain/Step Time": 8.476010780781507} +{"Pretrain/Learning Rate": 3.495740315613245e-05, "Pretrain/Loss": 2.038952589035034, "Pretrain/Loss (Raw)": 2.0363142490386963, "Pretrain/Step": 7410, "Pretrain/Step Time": 8.47636810876429} +{"Pretrain/Learning Rate": 3.49535091048374e-05, "Pretrain/Loss": 2.038634777069092, "Pretrain/Loss (Raw)": 2.1748876571655273, "Pretrain/Step": 7411, "Pretrain/Step Time": 8.47437122836709} +{"Pretrain/Learning Rate": 3.4949614766539914e-05, "Pretrain/Loss": 2.038803815841675, "Pretrain/Loss (Raw)": 2.0893354415893555, "Pretrain/Step": 7412, "Pretrain/Step Time": 8.477387260645628} +{"Pretrain/Learning Rate": 3.494572014135232e-05, "Pretrain/Loss": 2.036571502685547, "Pretrain/Loss (Raw)": 1.9499214887619019, "Pretrain/Step": 7413, "Pretrain/Step Time": 8.47381210885942} +{"Pretrain/Learning Rate": 3.4941825229386896e-05, "Pretrain/Loss": 2.0341341495513916, "Pretrain/Loss (Raw)": 2.0439934730529785, "Pretrain/Step": 7414, "Pretrain/Step Time": 8.471571683883667} +{"Pretrain/Learning Rate": 3.493793003075594e-05, "Pretrain/Loss": 2.032170534133911, "Pretrain/Loss (Raw)": 1.599770426750183, "Pretrain/Step": 7415, "Pretrain/Step Time": 8.470921587198973} +{"Pretrain/Learning Rate": 3.4934034545571774e-05, "Pretrain/Loss": 2.032181739807129, "Pretrain/Loss (Raw)": 2.1251420974731445, "Pretrain/Step": 7416, "Pretrain/Step Time": 8.475852191448212} +{"Pretrain/Learning Rate": 3.493013877394673e-05, "Pretrain/Loss": 2.032242774963379, "Pretrain/Loss (Raw)": 1.8692845106124878, "Pretrain/Step": 7417, "Pretrain/Step Time": 8.475901395082474} +{"Pretrain/Learning Rate": 3.492624271599314e-05, "Pretrain/Loss": 2.0355114936828613, "Pretrain/Loss (Raw)": 2.4372334480285645, "Pretrain/Step": 7418, "Pretrain/Step Time": 8.477470517158508} +{"Pretrain/Learning Rate": 3.492234637182334e-05, "Pretrain/Loss": 2.03779935836792, "Pretrain/Loss (Raw)": 2.47623348236084, "Pretrain/Step": 7419, "Pretrain/Step Time": 8.482053434476256} +{"Pretrain/Learning Rate": 3.4918449741549666e-05, "Pretrain/Loss": 2.038770914077759, "Pretrain/Loss (Raw)": 2.0642213821411133, "Pretrain/Step": 7420, "Pretrain/Step Time": 8.478522647172213} +{"Pretrain/Learning Rate": 3.49145528252845e-05, "Pretrain/Loss": 2.039179801940918, "Pretrain/Loss (Raw)": 2.133232593536377, "Pretrain/Step": 7421, "Pretrain/Step Time": 8.482253739610314} +{"Pretrain/Learning Rate": 3.491065562314018e-05, "Pretrain/Loss": 2.0423083305358887, "Pretrain/Loss (Raw)": 2.383467435836792, "Pretrain/Step": 7422, "Pretrain/Step Time": 8.485420743003488} +{"Pretrain/Learning Rate": 3.4906758135229096e-05, "Pretrain/Loss": 2.0428719520568848, "Pretrain/Loss (Raw)": 2.238412618637085, "Pretrain/Step": 7423, "Pretrain/Step Time": 8.480525089427829} +{"Pretrain/Learning Rate": 3.490286036166363e-05, "Pretrain/Loss": 2.0463364124298096, "Pretrain/Loss (Raw)": 2.0781514644622803, "Pretrain/Step": 7424, "Pretrain/Step Time": 8.477184649556875} +{"Pretrain/Learning Rate": 3.489896230255616e-05, "Pretrain/Loss": 2.0468201637268066, "Pretrain/Loss (Raw)": 2.1725013256073, "Pretrain/Step": 7425, "Pretrain/Step Time": 8.483577089384198} +{"Pretrain/Learning Rate": 3.4895063958019094e-05, "Pretrain/Loss": 2.044771671295166, "Pretrain/Loss (Raw)": 1.9515445232391357, "Pretrain/Step": 7426, "Pretrain/Step Time": 8.481734357774258} +{"Pretrain/Learning Rate": 3.489116532816483e-05, "Pretrain/Loss": 2.0434646606445312, "Pretrain/Loss (Raw)": 1.8987263441085815, "Pretrain/Step": 7427, "Pretrain/Step Time": 8.482172075659037} +{"Pretrain/Learning Rate": 3.488726641310579e-05, "Pretrain/Loss": 2.044083595275879, "Pretrain/Loss (Raw)": 2.2121503353118896, "Pretrain/Step": 7428, "Pretrain/Step Time": 8.48608597740531} +{"Pretrain/Learning Rate": 3.488336721295439e-05, "Pretrain/Loss": 2.0405783653259277, "Pretrain/Loss (Raw)": 1.6983776092529297, "Pretrain/Step": 7429, "Pretrain/Step Time": 8.484447898343205} +{"Pretrain/Learning Rate": 3.487946772782307e-05, "Pretrain/Loss": 2.040496349334717, "Pretrain/Loss (Raw)": 1.940497636795044, "Pretrain/Step": 7430, "Pretrain/Step Time": 8.482127873227} +{"Pretrain/Learning Rate": 3.487556795782426e-05, "Pretrain/Loss": 2.0390753746032715, "Pretrain/Loss (Raw)": 1.9727169275283813, "Pretrain/Step": 7431, "Pretrain/Step Time": 8.484779670834541} +{"Pretrain/Learning Rate": 3.487166790307041e-05, "Pretrain/Loss": 2.0396103858947754, "Pretrain/Loss (Raw)": 2.096329689025879, "Pretrain/Step": 7432, "Pretrain/Step Time": 8.484622612595558} +{"Pretrain/Learning Rate": 3.486776756367397e-05, "Pretrain/Loss": 2.040208339691162, "Pretrain/Loss (Raw)": 2.061079263687134, "Pretrain/Step": 7433, "Pretrain/Step Time": 8.486607363447547} +{"Pretrain/Learning Rate": 3.4863866939747416e-05, "Pretrain/Loss": 2.0404064655303955, "Pretrain/Loss (Raw)": 1.9640650749206543, "Pretrain/Step": 7434, "Pretrain/Step Time": 8.487790498882532} +{"Pretrain/Learning Rate": 3.48599660314032e-05, "Pretrain/Loss": 2.0408613681793213, "Pretrain/Loss (Raw)": 2.1513376235961914, "Pretrain/Step": 7435, "Pretrain/Step Time": 8.48617048189044} +{"Pretrain/Learning Rate": 3.4856064838753825e-05, "Pretrain/Loss": 2.0398497581481934, "Pretrain/Loss (Raw)": 2.0540974140167236, "Pretrain/Step": 7436, "Pretrain/Step Time": 8.483189111575484} +{"Pretrain/Learning Rate": 3.4852163361911764e-05, "Pretrain/Loss": 2.037102699279785, "Pretrain/Loss (Raw)": 1.9931501150131226, "Pretrain/Step": 7437, "Pretrain/Step Time": 8.486775605008006} +{"Pretrain/Learning Rate": 3.4848261600989524e-05, "Pretrain/Loss": 2.0389904975891113, "Pretrain/Loss (Raw)": 2.168674945831299, "Pretrain/Step": 7438, "Pretrain/Step Time": 8.489105362445116} +{"Pretrain/Learning Rate": 3.48443595560996e-05, "Pretrain/Loss": 2.036813735961914, "Pretrain/Loss (Raw)": 1.9818648099899292, "Pretrain/Step": 7439, "Pretrain/Step Time": 8.485885540023446} +{"Pretrain/Learning Rate": 3.484045722735451e-05, "Pretrain/Loss": 2.037820816040039, "Pretrain/Loss (Raw)": 2.0053110122680664, "Pretrain/Step": 7440, "Pretrain/Step Time": 8.483951048925519} +{"Pretrain/Learning Rate": 3.4836554614866765e-05, "Pretrain/Loss": 2.0320591926574707, "Pretrain/Loss (Raw)": 1.7453027963638306, "Pretrain/Step": 7441, "Pretrain/Step Time": 8.4894760530442} +{"Pretrain/Learning Rate": 3.483265171874891e-05, "Pretrain/Loss": 2.032097578048706, "Pretrain/Loss (Raw)": 1.8743618726730347, "Pretrain/Step": 7442, "Pretrain/Step Time": 8.484814403578639} +{"Pretrain/Learning Rate": 3.482874853911347e-05, "Pretrain/Loss": 2.033688545227051, "Pretrain/Loss (Raw)": 2.1554672718048096, "Pretrain/Step": 7443, "Pretrain/Step Time": 8.482352931052446} +{"Pretrain/Learning Rate": 3.4824845076073e-05, "Pretrain/Loss": 2.036191463470459, "Pretrain/Loss (Raw)": 2.057403087615967, "Pretrain/Step": 7444, "Pretrain/Step Time": 8.483547072857618} +{"Pretrain/Learning Rate": 3.482094132974004e-05, "Pretrain/Loss": 2.0370125770568848, "Pretrain/Loss (Raw)": 2.085244655609131, "Pretrain/Step": 7445, "Pretrain/Step Time": 8.483738753944635} +{"Pretrain/Learning Rate": 3.4817037300227166e-05, "Pretrain/Loss": 2.033673048019409, "Pretrain/Loss (Raw)": 1.6405224800109863, "Pretrain/Step": 7446, "Pretrain/Step Time": 8.482118550688028} +{"Pretrain/Learning Rate": 3.4813132987646943e-05, "Pretrain/Loss": 2.0343568325042725, "Pretrain/Loss (Raw)": 2.141709089279175, "Pretrain/Step": 7447, "Pretrain/Step Time": 8.481516821309924} +{"Pretrain/Learning Rate": 3.480922839211195e-05, "Pretrain/Loss": 2.0320286750793457, "Pretrain/Loss (Raw)": 1.7687891721725464, "Pretrain/Step": 7448, "Pretrain/Step Time": 8.485246740281582} +{"Pretrain/Learning Rate": 3.480532351373476e-05, "Pretrain/Loss": 2.0289535522460938, "Pretrain/Loss (Raw)": 1.6106510162353516, "Pretrain/Step": 7449, "Pretrain/Step Time": 8.489722354337573} +{"Pretrain/Learning Rate": 3.480141835262799e-05, "Pretrain/Loss": 2.032697916030884, "Pretrain/Loss (Raw)": 2.4925918579101562, "Pretrain/Step": 7450, "Pretrain/Step Time": 8.490220034494996} +{"Pretrain/Learning Rate": 3.479751290890423e-05, "Pretrain/Loss": 2.0329346656799316, "Pretrain/Loss (Raw)": 2.0063254833221436, "Pretrain/Step": 7451, "Pretrain/Step Time": 8.491411590948701} +{"Pretrain/Learning Rate": 3.479360718267608e-05, "Pretrain/Loss": 2.0312795639038086, "Pretrain/Loss (Raw)": 1.933351993560791, "Pretrain/Step": 7452, "Pretrain/Step Time": 8.487000498920679} +{"Pretrain/Learning Rate": 3.478970117405619e-05, "Pretrain/Loss": 2.030930519104004, "Pretrain/Loss (Raw)": 2.0108180046081543, "Pretrain/Step": 7453, "Pretrain/Step Time": 8.490407723933458} +{"Pretrain/Learning Rate": 3.478579488315715e-05, "Pretrain/Loss": 2.030712842941284, "Pretrain/Loss (Raw)": 1.9937788248062134, "Pretrain/Step": 7454, "Pretrain/Step Time": 8.48663423396647} +{"Pretrain/Learning Rate": 3.478188831009163e-05, "Pretrain/Loss": 2.0297622680664062, "Pretrain/Loss (Raw)": 1.919568419456482, "Pretrain/Step": 7455, "Pretrain/Step Time": 8.48983277194202} +{"Pretrain/Learning Rate": 3.477798145497224e-05, "Pretrain/Loss": 2.0318827629089355, "Pretrain/Loss (Raw)": 2.15374493598938, "Pretrain/Step": 7456, "Pretrain/Step Time": 8.486724741756916} +{"Pretrain/Learning Rate": 3.477407431791166e-05, "Pretrain/Loss": 2.031472682952881, "Pretrain/Loss (Raw)": 1.944199562072754, "Pretrain/Step": 7457, "Pretrain/Step Time": 8.482076512649655} +{"Pretrain/Learning Rate": 3.477016689902253e-05, "Pretrain/Loss": 2.031709671020508, "Pretrain/Loss (Raw)": 2.060542583465576, "Pretrain/Step": 7458, "Pretrain/Step Time": 8.484520547091961} +{"Pretrain/Learning Rate": 3.476625919841753e-05, "Pretrain/Loss": 2.031731605529785, "Pretrain/Loss (Raw)": 1.9304852485656738, "Pretrain/Step": 7459, "Pretrain/Step Time": 8.4834228400141} +{"Pretrain/Learning Rate": 3.4762351216209324e-05, "Pretrain/Loss": 2.0308425426483154, "Pretrain/Loss (Raw)": 1.9667394161224365, "Pretrain/Step": 7460, "Pretrain/Step Time": 8.480377109721303} +{"Pretrain/Learning Rate": 3.475844295251061e-05, "Pretrain/Loss": 2.0296645164489746, "Pretrain/Loss (Raw)": 2.0337107181549072, "Pretrain/Step": 7461, "Pretrain/Step Time": 8.485506461933255} +{"Pretrain/Learning Rate": 3.475453440743407e-05, "Pretrain/Loss": 2.03110671043396, "Pretrain/Loss (Raw)": 2.155085802078247, "Pretrain/Step": 7462, "Pretrain/Step Time": 8.481553567573428} +{"Pretrain/Learning Rate": 3.4750625581092406e-05, "Pretrain/Loss": 2.032349109649658, "Pretrain/Loss (Raw)": 2.0349042415618896, "Pretrain/Step": 7463, "Pretrain/Step Time": 8.482386518269777} +{"Pretrain/Learning Rate": 3.474671647359833e-05, "Pretrain/Loss": 2.0283236503601074, "Pretrain/Loss (Raw)": 1.5477172136306763, "Pretrain/Step": 7464, "Pretrain/Step Time": 8.481184227392077} +{"Pretrain/Learning Rate": 3.474280708506455e-05, "Pretrain/Loss": 2.0284786224365234, "Pretrain/Loss (Raw)": 1.91544771194458, "Pretrain/Step": 7465, "Pretrain/Step Time": 8.480021772906184} +{"Pretrain/Learning Rate": 3.47388974156038e-05, "Pretrain/Loss": 2.028045177459717, "Pretrain/Loss (Raw)": 2.013903856277466, "Pretrain/Step": 7466, "Pretrain/Step Time": 8.481496840715408} +{"Pretrain/Learning Rate": 3.473498746532881e-05, "Pretrain/Loss": 2.028209924697876, "Pretrain/Loss (Raw)": 2.078932523727417, "Pretrain/Step": 7467, "Pretrain/Step Time": 8.479222796857357} +{"Pretrain/Learning Rate": 3.473107723435231e-05, "Pretrain/Loss": 2.0270519256591797, "Pretrain/Loss (Raw)": 1.8565090894699097, "Pretrain/Step": 7468, "Pretrain/Step Time": 8.479578448459506} +{"Pretrain/Learning Rate": 3.472716672278707e-05, "Pretrain/Loss": 2.027606964111328, "Pretrain/Loss (Raw)": 2.084437131881714, "Pretrain/Step": 7469, "Pretrain/Step Time": 8.474835354834795} +{"Pretrain/Learning Rate": 3.472325593074583e-05, "Pretrain/Loss": 2.0290632247924805, "Pretrain/Loss (Raw)": 2.1168720722198486, "Pretrain/Step": 7470, "Pretrain/Step Time": 8.475197764113545} +{"Pretrain/Learning Rate": 3.4719344858341364e-05, "Pretrain/Loss": 2.0293822288513184, "Pretrain/Loss (Raw)": 2.147339344024658, "Pretrain/Step": 7471, "Pretrain/Step Time": 8.476045951247215} +{"Pretrain/Learning Rate": 3.4715433505686435e-05, "Pretrain/Loss": 2.031425952911377, "Pretrain/Loss (Raw)": 2.03094482421875, "Pretrain/Step": 7472, "Pretrain/Step Time": 8.477762658149004} +{"Pretrain/Learning Rate": 3.4711521872893824e-05, "Pretrain/Loss": 2.0286426544189453, "Pretrain/Loss (Raw)": 1.7056736946105957, "Pretrain/Step": 7473, "Pretrain/Step Time": 8.475022926926613} +{"Pretrain/Learning Rate": 3.470760996007633e-05, "Pretrain/Loss": 2.030195713043213, "Pretrain/Loss (Raw)": 2.177116632461548, "Pretrain/Step": 7474, "Pretrain/Step Time": 8.477938272058964} +{"Pretrain/Learning Rate": 3.4703697767346754e-05, "Pretrain/Loss": 2.031073808670044, "Pretrain/Loss (Raw)": 1.9834791421890259, "Pretrain/Step": 7475, "Pretrain/Step Time": 8.478875920176506} +{"Pretrain/Learning Rate": 3.469978529481789e-05, "Pretrain/Loss": 2.030059337615967, "Pretrain/Loss (Raw)": 2.1483154296875, "Pretrain/Step": 7476, "Pretrain/Step Time": 8.476287821307778} +{"Pretrain/Learning Rate": 3.4695872542602555e-05, "Pretrain/Loss": 2.0301618576049805, "Pretrain/Loss (Raw)": 2.0738437175750732, "Pretrain/Step": 7477, "Pretrain/Step Time": 8.47575513087213} +{"Pretrain/Learning Rate": 3.4691959510813567e-05, "Pretrain/Loss": 2.0308074951171875, "Pretrain/Loss (Raw)": 1.921748399734497, "Pretrain/Step": 7478, "Pretrain/Step Time": 8.478276446461678} +{"Pretrain/Learning Rate": 3.468804619956376e-05, "Pretrain/Loss": 2.0291783809661865, "Pretrain/Loss (Raw)": 1.8436599969863892, "Pretrain/Step": 7479, "Pretrain/Step Time": 8.478446645662189} +{"Pretrain/Learning Rate": 3.468413260896597e-05, "Pretrain/Loss": 2.027830123901367, "Pretrain/Loss (Raw)": 1.885231852531433, "Pretrain/Step": 7480, "Pretrain/Step Time": 8.473303129896522} +{"Pretrain/Learning Rate": 3.468021873913304e-05, "Pretrain/Loss": 2.026965856552124, "Pretrain/Loss (Raw)": 1.972254991531372, "Pretrain/Step": 7481, "Pretrain/Step Time": 8.478525917977095} +{"Pretrain/Learning Rate": 3.467630459017783e-05, "Pretrain/Loss": 2.0258750915527344, "Pretrain/Loss (Raw)": 1.9404487609863281, "Pretrain/Step": 7482, "Pretrain/Step Time": 8.480810197070241} +{"Pretrain/Learning Rate": 3.46723901622132e-05, "Pretrain/Loss": 2.0248985290527344, "Pretrain/Loss (Raw)": 1.9356712102890015, "Pretrain/Step": 7483, "Pretrain/Step Time": 8.479266252368689} +{"Pretrain/Learning Rate": 3.4668475455352024e-05, "Pretrain/Loss": 2.0280675888061523, "Pretrain/Loss (Raw)": 2.2344958782196045, "Pretrain/Step": 7484, "Pretrain/Step Time": 8.477787904441357} +{"Pretrain/Learning Rate": 3.466456046970716e-05, "Pretrain/Loss": 2.028155565261841, "Pretrain/Loss (Raw)": 2.0112626552581787, "Pretrain/Step": 7485, "Pretrain/Step Time": 8.478529013693333} +{"Pretrain/Learning Rate": 3.466064520539152e-05, "Pretrain/Loss": 2.0281858444213867, "Pretrain/Loss (Raw)": 2.063579797744751, "Pretrain/Step": 7486, "Pretrain/Step Time": 8.47615241073072} +{"Pretrain/Learning Rate": 3.465672966251798e-05, "Pretrain/Loss": 2.02810001373291, "Pretrain/Loss (Raw)": 1.968363642692566, "Pretrain/Step": 7487, "Pretrain/Step Time": 8.474085371941328} +{"Pretrain/Learning Rate": 3.465281384119945e-05, "Pretrain/Loss": 2.0284509658813477, "Pretrain/Loss (Raw)": 1.9010460376739502, "Pretrain/Step": 7488, "Pretrain/Step Time": 8.47792205773294} +{"Pretrain/Learning Rate": 3.464889774154884e-05, "Pretrain/Loss": 2.0298843383789062, "Pretrain/Loss (Raw)": 2.0902693271636963, "Pretrain/Step": 7489, "Pretrain/Step Time": 8.47705203667283} +{"Pretrain/Learning Rate": 3.4644981363679064e-05, "Pretrain/Loss": 2.029120922088623, "Pretrain/Loss (Raw)": 2.2691469192504883, "Pretrain/Step": 7490, "Pretrain/Step Time": 8.477578096091747} +{"Pretrain/Learning Rate": 3.4641064707703045e-05, "Pretrain/Loss": 2.028010606765747, "Pretrain/Loss (Raw)": 1.9915424585342407, "Pretrain/Step": 7491, "Pretrain/Step Time": 8.47922976501286} +{"Pretrain/Learning Rate": 3.463714777373373e-05, "Pretrain/Loss": 2.0264317989349365, "Pretrain/Loss (Raw)": 1.7898997068405151, "Pretrain/Step": 7492, "Pretrain/Step Time": 8.476936550810933} +{"Pretrain/Learning Rate": 3.463323056188404e-05, "Pretrain/Loss": 2.0262062549591064, "Pretrain/Loss (Raw)": 1.9634507894515991, "Pretrain/Step": 7493, "Pretrain/Step Time": 8.475930979475379} +{"Pretrain/Learning Rate": 3.462931307226695e-05, "Pretrain/Loss": 2.0254263877868652, "Pretrain/Loss (Raw)": 1.9994652271270752, "Pretrain/Step": 7494, "Pretrain/Step Time": 8.476406881585717} +{"Pretrain/Learning Rate": 3.46253953049954e-05, "Pretrain/Loss": 2.02408504486084, "Pretrain/Loss (Raw)": 2.041341543197632, "Pretrain/Step": 7495, "Pretrain/Step Time": 8.481480618938804} +{"Pretrain/Learning Rate": 3.462147726018236e-05, "Pretrain/Loss": 2.0234756469726562, "Pretrain/Loss (Raw)": 1.780550241470337, "Pretrain/Step": 7496, "Pretrain/Step Time": 8.480378814041615} +{"Pretrain/Learning Rate": 3.461755893794081e-05, "Pretrain/Loss": 2.0235483646392822, "Pretrain/Loss (Raw)": 1.7499821186065674, "Pretrain/Step": 7497, "Pretrain/Step Time": 8.480865694582462} +{"Pretrain/Learning Rate": 3.461364033838373e-05, "Pretrain/Loss": 2.0223264694213867, "Pretrain/Loss (Raw)": 1.974647879600525, "Pretrain/Step": 7498, "Pretrain/Step Time": 8.477665670216084} +{"Pretrain/Learning Rate": 3.46097214616241e-05, "Pretrain/Loss": 2.023299217224121, "Pretrain/Loss (Raw)": 2.1601476669311523, "Pretrain/Step": 7499, "Pretrain/Step Time": 8.481010796502233} +{"Pretrain/Learning Rate": 3.460580230777493e-05, "Pretrain/Loss": 2.0226664543151855, "Pretrain/Loss (Raw)": 2.045149564743042, "Pretrain/Step": 7500, "Pretrain/Step Time": 8.478946344926953} +{"Pretrain/Learning Rate": 3.4601882876949225e-05, "Pretrain/Loss": 2.0218923091888428, "Pretrain/Loss (Raw)": 1.9469119310379028, "Pretrain/Step": 7501, "Pretrain/Step Time": 8.478823099285364} +{"Pretrain/Learning Rate": 3.4597963169259994e-05, "Pretrain/Loss": 2.02219295501709, "Pretrain/Loss (Raw)": 2.056218385696411, "Pretrain/Step": 7502, "Pretrain/Step Time": 8.480076052248478} +{"Pretrain/Learning Rate": 3.4594043184820264e-05, "Pretrain/Loss": 2.022955894470215, "Pretrain/Loss (Raw)": 2.019845724105835, "Pretrain/Step": 7503, "Pretrain/Step Time": 8.478580648079515} +{"Pretrain/Learning Rate": 3.4590122923743056e-05, "Pretrain/Loss": 2.0224337577819824, "Pretrain/Loss (Raw)": 2.068962335586548, "Pretrain/Step": 7504, "Pretrain/Step Time": 8.478494234383106} +{"Pretrain/Learning Rate": 3.458620238614142e-05, "Pretrain/Loss": 2.022327423095703, "Pretrain/Loss (Raw)": 1.9759838581085205, "Pretrain/Step": 7505, "Pretrain/Step Time": 8.481176758185029} +{"Pretrain/Learning Rate": 3.4582281572128395e-05, "Pretrain/Loss": 2.022663116455078, "Pretrain/Loss (Raw)": 2.0887861251831055, "Pretrain/Step": 7506, "Pretrain/Step Time": 8.482933761551976} +{"Pretrain/Learning Rate": 3.457836048181703e-05, "Pretrain/Loss": 2.022887706756592, "Pretrain/Loss (Raw)": 1.8809962272644043, "Pretrain/Step": 7507, "Pretrain/Step Time": 8.483938552439213} +{"Pretrain/Learning Rate": 3.45744391153204e-05, "Pretrain/Loss": 2.0224692821502686, "Pretrain/Loss (Raw)": 1.9697208404541016, "Pretrain/Step": 7508, "Pretrain/Step Time": 8.481156412512064} +{"Pretrain/Learning Rate": 3.457051747275156e-05, "Pretrain/Loss": 2.021656036376953, "Pretrain/Loss (Raw)": 2.0413084030151367, "Pretrain/Step": 7509, "Pretrain/Step Time": 8.47997578792274} +{"Pretrain/Learning Rate": 3.45665955542236e-05, "Pretrain/Loss": 2.0254979133605957, "Pretrain/Loss (Raw)": 2.1470000743865967, "Pretrain/Step": 7510, "Pretrain/Step Time": 8.478649444878101} +{"Pretrain/Learning Rate": 3.456267335984961e-05, "Pretrain/Loss": 2.0263805389404297, "Pretrain/Loss (Raw)": 2.0154662132263184, "Pretrain/Step": 7511, "Pretrain/Step Time": 8.476261680945754} +{"Pretrain/Learning Rate": 3.455875088974266e-05, "Pretrain/Loss": 2.0268280506134033, "Pretrain/Loss (Raw)": 1.946384310722351, "Pretrain/Step": 7512, "Pretrain/Step Time": 8.477802177891135} +{"Pretrain/Learning Rate": 3.455482814401587e-05, "Pretrain/Loss": 2.0267598628997803, "Pretrain/Loss (Raw)": 1.8806228637695312, "Pretrain/Step": 7513, "Pretrain/Step Time": 8.479406334459782} +{"Pretrain/Learning Rate": 3.4550905122782354e-05, "Pretrain/Loss": 2.0285556316375732, "Pretrain/Loss (Raw)": 2.0384809970855713, "Pretrain/Step": 7514, "Pretrain/Step Time": 8.479364166036248} +{"Pretrain/Learning Rate": 3.454698182615522e-05, "Pretrain/Loss": 2.030543088912964, "Pretrain/Loss (Raw)": 2.1318211555480957, "Pretrain/Step": 7515, "Pretrain/Step Time": 8.47773146443069} +{"Pretrain/Learning Rate": 3.454305825424759e-05, "Pretrain/Loss": 2.0295028686523438, "Pretrain/Loss (Raw)": 2.047302484512329, "Pretrain/Step": 7516, "Pretrain/Step Time": 8.47837276943028} +{"Pretrain/Learning Rate": 3.45391344071726e-05, "Pretrain/Loss": 2.027493715286255, "Pretrain/Loss (Raw)": 1.9024169445037842, "Pretrain/Step": 7517, "Pretrain/Step Time": 8.48099159449339} +{"Pretrain/Learning Rate": 3.4535210285043394e-05, "Pretrain/Loss": 2.0255978107452393, "Pretrain/Loss (Raw)": 2.228304862976074, "Pretrain/Step": 7518, "Pretrain/Step Time": 8.479412158951163} +{"Pretrain/Learning Rate": 3.453128588797313e-05, "Pretrain/Loss": 2.0260720252990723, "Pretrain/Loss (Raw)": 2.164947748184204, "Pretrain/Step": 7519, "Pretrain/Step Time": 8.480217596516013} +{"Pretrain/Learning Rate": 3.452736121607496e-05, "Pretrain/Loss": 2.0241615772247314, "Pretrain/Loss (Raw)": 2.1305932998657227, "Pretrain/Step": 7520, "Pretrain/Step Time": 8.48219795525074} +{"Pretrain/Learning Rate": 3.452343626946203e-05, "Pretrain/Loss": 2.0252890586853027, "Pretrain/Loss (Raw)": 2.0702173709869385, "Pretrain/Step": 7521, "Pretrain/Step Time": 8.482569644227624} +{"Pretrain/Learning Rate": 3.4519511048247536e-05, "Pretrain/Loss": 2.023347854614258, "Pretrain/Loss (Raw)": 1.9552586078643799, "Pretrain/Step": 7522, "Pretrain/Step Time": 8.48499546572566} +{"Pretrain/Learning Rate": 3.4515585552544655e-05, "Pretrain/Loss": 2.022156238555908, "Pretrain/Loss (Raw)": 1.971406102180481, "Pretrain/Step": 7523, "Pretrain/Step Time": 8.479691453278065} +{"Pretrain/Learning Rate": 3.451165978246657e-05, "Pretrain/Loss": 2.0237298011779785, "Pretrain/Loss (Raw)": 2.253390073776245, "Pretrain/Step": 7524, "Pretrain/Step Time": 8.484592208638787} +{"Pretrain/Learning Rate": 3.450773373812648e-05, "Pretrain/Loss": 2.0220110416412354, "Pretrain/Loss (Raw)": 1.6175973415374756, "Pretrain/Step": 7525, "Pretrain/Step Time": 8.482058700174093} +{"Pretrain/Learning Rate": 3.450380741963759e-05, "Pretrain/Loss": 2.0208094120025635, "Pretrain/Loss (Raw)": 1.9867099523544312, "Pretrain/Step": 7526, "Pretrain/Step Time": 8.479483902454376} +{"Pretrain/Learning Rate": 3.449988082711312e-05, "Pretrain/Loss": 2.0192437171936035, "Pretrain/Loss (Raw)": 1.9573725461959839, "Pretrain/Step": 7527, "Pretrain/Step Time": 8.487227434292436} +{"Pretrain/Learning Rate": 3.4495953960666274e-05, "Pretrain/Loss": 2.0174946784973145, "Pretrain/Loss (Raw)": 1.8606021404266357, "Pretrain/Step": 7528, "Pretrain/Step Time": 8.480269853025675} +{"Pretrain/Learning Rate": 3.4492026820410294e-05, "Pretrain/Loss": 2.013608694076538, "Pretrain/Loss (Raw)": 1.7576918601989746, "Pretrain/Step": 7529, "Pretrain/Step Time": 8.48192842118442} +{"Pretrain/Learning Rate": 3.4488099406458406e-05, "Pretrain/Loss": 2.0111188888549805, "Pretrain/Loss (Raw)": 1.814965844154358, "Pretrain/Step": 7530, "Pretrain/Step Time": 8.482405837625265} +{"Pretrain/Learning Rate": 3.4484171718923874e-05, "Pretrain/Loss": 2.012235164642334, "Pretrain/Loss (Raw)": 2.1524298191070557, "Pretrain/Step": 7531, "Pretrain/Step Time": 8.484400132670999} +{"Pretrain/Learning Rate": 3.4480243757919924e-05, "Pretrain/Loss": 2.013115406036377, "Pretrain/Loss (Raw)": 2.079573392868042, "Pretrain/Step": 7532, "Pretrain/Step Time": 8.480105597525835} +{"Pretrain/Learning Rate": 3.4476315523559835e-05, "Pretrain/Loss": 2.013638973236084, "Pretrain/Loss (Raw)": 2.1687214374542236, "Pretrain/Step": 7533, "Pretrain/Step Time": 8.479085929691792} +{"Pretrain/Learning Rate": 3.4472387015956864e-05, "Pretrain/Loss": 2.015096426010132, "Pretrain/Loss (Raw)": 2.118431568145752, "Pretrain/Step": 7534, "Pretrain/Step Time": 8.478359835222363} +{"Pretrain/Learning Rate": 3.446845823522429e-05, "Pretrain/Loss": 2.014375686645508, "Pretrain/Loss (Raw)": 2.0480973720550537, "Pretrain/Step": 7535, "Pretrain/Step Time": 8.478798117488623} +{"Pretrain/Learning Rate": 3.44645291814754e-05, "Pretrain/Loss": 2.013934373855591, "Pretrain/Loss (Raw)": 1.80867338180542, "Pretrain/Step": 7536, "Pretrain/Step Time": 8.481083111837506} +{"Pretrain/Learning Rate": 3.4460599854823486e-05, "Pretrain/Loss": 2.0114052295684814, "Pretrain/Loss (Raw)": 2.005449056625366, "Pretrain/Step": 7537, "Pretrain/Step Time": 8.483663354068995} +{"Pretrain/Learning Rate": 3.445667025538184e-05, "Pretrain/Loss": 2.010200023651123, "Pretrain/Loss (Raw)": 1.882035493850708, "Pretrain/Step": 7538, "Pretrain/Step Time": 8.486480740830302} +{"Pretrain/Learning Rate": 3.445274038326377e-05, "Pretrain/Loss": 2.0084311962127686, "Pretrain/Loss (Raw)": 1.948480486869812, "Pretrain/Step": 7539, "Pretrain/Step Time": 8.484673820436} +{"Pretrain/Learning Rate": 3.444881023858261e-05, "Pretrain/Loss": 2.006978988647461, "Pretrain/Loss (Raw)": 1.903439998626709, "Pretrain/Step": 7540, "Pretrain/Step Time": 8.483668092638254} +{"Pretrain/Learning Rate": 3.444487982145165e-05, "Pretrain/Loss": 2.008636951446533, "Pretrain/Loss (Raw)": 2.1621735095977783, "Pretrain/Step": 7541, "Pretrain/Step Time": 8.48509375192225} +{"Pretrain/Learning Rate": 3.4440949131984245e-05, "Pretrain/Loss": 2.006270408630371, "Pretrain/Loss (Raw)": 1.741066813468933, "Pretrain/Step": 7542, "Pretrain/Step Time": 8.484402613714337} +{"Pretrain/Learning Rate": 3.443701817029373e-05, "Pretrain/Loss": 2.0101680755615234, "Pretrain/Loss (Raw)": 2.0986740589141846, "Pretrain/Step": 7543, "Pretrain/Step Time": 8.483826311305165} +{"Pretrain/Learning Rate": 3.4433086936493446e-05, "Pretrain/Loss": 2.009742498397827, "Pretrain/Loss (Raw)": 2.0706615447998047, "Pretrain/Step": 7544, "Pretrain/Step Time": 8.481153415516019} +{"Pretrain/Learning Rate": 3.442915543069675e-05, "Pretrain/Loss": 2.012092113494873, "Pretrain/Loss (Raw)": 2.1700618267059326, "Pretrain/Step": 7545, "Pretrain/Step Time": 8.480041889473796} +{"Pretrain/Learning Rate": 3.442522365301701e-05, "Pretrain/Loss": 2.0089471340179443, "Pretrain/Loss (Raw)": 2.0346450805664062, "Pretrain/Step": 7546, "Pretrain/Step Time": 8.481545712798834} +{"Pretrain/Learning Rate": 3.442129160356759e-05, "Pretrain/Loss": 2.002978801727295, "Pretrain/Loss (Raw)": 1.7123140096664429, "Pretrain/Step": 7547, "Pretrain/Step Time": 8.479569608345628} +{"Pretrain/Learning Rate": 3.441735928246186e-05, "Pretrain/Loss": 2.0036377906799316, "Pretrain/Loss (Raw)": 2.148555278778076, "Pretrain/Step": 7548, "Pretrain/Step Time": 8.482314176857471} +{"Pretrain/Learning Rate": 3.441342668981321e-05, "Pretrain/Loss": 2.0021679401397705, "Pretrain/Loss (Raw)": 1.9450973272323608, "Pretrain/Step": 7549, "Pretrain/Step Time": 8.477905919775367} +{"Pretrain/Learning Rate": 3.440949382573505e-05, "Pretrain/Loss": 1.999087929725647, "Pretrain/Loss (Raw)": 1.9892122745513916, "Pretrain/Step": 7550, "Pretrain/Step Time": 8.47492653131485} +{"Pretrain/Learning Rate": 3.440556069034077e-05, "Pretrain/Loss": 1.9975416660308838, "Pretrain/Loss (Raw)": 2.04049015045166, "Pretrain/Step": 7551, "Pretrain/Step Time": 8.475776528939605} +{"Pretrain/Learning Rate": 3.4401627283743765e-05, "Pretrain/Loss": 1.9965890645980835, "Pretrain/Loss (Raw)": 1.9562166929244995, "Pretrain/Step": 7552, "Pretrain/Step Time": 8.480781430378556} +{"Pretrain/Learning Rate": 3.439769360605747e-05, "Pretrain/Loss": 1.995436668395996, "Pretrain/Loss (Raw)": 2.024995803833008, "Pretrain/Step": 7553, "Pretrain/Step Time": 8.476656360551715} +{"Pretrain/Learning Rate": 3.4393759657395305e-05, "Pretrain/Loss": 1.9943461418151855, "Pretrain/Loss (Raw)": 1.8119572401046753, "Pretrain/Step": 7554, "Pretrain/Step Time": 8.482857147231698} +{"Pretrain/Learning Rate": 3.43898254378707e-05, "Pretrain/Loss": 1.9961552619934082, "Pretrain/Loss (Raw)": 2.130303144454956, "Pretrain/Step": 7555, "Pretrain/Step Time": 8.480410557240248} +{"Pretrain/Learning Rate": 3.438589094759711e-05, "Pretrain/Loss": 1.995739221572876, "Pretrain/Loss (Raw)": 2.1588757038116455, "Pretrain/Step": 7556, "Pretrain/Step Time": 8.477315410971642} +{"Pretrain/Learning Rate": 3.438195618668796e-05, "Pretrain/Loss": 1.9987791776657104, "Pretrain/Loss (Raw)": 2.087510824203491, "Pretrain/Step": 7557, "Pretrain/Step Time": 8.478881875053048} +{"Pretrain/Learning Rate": 3.437802115525672e-05, "Pretrain/Loss": 1.9982037544250488, "Pretrain/Loss (Raw)": 1.8668421506881714, "Pretrain/Step": 7558, "Pretrain/Step Time": 8.478601584210992} +{"Pretrain/Learning Rate": 3.437408585341686e-05, "Pretrain/Loss": 1.9983859062194824, "Pretrain/Loss (Raw)": 1.9960291385650635, "Pretrain/Step": 7559, "Pretrain/Step Time": 8.47838039137423} +{"Pretrain/Learning Rate": 3.437015028128183e-05, "Pretrain/Loss": 1.9977740049362183, "Pretrain/Loss (Raw)": 2.017996311187744, "Pretrain/Step": 7560, "Pretrain/Step Time": 8.473064230754972} +{"Pretrain/Learning Rate": 3.436621443896513e-05, "Pretrain/Loss": 1.9973952770233154, "Pretrain/Loss (Raw)": 2.012618064880371, "Pretrain/Step": 7561, "Pretrain/Step Time": 8.473253147676587} +{"Pretrain/Learning Rate": 3.4362278326580235e-05, "Pretrain/Loss": 1.9982393980026245, "Pretrain/Loss (Raw)": 2.072096347808838, "Pretrain/Step": 7562, "Pretrain/Step Time": 8.474489636719227} +{"Pretrain/Learning Rate": 3.435834194424064e-05, "Pretrain/Loss": 1.9984713792800903, "Pretrain/Loss (Raw)": 2.181048631668091, "Pretrain/Step": 7563, "Pretrain/Step Time": 8.475598314777017} +{"Pretrain/Learning Rate": 3.435440529205985e-05, "Pretrain/Loss": 1.9978138208389282, "Pretrain/Loss (Raw)": 1.9699100255966187, "Pretrain/Step": 7564, "Pretrain/Step Time": 8.478242119774222} +{"Pretrain/Learning Rate": 3.435046837015139e-05, "Pretrain/Loss": 1.9972213506698608, "Pretrain/Loss (Raw)": 1.917325496673584, "Pretrain/Step": 7565, "Pretrain/Step Time": 8.473270969465375} +{"Pretrain/Learning Rate": 3.4346531178628764e-05, "Pretrain/Loss": 1.9947208166122437, "Pretrain/Loss (Raw)": 1.8486084938049316, "Pretrain/Step": 7566, "Pretrain/Step Time": 8.47581629641354} +{"Pretrain/Learning Rate": 3.43425937176055e-05, "Pretrain/Loss": 1.9954302310943604, "Pretrain/Loss (Raw)": 2.0726730823516846, "Pretrain/Step": 7567, "Pretrain/Step Time": 8.477031588554382} +{"Pretrain/Learning Rate": 3.433865598719513e-05, "Pretrain/Loss": 1.995509147644043, "Pretrain/Loss (Raw)": 2.0154221057891846, "Pretrain/Step": 7568, "Pretrain/Step Time": 8.475549386814237} +{"Pretrain/Learning Rate": 3.4334717987511195e-05, "Pretrain/Loss": 1.9971166849136353, "Pretrain/Loss (Raw)": 1.9510642290115356, "Pretrain/Step": 7569, "Pretrain/Step Time": 8.470928560942411} +{"Pretrain/Learning Rate": 3.433077971866725e-05, "Pretrain/Loss": 1.9949675798416138, "Pretrain/Loss (Raw)": 1.5992740392684937, "Pretrain/Step": 7570, "Pretrain/Step Time": 8.469723239541054} +{"Pretrain/Learning Rate": 3.432684118077685e-05, "Pretrain/Loss": 1.993204116821289, "Pretrain/Loss (Raw)": 1.9297304153442383, "Pretrain/Step": 7571, "Pretrain/Step Time": 8.469732888042927} +{"Pretrain/Learning Rate": 3.432290237395356e-05, "Pretrain/Loss": 1.9938974380493164, "Pretrain/Loss (Raw)": 2.146149158477783, "Pretrain/Step": 7572, "Pretrain/Step Time": 8.47089040465653} +{"Pretrain/Learning Rate": 3.431896329831096e-05, "Pretrain/Loss": 1.992350459098816, "Pretrain/Loss (Raw)": 1.8872393369674683, "Pretrain/Step": 7573, "Pretrain/Step Time": 8.472365342080593} +{"Pretrain/Learning Rate": 3.431502395396261e-05, "Pretrain/Loss": 1.9950127601623535, "Pretrain/Loss (Raw)": 1.9812896251678467, "Pretrain/Step": 7574, "Pretrain/Step Time": 8.475160213187337} +{"Pretrain/Learning Rate": 3.431108434102211e-05, "Pretrain/Loss": 1.9941834211349487, "Pretrain/Loss (Raw)": 2.0355544090270996, "Pretrain/Step": 7575, "Pretrain/Step Time": 8.474901823326945} +{"Pretrain/Learning Rate": 3.430714445960307e-05, "Pretrain/Loss": 1.995427131652832, "Pretrain/Loss (Raw)": 1.927986979484558, "Pretrain/Step": 7576, "Pretrain/Step Time": 8.46971870213747} +{"Pretrain/Learning Rate": 3.430320430981907e-05, "Pretrain/Loss": 1.9992789030075073, "Pretrain/Loss (Raw)": 2.103685140609741, "Pretrain/Step": 7577, "Pretrain/Step Time": 8.467737814411521} +{"Pretrain/Learning Rate": 3.429926389178374e-05, "Pretrain/Loss": 1.9953936338424683, "Pretrain/Loss (Raw)": 1.9952749013900757, "Pretrain/Step": 7578, "Pretrain/Step Time": 8.468281907960773} +{"Pretrain/Learning Rate": 3.429532320561069e-05, "Pretrain/Loss": 1.995305061340332, "Pretrain/Loss (Raw)": 1.9949740171432495, "Pretrain/Step": 7579, "Pretrain/Step Time": 8.469883291050792} +{"Pretrain/Learning Rate": 3.429138225141354e-05, "Pretrain/Loss": 1.9968208074569702, "Pretrain/Loss (Raw)": 2.1273720264434814, "Pretrain/Step": 7580, "Pretrain/Step Time": 8.469815198332071} +{"Pretrain/Learning Rate": 3.4287441029305936e-05, "Pretrain/Loss": 1.9985785484313965, "Pretrain/Loss (Raw)": 2.2358012199401855, "Pretrain/Step": 7581, "Pretrain/Step Time": 8.469215327873826} +{"Pretrain/Learning Rate": 3.428349953940151e-05, "Pretrain/Loss": 1.9987812042236328, "Pretrain/Loss (Raw)": 2.0197296142578125, "Pretrain/Step": 7582, "Pretrain/Step Time": 8.47298645786941} +{"Pretrain/Learning Rate": 3.4279557781813936e-05, "Pretrain/Loss": 2.000493288040161, "Pretrain/Loss (Raw)": 2.1387157440185547, "Pretrain/Step": 7583, "Pretrain/Step Time": 8.473309447988868} +{"Pretrain/Learning Rate": 3.4275615756656844e-05, "Pretrain/Loss": 2.000171184539795, "Pretrain/Loss (Raw)": 2.1125376224517822, "Pretrain/Step": 7584, "Pretrain/Step Time": 8.473056886345148} +{"Pretrain/Learning Rate": 3.4271673464043916e-05, "Pretrain/Loss": 2.0002405643463135, "Pretrain/Loss (Raw)": 1.9530619382858276, "Pretrain/Step": 7585, "Pretrain/Step Time": 8.474226059392095} +{"Pretrain/Learning Rate": 3.4267730904088815e-05, "Pretrain/Loss": 1.9993091821670532, "Pretrain/Loss (Raw)": 1.9413102865219116, "Pretrain/Step": 7586, "Pretrain/Step Time": 8.474698353558779} +{"Pretrain/Learning Rate": 3.426378807690522e-05, "Pretrain/Loss": 2.000619649887085, "Pretrain/Loss (Raw)": 2.0982413291931152, "Pretrain/Step": 7587, "Pretrain/Step Time": 8.472422020509839} +{"Pretrain/Learning Rate": 3.425984498260684e-05, "Pretrain/Loss": 2.0020692348480225, "Pretrain/Loss (Raw)": 2.1522867679595947, "Pretrain/Step": 7588, "Pretrain/Step Time": 8.478895826265216} +{"Pretrain/Learning Rate": 3.4255901621307355e-05, "Pretrain/Loss": 2.0032529830932617, "Pretrain/Loss (Raw)": 2.18522572517395, "Pretrain/Step": 7589, "Pretrain/Step Time": 8.480491261929274} +{"Pretrain/Learning Rate": 3.425195799312047e-05, "Pretrain/Loss": 2.0036208629608154, "Pretrain/Loss (Raw)": 2.202165365219116, "Pretrain/Step": 7590, "Pretrain/Step Time": 8.478716228157282} +{"Pretrain/Learning Rate": 3.42480140981599e-05, "Pretrain/Loss": 2.0043036937713623, "Pretrain/Loss (Raw)": 2.1223220825195312, "Pretrain/Step": 7591, "Pretrain/Step Time": 8.478805782273412} +{"Pretrain/Learning Rate": 3.424406993653936e-05, "Pretrain/Loss": 2.0087389945983887, "Pretrain/Loss (Raw)": 2.1154556274414062, "Pretrain/Step": 7592, "Pretrain/Step Time": 8.479927407577634} +{"Pretrain/Learning Rate": 3.424012550837258e-05, "Pretrain/Loss": 2.0096237659454346, "Pretrain/Loss (Raw)": 2.02866792678833, "Pretrain/Step": 7593, "Pretrain/Step Time": 8.478202356025577} +{"Pretrain/Learning Rate": 3.423618081377329e-05, "Pretrain/Loss": 2.0116159915924072, "Pretrain/Loss (Raw)": 2.2689003944396973, "Pretrain/Step": 7594, "Pretrain/Step Time": 8.479349292814732} +{"Pretrain/Learning Rate": 3.4232235852855245e-05, "Pretrain/Loss": 2.011115074157715, "Pretrain/Loss (Raw)": 2.014836072921753, "Pretrain/Step": 7595, "Pretrain/Step Time": 8.48464105091989} +{"Pretrain/Learning Rate": 3.4228290625732185e-05, "Pretrain/Loss": 2.0115103721618652, "Pretrain/Loss (Raw)": 1.907082200050354, "Pretrain/Step": 7596, "Pretrain/Step Time": 8.481746295467019} +{"Pretrain/Learning Rate": 3.422434513251787e-05, "Pretrain/Loss": 2.0105910301208496, "Pretrain/Loss (Raw)": 1.9667742252349854, "Pretrain/Step": 7597, "Pretrain/Step Time": 8.485110914334655} +{"Pretrain/Learning Rate": 3.422039937332607e-05, "Pretrain/Loss": 2.0094354152679443, "Pretrain/Loss (Raw)": 1.9689538478851318, "Pretrain/Step": 7598, "Pretrain/Step Time": 8.485343778505921} +{"Pretrain/Learning Rate": 3.421645334827055e-05, "Pretrain/Loss": 2.0081920623779297, "Pretrain/Loss (Raw)": 1.9881954193115234, "Pretrain/Step": 7599, "Pretrain/Step Time": 8.483161812648177} +{"Pretrain/Learning Rate": 3.421250705746509e-05, "Pretrain/Loss": 2.008713722229004, "Pretrain/Loss (Raw)": 2.097710371017456, "Pretrain/Step": 7600, "Pretrain/Step Time": 8.483972121030092} +{"Pretrain/Learning Rate": 3.420856050102349e-05, "Pretrain/Loss": 2.01265811920166, "Pretrain/Loss (Raw)": 2.2105495929718018, "Pretrain/Step": 7601, "Pretrain/Step Time": 8.487031999975443} +{"Pretrain/Learning Rate": 3.420461367905954e-05, "Pretrain/Loss": 2.010328769683838, "Pretrain/Loss (Raw)": 1.8789702653884888, "Pretrain/Step": 7602, "Pretrain/Step Time": 8.484167275950313} +{"Pretrain/Learning Rate": 3.4200666591687045e-05, "Pretrain/Loss": 2.011723518371582, "Pretrain/Loss (Raw)": 2.161979913711548, "Pretrain/Step": 7603, "Pretrain/Step Time": 8.486116265878081} +{"Pretrain/Learning Rate": 3.419671923901981e-05, "Pretrain/Loss": 2.0115535259246826, "Pretrain/Loss (Raw)": 2.1265931129455566, "Pretrain/Step": 7604, "Pretrain/Step Time": 8.485961578786373} +{"Pretrain/Learning Rate": 3.419277162117166e-05, "Pretrain/Loss": 2.0112786293029785, "Pretrain/Loss (Raw)": 2.038663148880005, "Pretrain/Step": 7605, "Pretrain/Step Time": 8.487336130812764} +{"Pretrain/Learning Rate": 3.418882373825642e-05, "Pretrain/Loss": 2.011420249938965, "Pretrain/Loss (Raw)": 1.9398730993270874, "Pretrain/Step": 7606, "Pretrain/Step Time": 8.486537862569094} +{"Pretrain/Learning Rate": 3.4184875590387924e-05, "Pretrain/Loss": 2.0119924545288086, "Pretrain/Loss (Raw)": 1.9168986082077026, "Pretrain/Step": 7607, "Pretrain/Step Time": 8.49067241512239} +{"Pretrain/Learning Rate": 3.4180927177680025e-05, "Pretrain/Loss": 2.013840675354004, "Pretrain/Loss (Raw)": 2.121812582015991, "Pretrain/Step": 7608, "Pretrain/Step Time": 8.487994607537985} +{"Pretrain/Learning Rate": 3.4176978500246554e-05, "Pretrain/Loss": 2.012932062149048, "Pretrain/Loss (Raw)": 1.8559250831604004, "Pretrain/Step": 7609, "Pretrain/Step Time": 8.484426023438573} +{"Pretrain/Learning Rate": 3.417302955820137e-05, "Pretrain/Loss": 2.012803792953491, "Pretrain/Loss (Raw)": 1.9240309000015259, "Pretrain/Step": 7610, "Pretrain/Step Time": 8.484703185036778} +{"Pretrain/Learning Rate": 3.416908035165836e-05, "Pretrain/Loss": 2.0133509635925293, "Pretrain/Loss (Raw)": 2.005715847015381, "Pretrain/Step": 7611, "Pretrain/Step Time": 8.481282467022538} +{"Pretrain/Learning Rate": 3.416513088073138e-05, "Pretrain/Loss": 2.011897087097168, "Pretrain/Loss (Raw)": 2.0484085083007812, "Pretrain/Step": 7612, "Pretrain/Step Time": 8.483083916828036} +{"Pretrain/Learning Rate": 3.41611811455343e-05, "Pretrain/Loss": 2.011352062225342, "Pretrain/Loss (Raw)": 1.94147527217865, "Pretrain/Step": 7613, "Pretrain/Step Time": 8.489180674776435} +{"Pretrain/Learning Rate": 3.415723114618104e-05, "Pretrain/Loss": 2.012423515319824, "Pretrain/Loss (Raw)": 2.200739860534668, "Pretrain/Step": 7614, "Pretrain/Step Time": 8.485778078436852} +{"Pretrain/Learning Rate": 3.415328088278546e-05, "Pretrain/Loss": 2.0136213302612305, "Pretrain/Loss (Raw)": 2.1216964721679688, "Pretrain/Step": 7615, "Pretrain/Step Time": 8.488708520308137} +{"Pretrain/Learning Rate": 3.414933035546149e-05, "Pretrain/Loss": 2.012505054473877, "Pretrain/Loss (Raw)": 1.7581595182418823, "Pretrain/Step": 7616, "Pretrain/Step Time": 8.49020447768271} +{"Pretrain/Learning Rate": 3.414537956432301e-05, "Pretrain/Loss": 2.012740135192871, "Pretrain/Loss (Raw)": 2.1203737258911133, "Pretrain/Step": 7617, "Pretrain/Step Time": 8.482230247929692} +{"Pretrain/Learning Rate": 3.414142850948397e-05, "Pretrain/Loss": 2.0107789039611816, "Pretrain/Loss (Raw)": 2.0180907249450684, "Pretrain/Step": 7618, "Pretrain/Step Time": 8.487616240978241} +{"Pretrain/Learning Rate": 3.413747719105828e-05, "Pretrain/Loss": 2.011592149734497, "Pretrain/Loss (Raw)": 2.095646381378174, "Pretrain/Step": 7619, "Pretrain/Step Time": 8.4887351449579} +{"Pretrain/Learning Rate": 3.413352560915988e-05, "Pretrain/Loss": 2.0152406692504883, "Pretrain/Loss (Raw)": 2.256897211074829, "Pretrain/Step": 7620, "Pretrain/Step Time": 8.488590111956} +{"Pretrain/Learning Rate": 3.412957376390271e-05, "Pretrain/Loss": 2.0156800746917725, "Pretrain/Loss (Raw)": 2.019704580307007, "Pretrain/Step": 7621, "Pretrain/Step Time": 8.488724205642939} +{"Pretrain/Learning Rate": 3.412562165540071e-05, "Pretrain/Loss": 2.0159833431243896, "Pretrain/Loss (Raw)": 2.038292407989502, "Pretrain/Step": 7622, "Pretrain/Step Time": 8.490147618576884} +{"Pretrain/Learning Rate": 3.4121669283767846e-05, "Pretrain/Loss": 2.0160746574401855, "Pretrain/Loss (Raw)": 2.0529909133911133, "Pretrain/Step": 7623, "Pretrain/Step Time": 8.483815448358655} +{"Pretrain/Learning Rate": 3.411771664911807e-05, "Pretrain/Loss": 2.0190083980560303, "Pretrain/Loss (Raw)": 2.156095027923584, "Pretrain/Step": 7624, "Pretrain/Step Time": 8.488220475614071} +{"Pretrain/Learning Rate": 3.411376375156537e-05, "Pretrain/Loss": 2.0210342407226562, "Pretrain/Loss (Raw)": 2.0092885494232178, "Pretrain/Step": 7625, "Pretrain/Step Time": 8.484015801921487} +{"Pretrain/Learning Rate": 3.410981059122372e-05, "Pretrain/Loss": 2.0224990844726562, "Pretrain/Loss (Raw)": 2.16213059425354, "Pretrain/Step": 7626, "Pretrain/Step Time": 8.481860285624862} +{"Pretrain/Learning Rate": 3.41058571682071e-05, "Pretrain/Loss": 2.024397373199463, "Pretrain/Loss (Raw)": 2.403135061264038, "Pretrain/Step": 7627, "Pretrain/Step Time": 8.482575038447976} +{"Pretrain/Learning Rate": 3.41019034826295e-05, "Pretrain/Loss": 2.0241920948028564, "Pretrain/Loss (Raw)": 2.018867015838623, "Pretrain/Step": 7628, "Pretrain/Step Time": 8.48323405906558} +{"Pretrain/Learning Rate": 3.4097949534604945e-05, "Pretrain/Loss": 2.024712562561035, "Pretrain/Loss (Raw)": 2.013538122177124, "Pretrain/Step": 7629, "Pretrain/Step Time": 8.484624331817031} +{"Pretrain/Learning Rate": 3.4093995324247426e-05, "Pretrain/Loss": 2.024311065673828, "Pretrain/Loss (Raw)": 2.004864454269409, "Pretrain/Step": 7630, "Pretrain/Step Time": 8.483857044950128} +{"Pretrain/Learning Rate": 3.409004085167096e-05, "Pretrain/Loss": 2.0258302688598633, "Pretrain/Loss (Raw)": 2.2142672538757324, "Pretrain/Step": 7631, "Pretrain/Step Time": 8.484091687947512} +{"Pretrain/Learning Rate": 3.408608611698956e-05, "Pretrain/Loss": 2.0236544609069824, "Pretrain/Loss (Raw)": 1.7904881238937378, "Pretrain/Step": 7632, "Pretrain/Step Time": 8.490396853536367} +{"Pretrain/Learning Rate": 3.4082131120317285e-05, "Pretrain/Loss": 2.022716999053955, "Pretrain/Loss (Raw)": 1.8559751510620117, "Pretrain/Step": 7633, "Pretrain/Step Time": 8.48542425967753} +{"Pretrain/Learning Rate": 3.407817586176816e-05, "Pretrain/Loss": 2.021909713745117, "Pretrain/Loss (Raw)": 1.985426664352417, "Pretrain/Step": 7634, "Pretrain/Step Time": 8.48372284322977} +{"Pretrain/Learning Rate": 3.407422034145624e-05, "Pretrain/Loss": 2.022336483001709, "Pretrain/Loss (Raw)": 1.9356729984283447, "Pretrain/Step": 7635, "Pretrain/Step Time": 8.483255688101053} +{"Pretrain/Learning Rate": 3.407026455949557e-05, "Pretrain/Loss": 2.0224757194519043, "Pretrain/Loss (Raw)": 1.9874869585037231, "Pretrain/Step": 7636, "Pretrain/Step Time": 8.488974500447512} +{"Pretrain/Learning Rate": 3.406630851600021e-05, "Pretrain/Loss": 2.024440288543701, "Pretrain/Loss (Raw)": 2.292790651321411, "Pretrain/Step": 7637, "Pretrain/Step Time": 8.487635925412178} +{"Pretrain/Learning Rate": 3.406235221108424e-05, "Pretrain/Loss": 2.0238211154937744, "Pretrain/Loss (Raw)": 2.0677576065063477, "Pretrain/Step": 7638, "Pretrain/Step Time": 8.484911061823368} +{"Pretrain/Learning Rate": 3.4058395644861726e-05, "Pretrain/Loss": 2.024984121322632, "Pretrain/Loss (Raw)": 2.1643259525299072, "Pretrain/Step": 7639, "Pretrain/Step Time": 8.483686376363039} +{"Pretrain/Learning Rate": 3.405443881744677e-05, "Pretrain/Loss": 2.0232176780700684, "Pretrain/Loss (Raw)": 1.7202731370925903, "Pretrain/Step": 7640, "Pretrain/Step Time": 8.483225541189313} +{"Pretrain/Learning Rate": 3.405048172895345e-05, "Pretrain/Loss": 2.0231776237487793, "Pretrain/Loss (Raw)": 1.8755053281784058, "Pretrain/Step": 7641, "Pretrain/Step Time": 8.48232988268137} +{"Pretrain/Learning Rate": 3.4046524379495865e-05, "Pretrain/Loss": 2.0236406326293945, "Pretrain/Loss (Raw)": 2.0977587699890137, "Pretrain/Step": 7642, "Pretrain/Step Time": 8.483404399827123} +{"Pretrain/Learning Rate": 3.404256676918813e-05, "Pretrain/Loss": 2.0244696140289307, "Pretrain/Loss (Raw)": 2.2379119396209717, "Pretrain/Step": 7643, "Pretrain/Step Time": 8.482099754735827} +{"Pretrain/Learning Rate": 3.403860889814435e-05, "Pretrain/Loss": 2.024216413497925, "Pretrain/Loss (Raw)": 2.0148956775665283, "Pretrain/Step": 7644, "Pretrain/Step Time": 8.48424612544477} +{"Pretrain/Learning Rate": 3.403465076647866e-05, "Pretrain/Loss": 2.0255703926086426, "Pretrain/Loss (Raw)": 2.0757057666778564, "Pretrain/Step": 7645, "Pretrain/Step Time": 8.480068570002913} +{"Pretrain/Learning Rate": 3.403069237430519e-05, "Pretrain/Loss": 2.0233583450317383, "Pretrain/Loss (Raw)": 1.9451894760131836, "Pretrain/Step": 7646, "Pretrain/Step Time": 8.480121225118637} +{"Pretrain/Learning Rate": 3.4026733721738066e-05, "Pretrain/Loss": 2.0209577083587646, "Pretrain/Loss (Raw)": 1.8576626777648926, "Pretrain/Step": 7647, "Pretrain/Step Time": 8.479674650356174} +{"Pretrain/Learning Rate": 3.402277480889144e-05, "Pretrain/Loss": 2.018101215362549, "Pretrain/Loss (Raw)": 1.7649486064910889, "Pretrain/Step": 7648, "Pretrain/Step Time": 8.483350107446313} +{"Pretrain/Learning Rate": 3.401881563587946e-05, "Pretrain/Loss": 2.017289638519287, "Pretrain/Loss (Raw)": 1.96632719039917, "Pretrain/Step": 7649, "Pretrain/Step Time": 8.479383878409863} +{"Pretrain/Learning Rate": 3.4014856202816284e-05, "Pretrain/Loss": 2.0183818340301514, "Pretrain/Loss (Raw)": 2.0950777530670166, "Pretrain/Step": 7650, "Pretrain/Step Time": 8.480276891961694} +{"Pretrain/Learning Rate": 3.40108965098161e-05, "Pretrain/Loss": 2.0181877613067627, "Pretrain/Loss (Raw)": 1.9465728998184204, "Pretrain/Step": 7651, "Pretrain/Step Time": 8.48828711360693} +{"Pretrain/Learning Rate": 3.400693655699306e-05, "Pretrain/Loss": 2.01694917678833, "Pretrain/Loss (Raw)": 2.094860553741455, "Pretrain/Step": 7652, "Pretrain/Step Time": 8.481544760987163} +{"Pretrain/Learning Rate": 3.4002976344461344e-05, "Pretrain/Loss": 2.020663261413574, "Pretrain/Loss (Raw)": 2.092973232269287, "Pretrain/Step": 7653, "Pretrain/Step Time": 8.484807638451457} +{"Pretrain/Learning Rate": 3.399901587233516e-05, "Pretrain/Loss": 2.0205631256103516, "Pretrain/Loss (Raw)": 1.9738831520080566, "Pretrain/Step": 7654, "Pretrain/Step Time": 8.484349740669131} +{"Pretrain/Learning Rate": 3.3995055140728696e-05, "Pretrain/Loss": 2.021913528442383, "Pretrain/Loss (Raw)": 2.1302695274353027, "Pretrain/Step": 7655, "Pretrain/Step Time": 8.47949805110693} +{"Pretrain/Learning Rate": 3.399109414975616e-05, "Pretrain/Loss": 2.0239696502685547, "Pretrain/Loss (Raw)": 2.12378191947937, "Pretrain/Step": 7656, "Pretrain/Step Time": 8.481145765632391} +{"Pretrain/Learning Rate": 3.398713289953177e-05, "Pretrain/Loss": 2.025376081466675, "Pretrain/Loss (Raw)": 1.9376972913742065, "Pretrain/Step": 7657, "Pretrain/Step Time": 8.48012606985867} +{"Pretrain/Learning Rate": 3.398317139016973e-05, "Pretrain/Loss": 2.025866985321045, "Pretrain/Loss (Raw)": 1.8777861595153809, "Pretrain/Step": 7658, "Pretrain/Step Time": 8.47608813457191} +{"Pretrain/Learning Rate": 3.397920962178428e-05, "Pretrain/Loss": 2.0253407955169678, "Pretrain/Loss (Raw)": 2.085092067718506, "Pretrain/Step": 7659, "Pretrain/Step Time": 8.474818659946322} +{"Pretrain/Learning Rate": 3.397524759448965e-05, "Pretrain/Loss": 2.025672197341919, "Pretrain/Loss (Raw)": 2.1220130920410156, "Pretrain/Step": 7660, "Pretrain/Step Time": 8.476489605382085} +{"Pretrain/Learning Rate": 3.397128530840007e-05, "Pretrain/Loss": 2.026538372039795, "Pretrain/Loss (Raw)": 2.2795464992523193, "Pretrain/Step": 7661, "Pretrain/Step Time": 8.476140098646283} +{"Pretrain/Learning Rate": 3.396732276362982e-05, "Pretrain/Loss": 2.0266926288604736, "Pretrain/Loss (Raw)": 2.1382100582122803, "Pretrain/Step": 7662, "Pretrain/Step Time": 8.474428506568074} +{"Pretrain/Learning Rate": 3.3963359960293126e-05, "Pretrain/Loss": 2.026423454284668, "Pretrain/Loss (Raw)": 2.013627529144287, "Pretrain/Step": 7663, "Pretrain/Step Time": 8.477219494059682} +{"Pretrain/Learning Rate": 3.3959396898504274e-05, "Pretrain/Loss": 2.0264620780944824, "Pretrain/Loss (Raw)": 1.8136152029037476, "Pretrain/Step": 7664, "Pretrain/Step Time": 8.478321023285389} +{"Pretrain/Learning Rate": 3.395543357837753e-05, "Pretrain/Loss": 2.0269546508789062, "Pretrain/Loss (Raw)": 2.068497657775879, "Pretrain/Step": 7665, "Pretrain/Step Time": 8.475225845351815} +{"Pretrain/Learning Rate": 3.3951470000027166e-05, "Pretrain/Loss": 2.026343822479248, "Pretrain/Loss (Raw)": 1.8038439750671387, "Pretrain/Step": 7666, "Pretrain/Step Time": 8.473595583811402} +{"Pretrain/Learning Rate": 3.394750616356748e-05, "Pretrain/Loss": 2.0263712406158447, "Pretrain/Loss (Raw)": 1.9520035982131958, "Pretrain/Step": 7667, "Pretrain/Step Time": 8.475251153111458} +{"Pretrain/Learning Rate": 3.394354206911275e-05, "Pretrain/Loss": 2.0265488624572754, "Pretrain/Loss (Raw)": 1.926175594329834, "Pretrain/Step": 7668, "Pretrain/Step Time": 8.479394050315022} +{"Pretrain/Learning Rate": 3.39395777167773e-05, "Pretrain/Loss": 2.0255887508392334, "Pretrain/Loss (Raw)": 2.039273977279663, "Pretrain/Step": 7669, "Pretrain/Step Time": 8.477339535951614} +{"Pretrain/Learning Rate": 3.393561310667542e-05, "Pretrain/Loss": 2.0274643898010254, "Pretrain/Loss (Raw)": 1.9811570644378662, "Pretrain/Step": 7670, "Pretrain/Step Time": 8.479981061071157} +{"Pretrain/Learning Rate": 3.393164823892144e-05, "Pretrain/Loss": 2.0263664722442627, "Pretrain/Loss (Raw)": 1.9581427574157715, "Pretrain/Step": 7671, "Pretrain/Step Time": 8.479011146351695} +{"Pretrain/Learning Rate": 3.392768311362969e-05, "Pretrain/Loss": 2.0265161991119385, "Pretrain/Loss (Raw)": 2.0898194313049316, "Pretrain/Step": 7672, "Pretrain/Step Time": 8.476108709350228} +{"Pretrain/Learning Rate": 3.392371773091448e-05, "Pretrain/Loss": 2.0225868225097656, "Pretrain/Loss (Raw)": 1.667106032371521, "Pretrain/Step": 7673, "Pretrain/Step Time": 8.480209613218904} +{"Pretrain/Learning Rate": 3.391975209089016e-05, "Pretrain/Loss": 2.022904872894287, "Pretrain/Loss (Raw)": 2.0753798484802246, "Pretrain/Step": 7674, "Pretrain/Step Time": 8.477534526959062} +{"Pretrain/Learning Rate": 3.391578619367108e-05, "Pretrain/Loss": 2.0262582302093506, "Pretrain/Loss (Raw)": 2.1415228843688965, "Pretrain/Step": 7675, "Pretrain/Step Time": 8.474513933062553} +{"Pretrain/Learning Rate": 3.3911820039371586e-05, "Pretrain/Loss": 2.0267159938812256, "Pretrain/Loss (Raw)": 2.2071642875671387, "Pretrain/Step": 7676, "Pretrain/Step Time": 8.471793366596103} +{"Pretrain/Learning Rate": 3.3907853628106046e-05, "Pretrain/Loss": 2.026262044906616, "Pretrain/Loss (Raw)": 1.886957049369812, "Pretrain/Step": 7677, "Pretrain/Step Time": 8.47647294215858} +{"Pretrain/Learning Rate": 3.390388695998883e-05, "Pretrain/Loss": 2.027573347091675, "Pretrain/Loss (Raw)": 2.157078504562378, "Pretrain/Step": 7678, "Pretrain/Step Time": 8.4828295186162} +{"Pretrain/Learning Rate": 3.389992003513431e-05, "Pretrain/Loss": 2.028763771057129, "Pretrain/Loss (Raw)": 2.1928555965423584, "Pretrain/Step": 7679, "Pretrain/Step Time": 8.482805190607905} +{"Pretrain/Learning Rate": 3.3895952853656864e-05, "Pretrain/Loss": 2.029256582260132, "Pretrain/Loss (Raw)": 2.0192933082580566, "Pretrain/Step": 7680, "Pretrain/Step Time": 8.481766073033214} +{"Pretrain/Learning Rate": 3.389198541567089e-05, "Pretrain/Loss": 2.0291051864624023, "Pretrain/Loss (Raw)": 2.005617141723633, "Pretrain/Step": 7681, "Pretrain/Step Time": 8.484853200614452} +{"Pretrain/Learning Rate": 3.388801772129079e-05, "Pretrain/Loss": 2.029142379760742, "Pretrain/Loss (Raw)": 1.8167237043380737, "Pretrain/Step": 7682, "Pretrain/Step Time": 8.479499803856015} +{"Pretrain/Learning Rate": 3.388404977063096e-05, "Pretrain/Loss": 2.02713680267334, "Pretrain/Loss (Raw)": 1.8736143112182617, "Pretrain/Step": 7683, "Pretrain/Step Time": 8.47784398496151} +{"Pretrain/Learning Rate": 3.388008156380582e-05, "Pretrain/Loss": 2.0269360542297363, "Pretrain/Loss (Raw)": 2.133169412612915, "Pretrain/Step": 7684, "Pretrain/Step Time": 8.48166548088193} +{"Pretrain/Learning Rate": 3.3876113100929784e-05, "Pretrain/Loss": 2.0259079933166504, "Pretrain/Loss (Raw)": 1.9558823108673096, "Pretrain/Step": 7685, "Pretrain/Step Time": 8.48017650283873} +{"Pretrain/Learning Rate": 3.387214438211729e-05, "Pretrain/Loss": 2.027628183364868, "Pretrain/Loss (Raw)": 2.0870392322540283, "Pretrain/Step": 7686, "Pretrain/Step Time": 8.480675829574466} +{"Pretrain/Learning Rate": 3.3868175407482764e-05, "Pretrain/Loss": 2.0279862880706787, "Pretrain/Loss (Raw)": 2.041872262954712, "Pretrain/Step": 7687, "Pretrain/Step Time": 8.480536185204983} +{"Pretrain/Learning Rate": 3.386420617714065e-05, "Pretrain/Loss": 2.027310371398926, "Pretrain/Loss (Raw)": 1.9314919710159302, "Pretrain/Step": 7688, "Pretrain/Step Time": 8.483292914927006} +{"Pretrain/Learning Rate": 3.38602366912054e-05, "Pretrain/Loss": 2.0273263454437256, "Pretrain/Loss (Raw)": 2.014666795730591, "Pretrain/Step": 7689, "Pretrain/Step Time": 8.483455056324601} +{"Pretrain/Learning Rate": 3.385626694979147e-05, "Pretrain/Loss": 2.028151512145996, "Pretrain/Loss (Raw)": 2.177717447280884, "Pretrain/Step": 7690, "Pretrain/Step Time": 8.478532258421183} +{"Pretrain/Learning Rate": 3.385229695301333e-05, "Pretrain/Loss": 2.0252373218536377, "Pretrain/Loss (Raw)": 1.808021903038025, "Pretrain/Step": 7691, "Pretrain/Step Time": 8.478923216462135} +{"Pretrain/Learning Rate": 3.384832670098544e-05, "Pretrain/Loss": 2.025021553039551, "Pretrain/Loss (Raw)": 1.942294716835022, "Pretrain/Step": 7692, "Pretrain/Step Time": 8.475351680070162} +{"Pretrain/Learning Rate": 3.3844356193822304e-05, "Pretrain/Loss": 2.024507999420166, "Pretrain/Loss (Raw)": 1.851563811302185, "Pretrain/Step": 7693, "Pretrain/Step Time": 8.473898639902472} +{"Pretrain/Learning Rate": 3.3840385431638375e-05, "Pretrain/Loss": 2.0259954929351807, "Pretrain/Loss (Raw)": 2.039029359817505, "Pretrain/Step": 7694, "Pretrain/Step Time": 8.475223949179053} +{"Pretrain/Learning Rate": 3.3836414414548175e-05, "Pretrain/Loss": 2.026394844055176, "Pretrain/Loss (Raw)": 2.1237707138061523, "Pretrain/Step": 7695, "Pretrain/Step Time": 8.472167506814003} +{"Pretrain/Learning Rate": 3.383244314266619e-05, "Pretrain/Loss": 2.0251593589782715, "Pretrain/Loss (Raw)": 1.8572778701782227, "Pretrain/Step": 7696, "Pretrain/Step Time": 8.480271423235536} +{"Pretrain/Learning Rate": 3.382847161610693e-05, "Pretrain/Loss": 2.026557445526123, "Pretrain/Loss (Raw)": 2.1300621032714844, "Pretrain/Step": 7697, "Pretrain/Step Time": 8.48219982534647} +{"Pretrain/Learning Rate": 3.3824499834984925e-05, "Pretrain/Loss": 2.0343799591064453, "Pretrain/Loss (Raw)": 2.6005191802978516, "Pretrain/Step": 7698, "Pretrain/Step Time": 8.47954423353076} +{"Pretrain/Learning Rate": 3.382052779941468e-05, "Pretrain/Loss": 2.0340514183044434, "Pretrain/Loss (Raw)": 1.8877060413360596, "Pretrain/Step": 7699, "Pretrain/Step Time": 8.482484703883529} +{"Pretrain/Learning Rate": 3.3816555509510736e-05, "Pretrain/Loss": 2.0314860343933105, "Pretrain/Loss (Raw)": 1.8177728652954102, "Pretrain/Step": 7700, "Pretrain/Step Time": 8.48489024490118} +{"Pretrain/Learning Rate": 3.381258296538763e-05, "Pretrain/Loss": 2.034019947052002, "Pretrain/Loss (Raw)": 2.2115635871887207, "Pretrain/Step": 7701, "Pretrain/Step Time": 8.483696615323424} +{"Pretrain/Learning Rate": 3.3808610167159907e-05, "Pretrain/Loss": 2.0337204933166504, "Pretrain/Loss (Raw)": 1.9429458379745483, "Pretrain/Step": 7702, "Pretrain/Step Time": 8.478672794997692} +{"Pretrain/Learning Rate": 3.380463711494211e-05, "Pretrain/Loss": 2.0355911254882812, "Pretrain/Loss (Raw)": 2.2750117778778076, "Pretrain/Step": 7703, "Pretrain/Step Time": 8.47822523675859} +{"Pretrain/Learning Rate": 3.380066380884882e-05, "Pretrain/Loss": 2.037550687789917, "Pretrain/Loss (Raw)": 2.1788065433502197, "Pretrain/Step": 7704, "Pretrain/Step Time": 8.481054220348597} +{"Pretrain/Learning Rate": 3.379669024899459e-05, "Pretrain/Loss": 2.0364840030670166, "Pretrain/Loss (Raw)": 1.9671825170516968, "Pretrain/Step": 7705, "Pretrain/Step Time": 8.480779575183988} +{"Pretrain/Learning Rate": 3.3792716435494e-05, "Pretrain/Loss": 2.0380845069885254, "Pretrain/Loss (Raw)": 2.2001261711120605, "Pretrain/Step": 7706, "Pretrain/Step Time": 8.481978440657258} +{"Pretrain/Learning Rate": 3.378874236846162e-05, "Pretrain/Loss": 2.04048752784729, "Pretrain/Loss (Raw)": 2.3025665283203125, "Pretrain/Step": 7707, "Pretrain/Step Time": 8.478695563971996} +{"Pretrain/Learning Rate": 3.378476804801206e-05, "Pretrain/Loss": 2.039807081222534, "Pretrain/Loss (Raw)": 2.0402672290802, "Pretrain/Step": 7708, "Pretrain/Step Time": 8.47993852943182} +{"Pretrain/Learning Rate": 3.37807934742599e-05, "Pretrain/Loss": 2.036689281463623, "Pretrain/Loss (Raw)": 1.836711049079895, "Pretrain/Step": 7709, "Pretrain/Step Time": 8.477265732362866} +{"Pretrain/Learning Rate": 3.377681864731976e-05, "Pretrain/Loss": 2.035432815551758, "Pretrain/Loss (Raw)": 1.8589164018630981, "Pretrain/Step": 7710, "Pretrain/Step Time": 8.480394687503576} +{"Pretrain/Learning Rate": 3.377284356730623e-05, "Pretrain/Loss": 2.032496690750122, "Pretrain/Loss (Raw)": 1.7628737688064575, "Pretrain/Step": 7711, "Pretrain/Step Time": 8.478808568790555} +{"Pretrain/Learning Rate": 3.376886823433395e-05, "Pretrain/Loss": 2.0317752361297607, "Pretrain/Loss (Raw)": 2.020186185836792, "Pretrain/Step": 7712, "Pretrain/Step Time": 8.48984189517796} +{"Pretrain/Learning Rate": 3.3764892648517526e-05, "Pretrain/Loss": 2.0321044921875, "Pretrain/Loss (Raw)": 1.9952117204666138, "Pretrain/Step": 7713, "Pretrain/Step Time": 8.486426781862974} +{"Pretrain/Learning Rate": 3.3760916809971604e-05, "Pretrain/Loss": 2.0322155952453613, "Pretrain/Loss (Raw)": 1.9555264711380005, "Pretrain/Step": 7714, "Pretrain/Step Time": 8.48429917730391} +{"Pretrain/Learning Rate": 3.375694071881083e-05, "Pretrain/Loss": 2.0310399532318115, "Pretrain/Loss (Raw)": 1.9477851390838623, "Pretrain/Step": 7715, "Pretrain/Step Time": 8.48322506248951} +{"Pretrain/Learning Rate": 3.375296437514984e-05, "Pretrain/Loss": 2.034318208694458, "Pretrain/Loss (Raw)": 2.571876049041748, "Pretrain/Step": 7716, "Pretrain/Step Time": 8.482716843485832} +{"Pretrain/Learning Rate": 3.3748987779103286e-05, "Pretrain/Loss": 2.032514810562134, "Pretrain/Loss (Raw)": 1.9544175863265991, "Pretrain/Step": 7717, "Pretrain/Step Time": 8.479781934991479} +{"Pretrain/Learning Rate": 3.374501093078584e-05, "Pretrain/Loss": 2.0305914878845215, "Pretrain/Loss (Raw)": 1.95595121383667, "Pretrain/Step": 7718, "Pretrain/Step Time": 8.483382731676102} +{"Pretrain/Learning Rate": 3.3741033830312176e-05, "Pretrain/Loss": 2.029177188873291, "Pretrain/Loss (Raw)": 1.9412970542907715, "Pretrain/Step": 7719, "Pretrain/Step Time": 8.480992322787642} +{"Pretrain/Learning Rate": 3.373705647779696e-05, "Pretrain/Loss": 2.029453754425049, "Pretrain/Loss (Raw)": 2.1508419513702393, "Pretrain/Step": 7720, "Pretrain/Step Time": 8.479738913476467} +{"Pretrain/Learning Rate": 3.373307887335487e-05, "Pretrain/Loss": 2.029106616973877, "Pretrain/Loss (Raw)": 1.9842712879180908, "Pretrain/Step": 7721, "Pretrain/Step Time": 8.4804975874722} +{"Pretrain/Learning Rate": 3.372910101710062e-05, "Pretrain/Loss": 2.0293707847595215, "Pretrain/Loss (Raw)": 2.3027236461639404, "Pretrain/Step": 7722, "Pretrain/Step Time": 8.47960646264255} +{"Pretrain/Learning Rate": 3.372512290914889e-05, "Pretrain/Loss": 2.0295028686523438, "Pretrain/Loss (Raw)": 2.0317025184631348, "Pretrain/Step": 7723, "Pretrain/Step Time": 8.478040212765336} +{"Pretrain/Learning Rate": 3.372114454961439e-05, "Pretrain/Loss": 2.030404567718506, "Pretrain/Loss (Raw)": 2.0225203037261963, "Pretrain/Step": 7724, "Pretrain/Step Time": 8.480360738933086} +{"Pretrain/Learning Rate": 3.371716593861184e-05, "Pretrain/Loss": 2.0324575901031494, "Pretrain/Loss (Raw)": 2.2295663356781006, "Pretrain/Step": 7725, "Pretrain/Step Time": 8.476346036419272} +{"Pretrain/Learning Rate": 3.371318707625595e-05, "Pretrain/Loss": 2.032802104949951, "Pretrain/Loss (Raw)": 2.013042688369751, "Pretrain/Step": 7726, "Pretrain/Step Time": 8.477540455758572} +{"Pretrain/Learning Rate": 3.3709207962661454e-05, "Pretrain/Loss": 2.0330076217651367, "Pretrain/Loss (Raw)": 2.0144846439361572, "Pretrain/Step": 7727, "Pretrain/Step Time": 8.479269228875637} +{"Pretrain/Learning Rate": 3.370522859794308e-05, "Pretrain/Loss": 2.0357251167297363, "Pretrain/Loss (Raw)": 2.4455556869506836, "Pretrain/Step": 7728, "Pretrain/Step Time": 8.489668073132634} +{"Pretrain/Learning Rate": 3.370124898221559e-05, "Pretrain/Loss": 2.0343151092529297, "Pretrain/Loss (Raw)": 2.0300776958465576, "Pretrain/Step": 7729, "Pretrain/Step Time": 8.48597295023501} +{"Pretrain/Learning Rate": 3.3697269115593714e-05, "Pretrain/Loss": 2.0358452796936035, "Pretrain/Loss (Raw)": 2.0748372077941895, "Pretrain/Step": 7730, "Pretrain/Step Time": 8.486222259700298} +{"Pretrain/Learning Rate": 3.3693288998192216e-05, "Pretrain/Loss": 2.033437728881836, "Pretrain/Loss (Raw)": 1.853834867477417, "Pretrain/Step": 7731, "Pretrain/Step Time": 8.484738981351256} +{"Pretrain/Learning Rate": 3.3689308630125846e-05, "Pretrain/Loss": 2.032353162765503, "Pretrain/Loss (Raw)": 1.987734079360962, "Pretrain/Step": 7732, "Pretrain/Step Time": 8.48535150103271} +{"Pretrain/Learning Rate": 3.36853280115094e-05, "Pretrain/Loss": 2.0335092544555664, "Pretrain/Loss (Raw)": 2.1866672039031982, "Pretrain/Step": 7733, "Pretrain/Step Time": 8.483976874500513} +{"Pretrain/Learning Rate": 3.368134714245764e-05, "Pretrain/Loss": 2.0359537601470947, "Pretrain/Loss (Raw)": 2.2527530193328857, "Pretrain/Step": 7734, "Pretrain/Step Time": 8.483710223808885} +{"Pretrain/Learning Rate": 3.367736602308536e-05, "Pretrain/Loss": 2.038334846496582, "Pretrain/Loss (Raw)": 2.221689462661743, "Pretrain/Step": 7735, "Pretrain/Step Time": 8.478430243209004} +{"Pretrain/Learning Rate": 3.3673384653507343e-05, "Pretrain/Loss": 2.038919687271118, "Pretrain/Loss (Raw)": 2.196678876876831, "Pretrain/Step": 7736, "Pretrain/Step Time": 8.48182307742536} +{"Pretrain/Learning Rate": 3.366940303383839e-05, "Pretrain/Loss": 2.037662982940674, "Pretrain/Loss (Raw)": 1.6950597763061523, "Pretrain/Step": 7737, "Pretrain/Step Time": 8.478289553895593} +{"Pretrain/Learning Rate": 3.3665421164193314e-05, "Pretrain/Loss": 2.0398519039154053, "Pretrain/Loss (Raw)": 2.2042112350463867, "Pretrain/Step": 7738, "Pretrain/Step Time": 8.478280007839203} +{"Pretrain/Learning Rate": 3.3661439044686933e-05, "Pretrain/Loss": 2.039957284927368, "Pretrain/Loss (Raw)": 2.019197463989258, "Pretrain/Step": 7739, "Pretrain/Step Time": 8.480136862024665} +{"Pretrain/Learning Rate": 3.365745667543406e-05, "Pretrain/Loss": 2.040513277053833, "Pretrain/Loss (Raw)": 2.1195671558380127, "Pretrain/Step": 7740, "Pretrain/Step Time": 8.477785862982273} +{"Pretrain/Learning Rate": 3.365347405654953e-05, "Pretrain/Loss": 2.0408289432525635, "Pretrain/Loss (Raw)": 1.981881856918335, "Pretrain/Step": 7741, "Pretrain/Step Time": 8.474210064858198} +{"Pretrain/Learning Rate": 3.3649491188148175e-05, "Pretrain/Loss": 2.039355754852295, "Pretrain/Loss (Raw)": 2.0121984481811523, "Pretrain/Step": 7742, "Pretrain/Step Time": 8.476274386048317} +{"Pretrain/Learning Rate": 3.3645508070344836e-05, "Pretrain/Loss": 2.0395166873931885, "Pretrain/Loss (Raw)": 2.142284870147705, "Pretrain/Step": 7743, "Pretrain/Step Time": 8.478588474914432} +{"Pretrain/Learning Rate": 3.364152470325436e-05, "Pretrain/Loss": 2.040147542953491, "Pretrain/Loss (Raw)": 1.8389145135879517, "Pretrain/Step": 7744, "Pretrain/Step Time": 8.476986180990934} +{"Pretrain/Learning Rate": 3.363754108699162e-05, "Pretrain/Loss": 2.0397186279296875, "Pretrain/Loss (Raw)": 2.0654518604278564, "Pretrain/Step": 7745, "Pretrain/Step Time": 8.47963248565793} +{"Pretrain/Learning Rate": 3.363355722167147e-05, "Pretrain/Loss": 2.040724992752075, "Pretrain/Loss (Raw)": 2.1469216346740723, "Pretrain/Step": 7746, "Pretrain/Step Time": 8.475048772990704} +{"Pretrain/Learning Rate": 3.3629573107408786e-05, "Pretrain/Loss": 2.039659261703491, "Pretrain/Loss (Raw)": 1.9592255353927612, "Pretrain/Step": 7747, "Pretrain/Step Time": 8.474560985341668} +{"Pretrain/Learning Rate": 3.3625588744318445e-05, "Pretrain/Loss": 2.0380611419677734, "Pretrain/Loss (Raw)": 2.0523126125335693, "Pretrain/Step": 7748, "Pretrain/Step Time": 8.47416416555643} +{"Pretrain/Learning Rate": 3.3621604132515324e-05, "Pretrain/Loss": 2.0393919944763184, "Pretrain/Loss (Raw)": 2.1900689601898193, "Pretrain/Step": 7749, "Pretrain/Step Time": 8.477743245661259} +{"Pretrain/Learning Rate": 3.361761927211433e-05, "Pretrain/Loss": 2.03916072845459, "Pretrain/Loss (Raw)": 2.0086870193481445, "Pretrain/Step": 7750, "Pretrain/Step Time": 8.475039327517152} +{"Pretrain/Learning Rate": 3.361363416323037e-05, "Pretrain/Loss": 2.0381453037261963, "Pretrain/Loss (Raw)": 1.9230544567108154, "Pretrain/Step": 7751, "Pretrain/Step Time": 8.477524379268289} +{"Pretrain/Learning Rate": 3.360964880597833e-05, "Pretrain/Loss": 2.0366246700286865, "Pretrain/Loss (Raw)": 1.961439609527588, "Pretrain/Step": 7752, "Pretrain/Step Time": 8.474833158776164} +{"Pretrain/Learning Rate": 3.360566320047314e-05, "Pretrain/Loss": 2.036954402923584, "Pretrain/Loss (Raw)": 2.0514907836914062, "Pretrain/Step": 7753, "Pretrain/Step Time": 8.475033266469836} +{"Pretrain/Learning Rate": 3.360167734682971e-05, "Pretrain/Loss": 2.0369582176208496, "Pretrain/Loss (Raw)": 2.1625983715057373, "Pretrain/Step": 7754, "Pretrain/Step Time": 8.47757675498724} +{"Pretrain/Learning Rate": 3.359769124516299e-05, "Pretrain/Loss": 2.0329580307006836, "Pretrain/Loss (Raw)": 1.8911458253860474, "Pretrain/Step": 7755, "Pretrain/Step Time": 8.474520487710834} +{"Pretrain/Learning Rate": 3.35937048955879e-05, "Pretrain/Loss": 2.0320520401000977, "Pretrain/Loss (Raw)": 1.9028561115264893, "Pretrain/Step": 7756, "Pretrain/Step Time": 8.474431907758117} +{"Pretrain/Learning Rate": 3.3589718298219386e-05, "Pretrain/Loss": 2.031157970428467, "Pretrain/Loss (Raw)": 1.899124026298523, "Pretrain/Step": 7757, "Pretrain/Step Time": 8.473373353481293} +{"Pretrain/Learning Rate": 3.3585731453172396e-05, "Pretrain/Loss": 2.0329599380493164, "Pretrain/Loss (Raw)": 2.2354962825775146, "Pretrain/Step": 7758, "Pretrain/Step Time": 8.471656613051891} +{"Pretrain/Learning Rate": 3.358174436056189e-05, "Pretrain/Loss": 2.0308146476745605, "Pretrain/Loss (Raw)": 1.9396809339523315, "Pretrain/Step": 7759, "Pretrain/Step Time": 8.468073172494769} +{"Pretrain/Learning Rate": 3.357775702050285e-05, "Pretrain/Loss": 2.031287431716919, "Pretrain/Loss (Raw)": 1.851021409034729, "Pretrain/Step": 7760, "Pretrain/Step Time": 8.469593161717057} +{"Pretrain/Learning Rate": 3.357376943311022e-05, "Pretrain/Loss": 2.0317578315734863, "Pretrain/Loss (Raw)": 1.9161924123764038, "Pretrain/Step": 7761, "Pretrain/Step Time": 8.474006285890937} +{"Pretrain/Learning Rate": 3.3569781598499e-05, "Pretrain/Loss": 2.030038833618164, "Pretrain/Loss (Raw)": 1.765382170677185, "Pretrain/Step": 7762, "Pretrain/Step Time": 8.475770834833384} +{"Pretrain/Learning Rate": 3.356579351678416e-05, "Pretrain/Loss": 2.0310096740722656, "Pretrain/Loss (Raw)": 2.0599186420440674, "Pretrain/Step": 7763, "Pretrain/Step Time": 8.472444824874401} +{"Pretrain/Learning Rate": 3.356180518808071e-05, "Pretrain/Loss": 2.029909133911133, "Pretrain/Loss (Raw)": 1.8466377258300781, "Pretrain/Step": 7764, "Pretrain/Step Time": 8.471371181309223} +{"Pretrain/Learning Rate": 3.355781661250364e-05, "Pretrain/Loss": 2.028446912765503, "Pretrain/Loss (Raw)": 2.105605125427246, "Pretrain/Step": 7765, "Pretrain/Step Time": 8.469843234866858} +{"Pretrain/Learning Rate": 3.355382779016797e-05, "Pretrain/Loss": 2.028049945831299, "Pretrain/Loss (Raw)": 2.016991138458252, "Pretrain/Step": 7766, "Pretrain/Step Time": 8.4709946885705} +{"Pretrain/Learning Rate": 3.35498387211887e-05, "Pretrain/Loss": 2.027376413345337, "Pretrain/Loss (Raw)": 2.0780980587005615, "Pretrain/Step": 7767, "Pretrain/Step Time": 8.469811407849193} +{"Pretrain/Learning Rate": 3.3545849405680854e-05, "Pretrain/Loss": 2.030409336090088, "Pretrain/Loss (Raw)": 2.1084601879119873, "Pretrain/Step": 7768, "Pretrain/Step Time": 8.472990281879902} +{"Pretrain/Learning Rate": 3.354185984375946e-05, "Pretrain/Loss": 2.0298023223876953, "Pretrain/Loss (Raw)": 1.7978249788284302, "Pretrain/Step": 7769, "Pretrain/Step Time": 8.47285258024931} +{"Pretrain/Learning Rate": 3.353787003553957e-05, "Pretrain/Loss": 2.0291123390197754, "Pretrain/Loss (Raw)": 2.0094358921051025, "Pretrain/Step": 7770, "Pretrain/Step Time": 8.468295089900494} +{"Pretrain/Learning Rate": 3.353387998113621e-05, "Pretrain/Loss": 2.0292904376983643, "Pretrain/Loss (Raw)": 2.26072359085083, "Pretrain/Step": 7771, "Pretrain/Step Time": 8.471182314679027} +{"Pretrain/Learning Rate": 3.352988968066444e-05, "Pretrain/Loss": 2.0296521186828613, "Pretrain/Loss (Raw)": 2.0611648559570312, "Pretrain/Step": 7772, "Pretrain/Step Time": 8.467134952545166} +{"Pretrain/Learning Rate": 3.3525899134239314e-05, "Pretrain/Loss": 2.0307722091674805, "Pretrain/Loss (Raw)": 2.2191109657287598, "Pretrain/Step": 7773, "Pretrain/Step Time": 8.47052233852446} +{"Pretrain/Learning Rate": 3.3521908341975895e-05, "Pretrain/Loss": 2.0308308601379395, "Pretrain/Loss (Raw)": 1.9527018070220947, "Pretrain/Step": 7774, "Pretrain/Step Time": 8.468740168958902} +{"Pretrain/Learning Rate": 3.3517917303989255e-05, "Pretrain/Loss": 2.0304598808288574, "Pretrain/Loss (Raw)": 1.810171127319336, "Pretrain/Step": 7775, "Pretrain/Step Time": 8.470773492008448} +{"Pretrain/Learning Rate": 3.3513926020394475e-05, "Pretrain/Loss": 2.0317907333374023, "Pretrain/Loss (Raw)": 1.9352856874465942, "Pretrain/Step": 7776, "Pretrain/Step Time": 8.464180752635002} +{"Pretrain/Learning Rate": 3.350993449130664e-05, "Pretrain/Loss": 2.032794952392578, "Pretrain/Loss (Raw)": 2.094883918762207, "Pretrain/Step": 7777, "Pretrain/Step Time": 8.46798351407051} +{"Pretrain/Learning Rate": 3.350594271684085e-05, "Pretrain/Loss": 2.0322580337524414, "Pretrain/Loss (Raw)": 2.0263354778289795, "Pretrain/Step": 7778, "Pretrain/Step Time": 8.469616506248713} +{"Pretrain/Learning Rate": 3.35019506971122e-05, "Pretrain/Loss": 2.033909797668457, "Pretrain/Loss (Raw)": 2.157992362976074, "Pretrain/Step": 7779, "Pretrain/Step Time": 8.46268168836832} +{"Pretrain/Learning Rate": 3.349795843223578e-05, "Pretrain/Loss": 2.0336661338806152, "Pretrain/Loss (Raw)": 2.063652515411377, "Pretrain/Step": 7780, "Pretrain/Step Time": 8.462381955236197} +{"Pretrain/Learning Rate": 3.349396592232673e-05, "Pretrain/Loss": 2.0307602882385254, "Pretrain/Loss (Raw)": 1.7210545539855957, "Pretrain/Step": 7781, "Pretrain/Step Time": 8.46164378337562} +{"Pretrain/Learning Rate": 3.348997316750015e-05, "Pretrain/Loss": 2.0307207107543945, "Pretrain/Loss (Raw)": 1.968808650970459, "Pretrain/Step": 7782, "Pretrain/Step Time": 8.461985010653734} +{"Pretrain/Learning Rate": 3.348598016787119e-05, "Pretrain/Loss": 2.0304722785949707, "Pretrain/Loss (Raw)": 2.0984597206115723, "Pretrain/Step": 7783, "Pretrain/Step Time": 8.459231454879045} +{"Pretrain/Learning Rate": 3.348198692355498e-05, "Pretrain/Loss": 2.0293803215026855, "Pretrain/Loss (Raw)": 1.9840161800384521, "Pretrain/Step": 7784, "Pretrain/Step Time": 8.462600510567427} +{"Pretrain/Learning Rate": 3.347799343466664e-05, "Pretrain/Loss": 2.030313491821289, "Pretrain/Loss (Raw)": 2.0571625232696533, "Pretrain/Step": 7785, "Pretrain/Step Time": 8.463098801672459} +{"Pretrain/Learning Rate": 3.347399970132135e-05, "Pretrain/Loss": 2.033329963684082, "Pretrain/Loss (Raw)": 2.2638931274414062, "Pretrain/Step": 7786, "Pretrain/Step Time": 8.463341489434242} +{"Pretrain/Learning Rate": 3.3470005723634237e-05, "Pretrain/Loss": 2.033033847808838, "Pretrain/Loss (Raw)": 2.0471549034118652, "Pretrain/Step": 7787, "Pretrain/Step Time": 8.46285848133266} +{"Pretrain/Learning Rate": 3.346601150172048e-05, "Pretrain/Loss": 2.032921552658081, "Pretrain/Loss (Raw)": 2.107671022415161, "Pretrain/Step": 7788, "Pretrain/Step Time": 8.462407423183322} +{"Pretrain/Learning Rate": 3.346201703569527e-05, "Pretrain/Loss": 2.0310049057006836, "Pretrain/Loss (Raw)": 2.034217119216919, "Pretrain/Step": 7789, "Pretrain/Step Time": 8.462567312642932} +{"Pretrain/Learning Rate": 3.345802232567375e-05, "Pretrain/Loss": 2.030665874481201, "Pretrain/Loss (Raw)": 2.094811201095581, "Pretrain/Step": 7790, "Pretrain/Step Time": 8.463992591947317} +{"Pretrain/Learning Rate": 3.345402737177112e-05, "Pretrain/Loss": 2.031379222869873, "Pretrain/Loss (Raw)": 2.1049351692199707, "Pretrain/Step": 7791, "Pretrain/Step Time": 8.464108211919665} +{"Pretrain/Learning Rate": 3.345003217410257e-05, "Pretrain/Loss": 2.033128261566162, "Pretrain/Loss (Raw)": 2.037489891052246, "Pretrain/Step": 7792, "Pretrain/Step Time": 8.460601143538952} +{"Pretrain/Learning Rate": 3.3446036732783297e-05, "Pretrain/Loss": 2.0315234661102295, "Pretrain/Loss (Raw)": 1.8630698919296265, "Pretrain/Step": 7793, "Pretrain/Step Time": 8.465527635067701} +{"Pretrain/Learning Rate": 3.344204104792852e-05, "Pretrain/Loss": 2.0337486267089844, "Pretrain/Loss (Raw)": 2.088672637939453, "Pretrain/Step": 7794, "Pretrain/Step Time": 8.468501521274447} +{"Pretrain/Learning Rate": 3.343804511965343e-05, "Pretrain/Loss": 2.0344297885894775, "Pretrain/Loss (Raw)": 2.039191484451294, "Pretrain/Step": 7795, "Pretrain/Step Time": 8.464833365753293} +{"Pretrain/Learning Rate": 3.343404894807326e-05, "Pretrain/Loss": 2.0340309143066406, "Pretrain/Loss (Raw)": 1.8751083612442017, "Pretrain/Step": 7796, "Pretrain/Step Time": 8.460534365847707} +{"Pretrain/Learning Rate": 3.343005253330323e-05, "Pretrain/Loss": 2.031707525253296, "Pretrain/Loss (Raw)": 1.7419034242630005, "Pretrain/Step": 7797, "Pretrain/Step Time": 8.469888692721725} +{"Pretrain/Learning Rate": 3.3426055875458585e-05, "Pretrain/Loss": 2.032069683074951, "Pretrain/Loss (Raw)": 2.0274879932403564, "Pretrain/Step": 7798, "Pretrain/Step Time": 8.46422960050404} +{"Pretrain/Learning Rate": 3.342205897465456e-05, "Pretrain/Loss": 2.0337133407592773, "Pretrain/Loss (Raw)": 2.168536424636841, "Pretrain/Step": 7799, "Pretrain/Step Time": 8.468417314812541} +{"Pretrain/Learning Rate": 3.341806183100639e-05, "Pretrain/Loss": 2.035219669342041, "Pretrain/Loss (Raw)": 2.2826499938964844, "Pretrain/Step": 7800, "Pretrain/Step Time": 8.46507953107357} +{"Pretrain/Learning Rate": 3.341406444462935e-05, "Pretrain/Loss": 2.0367722511291504, "Pretrain/Loss (Raw)": 1.8658217191696167, "Pretrain/Step": 7801, "Pretrain/Step Time": 8.46851272135973} +{"Pretrain/Learning Rate": 3.341006681563869e-05, "Pretrain/Loss": 2.0364670753479004, "Pretrain/Loss (Raw)": 2.036289930343628, "Pretrain/Step": 7802, "Pretrain/Step Time": 8.46855429187417} +{"Pretrain/Learning Rate": 3.3406068944149684e-05, "Pretrain/Loss": 2.0352835655212402, "Pretrain/Loss (Raw)": 1.990057110786438, "Pretrain/Step": 7803, "Pretrain/Step Time": 8.466661736369133} +{"Pretrain/Learning Rate": 3.340207083027761e-05, "Pretrain/Loss": 2.0340375900268555, "Pretrain/Loss (Raw)": 2.047689437866211, "Pretrain/Step": 7804, "Pretrain/Step Time": 8.468239875510335} +{"Pretrain/Learning Rate": 3.339807247413774e-05, "Pretrain/Loss": 2.0373148918151855, "Pretrain/Loss (Raw)": 2.3064682483673096, "Pretrain/Step": 7805, "Pretrain/Step Time": 8.466006826609373} +{"Pretrain/Learning Rate": 3.3394073875845375e-05, "Pretrain/Loss": 2.035153388977051, "Pretrain/Loss (Raw)": 1.8803906440734863, "Pretrain/Step": 7806, "Pretrain/Step Time": 8.459921095520258} +{"Pretrain/Learning Rate": 3.33900750355158e-05, "Pretrain/Loss": 2.032801628112793, "Pretrain/Loss (Raw)": 1.891838788986206, "Pretrain/Step": 7807, "Pretrain/Step Time": 8.464593721553683} +{"Pretrain/Learning Rate": 3.338607595326434e-05, "Pretrain/Loss": 2.0336830615997314, "Pretrain/Loss (Raw)": 2.132105827331543, "Pretrain/Step": 7808, "Pretrain/Step Time": 8.463100612163544} +{"Pretrain/Learning Rate": 3.338207662920628e-05, "Pretrain/Loss": 2.033316135406494, "Pretrain/Loss (Raw)": 1.9586238861083984, "Pretrain/Step": 7809, "Pretrain/Step Time": 8.46205285936594} +{"Pretrain/Learning Rate": 3.337807706345695e-05, "Pretrain/Loss": 2.034512758255005, "Pretrain/Loss (Raw)": 1.9699127674102783, "Pretrain/Step": 7810, "Pretrain/Step Time": 8.462397685274482} +{"Pretrain/Learning Rate": 3.337407725613168e-05, "Pretrain/Loss": 2.0344605445861816, "Pretrain/Loss (Raw)": 1.8669350147247314, "Pretrain/Step": 7811, "Pretrain/Step Time": 8.465352544561028} +{"Pretrain/Learning Rate": 3.337007720734579e-05, "Pretrain/Loss": 2.0344595909118652, "Pretrain/Loss (Raw)": 2.1330442428588867, "Pretrain/Step": 7812, "Pretrain/Step Time": 8.458453599363565} +{"Pretrain/Learning Rate": 3.336607691721463e-05, "Pretrain/Loss": 2.0347740650177, "Pretrain/Loss (Raw)": 1.996128797531128, "Pretrain/Step": 7813, "Pretrain/Step Time": 8.461575025692582} +{"Pretrain/Learning Rate": 3.336207638585354e-05, "Pretrain/Loss": 2.033442497253418, "Pretrain/Loss (Raw)": 1.9166017770767212, "Pretrain/Step": 7814, "Pretrain/Step Time": 8.462325435131788} +{"Pretrain/Learning Rate": 3.3358075613377865e-05, "Pretrain/Loss": 2.0325889587402344, "Pretrain/Loss (Raw)": 1.9326646327972412, "Pretrain/Step": 7815, "Pretrain/Step Time": 8.463660564273596} +{"Pretrain/Learning Rate": 3.3354074599902976e-05, "Pretrain/Loss": 2.0330958366394043, "Pretrain/Loss (Raw)": 1.996324896812439, "Pretrain/Step": 7816, "Pretrain/Step Time": 8.461712857708335} +{"Pretrain/Learning Rate": 3.335007334554423e-05, "Pretrain/Loss": 2.0323472023010254, "Pretrain/Loss (Raw)": 1.9188498258590698, "Pretrain/Step": 7817, "Pretrain/Step Time": 8.460355618968606} +{"Pretrain/Learning Rate": 3.334607185041701e-05, "Pretrain/Loss": 2.0303001403808594, "Pretrain/Loss (Raw)": 1.9157041311264038, "Pretrain/Step": 7818, "Pretrain/Step Time": 8.460843851789832} +{"Pretrain/Learning Rate": 3.334207011463669e-05, "Pretrain/Loss": 2.034327745437622, "Pretrain/Loss (Raw)": 2.323565721511841, "Pretrain/Step": 7819, "Pretrain/Step Time": 8.458438467234373} +{"Pretrain/Learning Rate": 3.333806813831867e-05, "Pretrain/Loss": 2.0343680381774902, "Pretrain/Loss (Raw)": 1.9474191665649414, "Pretrain/Step": 7820, "Pretrain/Step Time": 8.461160216480494} +{"Pretrain/Learning Rate": 3.333406592157832e-05, "Pretrain/Loss": 2.035365104675293, "Pretrain/Loss (Raw)": 1.9791946411132812, "Pretrain/Step": 7821, "Pretrain/Step Time": 8.463382413610816} +{"Pretrain/Learning Rate": 3.3330063464531056e-05, "Pretrain/Loss": 2.035027503967285, "Pretrain/Loss (Raw)": 1.9958164691925049, "Pretrain/Step": 7822, "Pretrain/Step Time": 8.460973279550672} +{"Pretrain/Learning Rate": 3.3326060767292286e-05, "Pretrain/Loss": 2.034414291381836, "Pretrain/Loss (Raw)": 2.045287609100342, "Pretrain/Step": 7823, "Pretrain/Step Time": 8.463094230741262} +{"Pretrain/Learning Rate": 3.3322057829977424e-05, "Pretrain/Loss": 2.0335025787353516, "Pretrain/Loss (Raw)": 1.740572452545166, "Pretrain/Step": 7824, "Pretrain/Step Time": 8.457219861447811} +{"Pretrain/Learning Rate": 3.331805465270189e-05, "Pretrain/Loss": 2.032869577407837, "Pretrain/Loss (Raw)": 2.049039602279663, "Pretrain/Step": 7825, "Pretrain/Step Time": 8.453710613772273} +{"Pretrain/Learning Rate": 3.3314051235581126e-05, "Pretrain/Loss": 2.0310733318328857, "Pretrain/Loss (Raw)": 2.3705990314483643, "Pretrain/Step": 7826, "Pretrain/Step Time": 8.458675980567932} +{"Pretrain/Learning Rate": 3.331004757873054e-05, "Pretrain/Loss": 2.033322334289551, "Pretrain/Loss (Raw)": 2.1755778789520264, "Pretrain/Step": 7827, "Pretrain/Step Time": 8.455994211137295} +{"Pretrain/Learning Rate": 3.33060436822656e-05, "Pretrain/Loss": 2.0359041690826416, "Pretrain/Loss (Raw)": 2.1482601165771484, "Pretrain/Step": 7828, "Pretrain/Step Time": 8.45073276385665} +{"Pretrain/Learning Rate": 3.330203954630173e-05, "Pretrain/Loss": 2.0343706607818604, "Pretrain/Loss (Raw)": 2.0152623653411865, "Pretrain/Step": 7829, "Pretrain/Step Time": 8.451077470555902} +{"Pretrain/Learning Rate": 3.329803517095442e-05, "Pretrain/Loss": 2.0356078147888184, "Pretrain/Loss (Raw)": 2.1013007164001465, "Pretrain/Step": 7830, "Pretrain/Step Time": 8.452948573976755} +{"Pretrain/Learning Rate": 3.3294030556339106e-05, "Pretrain/Loss": 2.034447193145752, "Pretrain/Loss (Raw)": 2.1264595985412598, "Pretrain/Step": 7831, "Pretrain/Step Time": 8.451458675786853} +{"Pretrain/Learning Rate": 3.329002570257127e-05, "Pretrain/Loss": 2.032409191131592, "Pretrain/Loss (Raw)": 1.91791570186615, "Pretrain/Step": 7832, "Pretrain/Step Time": 8.452606488019228} +{"Pretrain/Learning Rate": 3.328602060976639e-05, "Pretrain/Loss": 2.0330300331115723, "Pretrain/Loss (Raw)": 2.0466811656951904, "Pretrain/Step": 7833, "Pretrain/Step Time": 8.449821036309004} +{"Pretrain/Learning Rate": 3.328201527803994e-05, "Pretrain/Loss": 2.0328474044799805, "Pretrain/Loss (Raw)": 2.176743984222412, "Pretrain/Step": 7834, "Pretrain/Step Time": 8.449273182079196} +{"Pretrain/Learning Rate": 3.327800970750742e-05, "Pretrain/Loss": 2.0306293964385986, "Pretrain/Loss (Raw)": 2.0186593532562256, "Pretrain/Step": 7835, "Pretrain/Step Time": 8.451208231970668} +{"Pretrain/Learning Rate": 3.327400389828433e-05, "Pretrain/Loss": 2.027310371398926, "Pretrain/Loss (Raw)": 1.615422010421753, "Pretrain/Step": 7836, "Pretrain/Step Time": 8.456465436145663} +{"Pretrain/Learning Rate": 3.326999785048617e-05, "Pretrain/Loss": 2.027212142944336, "Pretrain/Loss (Raw)": 1.8241599798202515, "Pretrain/Step": 7837, "Pretrain/Step Time": 8.457765243947506} +{"Pretrain/Learning Rate": 3.326599156422845e-05, "Pretrain/Loss": 2.0292601585388184, "Pretrain/Loss (Raw)": 2.121056318283081, "Pretrain/Step": 7838, "Pretrain/Step Time": 8.451824381947517} +{"Pretrain/Learning Rate": 3.326198503962669e-05, "Pretrain/Loss": 2.0315322875976562, "Pretrain/Loss (Raw)": 2.053722858428955, "Pretrain/Step": 7839, "Pretrain/Step Time": 8.449554830789566} +{"Pretrain/Learning Rate": 3.3257978276796414e-05, "Pretrain/Loss": 2.0329980850219727, "Pretrain/Loss (Raw)": 2.2077865600585938, "Pretrain/Step": 7840, "Pretrain/Step Time": 8.441671328619123} +{"Pretrain/Learning Rate": 3.3253971275853163e-05, "Pretrain/Loss": 2.0343713760375977, "Pretrain/Loss (Raw)": 2.1709840297698975, "Pretrain/Step": 7841, "Pretrain/Step Time": 8.445290388539433} +{"Pretrain/Learning Rate": 3.324996403691246e-05, "Pretrain/Loss": 2.0353190898895264, "Pretrain/Loss (Raw)": 2.076836347579956, "Pretrain/Step": 7842, "Pretrain/Step Time": 8.4471450522542} +{"Pretrain/Learning Rate": 3.324595656008986e-05, "Pretrain/Loss": 2.037808895111084, "Pretrain/Loss (Raw)": 2.266500234603882, "Pretrain/Step": 7843, "Pretrain/Step Time": 8.44696980342269} +{"Pretrain/Learning Rate": 3.3241948845500924e-05, "Pretrain/Loss": 2.0336081981658936, "Pretrain/Loss (Raw)": 2.0341787338256836, "Pretrain/Step": 7844, "Pretrain/Step Time": 8.443477304652333} +{"Pretrain/Learning Rate": 3.32379408932612e-05, "Pretrain/Loss": 2.0328476428985596, "Pretrain/Loss (Raw)": 1.8570609092712402, "Pretrain/Step": 7845, "Pretrain/Step Time": 8.444970775395632} +{"Pretrain/Learning Rate": 3.3233932703486255e-05, "Pretrain/Loss": 2.0348358154296875, "Pretrain/Loss (Raw)": 2.210447311401367, "Pretrain/Step": 7846, "Pretrain/Step Time": 8.443201733753085} +{"Pretrain/Learning Rate": 3.322992427629167e-05, "Pretrain/Loss": 2.034254789352417, "Pretrain/Loss (Raw)": 1.8669129610061646, "Pretrain/Step": 7847, "Pretrain/Step Time": 8.444522371515632} +{"Pretrain/Learning Rate": 3.322591561179301e-05, "Pretrain/Loss": 2.03299617767334, "Pretrain/Loss (Raw)": 1.9897466897964478, "Pretrain/Step": 7848, "Pretrain/Step Time": 8.445648638531566} +{"Pretrain/Learning Rate": 3.322190671010588e-05, "Pretrain/Loss": 2.0339691638946533, "Pretrain/Loss (Raw)": 2.1087844371795654, "Pretrain/Step": 7849, "Pretrain/Step Time": 8.444917952641845} +{"Pretrain/Learning Rate": 3.3217897571345865e-05, "Pretrain/Loss": 2.033937931060791, "Pretrain/Loss (Raw)": 2.298724412918091, "Pretrain/Step": 7850, "Pretrain/Step Time": 8.442701509222388} +{"Pretrain/Learning Rate": 3.321388819562856e-05, "Pretrain/Loss": 2.0323634147644043, "Pretrain/Loss (Raw)": 1.8301702737808228, "Pretrain/Step": 7851, "Pretrain/Step Time": 8.4456601832062} +{"Pretrain/Learning Rate": 3.32098785830696e-05, "Pretrain/Loss": 2.0319106578826904, "Pretrain/Loss (Raw)": 1.964581847190857, "Pretrain/Step": 7852, "Pretrain/Step Time": 8.443193910643458} +{"Pretrain/Learning Rate": 3.320586873378456e-05, "Pretrain/Loss": 2.030402660369873, "Pretrain/Loss (Raw)": 2.036555051803589, "Pretrain/Step": 7853, "Pretrain/Step Time": 8.44322009012103} +{"Pretrain/Learning Rate": 3.320185864788908e-05, "Pretrain/Loss": 2.0302953720092773, "Pretrain/Loss (Raw)": 1.999315619468689, "Pretrain/Step": 7854, "Pretrain/Step Time": 8.44267295487225} +{"Pretrain/Learning Rate": 3.319784832549879e-05, "Pretrain/Loss": 2.032794237136841, "Pretrain/Loss (Raw)": 2.3343262672424316, "Pretrain/Step": 7855, "Pretrain/Step Time": 8.442349802702665} +{"Pretrain/Learning Rate": 3.319383776672933e-05, "Pretrain/Loss": 2.032282590866089, "Pretrain/Loss (Raw)": 2.380053758621216, "Pretrain/Step": 7856, "Pretrain/Step Time": 8.43132969737053} +{"Pretrain/Learning Rate": 3.318982697169633e-05, "Pretrain/Loss": 2.0326812267303467, "Pretrain/Loss (Raw)": 2.081115245819092, "Pretrain/Step": 7857, "Pretrain/Step Time": 8.4335503783077} +{"Pretrain/Learning Rate": 3.318581594051544e-05, "Pretrain/Loss": 2.0330631732940674, "Pretrain/Loss (Raw)": 2.1237196922302246, "Pretrain/Step": 7858, "Pretrain/Step Time": 8.431621342897415} +{"Pretrain/Learning Rate": 3.318180467330232e-05, "Pretrain/Loss": 2.0346450805664062, "Pretrain/Loss (Raw)": 2.056332588195801, "Pretrain/Step": 7859, "Pretrain/Step Time": 8.429941043257713} +{"Pretrain/Learning Rate": 3.3177793170172626e-05, "Pretrain/Loss": 2.0352060794830322, "Pretrain/Loss (Raw)": 2.059537887573242, "Pretrain/Step": 7860, "Pretrain/Step Time": 8.429729916155338} +{"Pretrain/Learning Rate": 3.3173781431242036e-05, "Pretrain/Loss": 2.0346579551696777, "Pretrain/Loss (Raw)": 2.116501569747925, "Pretrain/Step": 7861, "Pretrain/Step Time": 8.430976282805204} +{"Pretrain/Learning Rate": 3.316976945662622e-05, "Pretrain/Loss": 2.0338077545166016, "Pretrain/Loss (Raw)": 2.1439340114593506, "Pretrain/Step": 7862, "Pretrain/Step Time": 8.427849369123578} +{"Pretrain/Learning Rate": 3.3165757246440864e-05, "Pretrain/Loss": 2.0326004028320312, "Pretrain/Loss (Raw)": 2.0671632289886475, "Pretrain/Step": 7863, "Pretrain/Step Time": 8.429377505555749} +{"Pretrain/Learning Rate": 3.316174480080165e-05, "Pretrain/Loss": 2.0313913822174072, "Pretrain/Loss (Raw)": 2.041903257369995, "Pretrain/Step": 7864, "Pretrain/Step Time": 8.429535415023565} +{"Pretrain/Learning Rate": 3.315773211982427e-05, "Pretrain/Loss": 2.0337412357330322, "Pretrain/Loss (Raw)": 1.9958258867263794, "Pretrain/Step": 7865, "Pretrain/Step Time": 8.430996099486947} +{"Pretrain/Learning Rate": 3.315371920362445e-05, "Pretrain/Loss": 2.0334715843200684, "Pretrain/Loss (Raw)": 2.1697256565093994, "Pretrain/Step": 7866, "Pretrain/Step Time": 8.432259092107415} +{"Pretrain/Learning Rate": 3.3149706052317886e-05, "Pretrain/Loss": 2.0323898792266846, "Pretrain/Loss (Raw)": 1.8807332515716553, "Pretrain/Step": 7867, "Pretrain/Step Time": 8.432069003582} +{"Pretrain/Learning Rate": 3.314569266602029e-05, "Pretrain/Loss": 2.0316994190216064, "Pretrain/Loss (Raw)": 2.031174659729004, "Pretrain/Step": 7868, "Pretrain/Step Time": 8.434394670650363} +{"Pretrain/Learning Rate": 3.3141679044847376e-05, "Pretrain/Loss": 2.032128095626831, "Pretrain/Loss (Raw)": 2.0367519855499268, "Pretrain/Step": 7869, "Pretrain/Step Time": 8.430927956476808} +{"Pretrain/Learning Rate": 3.3137665188914894e-05, "Pretrain/Loss": 2.032806158065796, "Pretrain/Loss (Raw)": 2.098999261856079, "Pretrain/Step": 7870, "Pretrain/Step Time": 8.429583156481385} +{"Pretrain/Learning Rate": 3.313365109833858e-05, "Pretrain/Loss": 2.032541036605835, "Pretrain/Loss (Raw)": 2.108344316482544, "Pretrain/Step": 7871, "Pretrain/Step Time": 8.428465204313397} +{"Pretrain/Learning Rate": 3.312963677323416e-05, "Pretrain/Loss": 2.0333023071289062, "Pretrain/Loss (Raw)": 1.9363356828689575, "Pretrain/Step": 7872, "Pretrain/Step Time": 8.429641045629978} +{"Pretrain/Learning Rate": 3.31256222137174e-05, "Pretrain/Loss": 2.0332627296447754, "Pretrain/Loss (Raw)": 2.060417890548706, "Pretrain/Step": 7873, "Pretrain/Step Time": 8.42980275861919} +{"Pretrain/Learning Rate": 3.312160741990405e-05, "Pretrain/Loss": 2.0343592166900635, "Pretrain/Loss (Raw)": 2.2872722148895264, "Pretrain/Step": 7874, "Pretrain/Step Time": 8.429056832566857} +{"Pretrain/Learning Rate": 3.3117592391909874e-05, "Pretrain/Loss": 2.0343546867370605, "Pretrain/Loss (Raw)": 1.9586567878723145, "Pretrain/Step": 7875, "Pretrain/Step Time": 8.4284733440727} +{"Pretrain/Learning Rate": 3.311357712985065e-05, "Pretrain/Loss": 2.0337166786193848, "Pretrain/Loss (Raw)": 1.9706387519836426, "Pretrain/Step": 7876, "Pretrain/Step Time": 8.43071836605668} +{"Pretrain/Learning Rate": 3.310956163384214e-05, "Pretrain/Loss": 2.032472610473633, "Pretrain/Loss (Raw)": 2.0308194160461426, "Pretrain/Step": 7877, "Pretrain/Step Time": 8.428556699305773} +{"Pretrain/Learning Rate": 3.310554590400014e-05, "Pretrain/Loss": 2.03354549407959, "Pretrain/Loss (Raw)": 2.146040439605713, "Pretrain/Step": 7878, "Pretrain/Step Time": 8.427907455712557} +{"Pretrain/Learning Rate": 3.310152994044045e-05, "Pretrain/Loss": 2.0353622436523438, "Pretrain/Loss (Raw)": 2.1555938720703125, "Pretrain/Step": 7879, "Pretrain/Step Time": 8.423614356666803} +{"Pretrain/Learning Rate": 3.309751374327884e-05, "Pretrain/Loss": 2.0341386795043945, "Pretrain/Loss (Raw)": 1.804824709892273, "Pretrain/Step": 7880, "Pretrain/Step Time": 8.424265557900071} +{"Pretrain/Learning Rate": 3.3093497312631136e-05, "Pretrain/Loss": 2.0324816703796387, "Pretrain/Loss (Raw)": 1.8393412828445435, "Pretrain/Step": 7881, "Pretrain/Step Time": 8.426086753606796} +{"Pretrain/Learning Rate": 3.3089480648613136e-05, "Pretrain/Loss": 2.0302414894104004, "Pretrain/Loss (Raw)": 1.8758949041366577, "Pretrain/Step": 7882, "Pretrain/Step Time": 8.423709513619542} +{"Pretrain/Learning Rate": 3.3085463751340666e-05, "Pretrain/Loss": 2.029444694519043, "Pretrain/Loss (Raw)": 1.7891336679458618, "Pretrain/Step": 7883, "Pretrain/Step Time": 8.423912348225713} +{"Pretrain/Learning Rate": 3.3081446620929554e-05, "Pretrain/Loss": 2.0321950912475586, "Pretrain/Loss (Raw)": 2.2549092769622803, "Pretrain/Step": 7884, "Pretrain/Step Time": 8.422460861504078} +{"Pretrain/Learning Rate": 3.3077429257495626e-05, "Pretrain/Loss": 2.031935930252075, "Pretrain/Loss (Raw)": 1.865949273109436, "Pretrain/Step": 7885, "Pretrain/Step Time": 8.42623358592391} +{"Pretrain/Learning Rate": 3.3073411661154715e-05, "Pretrain/Loss": 2.029390573501587, "Pretrain/Loss (Raw)": 1.9097087383270264, "Pretrain/Step": 7886, "Pretrain/Step Time": 8.424820261076093} +{"Pretrain/Learning Rate": 3.3069393832022676e-05, "Pretrain/Loss": 2.031545639038086, "Pretrain/Loss (Raw)": 2.215519428253174, "Pretrain/Step": 7887, "Pretrain/Step Time": 8.43183759227395} +{"Pretrain/Learning Rate": 3.306537577021535e-05, "Pretrain/Loss": 2.03391170501709, "Pretrain/Loss (Raw)": 2.1539080142974854, "Pretrain/Step": 7888, "Pretrain/Step Time": 8.42489055916667} +{"Pretrain/Learning Rate": 3.3061357475848606e-05, "Pretrain/Loss": 2.033356189727783, "Pretrain/Loss (Raw)": 1.8450448513031006, "Pretrain/Step": 7889, "Pretrain/Step Time": 8.424619322642684} +{"Pretrain/Learning Rate": 3.305733894903829e-05, "Pretrain/Loss": 2.0366714000701904, "Pretrain/Loss (Raw)": 2.189751386642456, "Pretrain/Step": 7890, "Pretrain/Step Time": 8.424885146319866} +{"Pretrain/Learning Rate": 3.305332018990029e-05, "Pretrain/Loss": 2.0366504192352295, "Pretrain/Loss (Raw)": 2.0572338104248047, "Pretrain/Step": 7891, "Pretrain/Step Time": 8.422809824347496} +{"Pretrain/Learning Rate": 3.3049301198550484e-05, "Pretrain/Loss": 2.0381970405578613, "Pretrain/Loss (Raw)": 2.0445902347564697, "Pretrain/Step": 7892, "Pretrain/Step Time": 8.427278535440564} +{"Pretrain/Learning Rate": 3.3045281975104744e-05, "Pretrain/Loss": 2.0347418785095215, "Pretrain/Loss (Raw)": 1.6633574962615967, "Pretrain/Step": 7893, "Pretrain/Step Time": 8.429451797157526} +{"Pretrain/Learning Rate": 3.304126251967899e-05, "Pretrain/Loss": 2.035097360610962, "Pretrain/Loss (Raw)": 2.062486171722412, "Pretrain/Step": 7894, "Pretrain/Step Time": 8.42833018116653} +{"Pretrain/Learning Rate": 3.303724283238907e-05, "Pretrain/Loss": 2.03458309173584, "Pretrain/Loss (Raw)": 2.0122618675231934, "Pretrain/Step": 7895, "Pretrain/Step Time": 8.431065211072564} +{"Pretrain/Learning Rate": 3.303322291335094e-05, "Pretrain/Loss": 2.0348761081695557, "Pretrain/Loss (Raw)": 2.1459927558898926, "Pretrain/Step": 7896, "Pretrain/Step Time": 8.426484758034348} +{"Pretrain/Learning Rate": 3.3029202762680484e-05, "Pretrain/Loss": 2.037353992462158, "Pretrain/Loss (Raw)": 2.1149864196777344, "Pretrain/Step": 7897, "Pretrain/Step Time": 8.425482492893934} +{"Pretrain/Learning Rate": 3.3025182380493625e-05, "Pretrain/Loss": 2.037003993988037, "Pretrain/Loss (Raw)": 1.9646093845367432, "Pretrain/Step": 7898, "Pretrain/Step Time": 8.426672482863069} +{"Pretrain/Learning Rate": 3.3021161766906295e-05, "Pretrain/Loss": 2.0352206230163574, "Pretrain/Loss (Raw)": 2.0324788093566895, "Pretrain/Step": 7899, "Pretrain/Step Time": 8.430550644174218} +{"Pretrain/Learning Rate": 3.301714092203442e-05, "Pretrain/Loss": 2.0346434116363525, "Pretrain/Loss (Raw)": 1.9872756004333496, "Pretrain/Step": 7900, "Pretrain/Step Time": 8.433977147564292} +{"Pretrain/Learning Rate": 3.301311984599393e-05, "Pretrain/Loss": 2.031564235687256, "Pretrain/Loss (Raw)": 1.8249670267105103, "Pretrain/Step": 7901, "Pretrain/Step Time": 8.433678656816483} +{"Pretrain/Learning Rate": 3.300909853890078e-05, "Pretrain/Loss": 2.032867670059204, "Pretrain/Loss (Raw)": 2.11954665184021, "Pretrain/Step": 7902, "Pretrain/Step Time": 8.432955464348197} +{"Pretrain/Learning Rate": 3.300507700087092e-05, "Pretrain/Loss": 2.0388941764831543, "Pretrain/Loss (Raw)": 2.581573009490967, "Pretrain/Step": 7903, "Pretrain/Step Time": 8.429755613207817} +{"Pretrain/Learning Rate": 3.300105523202032e-05, "Pretrain/Loss": 2.039228916168213, "Pretrain/Loss (Raw)": 1.978145956993103, "Pretrain/Step": 7904, "Pretrain/Step Time": 8.433188807219267} +{"Pretrain/Learning Rate": 3.2997033232464926e-05, "Pretrain/Loss": 2.0386128425598145, "Pretrain/Loss (Raw)": 2.0159854888916016, "Pretrain/Step": 7905, "Pretrain/Step Time": 8.432269550859928} +{"Pretrain/Learning Rate": 3.2993011002320705e-05, "Pretrain/Loss": 2.039388656616211, "Pretrain/Loss (Raw)": 2.125659704208374, "Pretrain/Step": 7906, "Pretrain/Step Time": 8.431107154116035} +{"Pretrain/Learning Rate": 3.298898854170366e-05, "Pretrain/Loss": 2.0387895107269287, "Pretrain/Loss (Raw)": 2.0813066959381104, "Pretrain/Step": 7907, "Pretrain/Step Time": 8.435496306046844} +{"Pretrain/Learning Rate": 3.298496585072975e-05, "Pretrain/Loss": 2.0378596782684326, "Pretrain/Loss (Raw)": 1.9446097612380981, "Pretrain/Step": 7908, "Pretrain/Step Time": 8.437825253233314} +{"Pretrain/Learning Rate": 3.298094292951499e-05, "Pretrain/Loss": 2.0403966903686523, "Pretrain/Loss (Raw)": 2.0458033084869385, "Pretrain/Step": 7909, "Pretrain/Step Time": 8.437370277941227} +{"Pretrain/Learning Rate": 3.297691977817537e-05, "Pretrain/Loss": 2.040632724761963, "Pretrain/Loss (Raw)": 1.9990211725234985, "Pretrain/Step": 7910, "Pretrain/Step Time": 8.437134690582752} +{"Pretrain/Learning Rate": 3.2972896396826885e-05, "Pretrain/Loss": 2.0406999588012695, "Pretrain/Loss (Raw)": 2.1070549488067627, "Pretrain/Step": 7911, "Pretrain/Step Time": 8.437442699447274} +{"Pretrain/Learning Rate": 3.2968872785585544e-05, "Pretrain/Loss": 2.042288303375244, "Pretrain/Loss (Raw)": 2.1873421669006348, "Pretrain/Step": 7912, "Pretrain/Step Time": 8.43480209261179} +{"Pretrain/Learning Rate": 3.2964848944567386e-05, "Pretrain/Loss": 2.0416131019592285, "Pretrain/Loss (Raw)": 1.970747709274292, "Pretrain/Step": 7913, "Pretrain/Step Time": 8.432028535753489} +{"Pretrain/Learning Rate": 3.2960824873888415e-05, "Pretrain/Loss": 2.040128707885742, "Pretrain/Loss (Raw)": 2.073882579803467, "Pretrain/Step": 7914, "Pretrain/Step Time": 8.435340076684952} +{"Pretrain/Learning Rate": 3.295680057366468e-05, "Pretrain/Loss": 2.0439720153808594, "Pretrain/Loss (Raw)": 2.539079427719116, "Pretrain/Step": 7915, "Pretrain/Step Time": 8.4353994615376} +{"Pretrain/Learning Rate": 3.2952776044012206e-05, "Pretrain/Loss": 2.043266773223877, "Pretrain/Loss (Raw)": 2.017430305480957, "Pretrain/Step": 7916, "Pretrain/Step Time": 8.437243796885014} +{"Pretrain/Learning Rate": 3.294875128504704e-05, "Pretrain/Loss": 2.043058156967163, "Pretrain/Loss (Raw)": 2.007498025894165, "Pretrain/Step": 7917, "Pretrain/Step Time": 8.439028007909656} +{"Pretrain/Learning Rate": 3.294472629688524e-05, "Pretrain/Loss": 2.0414655208587646, "Pretrain/Loss (Raw)": 1.8909496068954468, "Pretrain/Step": 7918, "Pretrain/Step Time": 8.445725126191974} +{"Pretrain/Learning Rate": 3.2940701079642846e-05, "Pretrain/Loss": 2.0406930446624756, "Pretrain/Loss (Raw)": 2.006068468093872, "Pretrain/Step": 7919, "Pretrain/Step Time": 8.442163832485676} +{"Pretrain/Learning Rate": 3.293667563343594e-05, "Pretrain/Loss": 2.0405616760253906, "Pretrain/Loss (Raw)": 2.020684003829956, "Pretrain/Step": 7920, "Pretrain/Step Time": 8.442387208342552} +{"Pretrain/Learning Rate": 3.293264995838059e-05, "Pretrain/Loss": 2.038896083831787, "Pretrain/Loss (Raw)": 1.649875283241272, "Pretrain/Step": 7921, "Pretrain/Step Time": 8.437519650906324} +{"Pretrain/Learning Rate": 3.2928624054592873e-05, "Pretrain/Loss": 2.0391769409179688, "Pretrain/Loss (Raw)": 2.124601364135742, "Pretrain/Step": 7922, "Pretrain/Step Time": 8.43491922877729} +{"Pretrain/Learning Rate": 3.292459792218886e-05, "Pretrain/Loss": 2.0393569469451904, "Pretrain/Loss (Raw)": 2.0622503757476807, "Pretrain/Step": 7923, "Pretrain/Step Time": 8.435257509350777} +{"Pretrain/Learning Rate": 3.292057156128466e-05, "Pretrain/Loss": 2.041438341140747, "Pretrain/Loss (Raw)": 2.141512155532837, "Pretrain/Step": 7924, "Pretrain/Step Time": 8.439258022233844} +{"Pretrain/Learning Rate": 3.291654497199636e-05, "Pretrain/Loss": 2.043771743774414, "Pretrain/Loss (Raw)": 2.0405635833740234, "Pretrain/Step": 7925, "Pretrain/Step Time": 8.431097533553839} +{"Pretrain/Learning Rate": 3.291251815444007e-05, "Pretrain/Loss": 2.044126510620117, "Pretrain/Loss (Raw)": 2.072922468185425, "Pretrain/Step": 7926, "Pretrain/Step Time": 8.431416196748614} +{"Pretrain/Learning Rate": 3.290849110873189e-05, "Pretrain/Loss": 2.0433390140533447, "Pretrain/Loss (Raw)": 2.067720651626587, "Pretrain/Step": 7927, "Pretrain/Step Time": 8.435594625771046} +{"Pretrain/Learning Rate": 3.290446383498795e-05, "Pretrain/Loss": 2.0403122901916504, "Pretrain/Loss (Raw)": 1.8952322006225586, "Pretrain/Step": 7928, "Pretrain/Step Time": 8.438092002645135} +{"Pretrain/Learning Rate": 3.2900436333324364e-05, "Pretrain/Loss": 2.041806221008301, "Pretrain/Loss (Raw)": 2.05704665184021, "Pretrain/Step": 7929, "Pretrain/Step Time": 8.43292417936027} +{"Pretrain/Learning Rate": 3.289640860385726e-05, "Pretrain/Loss": 2.0420279502868652, "Pretrain/Loss (Raw)": 2.0647034645080566, "Pretrain/Step": 7930, "Pretrain/Step Time": 8.432809269055724} +{"Pretrain/Learning Rate": 3.28923806467028e-05, "Pretrain/Loss": 2.041409492492676, "Pretrain/Loss (Raw)": 1.9108775854110718, "Pretrain/Step": 7931, "Pretrain/Step Time": 8.435930678620934} +{"Pretrain/Learning Rate": 3.288835246197709e-05, "Pretrain/Loss": 2.0405044555664062, "Pretrain/Loss (Raw)": 1.9318041801452637, "Pretrain/Step": 7932, "Pretrain/Step Time": 8.438356034457684} +{"Pretrain/Learning Rate": 3.288432404979631e-05, "Pretrain/Loss": 2.0371570587158203, "Pretrain/Loss (Raw)": 1.8780505657196045, "Pretrain/Step": 7933, "Pretrain/Step Time": 8.438070975244045} +{"Pretrain/Learning Rate": 3.2880295410276594e-05, "Pretrain/Loss": 2.0384867191314697, "Pretrain/Loss (Raw)": 2.0505545139312744, "Pretrain/Step": 7934, "Pretrain/Step Time": 8.446588553488255} +{"Pretrain/Learning Rate": 3.287626654353412e-05, "Pretrain/Loss": 2.0386624336242676, "Pretrain/Loss (Raw)": 1.914353609085083, "Pretrain/Step": 7935, "Pretrain/Step Time": 8.440871367231011} +{"Pretrain/Learning Rate": 3.2872237449685056e-05, "Pretrain/Loss": 2.0362565517425537, "Pretrain/Loss (Raw)": 1.824150562286377, "Pretrain/Step": 7936, "Pretrain/Step Time": 8.441592875868082} +{"Pretrain/Learning Rate": 3.286820812884557e-05, "Pretrain/Loss": 2.0365066528320312, "Pretrain/Loss (Raw)": 1.990609884262085, "Pretrain/Step": 7937, "Pretrain/Step Time": 8.438105987384915} +{"Pretrain/Learning Rate": 3.286417858113185e-05, "Pretrain/Loss": 2.036160945892334, "Pretrain/Loss (Raw)": 1.9256916046142578, "Pretrain/Step": 7938, "Pretrain/Step Time": 8.43911479972303} +{"Pretrain/Learning Rate": 3.286014880666008e-05, "Pretrain/Loss": 2.0380241870880127, "Pretrain/Loss (Raw)": 2.105433702468872, "Pretrain/Step": 7939, "Pretrain/Step Time": 8.440789954736829} +{"Pretrain/Learning Rate": 3.285611880554647e-05, "Pretrain/Loss": 2.037583827972412, "Pretrain/Loss (Raw)": 2.076652765274048, "Pretrain/Step": 7940, "Pretrain/Step Time": 8.443406770005822} +{"Pretrain/Learning Rate": 3.2852088577907206e-05, "Pretrain/Loss": 2.0363337993621826, "Pretrain/Loss (Raw)": 1.8361226320266724, "Pretrain/Step": 7941, "Pretrain/Step Time": 8.442268846556544} +{"Pretrain/Learning Rate": 3.2848058123858504e-05, "Pretrain/Loss": 2.0363993644714355, "Pretrain/Loss (Raw)": 1.924972653388977, "Pretrain/Step": 7942, "Pretrain/Step Time": 8.440293367952108} +{"Pretrain/Learning Rate": 3.284402744351658e-05, "Pretrain/Loss": 2.036456346511841, "Pretrain/Loss (Raw)": 1.939990758895874, "Pretrain/Step": 7943, "Pretrain/Step Time": 8.44159267283976} +{"Pretrain/Learning Rate": 3.2839996536997645e-05, "Pretrain/Loss": 2.033559799194336, "Pretrain/Loss (Raw)": 1.6255580186843872, "Pretrain/Step": 7944, "Pretrain/Step Time": 8.442874973639846} +{"Pretrain/Learning Rate": 3.283596540441795e-05, "Pretrain/Loss": 2.034472942352295, "Pretrain/Loss (Raw)": 2.035737991333008, "Pretrain/Step": 7945, "Pretrain/Step Time": 8.445891909301281} +{"Pretrain/Learning Rate": 3.283193404589371e-05, "Pretrain/Loss": 2.0357742309570312, "Pretrain/Loss (Raw)": 2.082287549972534, "Pretrain/Step": 7946, "Pretrain/Step Time": 8.446292223408818} +{"Pretrain/Learning Rate": 3.282790246154117e-05, "Pretrain/Loss": 2.0316033363342285, "Pretrain/Loss (Raw)": 1.7896829843521118, "Pretrain/Step": 7947, "Pretrain/Step Time": 8.44525589235127} +{"Pretrain/Learning Rate": 3.282387065147659e-05, "Pretrain/Loss": 2.030609369277954, "Pretrain/Loss (Raw)": 1.8201814889907837, "Pretrain/Step": 7948, "Pretrain/Step Time": 8.442941350862384} +{"Pretrain/Learning Rate": 3.2819838615816206e-05, "Pretrain/Loss": 2.0318570137023926, "Pretrain/Loss (Raw)": 2.138890027999878, "Pretrain/Step": 7949, "Pretrain/Step Time": 8.441692374646664} +{"Pretrain/Learning Rate": 3.281580635467629e-05, "Pretrain/Loss": 2.032700777053833, "Pretrain/Loss (Raw)": 2.103809118270874, "Pretrain/Step": 7950, "Pretrain/Step Time": 8.448456786572933} +{"Pretrain/Learning Rate": 3.281177386817311e-05, "Pretrain/Loss": 2.031113624572754, "Pretrain/Loss (Raw)": 1.8421300649642944, "Pretrain/Step": 7951, "Pretrain/Step Time": 8.447999436408281} +{"Pretrain/Learning Rate": 3.280774115642294e-05, "Pretrain/Loss": 2.033419132232666, "Pretrain/Loss (Raw)": 2.035705089569092, "Pretrain/Step": 7952, "Pretrain/Step Time": 8.45280785113573} +{"Pretrain/Learning Rate": 3.2803708219542064e-05, "Pretrain/Loss": 2.032273292541504, "Pretrain/Loss (Raw)": 1.9023476839065552, "Pretrain/Step": 7953, "Pretrain/Step Time": 8.454755866900086} +{"Pretrain/Learning Rate": 3.2799675057646754e-05, "Pretrain/Loss": 2.0307817459106445, "Pretrain/Loss (Raw)": 2.179689645767212, "Pretrain/Step": 7954, "Pretrain/Step Time": 8.453817339614034} +{"Pretrain/Learning Rate": 3.2795641670853307e-05, "Pretrain/Loss": 2.02956485748291, "Pretrain/Loss (Raw)": 2.0198447704315186, "Pretrain/Step": 7955, "Pretrain/Step Time": 8.454826902598143} +{"Pretrain/Learning Rate": 3.279160805927804e-05, "Pretrain/Loss": 2.027998447418213, "Pretrain/Loss (Raw)": 1.9477475881576538, "Pretrain/Step": 7956, "Pretrain/Step Time": 8.456821613013744} +{"Pretrain/Learning Rate": 3.278757422303723e-05, "Pretrain/Loss": 2.0283312797546387, "Pretrain/Loss (Raw)": 2.0578672885894775, "Pretrain/Step": 7957, "Pretrain/Step Time": 8.456085350364447} +{"Pretrain/Learning Rate": 3.278354016224722e-05, "Pretrain/Loss": 2.027461051940918, "Pretrain/Loss (Raw)": 1.9898961782455444, "Pretrain/Step": 7958, "Pretrain/Step Time": 8.455253222957253} +{"Pretrain/Learning Rate": 3.277950587702432e-05, "Pretrain/Loss": 2.025120258331299, "Pretrain/Loss (Raw)": 1.826828122138977, "Pretrain/Step": 7959, "Pretrain/Step Time": 8.46265865676105} +{"Pretrain/Learning Rate": 3.2775471367484836e-05, "Pretrain/Loss": 2.0249147415161133, "Pretrain/Loss (Raw)": 1.8915941715240479, "Pretrain/Step": 7960, "Pretrain/Step Time": 8.462075367569923} +{"Pretrain/Learning Rate": 3.2771436633745126e-05, "Pretrain/Loss": 2.0222342014312744, "Pretrain/Loss (Raw)": 1.7036070823669434, "Pretrain/Step": 7961, "Pretrain/Step Time": 8.465039350092411} +{"Pretrain/Learning Rate": 3.276740167592152e-05, "Pretrain/Loss": 2.0227909088134766, "Pretrain/Loss (Raw)": 2.2479889392852783, "Pretrain/Step": 7962, "Pretrain/Step Time": 8.461449293419719} +{"Pretrain/Learning Rate": 3.276336649413037e-05, "Pretrain/Loss": 2.020267963409424, "Pretrain/Loss (Raw)": 1.6957149505615234, "Pretrain/Step": 7963, "Pretrain/Step Time": 8.461506146937609} +{"Pretrain/Learning Rate": 3.275933108848801e-05, "Pretrain/Loss": 2.023390531539917, "Pretrain/Loss (Raw)": 2.0151216983795166, "Pretrain/Step": 7964, "Pretrain/Step Time": 8.45590160600841} +{"Pretrain/Learning Rate": 3.2755295459110805e-05, "Pretrain/Loss": 2.0253796577453613, "Pretrain/Loss (Raw)": 2.0787813663482666, "Pretrain/Step": 7965, "Pretrain/Step Time": 8.454551875591278} +{"Pretrain/Learning Rate": 3.2751259606115134e-05, "Pretrain/Loss": 2.023406982421875, "Pretrain/Loss (Raw)": 1.8685202598571777, "Pretrain/Step": 7966, "Pretrain/Step Time": 8.456035489216447} +{"Pretrain/Learning Rate": 3.2747223529617345e-05, "Pretrain/Loss": 2.0231881141662598, "Pretrain/Loss (Raw)": 2.0257115364074707, "Pretrain/Step": 7967, "Pretrain/Step Time": 8.456458812579513} +{"Pretrain/Learning Rate": 3.274318722973384e-05, "Pretrain/Loss": 2.0202584266662598, "Pretrain/Loss (Raw)": 1.8328261375427246, "Pretrain/Step": 7968, "Pretrain/Step Time": 8.457116050645709} +{"Pretrain/Learning Rate": 3.2739150706580976e-05, "Pretrain/Loss": 2.0198748111724854, "Pretrain/Loss (Raw)": 2.1218740940093994, "Pretrain/Step": 7969, "Pretrain/Step Time": 8.453031657263637} +{"Pretrain/Learning Rate": 3.273511396027517e-05, "Pretrain/Loss": 2.0199294090270996, "Pretrain/Loss (Raw)": 2.083824396133423, "Pretrain/Step": 7970, "Pretrain/Step Time": 8.454570228233933} +{"Pretrain/Learning Rate": 3.273107699093279e-05, "Pretrain/Loss": 2.0166075229644775, "Pretrain/Loss (Raw)": 1.8412877321243286, "Pretrain/Step": 7971, "Pretrain/Step Time": 8.45629027672112} +{"Pretrain/Learning Rate": 3.2727039798670266e-05, "Pretrain/Loss": 2.0155954360961914, "Pretrain/Loss (Raw)": 1.9046307802200317, "Pretrain/Step": 7972, "Pretrain/Step Time": 8.458362063392997} +{"Pretrain/Learning Rate": 3.2723002383603994e-05, "Pretrain/Loss": 2.017987012863159, "Pretrain/Loss (Raw)": 2.163186550140381, "Pretrain/Step": 7973, "Pretrain/Step Time": 8.456621391698718} +{"Pretrain/Learning Rate": 3.2718964745850394e-05, "Pretrain/Loss": 2.01686954498291, "Pretrain/Loss (Raw)": 2.067422389984131, "Pretrain/Step": 7974, "Pretrain/Step Time": 8.45727352052927} +{"Pretrain/Learning Rate": 3.271492688552589e-05, "Pretrain/Loss": 2.0203747749328613, "Pretrain/Loss (Raw)": 2.3155581951141357, "Pretrain/Step": 7975, "Pretrain/Step Time": 8.457936381921172} +{"Pretrain/Learning Rate": 3.27108888027469e-05, "Pretrain/Loss": 2.0212345123291016, "Pretrain/Loss (Raw)": 2.0998058319091797, "Pretrain/Step": 7976, "Pretrain/Step Time": 8.45964802801609} +{"Pretrain/Learning Rate": 3.270685049762987e-05, "Pretrain/Loss": 2.020951271057129, "Pretrain/Loss (Raw)": 2.072533369064331, "Pretrain/Step": 7977, "Pretrain/Step Time": 8.462777134031057} +{"Pretrain/Learning Rate": 3.2702811970291235e-05, "Pretrain/Loss": 2.0181124210357666, "Pretrain/Loss (Raw)": 1.9353399276733398, "Pretrain/Step": 7978, "Pretrain/Step Time": 8.462903693318367} +{"Pretrain/Learning Rate": 3.269877322084746e-05, "Pretrain/Loss": 2.0199265480041504, "Pretrain/Loss (Raw)": 2.062407970428467, "Pretrain/Step": 7979, "Pretrain/Step Time": 8.45592762157321} +{"Pretrain/Learning Rate": 3.2694734249414974e-05, "Pretrain/Loss": 2.0181074142456055, "Pretrain/Loss (Raw)": 1.731703519821167, "Pretrain/Step": 7980, "Pretrain/Step Time": 8.459689561277628} +{"Pretrain/Learning Rate": 3.269069505611026e-05, "Pretrain/Loss": 2.0187506675720215, "Pretrain/Loss (Raw)": 2.1188929080963135, "Pretrain/Step": 7981, "Pretrain/Step Time": 8.464153921231627} +{"Pretrain/Learning Rate": 3.268665564104977e-05, "Pretrain/Loss": 2.0182623863220215, "Pretrain/Loss (Raw)": 1.936798095703125, "Pretrain/Step": 7982, "Pretrain/Step Time": 8.463378259912133} +{"Pretrain/Learning Rate": 3.268261600434998e-05, "Pretrain/Loss": 2.015559434890747, "Pretrain/Loss (Raw)": 1.9883646965026855, "Pretrain/Step": 7983, "Pretrain/Step Time": 8.460478998720646} +{"Pretrain/Learning Rate": 3.267857614612738e-05, "Pretrain/Loss": 2.0142455101013184, "Pretrain/Loss (Raw)": 2.2118709087371826, "Pretrain/Step": 7984, "Pretrain/Step Time": 8.459181992337108} +{"Pretrain/Learning Rate": 3.267453606649845e-05, "Pretrain/Loss": 2.0154976844787598, "Pretrain/Loss (Raw)": 2.2413923740386963, "Pretrain/Step": 7985, "Pretrain/Step Time": 8.457949940115213} +{"Pretrain/Learning Rate": 3.2670495765579675e-05, "Pretrain/Loss": 2.0125479698181152, "Pretrain/Loss (Raw)": 1.7461702823638916, "Pretrain/Step": 7986, "Pretrain/Step Time": 8.462320160120726} +{"Pretrain/Learning Rate": 3.266645524348757e-05, "Pretrain/Loss": 2.0120420455932617, "Pretrain/Loss (Raw)": 1.9915697574615479, "Pretrain/Step": 7987, "Pretrain/Step Time": 8.459719343110919} +{"Pretrain/Learning Rate": 3.266241450033863e-05, "Pretrain/Loss": 2.0155253410339355, "Pretrain/Loss (Raw)": 2.5053913593292236, "Pretrain/Step": 7988, "Pretrain/Step Time": 8.461698185652494} +{"Pretrain/Learning Rate": 3.265837353624937e-05, "Pretrain/Loss": 2.0166962146759033, "Pretrain/Loss (Raw)": 2.2663745880126953, "Pretrain/Step": 7989, "Pretrain/Step Time": 8.45902363397181} +{"Pretrain/Learning Rate": 3.26543323513363e-05, "Pretrain/Loss": 2.016052722930908, "Pretrain/Loss (Raw)": 2.0615761280059814, "Pretrain/Step": 7990, "Pretrain/Step Time": 8.462259963154793} +{"Pretrain/Learning Rate": 3.2650290945715966e-05, "Pretrain/Loss": 2.0152482986450195, "Pretrain/Loss (Raw)": 1.9642070531845093, "Pretrain/Step": 7991, "Pretrain/Step Time": 8.466031258925796} +{"Pretrain/Learning Rate": 3.264624931950487e-05, "Pretrain/Loss": 2.0175633430480957, "Pretrain/Loss (Raw)": 2.338240385055542, "Pretrain/Step": 7992, "Pretrain/Step Time": 8.462977202609181} +{"Pretrain/Learning Rate": 3.264220747281958e-05, "Pretrain/Loss": 2.016632318496704, "Pretrain/Loss (Raw)": 1.87662672996521, "Pretrain/Step": 7993, "Pretrain/Step Time": 8.465979855507612} +{"Pretrain/Learning Rate": 3.263816540577662e-05, "Pretrain/Loss": 2.0147693157196045, "Pretrain/Loss (Raw)": 1.9312639236450195, "Pretrain/Step": 7994, "Pretrain/Step Time": 8.465742399916053} +{"Pretrain/Learning Rate": 3.263412311849255e-05, "Pretrain/Loss": 2.0158095359802246, "Pretrain/Loss (Raw)": 2.0138659477233887, "Pretrain/Step": 7995, "Pretrain/Step Time": 8.46623732149601} +{"Pretrain/Learning Rate": 3.2630080611083913e-05, "Pretrain/Loss": 2.0166847705841064, "Pretrain/Loss (Raw)": 2.143216133117676, "Pretrain/Step": 7996, "Pretrain/Step Time": 8.463388420641422} +{"Pretrain/Learning Rate": 3.262603788366728e-05, "Pretrain/Loss": 2.01668119430542, "Pretrain/Loss (Raw)": 2.0363070964813232, "Pretrain/Step": 7997, "Pretrain/Step Time": 8.470554230734706} +{"Pretrain/Learning Rate": 3.262199493635923e-05, "Pretrain/Loss": 2.0152223110198975, "Pretrain/Loss (Raw)": 1.9122501611709595, "Pretrain/Step": 7998, "Pretrain/Step Time": 8.470717331394553} +{"Pretrain/Learning Rate": 3.261795176927632e-05, "Pretrain/Loss": 2.0149693489074707, "Pretrain/Loss (Raw)": 2.0759735107421875, "Pretrain/Step": 7999, "Pretrain/Step Time": 8.46855110861361} +{"Pretrain/Learning Rate": 3.261390838253515e-05, "Pretrain/Loss": 2.014965534210205, "Pretrain/Loss (Raw)": 1.9358408451080322, "Pretrain/Step": 8000, "Pretrain/Step Time": 8.466922981664538} +{"Pretrain/Learning Rate": 3.260986477625229e-05, "Pretrain/Loss": 2.0119810104370117, "Pretrain/Loss (Raw)": 1.6784242391586304, "Pretrain/Step": 8001, "Pretrain/Step Time": 8.470750946551561} +{"Pretrain/Learning Rate": 3.2605820950544344e-05, "Pretrain/Loss": 2.009922504425049, "Pretrain/Loss (Raw)": 2.023773431777954, "Pretrain/Step": 8002, "Pretrain/Step Time": 8.472276791930199} +{"Pretrain/Learning Rate": 3.2601776905527916e-05, "Pretrain/Loss": 2.010838031768799, "Pretrain/Loss (Raw)": 2.075828790664673, "Pretrain/Step": 8003, "Pretrain/Step Time": 8.471954630687833} +{"Pretrain/Learning Rate": 3.2597732641319614e-05, "Pretrain/Loss": 2.0112991333007812, "Pretrain/Loss (Raw)": 2.029670238494873, "Pretrain/Step": 8004, "Pretrain/Step Time": 8.472890507429838} +{"Pretrain/Learning Rate": 3.259368815803604e-05, "Pretrain/Loss": 2.01176118850708, "Pretrain/Loss (Raw)": 2.0899596214294434, "Pretrain/Step": 8005, "Pretrain/Step Time": 8.475101122632623} +{"Pretrain/Learning Rate": 3.258964345579383e-05, "Pretrain/Loss": 2.012490749359131, "Pretrain/Loss (Raw)": 2.2394208908081055, "Pretrain/Step": 8006, "Pretrain/Step Time": 8.475863091647625} +{"Pretrain/Learning Rate": 3.2585598534709595e-05, "Pretrain/Loss": 2.0098745822906494, "Pretrain/Loss (Raw)": 1.8207201957702637, "Pretrain/Step": 8007, "Pretrain/Step Time": 8.480602461844683} +{"Pretrain/Learning Rate": 3.2581553394899965e-05, "Pretrain/Loss": 2.011039972305298, "Pretrain/Loss (Raw)": 1.954002857208252, "Pretrain/Step": 8008, "Pretrain/Step Time": 8.477958787232637} +{"Pretrain/Learning Rate": 3.2577508036481593e-05, "Pretrain/Loss": 2.0137393474578857, "Pretrain/Loss (Raw)": 2.184842109680176, "Pretrain/Step": 8009, "Pretrain/Step Time": 8.476687779650092} +{"Pretrain/Learning Rate": 3.257346245957113e-05, "Pretrain/Loss": 2.014944314956665, "Pretrain/Loss (Raw)": 2.0301549434661865, "Pretrain/Step": 8010, "Pretrain/Step Time": 8.475686646997929} +{"Pretrain/Learning Rate": 3.2569416664285213e-05, "Pretrain/Loss": 2.015859365463257, "Pretrain/Loss (Raw)": 1.9062414169311523, "Pretrain/Step": 8011, "Pretrain/Step Time": 8.479375701397657} +{"Pretrain/Learning Rate": 3.256537065074049e-05, "Pretrain/Loss": 2.0130457878112793, "Pretrain/Loss (Raw)": 1.8947662115097046, "Pretrain/Step": 8012, "Pretrain/Step Time": 8.480736631900072} +{"Pretrain/Learning Rate": 3.256132441905365e-05, "Pretrain/Loss": 2.0141217708587646, "Pretrain/Loss (Raw)": 2.0036869049072266, "Pretrain/Step": 8013, "Pretrain/Step Time": 8.475025417283177} +{"Pretrain/Learning Rate": 3.2557277969341345e-05, "Pretrain/Loss": 2.01572847366333, "Pretrain/Loss (Raw)": 2.1153621673583984, "Pretrain/Step": 8014, "Pretrain/Step Time": 8.482102205976844} +{"Pretrain/Learning Rate": 3.2553231301720254e-05, "Pretrain/Loss": 2.012592315673828, "Pretrain/Loss (Raw)": 1.8141118288040161, "Pretrain/Step": 8015, "Pretrain/Step Time": 8.479998322203755} +{"Pretrain/Learning Rate": 3.254918441630707e-05, "Pretrain/Loss": 2.0137672424316406, "Pretrain/Loss (Raw)": 2.3042984008789062, "Pretrain/Step": 8016, "Pretrain/Step Time": 8.477209810167551} +{"Pretrain/Learning Rate": 3.2545137313218475e-05, "Pretrain/Loss": 2.014578342437744, "Pretrain/Loss (Raw)": 1.9488579034805298, "Pretrain/Step": 8017, "Pretrain/Step Time": 8.476952765136957} +{"Pretrain/Learning Rate": 3.254108999257116e-05, "Pretrain/Loss": 2.0122342109680176, "Pretrain/Loss (Raw)": 1.8896994590759277, "Pretrain/Step": 8018, "Pretrain/Step Time": 8.473617536947131} +{"Pretrain/Learning Rate": 3.253704245448183e-05, "Pretrain/Loss": 2.0123848915100098, "Pretrain/Loss (Raw)": 2.076528787612915, "Pretrain/Step": 8019, "Pretrain/Step Time": 8.479933770373464} +{"Pretrain/Learning Rate": 3.25329946990672e-05, "Pretrain/Loss": 2.0118942260742188, "Pretrain/Loss (Raw)": 1.9817570447921753, "Pretrain/Step": 8020, "Pretrain/Step Time": 8.480541968718171} +{"Pretrain/Learning Rate": 3.2528946726443976e-05, "Pretrain/Loss": 2.015407085418701, "Pretrain/Loss (Raw)": 2.113006353378296, "Pretrain/Step": 8021, "Pretrain/Step Time": 8.477984154596925} +{"Pretrain/Learning Rate": 3.2524898536728884e-05, "Pretrain/Loss": 2.0153403282165527, "Pretrain/Loss (Raw)": 2.0539355278015137, "Pretrain/Step": 8022, "Pretrain/Step Time": 8.486032079905272} +{"Pretrain/Learning Rate": 3.252085013003864e-05, "Pretrain/Loss": 2.014756917953491, "Pretrain/Loss (Raw)": 1.9375925064086914, "Pretrain/Step": 8023, "Pretrain/Step Time": 8.481522988528013} +{"Pretrain/Learning Rate": 3.251680150648999e-05, "Pretrain/Loss": 2.0128254890441895, "Pretrain/Loss (Raw)": 1.898764729499817, "Pretrain/Step": 8024, "Pretrain/Step Time": 8.48362328670919} +{"Pretrain/Learning Rate": 3.251275266619967e-05, "Pretrain/Loss": 2.010255813598633, "Pretrain/Loss (Raw)": 1.7860878705978394, "Pretrain/Step": 8025, "Pretrain/Step Time": 8.48459586314857} +{"Pretrain/Learning Rate": 3.250870360928441e-05, "Pretrain/Loss": 2.011003017425537, "Pretrain/Loss (Raw)": 2.060253858566284, "Pretrain/Step": 8026, "Pretrain/Step Time": 8.489095658063889} +{"Pretrain/Learning Rate": 3.2504654335860986e-05, "Pretrain/Loss": 2.0096378326416016, "Pretrain/Loss (Raw)": 1.8577485084533691, "Pretrain/Step": 8027, "Pretrain/Step Time": 8.482067953795195} +{"Pretrain/Learning Rate": 3.250060484604614e-05, "Pretrain/Loss": 2.009476900100708, "Pretrain/Loss (Raw)": 1.9666566848754883, "Pretrain/Step": 8028, "Pretrain/Step Time": 8.483992720022798} +{"Pretrain/Learning Rate": 3.249655513995664e-05, "Pretrain/Loss": 2.0102553367614746, "Pretrain/Loss (Raw)": 1.9246265888214111, "Pretrain/Step": 8029, "Pretrain/Step Time": 8.483358627185225} +{"Pretrain/Learning Rate": 3.249250521770926e-05, "Pretrain/Loss": 2.0091769695281982, "Pretrain/Loss (Raw)": 1.9814924001693726, "Pretrain/Step": 8030, "Pretrain/Step Time": 8.48160700686276} +{"Pretrain/Learning Rate": 3.248845507942078e-05, "Pretrain/Loss": 2.0044517517089844, "Pretrain/Loss (Raw)": 1.9767463207244873, "Pretrain/Step": 8031, "Pretrain/Step Time": 8.481969434767962} +{"Pretrain/Learning Rate": 3.2484404725207974e-05, "Pretrain/Loss": 2.00382399559021, "Pretrain/Loss (Raw)": 1.8977965116500854, "Pretrain/Step": 8032, "Pretrain/Step Time": 8.487634291872382} +{"Pretrain/Learning Rate": 3.2480354155187626e-05, "Pretrain/Loss": 2.002713918685913, "Pretrain/Loss (Raw)": 1.8738927841186523, "Pretrain/Step": 8033, "Pretrain/Step Time": 8.489147242158651} +{"Pretrain/Learning Rate": 3.247630336947654e-05, "Pretrain/Loss": 2.0020532608032227, "Pretrain/Loss (Raw)": 2.0411033630371094, "Pretrain/Step": 8034, "Pretrain/Step Time": 8.48595073260367} +{"Pretrain/Learning Rate": 3.247225236819153e-05, "Pretrain/Loss": 2.001218795776367, "Pretrain/Loss (Raw)": 1.9744853973388672, "Pretrain/Step": 8035, "Pretrain/Step Time": 8.485182909294963} +{"Pretrain/Learning Rate": 3.246820115144938e-05, "Pretrain/Loss": 2.0026540756225586, "Pretrain/Loss (Raw)": 2.128331422805786, "Pretrain/Step": 8036, "Pretrain/Step Time": 8.48638528957963} +{"Pretrain/Learning Rate": 3.246414971936692e-05, "Pretrain/Loss": 2.0033035278320312, "Pretrain/Loss (Raw)": 2.1289074420928955, "Pretrain/Step": 8037, "Pretrain/Step Time": 8.48276992700994} +{"Pretrain/Learning Rate": 3.2460098072060954e-05, "Pretrain/Loss": 2.002683639526367, "Pretrain/Loss (Raw)": 1.9196947813034058, "Pretrain/Step": 8038, "Pretrain/Step Time": 8.485417054966092} +{"Pretrain/Learning Rate": 3.245604620964833e-05, "Pretrain/Loss": 2.001573085784912, "Pretrain/Loss (Raw)": 1.964887022972107, "Pretrain/Step": 8039, "Pretrain/Step Time": 8.4859832059592} +{"Pretrain/Learning Rate": 3.245199413224586e-05, "Pretrain/Loss": 1.998290777206421, "Pretrain/Loss (Raw)": 1.7672213315963745, "Pretrain/Step": 8040, "Pretrain/Step Time": 8.487446710467339} +{"Pretrain/Learning Rate": 3.24479418399704e-05, "Pretrain/Loss": 1.996457576751709, "Pretrain/Loss (Raw)": 1.7361152172088623, "Pretrain/Step": 8041, "Pretrain/Step Time": 8.491923449561} +{"Pretrain/Learning Rate": 3.244388933293878e-05, "Pretrain/Loss": 1.994512677192688, "Pretrain/Loss (Raw)": 1.824919581413269, "Pretrain/Step": 8042, "Pretrain/Step Time": 8.487191338092089} +{"Pretrain/Learning Rate": 3.243983661126787e-05, "Pretrain/Loss": 1.9921901226043701, "Pretrain/Loss (Raw)": 2.2418053150177, "Pretrain/Step": 8043, "Pretrain/Step Time": 8.48797838203609} +{"Pretrain/Learning Rate": 3.243578367507451e-05, "Pretrain/Loss": 1.992584466934204, "Pretrain/Loss (Raw)": 2.0678889751434326, "Pretrain/Step": 8044, "Pretrain/Step Time": 8.48798931017518} +{"Pretrain/Learning Rate": 3.243173052447557e-05, "Pretrain/Loss": 1.9915552139282227, "Pretrain/Loss (Raw)": 1.875776767730713, "Pretrain/Step": 8045, "Pretrain/Step Time": 8.486566573381424} +{"Pretrain/Learning Rate": 3.242767715958792e-05, "Pretrain/Loss": 1.9910244941711426, "Pretrain/Loss (Raw)": 1.8230167627334595, "Pretrain/Step": 8046, "Pretrain/Step Time": 8.476669261232018} +{"Pretrain/Learning Rate": 3.2423623580528425e-05, "Pretrain/Loss": 1.9901282787322998, "Pretrain/Loss (Raw)": 1.8913389444351196, "Pretrain/Step": 8047, "Pretrain/Step Time": 8.481042694300413} +{"Pretrain/Learning Rate": 3.2419569787414e-05, "Pretrain/Loss": 1.9917432069778442, "Pretrain/Loss (Raw)": 2.2274065017700195, "Pretrain/Step": 8048, "Pretrain/Step Time": 8.48300807364285} +{"Pretrain/Learning Rate": 3.2415515780361496e-05, "Pretrain/Loss": 1.9943037033081055, "Pretrain/Loss (Raw)": 1.9776062965393066, "Pretrain/Step": 8049, "Pretrain/Step Time": 8.485509498044848} +{"Pretrain/Learning Rate": 3.241146155948782e-05, "Pretrain/Loss": 1.9932044744491577, "Pretrain/Loss (Raw)": 1.9838978052139282, "Pretrain/Step": 8050, "Pretrain/Step Time": 8.482603652402759} +{"Pretrain/Learning Rate": 3.240740712490988e-05, "Pretrain/Loss": 1.9935345649719238, "Pretrain/Loss (Raw)": 2.1045098304748535, "Pretrain/Step": 8051, "Pretrain/Step Time": 8.487680157646537} +{"Pretrain/Learning Rate": 3.240335247674457e-05, "Pretrain/Loss": 1.9920995235443115, "Pretrain/Loss (Raw)": 1.9578322172164917, "Pretrain/Step": 8052, "Pretrain/Step Time": 8.483151426538825} +{"Pretrain/Learning Rate": 3.239929761510882e-05, "Pretrain/Loss": 1.9901026487350464, "Pretrain/Loss (Raw)": 1.7849509716033936, "Pretrain/Step": 8053, "Pretrain/Step Time": 8.48436850309372} +{"Pretrain/Learning Rate": 3.239524254011954e-05, "Pretrain/Loss": 1.9901262521743774, "Pretrain/Loss (Raw)": 2.0759501457214355, "Pretrain/Step": 8054, "Pretrain/Step Time": 8.487283799797297} +{"Pretrain/Learning Rate": 3.2391187251893646e-05, "Pretrain/Loss": 1.9912352561950684, "Pretrain/Loss (Raw)": 2.209665536880493, "Pretrain/Step": 8055, "Pretrain/Step Time": 8.482831861823797} +{"Pretrain/Learning Rate": 3.238713175054808e-05, "Pretrain/Loss": 1.993760108947754, "Pretrain/Loss (Raw)": 2.2184135913848877, "Pretrain/Step": 8056, "Pretrain/Step Time": 8.48522819019854} +{"Pretrain/Learning Rate": 3.2383076036199775e-05, "Pretrain/Loss": 1.9933054447174072, "Pretrain/Loss (Raw)": 1.9988468885421753, "Pretrain/Step": 8057, "Pretrain/Step Time": 8.489194139838219} +{"Pretrain/Learning Rate": 3.2379020108965684e-05, "Pretrain/Loss": 1.9930167198181152, "Pretrain/Loss (Raw)": 2.027749538421631, "Pretrain/Step": 8058, "Pretrain/Step Time": 8.491257084533572} +{"Pretrain/Learning Rate": 3.237496396896275e-05, "Pretrain/Loss": 1.9951469898223877, "Pretrain/Loss (Raw)": 2.183566093444824, "Pretrain/Step": 8059, "Pretrain/Step Time": 8.487833807244897} +{"Pretrain/Learning Rate": 3.2370907616307926e-05, "Pretrain/Loss": 1.9972560405731201, "Pretrain/Loss (Raw)": 2.201765537261963, "Pretrain/Step": 8060, "Pretrain/Step Time": 8.491645837202668} +{"Pretrain/Learning Rate": 3.236685105111818e-05, "Pretrain/Loss": 1.9998064041137695, "Pretrain/Loss (Raw)": 2.2044920921325684, "Pretrain/Step": 8061, "Pretrain/Step Time": 8.488501962274313} +{"Pretrain/Learning Rate": 3.2362794273510474e-05, "Pretrain/Loss": 1.9982867240905762, "Pretrain/Loss (Raw)": 1.856046199798584, "Pretrain/Step": 8062, "Pretrain/Step Time": 8.482870941981673} +{"Pretrain/Learning Rate": 3.235873728360179e-05, "Pretrain/Loss": 2.0005288124084473, "Pretrain/Loss (Raw)": 2.201298475265503, "Pretrain/Step": 8063, "Pretrain/Step Time": 8.484786977991462} +{"Pretrain/Learning Rate": 3.2354680081509095e-05, "Pretrain/Loss": 2.001755714416504, "Pretrain/Loss (Raw)": 1.9812475442886353, "Pretrain/Step": 8064, "Pretrain/Step Time": 8.487782765179873} +{"Pretrain/Learning Rate": 3.23506226673494e-05, "Pretrain/Loss": 2.0020508766174316, "Pretrain/Loss (Raw)": 2.028369903564453, "Pretrain/Step": 8065, "Pretrain/Step Time": 8.488404707983136} +{"Pretrain/Learning Rate": 3.234656504123966e-05, "Pretrain/Loss": 2.0016846656799316, "Pretrain/Loss (Raw)": 1.8788117170333862, "Pretrain/Step": 8066, "Pretrain/Step Time": 8.487794324755669} +{"Pretrain/Learning Rate": 3.234250720329691e-05, "Pretrain/Loss": 2.000931978225708, "Pretrain/Loss (Raw)": 2.009089469909668, "Pretrain/Step": 8067, "Pretrain/Step Time": 8.485594341531396} +{"Pretrain/Learning Rate": 3.2338449153638145e-05, "Pretrain/Loss": 2.0007877349853516, "Pretrain/Loss (Raw)": 2.058215618133545, "Pretrain/Step": 8068, "Pretrain/Step Time": 8.485345741733909} +{"Pretrain/Learning Rate": 3.233439089238036e-05, "Pretrain/Loss": 2.001932382583618, "Pretrain/Loss (Raw)": 1.9826173782348633, "Pretrain/Step": 8069, "Pretrain/Step Time": 8.49059641547501} +{"Pretrain/Learning Rate": 3.23303324196406e-05, "Pretrain/Loss": 2.0021095275878906, "Pretrain/Loss (Raw)": 1.947656512260437, "Pretrain/Step": 8070, "Pretrain/Step Time": 8.488005874678493} +{"Pretrain/Learning Rate": 3.2326273735535854e-05, "Pretrain/Loss": 2.0030455589294434, "Pretrain/Loss (Raw)": 2.059788227081299, "Pretrain/Step": 8071, "Pretrain/Step Time": 8.487344540655613} +{"Pretrain/Learning Rate": 3.232221484018318e-05, "Pretrain/Loss": 2.005448341369629, "Pretrain/Loss (Raw)": 1.933109164237976, "Pretrain/Step": 8072, "Pretrain/Step Time": 8.486846722662449} +{"Pretrain/Learning Rate": 3.23181557336996e-05, "Pretrain/Loss": 2.0048367977142334, "Pretrain/Loss (Raw)": 1.9574424028396606, "Pretrain/Step": 8073, "Pretrain/Step Time": 8.481157658621669} +{"Pretrain/Learning Rate": 3.231409641620216e-05, "Pretrain/Loss": 2.005279541015625, "Pretrain/Loss (Raw)": 2.138984441757202, "Pretrain/Step": 8074, "Pretrain/Step Time": 8.483951287344098} +{"Pretrain/Learning Rate": 3.2310036887807906e-05, "Pretrain/Loss": 2.006662368774414, "Pretrain/Loss (Raw)": 1.9666863679885864, "Pretrain/Step": 8075, "Pretrain/Step Time": 8.484031714498997} +{"Pretrain/Learning Rate": 3.230597714863389e-05, "Pretrain/Loss": 2.008289098739624, "Pretrain/Loss (Raw)": 2.028398036956787, "Pretrain/Step": 8076, "Pretrain/Step Time": 8.48606133274734} +{"Pretrain/Learning Rate": 3.230191719879717e-05, "Pretrain/Loss": 2.0114433765411377, "Pretrain/Loss (Raw)": 2.5426223278045654, "Pretrain/Step": 8077, "Pretrain/Step Time": 8.48938051238656} +{"Pretrain/Learning Rate": 3.2297857038414825e-05, "Pretrain/Loss": 2.010514497756958, "Pretrain/Loss (Raw)": 1.984938621520996, "Pretrain/Step": 8078, "Pretrain/Step Time": 8.480429276823997} +{"Pretrain/Learning Rate": 3.2293796667603906e-05, "Pretrain/Loss": 2.0125107765197754, "Pretrain/Loss (Raw)": 2.097611427307129, "Pretrain/Step": 8079, "Pretrain/Step Time": 8.477503459900618} +{"Pretrain/Learning Rate": 3.228973608648152e-05, "Pretrain/Loss": 2.012610912322998, "Pretrain/Loss (Raw)": 2.0485541820526123, "Pretrain/Step": 8080, "Pretrain/Step Time": 8.478221183642745} +{"Pretrain/Learning Rate": 3.228567529516471e-05, "Pretrain/Loss": 2.0148606300354004, "Pretrain/Loss (Raw)": 2.1902878284454346, "Pretrain/Step": 8081, "Pretrain/Step Time": 8.477368434891105} +{"Pretrain/Learning Rate": 3.22816142937706e-05, "Pretrain/Loss": 2.014101028442383, "Pretrain/Loss (Raw)": 2.0824813842773438, "Pretrain/Step": 8082, "Pretrain/Step Time": 8.474012680351734} +{"Pretrain/Learning Rate": 3.2277553082416274e-05, "Pretrain/Loss": 2.012035846710205, "Pretrain/Loss (Raw)": 1.75550377368927, "Pretrain/Step": 8083, "Pretrain/Step Time": 8.47522602416575} +{"Pretrain/Learning Rate": 3.227349166121883e-05, "Pretrain/Loss": 2.0130157470703125, "Pretrain/Loss (Raw)": 2.073197603225708, "Pretrain/Step": 8084, "Pretrain/Step Time": 8.47656849771738} +{"Pretrain/Learning Rate": 3.2269430030295396e-05, "Pretrain/Loss": 2.0119404792785645, "Pretrain/Loss (Raw)": 1.9201980829238892, "Pretrain/Step": 8085, "Pretrain/Step Time": 8.478005917742848} +{"Pretrain/Learning Rate": 3.2265368189763065e-05, "Pretrain/Loss": 2.013284683227539, "Pretrain/Loss (Raw)": 2.161961078643799, "Pretrain/Step": 8086, "Pretrain/Step Time": 8.477906556800008} +{"Pretrain/Learning Rate": 3.2261306139738954e-05, "Pretrain/Loss": 2.0153443813323975, "Pretrain/Loss (Raw)": 2.0904595851898193, "Pretrain/Step": 8087, "Pretrain/Step Time": 8.472905587404966} +{"Pretrain/Learning Rate": 3.2257243880340205e-05, "Pretrain/Loss": 2.016157627105713, "Pretrain/Loss (Raw)": 1.9957149028778076, "Pretrain/Step": 8088, "Pretrain/Step Time": 8.469576170668006} +{"Pretrain/Learning Rate": 3.2253181411683945e-05, "Pretrain/Loss": 2.017348289489746, "Pretrain/Loss (Raw)": 1.8559842109680176, "Pretrain/Step": 8089, "Pretrain/Step Time": 8.466149721294641} +{"Pretrain/Learning Rate": 3.2249118733887315e-05, "Pretrain/Loss": 2.0152993202209473, "Pretrain/Loss (Raw)": 1.985718846321106, "Pretrain/Step": 8090, "Pretrain/Step Time": 8.474706426262856} +{"Pretrain/Learning Rate": 3.224505584706746e-05, "Pretrain/Loss": 2.0178258419036865, "Pretrain/Loss (Raw)": 2.019129514694214, "Pretrain/Step": 8091, "Pretrain/Step Time": 8.47462958842516} +{"Pretrain/Learning Rate": 3.224099275134152e-05, "Pretrain/Loss": 2.0175390243530273, "Pretrain/Loss (Raw)": 1.9784101247787476, "Pretrain/Step": 8092, "Pretrain/Step Time": 8.475755535066128} +{"Pretrain/Learning Rate": 3.223692944682666e-05, "Pretrain/Loss": 2.0161280632019043, "Pretrain/Loss (Raw)": 1.8981598615646362, "Pretrain/Step": 8093, "Pretrain/Step Time": 8.47930633276701} +{"Pretrain/Learning Rate": 3.223286593364004e-05, "Pretrain/Loss": 2.0161798000335693, "Pretrain/Loss (Raw)": 1.8751652240753174, "Pretrain/Step": 8094, "Pretrain/Step Time": 8.476575415581465} +{"Pretrain/Learning Rate": 3.2228802211898835e-05, "Pretrain/Loss": 2.0160913467407227, "Pretrain/Loss (Raw)": 2.0144102573394775, "Pretrain/Step": 8095, "Pretrain/Step Time": 8.478268368169665} +{"Pretrain/Learning Rate": 3.222473828172021e-05, "Pretrain/Loss": 2.017411231994629, "Pretrain/Loss (Raw)": 2.00173020362854, "Pretrain/Step": 8096, "Pretrain/Step Time": 8.482785968109965} +{"Pretrain/Learning Rate": 3.222067414322135e-05, "Pretrain/Loss": 2.018263101577759, "Pretrain/Loss (Raw)": 2.2309374809265137, "Pretrain/Step": 8097, "Pretrain/Step Time": 8.483229983597994} +{"Pretrain/Learning Rate": 3.2216609796519437e-05, "Pretrain/Loss": 2.0187790393829346, "Pretrain/Loss (Raw)": 2.1498517990112305, "Pretrain/Step": 8098, "Pretrain/Step Time": 8.479789273813367} +{"Pretrain/Learning Rate": 3.221254524173167e-05, "Pretrain/Loss": 2.019350051879883, "Pretrain/Loss (Raw)": 1.9144046306610107, "Pretrain/Step": 8099, "Pretrain/Step Time": 8.483449744060636} +{"Pretrain/Learning Rate": 3.220848047897526e-05, "Pretrain/Loss": 2.02126407623291, "Pretrain/Loss (Raw)": 2.149592399597168, "Pretrain/Step": 8100, "Pretrain/Step Time": 8.48562465980649} +{"Pretrain/Learning Rate": 3.220441550836738e-05, "Pretrain/Loss": 2.0210819244384766, "Pretrain/Loss (Raw)": 2.139885425567627, "Pretrain/Step": 8101, "Pretrain/Step Time": 8.481386544182897} +{"Pretrain/Learning Rate": 3.220035033002527e-05, "Pretrain/Loss": 2.0208349227905273, "Pretrain/Loss (Raw)": 2.035813093185425, "Pretrain/Step": 8102, "Pretrain/Step Time": 8.482712220400572} +{"Pretrain/Learning Rate": 3.219628494406612e-05, "Pretrain/Loss": 2.018897533416748, "Pretrain/Loss (Raw)": 2.067553758621216, "Pretrain/Step": 8103, "Pretrain/Step Time": 8.481926349923015} +{"Pretrain/Learning Rate": 3.219221935060717e-05, "Pretrain/Loss": 2.0178184509277344, "Pretrain/Loss (Raw)": 1.9617012739181519, "Pretrain/Step": 8104, "Pretrain/Step Time": 8.478904956951737} +{"Pretrain/Learning Rate": 3.218815354976565e-05, "Pretrain/Loss": 2.01735782623291, "Pretrain/Loss (Raw)": 2.0135467052459717, "Pretrain/Step": 8105, "Pretrain/Step Time": 8.479460438713431} +{"Pretrain/Learning Rate": 3.218408754165879e-05, "Pretrain/Loss": 2.019351005554199, "Pretrain/Loss (Raw)": 2.190457344055176, "Pretrain/Step": 8106, "Pretrain/Step Time": 8.476864792406559} +{"Pretrain/Learning Rate": 3.218002132640383e-05, "Pretrain/Loss": 2.0165445804595947, "Pretrain/Loss (Raw)": 1.7031993865966797, "Pretrain/Step": 8107, "Pretrain/Step Time": 8.48063306324184} +{"Pretrain/Learning Rate": 3.2175954904118014e-05, "Pretrain/Loss": 2.0187883377075195, "Pretrain/Loss (Raw)": 2.018904685974121, "Pretrain/Step": 8108, "Pretrain/Step Time": 8.479714212939143} +{"Pretrain/Learning Rate": 3.2171888274918594e-05, "Pretrain/Loss": 2.017209529876709, "Pretrain/Loss (Raw)": 1.9167925119400024, "Pretrain/Step": 8109, "Pretrain/Step Time": 8.47484197281301} +{"Pretrain/Learning Rate": 3.2167821438922835e-05, "Pretrain/Loss": 2.016874074935913, "Pretrain/Loss (Raw)": 1.8938761949539185, "Pretrain/Step": 8110, "Pretrain/Step Time": 8.47356167808175} +{"Pretrain/Learning Rate": 3.2163754396248e-05, "Pretrain/Loss": 2.0171096324920654, "Pretrain/Loss (Raw)": 2.018547773361206, "Pretrain/Step": 8111, "Pretrain/Step Time": 8.475856613367796} +{"Pretrain/Learning Rate": 3.215968714701136e-05, "Pretrain/Loss": 2.0152177810668945, "Pretrain/Loss (Raw)": 1.9696624279022217, "Pretrain/Step": 8112, "Pretrain/Step Time": 8.48254226706922} +{"Pretrain/Learning Rate": 3.215561969133018e-05, "Pretrain/Loss": 2.0152015686035156, "Pretrain/Loss (Raw)": 2.239363431930542, "Pretrain/Step": 8113, "Pretrain/Step Time": 8.47922688163817} +{"Pretrain/Learning Rate": 3.2151552029321754e-05, "Pretrain/Loss": 2.015773296356201, "Pretrain/Loss (Raw)": 1.8193447589874268, "Pretrain/Step": 8114, "Pretrain/Step Time": 8.478958673775196} +{"Pretrain/Learning Rate": 3.214748416110337e-05, "Pretrain/Loss": 2.016606569290161, "Pretrain/Loss (Raw)": 2.0982229709625244, "Pretrain/Step": 8115, "Pretrain/Step Time": 8.481139335781336} +{"Pretrain/Learning Rate": 3.2143416086792313e-05, "Pretrain/Loss": 2.0126984119415283, "Pretrain/Loss (Raw)": 2.005129337310791, "Pretrain/Step": 8116, "Pretrain/Step Time": 8.484083903953433} +{"Pretrain/Learning Rate": 3.213934780650589e-05, "Pretrain/Loss": 2.0123493671417236, "Pretrain/Loss (Raw)": 2.2217020988464355, "Pretrain/Step": 8117, "Pretrain/Step Time": 8.485409440472722} +{"Pretrain/Learning Rate": 3.213527932036141e-05, "Pretrain/Loss": 2.012115240097046, "Pretrain/Loss (Raw)": 2.031606674194336, "Pretrain/Step": 8118, "Pretrain/Step Time": 8.483461184427142} +{"Pretrain/Learning Rate": 3.213121062847618e-05, "Pretrain/Loss": 2.0116238594055176, "Pretrain/Loss (Raw)": 1.9013011455535889, "Pretrain/Step": 8119, "Pretrain/Step Time": 8.480797611176968} +{"Pretrain/Learning Rate": 3.2127141730967524e-05, "Pretrain/Loss": 2.007925033569336, "Pretrain/Loss (Raw)": 1.8648197650909424, "Pretrain/Step": 8120, "Pretrain/Step Time": 8.484203238040209} +{"Pretrain/Learning Rate": 3.212307262795275e-05, "Pretrain/Loss": 2.0102343559265137, "Pretrain/Loss (Raw)": 2.172212839126587, "Pretrain/Step": 8121, "Pretrain/Step Time": 8.483400600031018} +{"Pretrain/Learning Rate": 3.211900331954921e-05, "Pretrain/Loss": 2.010500907897949, "Pretrain/Loss (Raw)": 1.9653857946395874, "Pretrain/Step": 8122, "Pretrain/Step Time": 8.482097713276744} +{"Pretrain/Learning Rate": 3.211493380587422e-05, "Pretrain/Loss": 2.0109822750091553, "Pretrain/Loss (Raw)": 2.0754690170288086, "Pretrain/Step": 8123, "Pretrain/Step Time": 8.479729885235429} +{"Pretrain/Learning Rate": 3.211086408704512e-05, "Pretrain/Loss": 2.0091803073883057, "Pretrain/Loss (Raw)": 1.912577748298645, "Pretrain/Step": 8124, "Pretrain/Step Time": 8.482993803918362} +{"Pretrain/Learning Rate": 3.210679416317928e-05, "Pretrain/Loss": 2.0104103088378906, "Pretrain/Loss (Raw)": 2.1937601566314697, "Pretrain/Step": 8125, "Pretrain/Step Time": 8.481477295979857} +{"Pretrain/Learning Rate": 3.2102724034394036e-05, "Pretrain/Loss": 2.0103838443756104, "Pretrain/Loss (Raw)": 1.9088214635849, "Pretrain/Step": 8126, "Pretrain/Step Time": 8.48171054199338} +{"Pretrain/Learning Rate": 3.209865370080676e-05, "Pretrain/Loss": 2.0115110874176025, "Pretrain/Loss (Raw)": 2.2202951908111572, "Pretrain/Step": 8127, "Pretrain/Step Time": 8.482904793694615} +{"Pretrain/Learning Rate": 3.20945831625348e-05, "Pretrain/Loss": 2.011092185974121, "Pretrain/Loss (Raw)": 1.8822234869003296, "Pretrain/Step": 8128, "Pretrain/Step Time": 8.487225875258446} +{"Pretrain/Learning Rate": 3.209051241969553e-05, "Pretrain/Loss": 2.0146126747131348, "Pretrain/Loss (Raw)": 2.1290502548217773, "Pretrain/Step": 8129, "Pretrain/Step Time": 8.479251394048333} +{"Pretrain/Learning Rate": 3.208644147240634e-05, "Pretrain/Loss": 2.0152673721313477, "Pretrain/Loss (Raw)": 2.1075632572174072, "Pretrain/Step": 8130, "Pretrain/Step Time": 8.480851840227842} +{"Pretrain/Learning Rate": 3.2082370320784605e-05, "Pretrain/Loss": 2.0158843994140625, "Pretrain/Loss (Raw)": 2.154806137084961, "Pretrain/Step": 8131, "Pretrain/Step Time": 8.486964512616396} +{"Pretrain/Learning Rate": 3.2078298964947715e-05, "Pretrain/Loss": 2.0147948265075684, "Pretrain/Loss (Raw)": 1.8901941776275635, "Pretrain/Step": 8132, "Pretrain/Step Time": 8.485670072957873} +{"Pretrain/Learning Rate": 3.207422740501307e-05, "Pretrain/Loss": 2.0138754844665527, "Pretrain/Loss (Raw)": 1.9722965955734253, "Pretrain/Step": 8133, "Pretrain/Step Time": 8.483498234301805} +{"Pretrain/Learning Rate": 3.2070155641098055e-05, "Pretrain/Loss": 2.0145628452301025, "Pretrain/Loss (Raw)": 2.327385187149048, "Pretrain/Step": 8134, "Pretrain/Step Time": 8.485180102288723} +{"Pretrain/Learning Rate": 3.206608367332009e-05, "Pretrain/Loss": 2.015855312347412, "Pretrain/Loss (Raw)": 1.9861750602722168, "Pretrain/Step": 8135, "Pretrain/Step Time": 8.483213419094682} +{"Pretrain/Learning Rate": 3.206201150179658e-05, "Pretrain/Loss": 2.016270160675049, "Pretrain/Loss (Raw)": 2.007075786590576, "Pretrain/Step": 8136, "Pretrain/Step Time": 8.485275618731976} +{"Pretrain/Learning Rate": 3.2057939126644955e-05, "Pretrain/Loss": 2.0160210132598877, "Pretrain/Loss (Raw)": 2.1529743671417236, "Pretrain/Step": 8137, "Pretrain/Step Time": 8.486356183886528} +{"Pretrain/Learning Rate": 3.205386654798263e-05, "Pretrain/Loss": 2.0170154571533203, "Pretrain/Loss (Raw)": 2.157447576522827, "Pretrain/Step": 8138, "Pretrain/Step Time": 8.492365635931492} +{"Pretrain/Learning Rate": 3.204979376592703e-05, "Pretrain/Loss": 2.0204532146453857, "Pretrain/Loss (Raw)": 2.3462798595428467, "Pretrain/Step": 8139, "Pretrain/Step Time": 8.487906411290169} +{"Pretrain/Learning Rate": 3.20457207805956e-05, "Pretrain/Loss": 2.021561622619629, "Pretrain/Loss (Raw)": 2.0366404056549072, "Pretrain/Step": 8140, "Pretrain/Step Time": 8.492540590465069} +{"Pretrain/Learning Rate": 3.2041647592105775e-05, "Pretrain/Loss": 2.0208559036254883, "Pretrain/Loss (Raw)": 1.9133546352386475, "Pretrain/Step": 8141, "Pretrain/Step Time": 8.493712518364191} +{"Pretrain/Learning Rate": 3.2037574200575005e-05, "Pretrain/Loss": 2.021331548690796, "Pretrain/Loss (Raw)": 2.176225185394287, "Pretrain/Step": 8142, "Pretrain/Step Time": 8.485349994152784} +{"Pretrain/Learning Rate": 3.203350060612075e-05, "Pretrain/Loss": 2.023131847381592, "Pretrain/Loss (Raw)": 2.044548273086548, "Pretrain/Step": 8143, "Pretrain/Step Time": 8.490517288446426} +{"Pretrain/Learning Rate": 3.202942680886045e-05, "Pretrain/Loss": 2.0229341983795166, "Pretrain/Loss (Raw)": 2.2790138721466064, "Pretrain/Step": 8144, "Pretrain/Step Time": 8.495842507109046} +{"Pretrain/Learning Rate": 3.2025352808911595e-05, "Pretrain/Loss": 2.023560047149658, "Pretrain/Loss (Raw)": 2.0289435386657715, "Pretrain/Step": 8145, "Pretrain/Step Time": 8.491899000480771} +{"Pretrain/Learning Rate": 3.202127860639165e-05, "Pretrain/Loss": 2.026038408279419, "Pretrain/Loss (Raw)": 2.2069592475891113, "Pretrain/Step": 8146, "Pretrain/Step Time": 8.494485491886735} +{"Pretrain/Learning Rate": 3.201720420141807e-05, "Pretrain/Loss": 2.0261783599853516, "Pretrain/Loss (Raw)": 2.0944063663482666, "Pretrain/Step": 8147, "Pretrain/Step Time": 8.490804018452764} +{"Pretrain/Learning Rate": 3.201312959410837e-05, "Pretrain/Loss": 2.027146339416504, "Pretrain/Loss (Raw)": 2.105658769607544, "Pretrain/Step": 8148, "Pretrain/Step Time": 8.485409574583173} +{"Pretrain/Learning Rate": 3.2009054784580014e-05, "Pretrain/Loss": 2.027514934539795, "Pretrain/Loss (Raw)": 2.1601855754852295, "Pretrain/Step": 8149, "Pretrain/Step Time": 8.488980984315276} +{"Pretrain/Learning Rate": 3.20049797729505e-05, "Pretrain/Loss": 2.0288209915161133, "Pretrain/Loss (Raw)": 2.221125602722168, "Pretrain/Step": 8150, "Pretrain/Step Time": 8.482409045100212} +{"Pretrain/Learning Rate": 3.200090455933734e-05, "Pretrain/Loss": 2.027580738067627, "Pretrain/Loss (Raw)": 1.7788288593292236, "Pretrain/Step": 8151, "Pretrain/Step Time": 8.489456688985229} +{"Pretrain/Learning Rate": 3.199682914385803e-05, "Pretrain/Loss": 2.03399920463562, "Pretrain/Loss (Raw)": 2.7203543186187744, "Pretrain/Step": 8152, "Pretrain/Step Time": 8.483071818947792} +{"Pretrain/Learning Rate": 3.1992753526630085e-05, "Pretrain/Loss": 2.036130666732788, "Pretrain/Loss (Raw)": 2.0588979721069336, "Pretrain/Step": 8153, "Pretrain/Step Time": 8.483897870406508} +{"Pretrain/Learning Rate": 3.198867770777102e-05, "Pretrain/Loss": 2.0350570678710938, "Pretrain/Loss (Raw)": 1.9228781461715698, "Pretrain/Step": 8154, "Pretrain/Step Time": 8.482024503871799} +{"Pretrain/Learning Rate": 3.1984601687398355e-05, "Pretrain/Loss": 2.0362401008605957, "Pretrain/Loss (Raw)": 2.0091609954833984, "Pretrain/Step": 8155, "Pretrain/Step Time": 8.484606644138694} +{"Pretrain/Learning Rate": 3.198052546562963e-05, "Pretrain/Loss": 2.038238525390625, "Pretrain/Loss (Raw)": 2.2224156856536865, "Pretrain/Step": 8156, "Pretrain/Step Time": 8.481362571939826} +{"Pretrain/Learning Rate": 3.197644904258237e-05, "Pretrain/Loss": 2.0388832092285156, "Pretrain/Loss (Raw)": 2.0071778297424316, "Pretrain/Step": 8157, "Pretrain/Step Time": 8.476147212088108} +{"Pretrain/Learning Rate": 3.197237241837413e-05, "Pretrain/Loss": 2.0415568351745605, "Pretrain/Loss (Raw)": 2.323709487915039, "Pretrain/Step": 8158, "Pretrain/Step Time": 8.476577445864677} +{"Pretrain/Learning Rate": 3.196829559312244e-05, "Pretrain/Loss": 2.041276216506958, "Pretrain/Loss (Raw)": 1.9408026933670044, "Pretrain/Step": 8159, "Pretrain/Step Time": 8.477373335510492} +{"Pretrain/Learning Rate": 3.196421856694486e-05, "Pretrain/Loss": 2.0413968563079834, "Pretrain/Loss (Raw)": 1.9132696390151978, "Pretrain/Step": 8160, "Pretrain/Step Time": 8.470848713070154} +{"Pretrain/Learning Rate": 3.1960141339958935e-05, "Pretrain/Loss": 2.043193817138672, "Pretrain/Loss (Raw)": 2.1039066314697266, "Pretrain/Step": 8161, "Pretrain/Step Time": 8.467461192980409} +{"Pretrain/Learning Rate": 3.195606391228226e-05, "Pretrain/Loss": 2.0434985160827637, "Pretrain/Loss (Raw)": 2.080094337463379, "Pretrain/Step": 8162, "Pretrain/Step Time": 8.46742120757699} +{"Pretrain/Learning Rate": 3.195198628403238e-05, "Pretrain/Loss": 2.045971632003784, "Pretrain/Loss (Raw)": 2.2910282611846924, "Pretrain/Step": 8163, "Pretrain/Step Time": 8.46503859385848} +{"Pretrain/Learning Rate": 3.194790845532687e-05, "Pretrain/Loss": 2.045133113861084, "Pretrain/Loss (Raw)": 2.0209908485412598, "Pretrain/Step": 8164, "Pretrain/Step Time": 8.463946780189872} +{"Pretrain/Learning Rate": 3.194383042628333e-05, "Pretrain/Loss": 2.045304298400879, "Pretrain/Loss (Raw)": 2.150843620300293, "Pretrain/Step": 8165, "Pretrain/Step Time": 8.469003189355135} +{"Pretrain/Learning Rate": 3.1939752197019326e-05, "Pretrain/Loss": 2.0465877056121826, "Pretrain/Loss (Raw)": 2.083967685699463, "Pretrain/Step": 8166, "Pretrain/Step Time": 8.46660091355443} +{"Pretrain/Learning Rate": 3.1935673767652454e-05, "Pretrain/Loss": 2.048090934753418, "Pretrain/Loss (Raw)": 2.1573233604431152, "Pretrain/Step": 8167, "Pretrain/Step Time": 8.469661124050617} +{"Pretrain/Learning Rate": 3.1931595138300325e-05, "Pretrain/Loss": 2.049981117248535, "Pretrain/Loss (Raw)": 2.0091280937194824, "Pretrain/Step": 8168, "Pretrain/Step Time": 8.46655653975904} +{"Pretrain/Learning Rate": 3.192751630908054e-05, "Pretrain/Loss": 2.050906181335449, "Pretrain/Loss (Raw)": 1.8545383214950562, "Pretrain/Step": 8169, "Pretrain/Step Time": 8.463883347809315} +{"Pretrain/Learning Rate": 3.19234372801107e-05, "Pretrain/Loss": 2.0531911849975586, "Pretrain/Loss (Raw)": 2.117410659790039, "Pretrain/Step": 8170, "Pretrain/Step Time": 8.462232675403357} +{"Pretrain/Learning Rate": 3.191935805150843e-05, "Pretrain/Loss": 2.0493431091308594, "Pretrain/Loss (Raw)": 1.7492395639419556, "Pretrain/Step": 8171, "Pretrain/Step Time": 8.463496126234531} +{"Pretrain/Learning Rate": 3.191527862339134e-05, "Pretrain/Loss": 2.048015832901001, "Pretrain/Loss (Raw)": 1.8979926109313965, "Pretrain/Step": 8172, "Pretrain/Step Time": 8.462098106741905} +{"Pretrain/Learning Rate": 3.1911198995877075e-05, "Pretrain/Loss": 2.0496907234191895, "Pretrain/Loss (Raw)": 2.0901682376861572, "Pretrain/Step": 8173, "Pretrain/Step Time": 8.461392072960734} +{"Pretrain/Learning Rate": 3.1907119169083264e-05, "Pretrain/Loss": 2.0508501529693604, "Pretrain/Loss (Raw)": 1.971430778503418, "Pretrain/Step": 8174, "Pretrain/Step Time": 8.460966754704714} +{"Pretrain/Learning Rate": 3.190303914312753e-05, "Pretrain/Loss": 2.051945209503174, "Pretrain/Loss (Raw)": 2.0314955711364746, "Pretrain/Step": 8175, "Pretrain/Step Time": 8.45985753275454} +{"Pretrain/Learning Rate": 3.189895891812753e-05, "Pretrain/Loss": 2.050625801086426, "Pretrain/Loss (Raw)": 2.0585532188415527, "Pretrain/Step": 8176, "Pretrain/Step Time": 8.461237413808703} +{"Pretrain/Learning Rate": 3.189487849420091e-05, "Pretrain/Loss": 2.050541877746582, "Pretrain/Loss (Raw)": 1.9668368101119995, "Pretrain/Step": 8177, "Pretrain/Step Time": 8.463305847719312} +{"Pretrain/Learning Rate": 3.1890797871465336e-05, "Pretrain/Loss": 2.0512776374816895, "Pretrain/Loss (Raw)": 2.0780930519104004, "Pretrain/Step": 8178, "Pretrain/Step Time": 8.460843749344349} +{"Pretrain/Learning Rate": 3.188671705003846e-05, "Pretrain/Loss": 2.0498929023742676, "Pretrain/Loss (Raw)": 1.927233099937439, "Pretrain/Step": 8179, "Pretrain/Step Time": 8.458291839808226} +{"Pretrain/Learning Rate": 3.188263603003796e-05, "Pretrain/Loss": 2.0498833656311035, "Pretrain/Loss (Raw)": 1.9566267728805542, "Pretrain/Step": 8180, "Pretrain/Step Time": 8.463493838906288} +{"Pretrain/Learning Rate": 3.18785548115815e-05, "Pretrain/Loss": 2.0504086017608643, "Pretrain/Loss (Raw)": 1.8521732091903687, "Pretrain/Step": 8181, "Pretrain/Step Time": 8.4633150678128} +{"Pretrain/Learning Rate": 3.187447339478675e-05, "Pretrain/Loss": 2.0501816272735596, "Pretrain/Loss (Raw)": 2.0469141006469727, "Pretrain/Step": 8182, "Pretrain/Step Time": 8.466550962999463} +{"Pretrain/Learning Rate": 3.187039177977141e-05, "Pretrain/Loss": 2.048807382583618, "Pretrain/Loss (Raw)": 2.0337533950805664, "Pretrain/Step": 8183, "Pretrain/Step Time": 8.464805787429214} +{"Pretrain/Learning Rate": 3.186630996665317e-05, "Pretrain/Loss": 2.0469040870666504, "Pretrain/Loss (Raw)": 1.974801778793335, "Pretrain/Step": 8184, "Pretrain/Step Time": 8.460407892242074} +{"Pretrain/Learning Rate": 3.186222795554973e-05, "Pretrain/Loss": 2.048556089401245, "Pretrain/Loss (Raw)": 2.2102885246276855, "Pretrain/Step": 8185, "Pretrain/Step Time": 8.458067694678903} +{"Pretrain/Learning Rate": 3.185814574657878e-05, "Pretrain/Loss": 2.048358678817749, "Pretrain/Loss (Raw)": 2.0024900436401367, "Pretrain/Step": 8186, "Pretrain/Step Time": 8.462320366874337} +{"Pretrain/Learning Rate": 3.185406333985802e-05, "Pretrain/Loss": 2.047970771789551, "Pretrain/Loss (Raw)": 2.133906841278076, "Pretrain/Step": 8187, "Pretrain/Step Time": 8.463960748165846} +{"Pretrain/Learning Rate": 3.184998073550518e-05, "Pretrain/Loss": 2.0468497276306152, "Pretrain/Loss (Raw)": 2.058277130126953, "Pretrain/Step": 8188, "Pretrain/Step Time": 8.458991285413504} +{"Pretrain/Learning Rate": 3.184589793363798e-05, "Pretrain/Loss": 2.04699444770813, "Pretrain/Loss (Raw)": 2.223006010055542, "Pretrain/Step": 8189, "Pretrain/Step Time": 8.462131638079882} +{"Pretrain/Learning Rate": 3.184181493437415e-05, "Pretrain/Loss": 2.048079013824463, "Pretrain/Loss (Raw)": 1.9948759078979492, "Pretrain/Step": 8190, "Pretrain/Step Time": 8.45875247195363} +{"Pretrain/Learning Rate": 3.1837731737831386e-05, "Pretrain/Loss": 2.0467123985290527, "Pretrain/Loss (Raw)": 2.0263772010803223, "Pretrain/Step": 8191, "Pretrain/Step Time": 8.458553275093436} +{"Pretrain/Learning Rate": 3.183364834412747e-05, "Pretrain/Loss": 2.0475821495056152, "Pretrain/Loss (Raw)": 2.0925910472869873, "Pretrain/Step": 8192, "Pretrain/Step Time": 8.459465324878693} +{"Pretrain/Learning Rate": 3.1829564753380105e-05, "Pretrain/Loss": 2.0476818084716797, "Pretrain/Loss (Raw)": 2.0411174297332764, "Pretrain/Step": 8193, "Pretrain/Step Time": 8.458382565528154} +{"Pretrain/Learning Rate": 3.1825480965707055e-05, "Pretrain/Loss": 2.048123836517334, "Pretrain/Loss (Raw)": 1.9353818893432617, "Pretrain/Step": 8194, "Pretrain/Step Time": 8.456339504569769} +{"Pretrain/Learning Rate": 3.182139698122608e-05, "Pretrain/Loss": 2.047794818878174, "Pretrain/Loss (Raw)": 1.9669883251190186, "Pretrain/Step": 8195, "Pretrain/Step Time": 8.457773078233004} +{"Pretrain/Learning Rate": 3.181731280005493e-05, "Pretrain/Loss": 2.0476441383361816, "Pretrain/Loss (Raw)": 2.038907289505005, "Pretrain/Step": 8196, "Pretrain/Step Time": 8.46021518856287} +{"Pretrain/Learning Rate": 3.181322842231137e-05, "Pretrain/Loss": 2.050150156021118, "Pretrain/Loss (Raw)": 2.3033664226531982, "Pretrain/Step": 8197, "Pretrain/Step Time": 8.454747758805752} +{"Pretrain/Learning Rate": 3.180914384811317e-05, "Pretrain/Loss": 2.0493335723876953, "Pretrain/Loss (Raw)": 1.8431482315063477, "Pretrain/Step": 8198, "Pretrain/Step Time": 8.45655433088541} +{"Pretrain/Learning Rate": 3.1805059077578114e-05, "Pretrain/Loss": 2.0480148792266846, "Pretrain/Loss (Raw)": 1.890993356704712, "Pretrain/Step": 8199, "Pretrain/Step Time": 8.453973576426506} +{"Pretrain/Learning Rate": 3.180097411082397e-05, "Pretrain/Loss": 2.0486340522766113, "Pretrain/Loss (Raw)": 2.012357711791992, "Pretrain/Step": 8200, "Pretrain/Step Time": 8.45707280561328} +{"Pretrain/Learning Rate": 3.179688894796854e-05, "Pretrain/Loss": 2.0483322143554688, "Pretrain/Loss (Raw)": 1.9188152551651, "Pretrain/Step": 8201, "Pretrain/Step Time": 8.457191972061992} +{"Pretrain/Learning Rate": 3.17928035891296e-05, "Pretrain/Loss": 2.047666549682617, "Pretrain/Loss (Raw)": 2.053806781768799, "Pretrain/Step": 8202, "Pretrain/Step Time": 8.45693545602262} +{"Pretrain/Learning Rate": 3.1788718034424956e-05, "Pretrain/Loss": 2.048908233642578, "Pretrain/Loss (Raw)": 2.1256353855133057, "Pretrain/Step": 8203, "Pretrain/Step Time": 8.458511365577579} +{"Pretrain/Learning Rate": 3.1784632283972425e-05, "Pretrain/Loss": 2.0487611293792725, "Pretrain/Loss (Raw)": 2.009542226791382, "Pretrain/Step": 8204, "Pretrain/Step Time": 8.457405220717192} +{"Pretrain/Learning Rate": 3.1780546337889795e-05, "Pretrain/Loss": 2.042463541030884, "Pretrain/Loss (Raw)": 1.736531376838684, "Pretrain/Step": 8205, "Pretrain/Step Time": 8.45460674725473} +{"Pretrain/Learning Rate": 3.17764601962949e-05, "Pretrain/Loss": 2.0421290397644043, "Pretrain/Loss (Raw)": 1.9421236515045166, "Pretrain/Step": 8206, "Pretrain/Step Time": 8.455076515674591} +{"Pretrain/Learning Rate": 3.177237385930554e-05, "Pretrain/Loss": 2.0420076847076416, "Pretrain/Loss (Raw)": 2.0820789337158203, "Pretrain/Step": 8207, "Pretrain/Step Time": 8.459949029609561} +{"Pretrain/Learning Rate": 3.176828732703956e-05, "Pretrain/Loss": 2.0417141914367676, "Pretrain/Loss (Raw)": 2.0109810829162598, "Pretrain/Step": 8208, "Pretrain/Step Time": 8.453720290213823} +{"Pretrain/Learning Rate": 3.176420059961479e-05, "Pretrain/Loss": 2.038983106613159, "Pretrain/Loss (Raw)": 1.8407093286514282, "Pretrain/Step": 8209, "Pretrain/Step Time": 8.453179571777582} +{"Pretrain/Learning Rate": 3.1760113677149055e-05, "Pretrain/Loss": 2.0375423431396484, "Pretrain/Loss (Raw)": 1.8980756998062134, "Pretrain/Step": 8210, "Pretrain/Step Time": 8.457945069298148} +{"Pretrain/Learning Rate": 3.175602655976021e-05, "Pretrain/Loss": 2.039240598678589, "Pretrain/Loss (Raw)": 1.9728585481643677, "Pretrain/Step": 8211, "Pretrain/Step Time": 8.45479173772037} +{"Pretrain/Learning Rate": 3.175193924756612e-05, "Pretrain/Loss": 2.0391154289245605, "Pretrain/Loss (Raw)": 2.057201385498047, "Pretrain/Step": 8212, "Pretrain/Step Time": 8.45449236407876} +{"Pretrain/Learning Rate": 3.17478517406846e-05, "Pretrain/Loss": 2.040147066116333, "Pretrain/Loss (Raw)": 2.052229166030884, "Pretrain/Step": 8213, "Pretrain/Step Time": 8.452465936541557} +{"Pretrain/Learning Rate": 3.174376403923354e-05, "Pretrain/Loss": 2.0395748615264893, "Pretrain/Loss (Raw)": 2.0887253284454346, "Pretrain/Step": 8214, "Pretrain/Step Time": 8.449388256296515} +{"Pretrain/Learning Rate": 3.173967614333079e-05, "Pretrain/Loss": 2.0385892391204834, "Pretrain/Loss (Raw)": 1.9642924070358276, "Pretrain/Step": 8215, "Pretrain/Step Time": 8.458667263388634} +{"Pretrain/Learning Rate": 3.1735588053094236e-05, "Pretrain/Loss": 2.0385472774505615, "Pretrain/Loss (Raw)": 1.990336537361145, "Pretrain/Step": 8216, "Pretrain/Step Time": 8.455723343417048} +{"Pretrain/Learning Rate": 3.173149976864175e-05, "Pretrain/Loss": 2.041179895401001, "Pretrain/Loss (Raw)": 2.1929662227630615, "Pretrain/Step": 8217, "Pretrain/Step Time": 8.458498045802116} +{"Pretrain/Learning Rate": 3.1727411290091214e-05, "Pretrain/Loss": 2.043797254562378, "Pretrain/Loss (Raw)": 2.3207480907440186, "Pretrain/Step": 8218, "Pretrain/Step Time": 8.457252418622375} +{"Pretrain/Learning Rate": 3.1723322617560516e-05, "Pretrain/Loss": 2.0436410903930664, "Pretrain/Loss (Raw)": 1.9991695880889893, "Pretrain/Step": 8219, "Pretrain/Step Time": 8.457696663215756} +{"Pretrain/Learning Rate": 3.1719233751167544e-05, "Pretrain/Loss": 2.0439720153808594, "Pretrain/Loss (Raw)": 2.0207419395446777, "Pretrain/Step": 8220, "Pretrain/Step Time": 8.455936213955283} +{"Pretrain/Learning Rate": 3.1715144691030205e-05, "Pretrain/Loss": 2.0463619232177734, "Pretrain/Loss (Raw)": 2.204049587249756, "Pretrain/Step": 8221, "Pretrain/Step Time": 8.45267765969038} +{"Pretrain/Learning Rate": 3.171105543726641e-05, "Pretrain/Loss": 2.0493006706237793, "Pretrain/Loss (Raw)": 2.251352310180664, "Pretrain/Step": 8222, "Pretrain/Step Time": 8.453598611056805} +{"Pretrain/Learning Rate": 3.170696598999406e-05, "Pretrain/Loss": 2.0482354164123535, "Pretrain/Loss (Raw)": 1.878064751625061, "Pretrain/Step": 8223, "Pretrain/Step Time": 8.451661264523864} +{"Pretrain/Learning Rate": 3.170287634933107e-05, "Pretrain/Loss": 2.049774408340454, "Pretrain/Loss (Raw)": 2.198680877685547, "Pretrain/Step": 8224, "Pretrain/Step Time": 8.451835922896862} +{"Pretrain/Learning Rate": 3.169878651539537e-05, "Pretrain/Loss": 2.0484097003936768, "Pretrain/Loss (Raw)": 2.056269407272339, "Pretrain/Step": 8225, "Pretrain/Step Time": 8.451881540939212} +{"Pretrain/Learning Rate": 3.1694696488304874e-05, "Pretrain/Loss": 2.046976327896118, "Pretrain/Loss (Raw)": 1.9663891792297363, "Pretrain/Step": 8226, "Pretrain/Step Time": 8.451102916151285} +{"Pretrain/Learning Rate": 3.169060626817754e-05, "Pretrain/Loss": 2.0478811264038086, "Pretrain/Loss (Raw)": 2.0302071571350098, "Pretrain/Step": 8227, "Pretrain/Step Time": 8.4499806817621} +{"Pretrain/Learning Rate": 3.168651585513128e-05, "Pretrain/Loss": 2.046452522277832, "Pretrain/Loss (Raw)": 1.9667561054229736, "Pretrain/Step": 8228, "Pretrain/Step Time": 8.443782297894359} +{"Pretrain/Learning Rate": 3.168242524928405e-05, "Pretrain/Loss": 2.044257640838623, "Pretrain/Loss (Raw)": 1.8589352369308472, "Pretrain/Step": 8229, "Pretrain/Step Time": 8.450134148821235} +{"Pretrain/Learning Rate": 3.167833445075379e-05, "Pretrain/Loss": 2.0458641052246094, "Pretrain/Loss (Raw)": 2.2414133548736572, "Pretrain/Step": 8230, "Pretrain/Step Time": 8.448418950662017} +{"Pretrain/Learning Rate": 3.1674243459658475e-05, "Pretrain/Loss": 2.0470032691955566, "Pretrain/Loss (Raw)": 2.213402032852173, "Pretrain/Step": 8231, "Pretrain/Step Time": 8.451591370627284} +{"Pretrain/Learning Rate": 3.167015227611606e-05, "Pretrain/Loss": 2.047348976135254, "Pretrain/Loss (Raw)": 2.0059382915496826, "Pretrain/Step": 8232, "Pretrain/Step Time": 8.452099427580833} +{"Pretrain/Learning Rate": 3.16660609002445e-05, "Pretrain/Loss": 2.047257900238037, "Pretrain/Loss (Raw)": 2.001878261566162, "Pretrain/Step": 8233, "Pretrain/Step Time": 8.452777490019798} +{"Pretrain/Learning Rate": 3.1661969332161766e-05, "Pretrain/Loss": 2.0458297729492188, "Pretrain/Loss (Raw)": 2.007650136947632, "Pretrain/Step": 8234, "Pretrain/Step Time": 8.455045215785503} +{"Pretrain/Learning Rate": 3.165787757198585e-05, "Pretrain/Loss": 2.048219680786133, "Pretrain/Loss (Raw)": 2.009143114089966, "Pretrain/Step": 8235, "Pretrain/Step Time": 8.45542424172163} +{"Pretrain/Learning Rate": 3.1653785619834734e-05, "Pretrain/Loss": 2.0466668605804443, "Pretrain/Loss (Raw)": 1.8201050758361816, "Pretrain/Step": 8236, "Pretrain/Step Time": 8.453242162242532} +{"Pretrain/Learning Rate": 3.164969347582639e-05, "Pretrain/Loss": 2.048713445663452, "Pretrain/Loss (Raw)": 2.1787655353546143, "Pretrain/Step": 8237, "Pretrain/Step Time": 8.452404187992215} +{"Pretrain/Learning Rate": 3.164560114007883e-05, "Pretrain/Loss": 2.0502824783325195, "Pretrain/Loss (Raw)": 2.094724178314209, "Pretrain/Step": 8238, "Pretrain/Step Time": 8.454389529302716} +{"Pretrain/Learning Rate": 3.164150861271004e-05, "Pretrain/Loss": 2.0511207580566406, "Pretrain/Loss (Raw)": 2.1258366107940674, "Pretrain/Step": 8239, "Pretrain/Step Time": 8.451890686526895} +{"Pretrain/Learning Rate": 3.163741589383803e-05, "Pretrain/Loss": 2.051270008087158, "Pretrain/Loss (Raw)": 1.9887439012527466, "Pretrain/Step": 8240, "Pretrain/Step Time": 8.448777634650469} +{"Pretrain/Learning Rate": 3.163332298358081e-05, "Pretrain/Loss": 2.0512588024139404, "Pretrain/Loss (Raw)": 2.2379469871520996, "Pretrain/Step": 8241, "Pretrain/Step Time": 8.450458897277713} +{"Pretrain/Learning Rate": 3.162922988205641e-05, "Pretrain/Loss": 2.0507493019104004, "Pretrain/Loss (Raw)": 1.7541468143463135, "Pretrain/Step": 8242, "Pretrain/Step Time": 8.447012780234218} +{"Pretrain/Learning Rate": 3.162513658938283e-05, "Pretrain/Loss": 2.0495975017547607, "Pretrain/Loss (Raw)": 1.9507808685302734, "Pretrain/Step": 8243, "Pretrain/Step Time": 8.444909546524286} +{"Pretrain/Learning Rate": 3.1621043105678106e-05, "Pretrain/Loss": 2.051816701889038, "Pretrain/Loss (Raw)": 2.289196252822876, "Pretrain/Step": 8244, "Pretrain/Step Time": 8.440445698797703} +{"Pretrain/Learning Rate": 3.161694943106028e-05, "Pretrain/Loss": 2.050232410430908, "Pretrain/Loss (Raw)": 2.01892352104187, "Pretrain/Step": 8245, "Pretrain/Step Time": 8.441264359280467} +{"Pretrain/Learning Rate": 3.1612855565647376e-05, "Pretrain/Loss": 2.050388813018799, "Pretrain/Loss (Raw)": 2.0515966415405273, "Pretrain/Step": 8246, "Pretrain/Step Time": 8.440114758908749} +{"Pretrain/Learning Rate": 3.1608761509557445e-05, "Pretrain/Loss": 2.049232006072998, "Pretrain/Loss (Raw)": 1.7532391548156738, "Pretrain/Step": 8247, "Pretrain/Step Time": 8.438728069886565} +{"Pretrain/Learning Rate": 3.160466726290853e-05, "Pretrain/Loss": 2.0514883995056152, "Pretrain/Loss (Raw)": 2.15366268157959, "Pretrain/Step": 8248, "Pretrain/Step Time": 8.443283470347524} +{"Pretrain/Learning Rate": 3.1600572825818696e-05, "Pretrain/Loss": 2.04838228225708, "Pretrain/Loss (Raw)": 1.7746270895004272, "Pretrain/Step": 8249, "Pretrain/Step Time": 8.441056162118912} +{"Pretrain/Learning Rate": 3.1596478198406e-05, "Pretrain/Loss": 2.0489063262939453, "Pretrain/Loss (Raw)": 2.0324604511260986, "Pretrain/Step": 8250, "Pretrain/Step Time": 8.444980777800083} +{"Pretrain/Learning Rate": 3.15923833807885e-05, "Pretrain/Loss": 2.047961711883545, "Pretrain/Loss (Raw)": 1.9545451402664185, "Pretrain/Step": 8251, "Pretrain/Step Time": 8.447533901780844} +{"Pretrain/Learning Rate": 3.158828837308427e-05, "Pretrain/Loss": 2.049574613571167, "Pretrain/Loss (Raw)": 2.1190311908721924, "Pretrain/Step": 8252, "Pretrain/Step Time": 8.44366392865777} +{"Pretrain/Learning Rate": 3.158419317541139e-05, "Pretrain/Loss": 2.0481343269348145, "Pretrain/Loss (Raw)": 2.0094125270843506, "Pretrain/Step": 8253, "Pretrain/Step Time": 8.442404234781861} +{"Pretrain/Learning Rate": 3.1580097787887955e-05, "Pretrain/Loss": 2.049405097961426, "Pretrain/Loss (Raw)": 2.071490526199341, "Pretrain/Step": 8254, "Pretrain/Step Time": 8.442441815510392} +{"Pretrain/Learning Rate": 3.1576002210632025e-05, "Pretrain/Loss": 2.047494411468506, "Pretrain/Loss (Raw)": 1.9756767749786377, "Pretrain/Step": 8255, "Pretrain/Step Time": 8.442182544618845} +{"Pretrain/Learning Rate": 3.1571906443761704e-05, "Pretrain/Loss": 2.048945426940918, "Pretrain/Loss (Raw)": 2.067972421646118, "Pretrain/Step": 8256, "Pretrain/Step Time": 8.436606146395206} +{"Pretrain/Learning Rate": 3.15678104873951e-05, "Pretrain/Loss": 2.0485591888427734, "Pretrain/Loss (Raw)": 2.079606771469116, "Pretrain/Step": 8257, "Pretrain/Step Time": 8.441150948405266} +{"Pretrain/Learning Rate": 3.1563714341650315e-05, "Pretrain/Loss": 2.04850172996521, "Pretrain/Loss (Raw)": 2.1002230644226074, "Pretrain/Step": 8258, "Pretrain/Step Time": 8.444431269541383} +{"Pretrain/Learning Rate": 3.155961800664545e-05, "Pretrain/Loss": 2.0479960441589355, "Pretrain/Loss (Raw)": 2.0900580883026123, "Pretrain/Step": 8259, "Pretrain/Step Time": 8.435328936204314} +{"Pretrain/Learning Rate": 3.155552148249862e-05, "Pretrain/Loss": 2.0480780601501465, "Pretrain/Loss (Raw)": 1.900712251663208, "Pretrain/Step": 8260, "Pretrain/Step Time": 8.436141530051827} +{"Pretrain/Learning Rate": 3.155142476932795e-05, "Pretrain/Loss": 2.0492796897888184, "Pretrain/Loss (Raw)": 2.1261041164398193, "Pretrain/Step": 8261, "Pretrain/Step Time": 8.437898825854063} +{"Pretrain/Learning Rate": 3.154732786725157e-05, "Pretrain/Loss": 2.0458617210388184, "Pretrain/Loss (Raw)": 1.8898890018463135, "Pretrain/Step": 8262, "Pretrain/Step Time": 8.440722258761525} +{"Pretrain/Learning Rate": 3.15432307763876e-05, "Pretrain/Loss": 2.045214891433716, "Pretrain/Loss (Raw)": 1.9033761024475098, "Pretrain/Step": 8263, "Pretrain/Step Time": 8.44173021055758} +{"Pretrain/Learning Rate": 3.15391334968542e-05, "Pretrain/Loss": 2.045793056488037, "Pretrain/Loss (Raw)": 2.081080198287964, "Pretrain/Step": 8264, "Pretrain/Step Time": 8.440914502367377} +{"Pretrain/Learning Rate": 3.153503602876948e-05, "Pretrain/Loss": 2.0451672077178955, "Pretrain/Loss (Raw)": 2.0728673934936523, "Pretrain/Step": 8265, "Pretrain/Step Time": 8.437766628339887} +{"Pretrain/Learning Rate": 3.1530938372251604e-05, "Pretrain/Loss": 2.043515682220459, "Pretrain/Loss (Raw)": 1.9460506439208984, "Pretrain/Step": 8266, "Pretrain/Step Time": 8.435309134423733} +{"Pretrain/Learning Rate": 3.1526840527418726e-05, "Pretrain/Loss": 2.0402255058288574, "Pretrain/Loss (Raw)": 1.9251326322555542, "Pretrain/Step": 8267, "Pretrain/Step Time": 8.438933188095689} +{"Pretrain/Learning Rate": 3.1522742494389e-05, "Pretrain/Loss": 2.0402722358703613, "Pretrain/Loss (Raw)": 2.04264235496521, "Pretrain/Step": 8268, "Pretrain/Step Time": 8.435352321714163} +{"Pretrain/Learning Rate": 3.15186442732806e-05, "Pretrain/Loss": 2.0413811206817627, "Pretrain/Loss (Raw)": 2.05527400970459, "Pretrain/Step": 8269, "Pretrain/Step Time": 8.4345166310668} +{"Pretrain/Learning Rate": 3.1514545864211684e-05, "Pretrain/Loss": 2.0398433208465576, "Pretrain/Loss (Raw)": 1.9794033765792847, "Pretrain/Step": 8270, "Pretrain/Step Time": 8.435960268601775} +{"Pretrain/Learning Rate": 3.151044726730043e-05, "Pretrain/Loss": 2.038440227508545, "Pretrain/Loss (Raw)": 1.8649147748947144, "Pretrain/Step": 8271, "Pretrain/Step Time": 8.429281057789922} +{"Pretrain/Learning Rate": 3.150634848266501e-05, "Pretrain/Loss": 2.035001754760742, "Pretrain/Loss (Raw)": 1.8388898372650146, "Pretrain/Step": 8272, "Pretrain/Step Time": 8.427119541913271} +{"Pretrain/Learning Rate": 3.150224951042363e-05, "Pretrain/Loss": 2.0339112281799316, "Pretrain/Loss (Raw)": 1.8893779516220093, "Pretrain/Step": 8273, "Pretrain/Step Time": 8.429732726886868} +{"Pretrain/Learning Rate": 3.149815035069447e-05, "Pretrain/Loss": 2.0313949584960938, "Pretrain/Loss (Raw)": 1.8848716020584106, "Pretrain/Step": 8274, "Pretrain/Step Time": 8.432145128026605} +{"Pretrain/Learning Rate": 3.149405100359572e-05, "Pretrain/Loss": 2.032529830932617, "Pretrain/Loss (Raw)": 2.2396857738494873, "Pretrain/Step": 8275, "Pretrain/Step Time": 8.43326305039227} +{"Pretrain/Learning Rate": 3.1489951469245585e-05, "Pretrain/Loss": 2.0334672927856445, "Pretrain/Loss (Raw)": 2.2256200313568115, "Pretrain/Step": 8276, "Pretrain/Step Time": 8.433405498042703} +{"Pretrain/Learning Rate": 3.148585174776228e-05, "Pretrain/Loss": 2.034665584564209, "Pretrain/Loss (Raw)": 2.3135735988616943, "Pretrain/Step": 8277, "Pretrain/Step Time": 8.4301254209131} +{"Pretrain/Learning Rate": 3.148175183926401e-05, "Pretrain/Loss": 2.031721591949463, "Pretrain/Loss (Raw)": 1.844322919845581, "Pretrain/Step": 8278, "Pretrain/Step Time": 8.432218002155423} +{"Pretrain/Learning Rate": 3.1477651743868994e-05, "Pretrain/Loss": 2.033365249633789, "Pretrain/Loss (Raw)": 1.9892023801803589, "Pretrain/Step": 8279, "Pretrain/Step Time": 8.42604797706008} +{"Pretrain/Learning Rate": 3.147355146169546e-05, "Pretrain/Loss": 2.0280089378356934, "Pretrain/Loss (Raw)": 2.0347418785095215, "Pretrain/Step": 8280, "Pretrain/Step Time": 8.434033097699285} +{"Pretrain/Learning Rate": 3.1469450992861627e-05, "Pretrain/Loss": 2.02813720703125, "Pretrain/Loss (Raw)": 2.0753095149993896, "Pretrain/Step": 8281, "Pretrain/Step Time": 8.433205416426063} +{"Pretrain/Learning Rate": 3.146535033748574e-05, "Pretrain/Loss": 2.0258021354675293, "Pretrain/Loss (Raw)": 1.6240129470825195, "Pretrain/Step": 8282, "Pretrain/Step Time": 8.429765006527305} +{"Pretrain/Learning Rate": 3.146124949568603e-05, "Pretrain/Loss": 2.0262365341186523, "Pretrain/Loss (Raw)": 2.0647661685943604, "Pretrain/Step": 8283, "Pretrain/Step Time": 8.429246474057436} +{"Pretrain/Learning Rate": 3.1457148467580746e-05, "Pretrain/Loss": 2.023843765258789, "Pretrain/Loss (Raw)": 1.9161356687545776, "Pretrain/Step": 8284, "Pretrain/Step Time": 8.431357795372605} +{"Pretrain/Learning Rate": 3.145304725328814e-05, "Pretrain/Loss": 2.025634765625, "Pretrain/Loss (Raw)": 2.236424446105957, "Pretrain/Step": 8285, "Pretrain/Step Time": 8.438757989555597} +{"Pretrain/Learning Rate": 3.144894585292647e-05, "Pretrain/Loss": 2.021639823913574, "Pretrain/Loss (Raw)": 1.8123478889465332, "Pretrain/Step": 8286, "Pretrain/Step Time": 8.438246732577682} +{"Pretrain/Learning Rate": 3.144484426661399e-05, "Pretrain/Loss": 2.022463798522949, "Pretrain/Loss (Raw)": 2.046257972717285, "Pretrain/Step": 8287, "Pretrain/Step Time": 8.439121257513762} +{"Pretrain/Learning Rate": 3.144074249446897e-05, "Pretrain/Loss": 2.02162504196167, "Pretrain/Loss (Raw)": 1.805911660194397, "Pretrain/Step": 8288, "Pretrain/Step Time": 8.438005849719048} +{"Pretrain/Learning Rate": 3.1436640536609676e-05, "Pretrain/Loss": 2.0206360816955566, "Pretrain/Loss (Raw)": 1.9773128032684326, "Pretrain/Step": 8289, "Pretrain/Step Time": 8.439387081190944} +{"Pretrain/Learning Rate": 3.1432538393154386e-05, "Pretrain/Loss": 2.0185604095458984, "Pretrain/Loss (Raw)": 1.8144062757492065, "Pretrain/Step": 8290, "Pretrain/Step Time": 8.438414493575692} +{"Pretrain/Learning Rate": 3.14284360642214e-05, "Pretrain/Loss": 2.0158321857452393, "Pretrain/Loss (Raw)": 1.9418506622314453, "Pretrain/Step": 8291, "Pretrain/Step Time": 8.44140120409429} +{"Pretrain/Learning Rate": 3.142433354992898e-05, "Pretrain/Loss": 2.0166068077087402, "Pretrain/Loss (Raw)": 2.1201367378234863, "Pretrain/Step": 8292, "Pretrain/Step Time": 8.438832025974989} +{"Pretrain/Learning Rate": 3.1420230850395434e-05, "Pretrain/Loss": 2.0167832374572754, "Pretrain/Loss (Raw)": 2.173413038253784, "Pretrain/Step": 8293, "Pretrain/Step Time": 8.435782300308347} +{"Pretrain/Learning Rate": 3.141612796573906e-05, "Pretrain/Loss": 2.015448570251465, "Pretrain/Loss (Raw)": 1.9131243228912354, "Pretrain/Step": 8294, "Pretrain/Step Time": 8.438780400902033} +{"Pretrain/Learning Rate": 3.141202489607815e-05, "Pretrain/Loss": 2.012216806411743, "Pretrain/Loss (Raw)": 1.743666648864746, "Pretrain/Step": 8295, "Pretrain/Step Time": 8.434957701712847} +{"Pretrain/Learning Rate": 3.140792164153104e-05, "Pretrain/Loss": 2.0109922885894775, "Pretrain/Loss (Raw)": 1.852388620376587, "Pretrain/Step": 8296, "Pretrain/Step Time": 8.438118701800704} +{"Pretrain/Learning Rate": 3.1403818202216006e-05, "Pretrain/Loss": 2.0132899284362793, "Pretrain/Loss (Raw)": 2.1486520767211914, "Pretrain/Step": 8297, "Pretrain/Step Time": 8.43838400579989} +{"Pretrain/Learning Rate": 3.13997145782514e-05, "Pretrain/Loss": 2.013188362121582, "Pretrain/Loss (Raw)": 2.1044042110443115, "Pretrain/Step": 8298, "Pretrain/Step Time": 8.44180022366345} +{"Pretrain/Learning Rate": 3.139561076975553e-05, "Pretrain/Loss": 2.0142881870269775, "Pretrain/Loss (Raw)": 1.8900327682495117, "Pretrain/Step": 8299, "Pretrain/Step Time": 8.443038636818528} +{"Pretrain/Learning Rate": 3.1391506776846736e-05, "Pretrain/Loss": 2.014775037765503, "Pretrain/Loss (Raw)": 1.960312843322754, "Pretrain/Step": 8300, "Pretrain/Step Time": 8.440143138170242} +{"Pretrain/Learning Rate": 3.138740259964336e-05, "Pretrain/Loss": 2.015714168548584, "Pretrain/Loss (Raw)": 2.210329055786133, "Pretrain/Step": 8301, "Pretrain/Step Time": 8.443685829639435} +{"Pretrain/Learning Rate": 3.1383298238263717e-05, "Pretrain/Loss": 2.017143726348877, "Pretrain/Loss (Raw)": 2.154418706893921, "Pretrain/Step": 8302, "Pretrain/Step Time": 8.44349772296846} +{"Pretrain/Learning Rate": 3.1379193692826175e-05, "Pretrain/Loss": 2.018054485321045, "Pretrain/Loss (Raw)": 2.1481125354766846, "Pretrain/Step": 8303, "Pretrain/Step Time": 8.443684410303831} +{"Pretrain/Learning Rate": 3.137508896344908e-05, "Pretrain/Loss": 2.017314910888672, "Pretrain/Loss (Raw)": 1.963853359222412, "Pretrain/Step": 8304, "Pretrain/Step Time": 8.440698126330972} +{"Pretrain/Learning Rate": 3.137098405025078e-05, "Pretrain/Loss": 2.017637252807617, "Pretrain/Loss (Raw)": 2.0081186294555664, "Pretrain/Step": 8305, "Pretrain/Step Time": 8.43882323242724} +{"Pretrain/Learning Rate": 3.136687895334966e-05, "Pretrain/Loss": 2.0169482231140137, "Pretrain/Loss (Raw)": 1.989869236946106, "Pretrain/Step": 8306, "Pretrain/Step Time": 8.439735567197204} +{"Pretrain/Learning Rate": 3.136277367286407e-05, "Pretrain/Loss": 2.0162670612335205, "Pretrain/Loss (Raw)": 1.8400901556015015, "Pretrain/Step": 8307, "Pretrain/Step Time": 8.44086992368102} +{"Pretrain/Learning Rate": 3.135866820891239e-05, "Pretrain/Loss": 2.0165350437164307, "Pretrain/Loss (Raw)": 1.9909148216247559, "Pretrain/Step": 8308, "Pretrain/Step Time": 8.4356260728091} +{"Pretrain/Learning Rate": 3.135456256161299e-05, "Pretrain/Loss": 2.0178191661834717, "Pretrain/Loss (Raw)": 2.0165138244628906, "Pretrain/Step": 8309, "Pretrain/Step Time": 8.435653420165181} +{"Pretrain/Learning Rate": 3.135045673108426e-05, "Pretrain/Loss": 2.018509864807129, "Pretrain/Loss (Raw)": 2.1353213787078857, "Pretrain/Step": 8310, "Pretrain/Step Time": 8.433181488886476} +{"Pretrain/Learning Rate": 3.1346350717444576e-05, "Pretrain/Loss": 2.0183722972869873, "Pretrain/Loss (Raw)": 2.016169786453247, "Pretrain/Step": 8311, "Pretrain/Step Time": 8.436980433762074} +{"Pretrain/Learning Rate": 3.1342244520812356e-05, "Pretrain/Loss": 2.0177183151245117, "Pretrain/Loss (Raw)": 1.8911149501800537, "Pretrain/Step": 8312, "Pretrain/Step Time": 8.439024187624454} +{"Pretrain/Learning Rate": 3.133813814130598e-05, "Pretrain/Loss": 2.0163588523864746, "Pretrain/Loss (Raw)": 2.0362372398376465, "Pretrain/Step": 8313, "Pretrain/Step Time": 8.438574451953173} +{"Pretrain/Learning Rate": 3.1334031579043866e-05, "Pretrain/Loss": 2.0177698135375977, "Pretrain/Loss (Raw)": 2.1831130981445312, "Pretrain/Step": 8314, "Pretrain/Step Time": 8.433902995660901} +{"Pretrain/Learning Rate": 3.132992483414441e-05, "Pretrain/Loss": 2.016331911087036, "Pretrain/Loss (Raw)": 1.949863076210022, "Pretrain/Step": 8315, "Pretrain/Step Time": 8.433202786371112} +{"Pretrain/Learning Rate": 3.1325817906726026e-05, "Pretrain/Loss": 2.016913414001465, "Pretrain/Loss (Raw)": 2.132718086242676, "Pretrain/Step": 8316, "Pretrain/Step Time": 8.435635954141617} +{"Pretrain/Learning Rate": 3.132171079690716e-05, "Pretrain/Loss": 2.015942335128784, "Pretrain/Loss (Raw)": 2.0986886024475098, "Pretrain/Step": 8317, "Pretrain/Step Time": 8.432375609874725} +{"Pretrain/Learning Rate": 3.131760350480621e-05, "Pretrain/Loss": 2.0158019065856934, "Pretrain/Loss (Raw)": 1.9769177436828613, "Pretrain/Step": 8318, "Pretrain/Step Time": 8.435361258685589} +{"Pretrain/Learning Rate": 3.1313496030541616e-05, "Pretrain/Loss": 2.01796817779541, "Pretrain/Loss (Raw)": 2.303633689880371, "Pretrain/Step": 8319, "Pretrain/Step Time": 8.4342323821038} +{"Pretrain/Learning Rate": 3.130938837423182e-05, "Pretrain/Loss": 2.018301010131836, "Pretrain/Loss (Raw)": 2.1352059841156006, "Pretrain/Step": 8320, "Pretrain/Step Time": 8.429777152836323} +{"Pretrain/Learning Rate": 3.130528053599525e-05, "Pretrain/Loss": 2.0167555809020996, "Pretrain/Loss (Raw)": 1.8432977199554443, "Pretrain/Step": 8321, "Pretrain/Step Time": 8.431322874501348} +{"Pretrain/Learning Rate": 3.1301172515950375e-05, "Pretrain/Loss": 2.0188989639282227, "Pretrain/Loss (Raw)": 2.2097465991973877, "Pretrain/Step": 8322, "Pretrain/Step Time": 8.431719234213233} +{"Pretrain/Learning Rate": 3.129706431421562e-05, "Pretrain/Loss": 2.0189242362976074, "Pretrain/Loss (Raw)": 1.9702123403549194, "Pretrain/Step": 8323, "Pretrain/Step Time": 8.430475916713476} +{"Pretrain/Learning Rate": 3.1292955930909453e-05, "Pretrain/Loss": 2.018599510192871, "Pretrain/Loss (Raw)": 1.997332215309143, "Pretrain/Step": 8324, "Pretrain/Step Time": 8.429441889747977} +{"Pretrain/Learning Rate": 3.128884736615034e-05, "Pretrain/Loss": 2.0167384147644043, "Pretrain/Loss (Raw)": 2.065157175064087, "Pretrain/Step": 8325, "Pretrain/Step Time": 8.427495829761028} +{"Pretrain/Learning Rate": 3.1284738620056747e-05, "Pretrain/Loss": 2.016474723815918, "Pretrain/Loss (Raw)": 1.8093862533569336, "Pretrain/Step": 8326, "Pretrain/Step Time": 8.431598491966724} +{"Pretrain/Learning Rate": 3.1280629692747156e-05, "Pretrain/Loss": 2.0174202919006348, "Pretrain/Loss (Raw)": 2.01204514503479, "Pretrain/Step": 8327, "Pretrain/Step Time": 8.431039879098535} +{"Pretrain/Learning Rate": 3.127652058434002e-05, "Pretrain/Loss": 2.0182576179504395, "Pretrain/Loss (Raw)": 2.1195435523986816, "Pretrain/Step": 8328, "Pretrain/Step Time": 8.430595312267542} +{"Pretrain/Learning Rate": 3.127241129495385e-05, "Pretrain/Loss": 2.0185165405273438, "Pretrain/Loss (Raw)": 1.9519537687301636, "Pretrain/Step": 8329, "Pretrain/Step Time": 8.431767234578729} +{"Pretrain/Learning Rate": 3.126830182470712e-05, "Pretrain/Loss": 2.016134738922119, "Pretrain/Loss (Raw)": 1.748917579650879, "Pretrain/Step": 8330, "Pretrain/Step Time": 8.429494908079505} +{"Pretrain/Learning Rate": 3.126419217371832e-05, "Pretrain/Loss": 2.015270709991455, "Pretrain/Loss (Raw)": 2.0150580406188965, "Pretrain/Step": 8331, "Pretrain/Step Time": 8.431780403479934} +{"Pretrain/Learning Rate": 3.1260082342105955e-05, "Pretrain/Loss": 2.0138320922851562, "Pretrain/Loss (Raw)": 1.8253893852233887, "Pretrain/Step": 8332, "Pretrain/Step Time": 8.43077046982944} +{"Pretrain/Learning Rate": 3.1255972329988536e-05, "Pretrain/Loss": 2.0183026790618896, "Pretrain/Loss (Raw)": 2.3087825775146484, "Pretrain/Step": 8333, "Pretrain/Step Time": 8.430061344057322} +{"Pretrain/Learning Rate": 3.125186213748456e-05, "Pretrain/Loss": 2.017658233642578, "Pretrain/Loss (Raw)": 1.8596333265304565, "Pretrain/Step": 8334, "Pretrain/Step Time": 8.433656508103013} +{"Pretrain/Learning Rate": 3.124775176471255e-05, "Pretrain/Loss": 2.0163822174072266, "Pretrain/Loss (Raw)": 1.9187488555908203, "Pretrain/Step": 8335, "Pretrain/Step Time": 8.4303298573941} +{"Pretrain/Learning Rate": 3.124364121179101e-05, "Pretrain/Loss": 2.014721393585205, "Pretrain/Loss (Raw)": 1.798385739326477, "Pretrain/Step": 8336, "Pretrain/Step Time": 8.432010302320123} +{"Pretrain/Learning Rate": 3.123953047883849e-05, "Pretrain/Loss": 2.017164945602417, "Pretrain/Loss (Raw)": 2.1534676551818848, "Pretrain/Step": 8337, "Pretrain/Step Time": 8.432533403858542} +{"Pretrain/Learning Rate": 3.123541956597351e-05, "Pretrain/Loss": 2.019558906555176, "Pretrain/Loss (Raw)": 2.2045199871063232, "Pretrain/Step": 8338, "Pretrain/Step Time": 8.433632500469685} +{"Pretrain/Learning Rate": 3.123130847331459e-05, "Pretrain/Loss": 2.0191545486450195, "Pretrain/Loss (Raw)": 1.9210885763168335, "Pretrain/Step": 8339, "Pretrain/Step Time": 8.430173225700855} +{"Pretrain/Learning Rate": 3.122719720098029e-05, "Pretrain/Loss": 2.018662452697754, "Pretrain/Loss (Raw)": 1.9942177534103394, "Pretrain/Step": 8340, "Pretrain/Step Time": 8.435357581824064} +{"Pretrain/Learning Rate": 3.122308574908915e-05, "Pretrain/Loss": 2.0151801109313965, "Pretrain/Loss (Raw)": 1.6064846515655518, "Pretrain/Step": 8341, "Pretrain/Step Time": 8.439909311011434} +{"Pretrain/Learning Rate": 3.1218974117759714e-05, "Pretrain/Loss": 2.0150539875030518, "Pretrain/Loss (Raw)": 2.0725796222686768, "Pretrain/Step": 8342, "Pretrain/Step Time": 8.44008106738329} +{"Pretrain/Learning Rate": 3.1214862307110546e-05, "Pretrain/Loss": 2.015730381011963, "Pretrain/Loss (Raw)": 2.0508790016174316, "Pretrain/Step": 8343, "Pretrain/Step Time": 8.431613681837916} +{"Pretrain/Learning Rate": 3.121075031726021e-05, "Pretrain/Loss": 2.01646089553833, "Pretrain/Loss (Raw)": 2.083813428878784, "Pretrain/Step": 8344, "Pretrain/Step Time": 8.434375489130616} +{"Pretrain/Learning Rate": 3.120663814832726e-05, "Pretrain/Loss": 2.0160763263702393, "Pretrain/Loss (Raw)": 2.143764019012451, "Pretrain/Step": 8345, "Pretrain/Step Time": 8.436018804088235} +{"Pretrain/Learning Rate": 3.120252580043027e-05, "Pretrain/Loss": 2.0144295692443848, "Pretrain/Loss (Raw)": 2.1099507808685303, "Pretrain/Step": 8346, "Pretrain/Step Time": 8.431341517716646} +{"Pretrain/Learning Rate": 3.119841327368783e-05, "Pretrain/Loss": 2.015152931213379, "Pretrain/Loss (Raw)": 2.0917739868164062, "Pretrain/Step": 8347, "Pretrain/Step Time": 8.429981676861644} +{"Pretrain/Learning Rate": 3.119430056821851e-05, "Pretrain/Loss": 2.016244411468506, "Pretrain/Loss (Raw)": 2.160451889038086, "Pretrain/Step": 8348, "Pretrain/Step Time": 8.433931969106197} +{"Pretrain/Learning Rate": 3.1190187684140905e-05, "Pretrain/Loss": 2.01654052734375, "Pretrain/Loss (Raw)": 2.2419605255126953, "Pretrain/Step": 8349, "Pretrain/Step Time": 8.431434845551848} +{"Pretrain/Learning Rate": 3.118607462157359e-05, "Pretrain/Loss": 2.015730142593384, "Pretrain/Loss (Raw)": 2.1476094722747803, "Pretrain/Step": 8350, "Pretrain/Step Time": 8.433864368125796} +{"Pretrain/Learning Rate": 3.118196138063518e-05, "Pretrain/Loss": 2.018551826477051, "Pretrain/Loss (Raw)": 2.2392444610595703, "Pretrain/Step": 8351, "Pretrain/Step Time": 8.43410523608327} +{"Pretrain/Learning Rate": 3.1177847961444276e-05, "Pretrain/Loss": 2.0170700550079346, "Pretrain/Loss (Raw)": 2.0090322494506836, "Pretrain/Step": 8352, "Pretrain/Step Time": 8.426260642707348} +{"Pretrain/Learning Rate": 3.1173734364119476e-05, "Pretrain/Loss": 2.0161280632019043, "Pretrain/Loss (Raw)": 1.935686707496643, "Pretrain/Step": 8353, "Pretrain/Step Time": 8.425806123763323} +{"Pretrain/Learning Rate": 3.11696205887794e-05, "Pretrain/Loss": 2.0164847373962402, "Pretrain/Loss (Raw)": 2.012037515640259, "Pretrain/Step": 8354, "Pretrain/Step Time": 8.427308360114694} +{"Pretrain/Learning Rate": 3.1165506635542666e-05, "Pretrain/Loss": 2.01595139503479, "Pretrain/Loss (Raw)": 1.9619518518447876, "Pretrain/Step": 8355, "Pretrain/Step Time": 8.424924133345485} +{"Pretrain/Learning Rate": 3.116139250452789e-05, "Pretrain/Loss": 2.0156099796295166, "Pretrain/Loss (Raw)": 1.9230482578277588, "Pretrain/Step": 8356, "Pretrain/Step Time": 8.426776738837361} +{"Pretrain/Learning Rate": 3.115727819585371e-05, "Pretrain/Loss": 2.0173511505126953, "Pretrain/Loss (Raw)": 2.0817711353302, "Pretrain/Step": 8357, "Pretrain/Step Time": 8.422800770029426} +{"Pretrain/Learning Rate": 3.1153163709638746e-05, "Pretrain/Loss": 2.0136830806732178, "Pretrain/Loss (Raw)": 1.77191162109375, "Pretrain/Step": 8358, "Pretrain/Step Time": 8.423984114080667} +{"Pretrain/Learning Rate": 3.114904904600165e-05, "Pretrain/Loss": 2.0111050605773926, "Pretrain/Loss (Raw)": 1.8834078311920166, "Pretrain/Step": 8359, "Pretrain/Step Time": 8.421086831018329} +{"Pretrain/Learning Rate": 3.114493420506106e-05, "Pretrain/Loss": 2.0116400718688965, "Pretrain/Loss (Raw)": 2.0744526386260986, "Pretrain/Step": 8360, "Pretrain/Step Time": 8.421015992760658} +{"Pretrain/Learning Rate": 3.114081918693562e-05, "Pretrain/Loss": 2.0134475231170654, "Pretrain/Loss (Raw)": 2.2332139015197754, "Pretrain/Step": 8361, "Pretrain/Step Time": 8.420140460133553} +{"Pretrain/Learning Rate": 3.113670399174399e-05, "Pretrain/Loss": 2.0138964653015137, "Pretrain/Loss (Raw)": 2.06512188911438, "Pretrain/Step": 8362, "Pretrain/Step Time": 8.420623503625393} +{"Pretrain/Learning Rate": 3.1132588619604826e-05, "Pretrain/Loss": 2.0143251419067383, "Pretrain/Loss (Raw)": 2.064016342163086, "Pretrain/Step": 8363, "Pretrain/Step Time": 8.418117435649037} +{"Pretrain/Learning Rate": 3.112847307063679e-05, "Pretrain/Loss": 2.0187325477600098, "Pretrain/Loss (Raw)": 2.384246826171875, "Pretrain/Step": 8364, "Pretrain/Step Time": 8.418834157288074} +{"Pretrain/Learning Rate": 3.112435734495856e-05, "Pretrain/Loss": 2.0150556564331055, "Pretrain/Loss (Raw)": 1.7081079483032227, "Pretrain/Step": 8365, "Pretrain/Step Time": 8.4218995179981} +{"Pretrain/Learning Rate": 3.11202414426888e-05, "Pretrain/Loss": 2.0136661529541016, "Pretrain/Loss (Raw)": 1.9168821573257446, "Pretrain/Step": 8366, "Pretrain/Step Time": 8.420373044908047} +{"Pretrain/Learning Rate": 3.1116125363946185e-05, "Pretrain/Loss": 2.0116541385650635, "Pretrain/Loss (Raw)": 1.8683065176010132, "Pretrain/Step": 8367, "Pretrain/Step Time": 8.422341834753752} +{"Pretrain/Learning Rate": 3.111200910884941e-05, "Pretrain/Loss": 2.0118608474731445, "Pretrain/Loss (Raw)": 2.0152058601379395, "Pretrain/Step": 8368, "Pretrain/Step Time": 8.418764412403107} +{"Pretrain/Learning Rate": 3.110789267751717e-05, "Pretrain/Loss": 2.0108373165130615, "Pretrain/Loss (Raw)": 2.106940269470215, "Pretrain/Step": 8369, "Pretrain/Step Time": 8.41601337119937} +{"Pretrain/Learning Rate": 3.1103776070068144e-05, "Pretrain/Loss": 2.0140950679779053, "Pretrain/Loss (Raw)": 2.171133518218994, "Pretrain/Step": 8370, "Pretrain/Step Time": 8.419640764594078} +{"Pretrain/Learning Rate": 3.109965928662104e-05, "Pretrain/Loss": 2.0151920318603516, "Pretrain/Loss (Raw)": 2.0911853313446045, "Pretrain/Step": 8371, "Pretrain/Step Time": 8.424429642036557} +{"Pretrain/Learning Rate": 3.109554232729456e-05, "Pretrain/Loss": 2.01239013671875, "Pretrain/Loss (Raw)": 1.9305567741394043, "Pretrain/Step": 8372, "Pretrain/Step Time": 8.42282179184258} +{"Pretrain/Learning Rate": 3.1091425192207416e-05, "Pretrain/Loss": 2.012158155441284, "Pretrain/Loss (Raw)": 1.989219307899475, "Pretrain/Step": 8373, "Pretrain/Step Time": 8.424849528819323} +{"Pretrain/Learning Rate": 3.108730788147832e-05, "Pretrain/Loss": 2.01228666305542, "Pretrain/Loss (Raw)": 2.068051338195801, "Pretrain/Step": 8374, "Pretrain/Step Time": 8.427491595968604} +{"Pretrain/Learning Rate": 3.108319039522599e-05, "Pretrain/Loss": 2.0145211219787598, "Pretrain/Loss (Raw)": 2.039259195327759, "Pretrain/Step": 8375, "Pretrain/Step Time": 8.425358885899186} +{"Pretrain/Learning Rate": 3.107907273356915e-05, "Pretrain/Loss": 2.013991355895996, "Pretrain/Loss (Raw)": 2.0858261585235596, "Pretrain/Step": 8376, "Pretrain/Step Time": 8.42026298865676} +{"Pretrain/Learning Rate": 3.107495489662654e-05, "Pretrain/Loss": 2.0154075622558594, "Pretrain/Loss (Raw)": 1.9559203386306763, "Pretrain/Step": 8377, "Pretrain/Step Time": 8.423837011680007} +{"Pretrain/Learning Rate": 3.1070836884516885e-05, "Pretrain/Loss": 2.0148580074310303, "Pretrain/Loss (Raw)": 1.9621217250823975, "Pretrain/Step": 8378, "Pretrain/Step Time": 8.422518571838737} +{"Pretrain/Learning Rate": 3.1066718697358927e-05, "Pretrain/Loss": 2.0158753395080566, "Pretrain/Loss (Raw)": 2.084749937057495, "Pretrain/Step": 8379, "Pretrain/Step Time": 8.423779033124447} +{"Pretrain/Learning Rate": 3.1062600335271405e-05, "Pretrain/Loss": 2.0143911838531494, "Pretrain/Loss (Raw)": 1.9290465116500854, "Pretrain/Step": 8380, "Pretrain/Step Time": 8.424060262739658} +{"Pretrain/Learning Rate": 3.1058481798373095e-05, "Pretrain/Loss": 2.0158934593200684, "Pretrain/Loss (Raw)": 2.2017104625701904, "Pretrain/Step": 8381, "Pretrain/Step Time": 8.42380048148334} +{"Pretrain/Learning Rate": 3.1054363086782724e-05, "Pretrain/Loss": 2.0149929523468018, "Pretrain/Loss (Raw)": 1.9562418460845947, "Pretrain/Step": 8382, "Pretrain/Step Time": 8.422426363453269} +{"Pretrain/Learning Rate": 3.105024420061905e-05, "Pretrain/Loss": 2.016361951828003, "Pretrain/Loss (Raw)": 2.1509153842926025, "Pretrain/Step": 8383, "Pretrain/Step Time": 8.424991408362985} +{"Pretrain/Learning Rate": 3.104612514000087e-05, "Pretrain/Loss": 2.0157346725463867, "Pretrain/Loss (Raw)": 1.9876561164855957, "Pretrain/Step": 8384, "Pretrain/Step Time": 8.423984225839376} +{"Pretrain/Learning Rate": 3.104200590504692e-05, "Pretrain/Loss": 2.0153539180755615, "Pretrain/Loss (Raw)": 2.030900001525879, "Pretrain/Step": 8385, "Pretrain/Step Time": 8.424223385751247} +{"Pretrain/Learning Rate": 3.1037886495875996e-05, "Pretrain/Loss": 2.0133187770843506, "Pretrain/Loss (Raw)": 1.8397011756896973, "Pretrain/Step": 8386, "Pretrain/Step Time": 8.417802961543202} +{"Pretrain/Learning Rate": 3.1033766912606865e-05, "Pretrain/Loss": 2.011467218399048, "Pretrain/Loss (Raw)": 1.8530776500701904, "Pretrain/Step": 8387, "Pretrain/Step Time": 8.421946996822953} +{"Pretrain/Learning Rate": 3.102964715535832e-05, "Pretrain/Loss": 2.013888359069824, "Pretrain/Loss (Raw)": 2.2105815410614014, "Pretrain/Step": 8388, "Pretrain/Step Time": 8.420900261029601} +{"Pretrain/Learning Rate": 3.102552722424915e-05, "Pretrain/Loss": 2.012265682220459, "Pretrain/Loss (Raw)": 1.9184490442276, "Pretrain/Step": 8389, "Pretrain/Step Time": 8.418204315006733} +{"Pretrain/Learning Rate": 3.102140711939815e-05, "Pretrain/Loss": 2.0122833251953125, "Pretrain/Loss (Raw)": 1.8921267986297607, "Pretrain/Step": 8390, "Pretrain/Step Time": 8.418728051707149} +{"Pretrain/Learning Rate": 3.1017286840924126e-05, "Pretrain/Loss": 2.013451337814331, "Pretrain/Loss (Raw)": 2.052896738052368, "Pretrain/Step": 8391, "Pretrain/Step Time": 8.416610185056925} +{"Pretrain/Learning Rate": 3.101316638894588e-05, "Pretrain/Loss": 2.01328444480896, "Pretrain/Loss (Raw)": 2.0596823692321777, "Pretrain/Step": 8392, "Pretrain/Step Time": 8.41700902953744} +{"Pretrain/Learning Rate": 3.100904576358221e-05, "Pretrain/Loss": 2.0122323036193848, "Pretrain/Loss (Raw)": 1.9382365942001343, "Pretrain/Step": 8393, "Pretrain/Step Time": 8.420828204602003} +{"Pretrain/Learning Rate": 3.1004924964951945e-05, "Pretrain/Loss": 2.0128257274627686, "Pretrain/Loss (Raw)": 2.0219883918762207, "Pretrain/Step": 8394, "Pretrain/Step Time": 8.41961458697915} +{"Pretrain/Learning Rate": 3.10008039931739e-05, "Pretrain/Loss": 2.0163700580596924, "Pretrain/Loss (Raw)": 2.3788223266601562, "Pretrain/Step": 8395, "Pretrain/Step Time": 8.417367657646537} +{"Pretrain/Learning Rate": 3.099668284836691e-05, "Pretrain/Loss": 2.016805648803711, "Pretrain/Loss (Raw)": 2.0983502864837646, "Pretrain/Step": 8396, "Pretrain/Step Time": 8.417906431481242} +{"Pretrain/Learning Rate": 3.099256153064979e-05, "Pretrain/Loss": 2.016385078430176, "Pretrain/Loss (Raw)": 2.0014917850494385, "Pretrain/Step": 8397, "Pretrain/Step Time": 8.420320574194193} +{"Pretrain/Learning Rate": 3.098844004014138e-05, "Pretrain/Loss": 2.018371820449829, "Pretrain/Loss (Raw)": 2.2336697578430176, "Pretrain/Step": 8398, "Pretrain/Step Time": 8.419656347483397} +{"Pretrain/Learning Rate": 3.098431837696053e-05, "Pretrain/Loss": 2.019609212875366, "Pretrain/Loss (Raw)": 2.0233266353607178, "Pretrain/Step": 8399, "Pretrain/Step Time": 8.418226869776845} +{"Pretrain/Learning Rate": 3.0980196541226075e-05, "Pretrain/Loss": 2.0204288959503174, "Pretrain/Loss (Raw)": 1.943785548210144, "Pretrain/Step": 8400, "Pretrain/Step Time": 8.41958761587739} +{"Pretrain/Learning Rate": 3.0976074533056874e-05, "Pretrain/Loss": 2.019085645675659, "Pretrain/Loss (Raw)": 1.7174749374389648, "Pretrain/Step": 8401, "Pretrain/Step Time": 8.418847473338246} +{"Pretrain/Learning Rate": 3.097195235257177e-05, "Pretrain/Loss": 2.021679639816284, "Pretrain/Loss (Raw)": 2.216862916946411, "Pretrain/Step": 8402, "Pretrain/Step Time": 8.413862250745296} +{"Pretrain/Learning Rate": 3.096782999988963e-05, "Pretrain/Loss": 2.0195512771606445, "Pretrain/Loss (Raw)": 1.9672874212265015, "Pretrain/Step": 8403, "Pretrain/Step Time": 8.417907921597362} +{"Pretrain/Learning Rate": 3.0963707475129324e-05, "Pretrain/Loss": 2.0198044776916504, "Pretrain/Loss (Raw)": 2.2580220699310303, "Pretrain/Step": 8404, "Pretrain/Step Time": 8.416248412802815} +{"Pretrain/Learning Rate": 3.095958477840971e-05, "Pretrain/Loss": 2.0187957286834717, "Pretrain/Loss (Raw)": 2.184455633163452, "Pretrain/Step": 8405, "Pretrain/Step Time": 8.417521268129349} +{"Pretrain/Learning Rate": 3.095546190984968e-05, "Pretrain/Loss": 2.0201244354248047, "Pretrain/Loss (Raw)": 2.0143845081329346, "Pretrain/Step": 8406, "Pretrain/Step Time": 8.417405873537064} +{"Pretrain/Learning Rate": 3.0951338869568096e-05, "Pretrain/Loss": 2.0196359157562256, "Pretrain/Loss (Raw)": 1.9266856908798218, "Pretrain/Step": 8407, "Pretrain/Step Time": 8.418277591466904} +{"Pretrain/Learning Rate": 3.0947215657683857e-05, "Pretrain/Loss": 2.0200278759002686, "Pretrain/Loss (Raw)": 2.0848870277404785, "Pretrain/Step": 8408, "Pretrain/Step Time": 8.421556118875742} +{"Pretrain/Learning Rate": 3.0943092274315845e-05, "Pretrain/Loss": 2.0194106101989746, "Pretrain/Loss (Raw)": 1.9963165521621704, "Pretrain/Step": 8409, "Pretrain/Step Time": 8.42003295570612} +{"Pretrain/Learning Rate": 3.093896871958295e-05, "Pretrain/Loss": 2.0218069553375244, "Pretrain/Loss (Raw)": 1.9307568073272705, "Pretrain/Step": 8410, "Pretrain/Step Time": 8.424812644720078} +{"Pretrain/Learning Rate": 3.0934844993604085e-05, "Pretrain/Loss": 2.021733283996582, "Pretrain/Loss (Raw)": 2.0553336143493652, "Pretrain/Step": 8411, "Pretrain/Step Time": 8.42385465092957} +{"Pretrain/Learning Rate": 3.093072109649815e-05, "Pretrain/Loss": 2.022200584411621, "Pretrain/Loss (Raw)": 1.9759242534637451, "Pretrain/Step": 8412, "Pretrain/Step Time": 8.421927243471146} +{"Pretrain/Learning Rate": 3.0926597028384055e-05, "Pretrain/Loss": 2.02005672454834, "Pretrain/Loss (Raw)": 1.962029218673706, "Pretrain/Step": 8413, "Pretrain/Step Time": 8.42210290953517} +{"Pretrain/Learning Rate": 3.0922472789380704e-05, "Pretrain/Loss": 2.022890567779541, "Pretrain/Loss (Raw)": 2.175060272216797, "Pretrain/Step": 8414, "Pretrain/Step Time": 8.422888504341245} +{"Pretrain/Learning Rate": 3.0918348379607034e-05, "Pretrain/Loss": 2.0202221870422363, "Pretrain/Loss (Raw)": 1.7047300338745117, "Pretrain/Step": 8415, "Pretrain/Step Time": 8.421795753762126} +{"Pretrain/Learning Rate": 3.0914223799181955e-05, "Pretrain/Loss": 2.021979570388794, "Pretrain/Loss (Raw)": 2.030860424041748, "Pretrain/Step": 8416, "Pretrain/Step Time": 8.421525413170457} +{"Pretrain/Learning Rate": 3.09100990482244e-05, "Pretrain/Loss": 2.0213565826416016, "Pretrain/Loss (Raw)": 1.8975499868392944, "Pretrain/Step": 8417, "Pretrain/Step Time": 8.418173400685191} +{"Pretrain/Learning Rate": 3.0905974126853315e-05, "Pretrain/Loss": 2.0255470275878906, "Pretrain/Loss (Raw)": 2.3507885932922363, "Pretrain/Step": 8418, "Pretrain/Step Time": 8.417785875499249} +{"Pretrain/Learning Rate": 3.090184903518762e-05, "Pretrain/Loss": 2.0274808406829834, "Pretrain/Loss (Raw)": 2.189359188079834, "Pretrain/Step": 8419, "Pretrain/Step Time": 8.416030123829842} +{"Pretrain/Learning Rate": 3.089772377334627e-05, "Pretrain/Loss": 2.0275769233703613, "Pretrain/Loss (Raw)": 2.132462978363037, "Pretrain/Step": 8420, "Pretrain/Step Time": 8.419698169454932} +{"Pretrain/Learning Rate": 3.089359834144822e-05, "Pretrain/Loss": 2.026080369949341, "Pretrain/Loss (Raw)": 1.9818580150604248, "Pretrain/Step": 8421, "Pretrain/Step Time": 8.42241220921278} +{"Pretrain/Learning Rate": 3.0889472739612405e-05, "Pretrain/Loss": 2.0249335765838623, "Pretrain/Loss (Raw)": 1.766326665878296, "Pretrain/Step": 8422, "Pretrain/Step Time": 8.421107161790133} +{"Pretrain/Learning Rate": 3.088534696795781e-05, "Pretrain/Loss": 2.0264556407928467, "Pretrain/Loss (Raw)": 1.9384920597076416, "Pretrain/Step": 8423, "Pretrain/Step Time": 8.42472256347537} +{"Pretrain/Learning Rate": 3.088122102660337e-05, "Pretrain/Loss": 2.0291481018066406, "Pretrain/Loss (Raw)": 2.1970114707946777, "Pretrain/Step": 8424, "Pretrain/Step Time": 8.421780934557319} +{"Pretrain/Learning Rate": 3.087709491566807e-05, "Pretrain/Loss": 2.0282552242279053, "Pretrain/Loss (Raw)": 2.034388542175293, "Pretrain/Step": 8425, "Pretrain/Step Time": 8.421050051227212} +{"Pretrain/Learning Rate": 3.087296863527088e-05, "Pretrain/Loss": 2.0265185832977295, "Pretrain/Loss (Raw)": 1.882112979888916, "Pretrain/Step": 8426, "Pretrain/Step Time": 8.420615112408996} +{"Pretrain/Learning Rate": 3.086884218553079e-05, "Pretrain/Loss": 2.026743173599243, "Pretrain/Loss (Raw)": 1.9187591075897217, "Pretrain/Step": 8427, "Pretrain/Step Time": 8.421782199293375} +{"Pretrain/Learning Rate": 3.086471556656677e-05, "Pretrain/Loss": 2.026808261871338, "Pretrain/Loss (Raw)": 1.968639612197876, "Pretrain/Step": 8428, "Pretrain/Step Time": 8.423246208578348} +{"Pretrain/Learning Rate": 3.0860588778497805e-05, "Pretrain/Loss": 2.0248069763183594, "Pretrain/Loss (Raw)": 1.9541923999786377, "Pretrain/Step": 8429, "Pretrain/Step Time": 8.420604096725583} +{"Pretrain/Learning Rate": 3.0856461821442894e-05, "Pretrain/Loss": 2.0253329277038574, "Pretrain/Loss (Raw)": 2.2217345237731934, "Pretrain/Step": 8430, "Pretrain/Step Time": 8.423067340627313} +{"Pretrain/Learning Rate": 3.0852334695521036e-05, "Pretrain/Loss": 2.027644395828247, "Pretrain/Loss (Raw)": 2.443967819213867, "Pretrain/Step": 8431, "Pretrain/Step Time": 8.422864044085145} +{"Pretrain/Learning Rate": 3.0848207400851234e-05, "Pretrain/Loss": 2.0266895294189453, "Pretrain/Loss (Raw)": 1.8416343927383423, "Pretrain/Step": 8432, "Pretrain/Step Time": 8.424744950607419} +{"Pretrain/Learning Rate": 3.08440799375525e-05, "Pretrain/Loss": 2.0276198387145996, "Pretrain/Loss (Raw)": 2.127218723297119, "Pretrain/Step": 8433, "Pretrain/Step Time": 8.426090903580189} +{"Pretrain/Learning Rate": 3.083995230574384e-05, "Pretrain/Loss": 2.0296847820281982, "Pretrain/Loss (Raw)": 2.254168748855591, "Pretrain/Step": 8434, "Pretrain/Step Time": 8.426719283685088} +{"Pretrain/Learning Rate": 3.083582450554426e-05, "Pretrain/Loss": 2.0307159423828125, "Pretrain/Loss (Raw)": 1.9720414876937866, "Pretrain/Step": 8435, "Pretrain/Step Time": 8.425128489732742} +{"Pretrain/Learning Rate": 3.08316965370728e-05, "Pretrain/Loss": 2.0302581787109375, "Pretrain/Loss (Raw)": 1.9323794841766357, "Pretrain/Step": 8436, "Pretrain/Step Time": 8.429527182132006} +{"Pretrain/Learning Rate": 3.082756840044848e-05, "Pretrain/Loss": 2.0291895866394043, "Pretrain/Loss (Raw)": 1.8797228336334229, "Pretrain/Step": 8437, "Pretrain/Step Time": 8.43091244623065} +{"Pretrain/Learning Rate": 3.082344009579034e-05, "Pretrain/Loss": 2.026251792907715, "Pretrain/Loss (Raw)": 1.7592610120773315, "Pretrain/Step": 8438, "Pretrain/Step Time": 8.43285459652543} +{"Pretrain/Learning Rate": 3.081931162321741e-05, "Pretrain/Loss": 2.0256080627441406, "Pretrain/Loss (Raw)": 1.9337761402130127, "Pretrain/Step": 8439, "Pretrain/Step Time": 8.43137932009995} +{"Pretrain/Learning Rate": 3.081518298284873e-05, "Pretrain/Loss": 2.0266032218933105, "Pretrain/Loss (Raw)": 2.0184926986694336, "Pretrain/Step": 8440, "Pretrain/Step Time": 8.4322854783386} +{"Pretrain/Learning Rate": 3.081105417480334e-05, "Pretrain/Loss": 2.024756908416748, "Pretrain/Loss (Raw)": 1.7999317646026611, "Pretrain/Step": 8441, "Pretrain/Step Time": 8.432457733899355} +{"Pretrain/Learning Rate": 3.080692519920031e-05, "Pretrain/Loss": 2.0239007472991943, "Pretrain/Loss (Raw)": 2.0735061168670654, "Pretrain/Step": 8442, "Pretrain/Step Time": 8.43150876276195} +{"Pretrain/Learning Rate": 3.0802796056158676e-05, "Pretrain/Loss": 2.024498462677002, "Pretrain/Loss (Raw)": 2.026376724243164, "Pretrain/Step": 8443, "Pretrain/Step Time": 8.431660132482648} +{"Pretrain/Learning Rate": 3.079866674579752e-05, "Pretrain/Loss": 2.0227913856506348, "Pretrain/Loss (Raw)": 1.9142178297042847, "Pretrain/Step": 8444, "Pretrain/Step Time": 8.42999991774559} +{"Pretrain/Learning Rate": 3.079453726823589e-05, "Pretrain/Loss": 2.0222415924072266, "Pretrain/Loss (Raw)": 2.028313636779785, "Pretrain/Step": 8445, "Pretrain/Step Time": 8.434015780687332} +{"Pretrain/Learning Rate": 3.079040762359286e-05, "Pretrain/Loss": 2.0242581367492676, "Pretrain/Loss (Raw)": 2.2350175380706787, "Pretrain/Step": 8446, "Pretrain/Step Time": 8.433052970096469} +{"Pretrain/Learning Rate": 3.0786277811987505e-05, "Pretrain/Loss": 2.0206832885742188, "Pretrain/Loss (Raw)": 1.8460726737976074, "Pretrain/Step": 8447, "Pretrain/Step Time": 8.432065516710281} +{"Pretrain/Learning Rate": 3.078214783353891e-05, "Pretrain/Loss": 2.0188846588134766, "Pretrain/Loss (Raw)": 1.9049750566482544, "Pretrain/Step": 8448, "Pretrain/Step Time": 8.429223120212555} +{"Pretrain/Learning Rate": 3.0778017688366175e-05, "Pretrain/Loss": 2.0205800533294678, "Pretrain/Loss (Raw)": 2.0603151321411133, "Pretrain/Step": 8449, "Pretrain/Step Time": 8.432854993268847} +{"Pretrain/Learning Rate": 3.077388737658836e-05, "Pretrain/Loss": 2.0207440853118896, "Pretrain/Loss (Raw)": 2.230731725692749, "Pretrain/Step": 8450, "Pretrain/Step Time": 8.432897541671991} +{"Pretrain/Learning Rate": 3.076975689832457e-05, "Pretrain/Loss": 2.0205695629119873, "Pretrain/Loss (Raw)": 1.9478785991668701, "Pretrain/Step": 8451, "Pretrain/Step Time": 8.431667631492019} +{"Pretrain/Learning Rate": 3.0765626253693917e-05, "Pretrain/Loss": 2.0186262130737305, "Pretrain/Loss (Raw)": 1.7485902309417725, "Pretrain/Step": 8452, "Pretrain/Step Time": 8.435542922466993} +{"Pretrain/Learning Rate": 3.076149544281548e-05, "Pretrain/Loss": 2.017845630645752, "Pretrain/Loss (Raw)": 1.9652477502822876, "Pretrain/Step": 8453, "Pretrain/Step Time": 8.435305012390018} +{"Pretrain/Learning Rate": 3.07573644658084e-05, "Pretrain/Loss": 2.0210659503936768, "Pretrain/Loss (Raw)": 2.2215466499328613, "Pretrain/Step": 8454, "Pretrain/Step Time": 8.434918381273746} +{"Pretrain/Learning Rate": 3.075323332279177e-05, "Pretrain/Loss": 2.02048397064209, "Pretrain/Loss (Raw)": 1.9375934600830078, "Pretrain/Step": 8455, "Pretrain/Step Time": 8.435763800516725} +{"Pretrain/Learning Rate": 3.074910201388471e-05, "Pretrain/Loss": 2.019453763961792, "Pretrain/Loss (Raw)": 1.9876532554626465, "Pretrain/Step": 8456, "Pretrain/Step Time": 8.435980577021837} +{"Pretrain/Learning Rate": 3.074497053920635e-05, "Pretrain/Loss": 2.02225923538208, "Pretrain/Loss (Raw)": 2.311048746109009, "Pretrain/Step": 8457, "Pretrain/Step Time": 8.435398437082767} +{"Pretrain/Learning Rate": 3.074083889887581e-05, "Pretrain/Loss": 2.0234506130218506, "Pretrain/Loss (Raw)": 1.9014109373092651, "Pretrain/Step": 8458, "Pretrain/Step Time": 8.435504188761115} +{"Pretrain/Learning Rate": 3.0736707093012226e-05, "Pretrain/Loss": 2.023540735244751, "Pretrain/Loss (Raw)": 2.0266077518463135, "Pretrain/Step": 8459, "Pretrain/Step Time": 8.437085354700685} +{"Pretrain/Learning Rate": 3.0732575121734745e-05, "Pretrain/Loss": 2.0249032974243164, "Pretrain/Loss (Raw)": 1.9998064041137695, "Pretrain/Step": 8460, "Pretrain/Step Time": 8.439786372706294} +{"Pretrain/Learning Rate": 3.072844298516249e-05, "Pretrain/Loss": 2.0236032009124756, "Pretrain/Loss (Raw)": 2.142362594604492, "Pretrain/Step": 8461, "Pretrain/Step Time": 8.440066441893578} +{"Pretrain/Learning Rate": 3.072431068341462e-05, "Pretrain/Loss": 2.025733470916748, "Pretrain/Loss (Raw)": 2.1323115825653076, "Pretrain/Step": 8462, "Pretrain/Step Time": 8.437285920605063} +{"Pretrain/Learning Rate": 3.0720178216610297e-05, "Pretrain/Loss": 2.0270469188690186, "Pretrain/Loss (Raw)": 2.086864948272705, "Pretrain/Step": 8463, "Pretrain/Step Time": 8.440645731985569} +{"Pretrain/Learning Rate": 3.071604558486866e-05, "Pretrain/Loss": 2.0278091430664062, "Pretrain/Loss (Raw)": 1.8959451913833618, "Pretrain/Step": 8464, "Pretrain/Step Time": 8.440315959975123} +{"Pretrain/Learning Rate": 3.0711912788308884e-05, "Pretrain/Loss": 2.0280771255493164, "Pretrain/Loss (Raw)": 2.1877944469451904, "Pretrain/Step": 8465, "Pretrain/Step Time": 8.438276939094067} +{"Pretrain/Learning Rate": 3.0707779827050126e-05, "Pretrain/Loss": 2.025435209274292, "Pretrain/Loss (Raw)": 1.866322636604309, "Pretrain/Step": 8466, "Pretrain/Step Time": 8.437562948092818} +{"Pretrain/Learning Rate": 3.070364670121156e-05, "Pretrain/Loss": 2.0265705585479736, "Pretrain/Loss (Raw)": 2.0664210319519043, "Pretrain/Step": 8467, "Pretrain/Step Time": 8.441518861800432} +{"Pretrain/Learning Rate": 3.069951341091236e-05, "Pretrain/Loss": 2.0263166427612305, "Pretrain/Loss (Raw)": 1.9617249965667725, "Pretrain/Step": 8468, "Pretrain/Step Time": 8.438343327492476} +{"Pretrain/Learning Rate": 3.069537995627172e-05, "Pretrain/Loss": 2.0289230346679688, "Pretrain/Loss (Raw)": 1.9401142597198486, "Pretrain/Step": 8469, "Pretrain/Step Time": 8.434252303093672} +{"Pretrain/Learning Rate": 3.06912463374088e-05, "Pretrain/Loss": 2.03060245513916, "Pretrain/Loss (Raw)": 2.2874951362609863, "Pretrain/Step": 8470, "Pretrain/Step Time": 8.434934619814157} +{"Pretrain/Learning Rate": 3.068711255444281e-05, "Pretrain/Loss": 2.031757354736328, "Pretrain/Loss (Raw)": 2.1987409591674805, "Pretrain/Step": 8471, "Pretrain/Step Time": 8.435958597809076} +{"Pretrain/Learning Rate": 3.068297860749294e-05, "Pretrain/Loss": 2.031126022338867, "Pretrain/Loss (Raw)": 2.0030205249786377, "Pretrain/Step": 8472, "Pretrain/Step Time": 8.436115032061934} +{"Pretrain/Learning Rate": 3.0678844496678384e-05, "Pretrain/Loss": 2.0303611755371094, "Pretrain/Loss (Raw)": 2.0458548069000244, "Pretrain/Step": 8473, "Pretrain/Step Time": 8.432871870696545} +{"Pretrain/Learning Rate": 3.067471022211835e-05, "Pretrain/Loss": 2.0296709537506104, "Pretrain/Loss (Raw)": 2.021584987640381, "Pretrain/Step": 8474, "Pretrain/Step Time": 8.434637689962983} +{"Pretrain/Learning Rate": 3.067057578393205e-05, "Pretrain/Loss": 2.026853322982788, "Pretrain/Loss (Raw)": 1.7311131954193115, "Pretrain/Step": 8475, "Pretrain/Step Time": 8.43398742005229} +{"Pretrain/Learning Rate": 3.06664411822387e-05, "Pretrain/Loss": 2.0260210037231445, "Pretrain/Loss (Raw)": 2.0539441108703613, "Pretrain/Step": 8476, "Pretrain/Step Time": 8.43177629262209} +{"Pretrain/Learning Rate": 3.06623064171575e-05, "Pretrain/Loss": 2.025749921798706, "Pretrain/Loss (Raw)": 2.2072510719299316, "Pretrain/Step": 8477, "Pretrain/Step Time": 8.433568326756358} +{"Pretrain/Learning Rate": 3.0658171488807696e-05, "Pretrain/Loss": 2.025113105773926, "Pretrain/Loss (Raw)": 2.066082000732422, "Pretrain/Step": 8478, "Pretrain/Step Time": 8.430755104869604} +{"Pretrain/Learning Rate": 3.065403639730851e-05, "Pretrain/Loss": 2.0240793228149414, "Pretrain/Loss (Raw)": 2.106924295425415, "Pretrain/Step": 8479, "Pretrain/Step Time": 8.43114390783012} +{"Pretrain/Learning Rate": 3.0649901142779155e-05, "Pretrain/Loss": 2.0239648818969727, "Pretrain/Loss (Raw)": 1.994399070739746, "Pretrain/Step": 8480, "Pretrain/Step Time": 8.43316918052733} +{"Pretrain/Learning Rate": 3.06457657253389e-05, "Pretrain/Loss": 2.0239832401275635, "Pretrain/Loss (Raw)": 1.9380288124084473, "Pretrain/Step": 8481, "Pretrain/Step Time": 8.432130703702569} +{"Pretrain/Learning Rate": 3.064163014510696e-05, "Pretrain/Loss": 2.0235109329223633, "Pretrain/Loss (Raw)": 1.951558232307434, "Pretrain/Step": 8482, "Pretrain/Step Time": 8.434158885851502} +{"Pretrain/Learning Rate": 3.063749440220259e-05, "Pretrain/Loss": 2.0233359336853027, "Pretrain/Loss (Raw)": 1.93955659866333, "Pretrain/Step": 8483, "Pretrain/Step Time": 8.434781869873405} +{"Pretrain/Learning Rate": 3.063335849674505e-05, "Pretrain/Loss": 2.0229458808898926, "Pretrain/Loss (Raw)": 1.8731539249420166, "Pretrain/Step": 8484, "Pretrain/Step Time": 8.434544360265136} +{"Pretrain/Learning Rate": 3.062922242885359e-05, "Pretrain/Loss": 2.0227930545806885, "Pretrain/Loss (Raw)": 2.0621860027313232, "Pretrain/Step": 8485, "Pretrain/Step Time": 8.43326447531581} +{"Pretrain/Learning Rate": 3.062508619864747e-05, "Pretrain/Loss": 2.0243563652038574, "Pretrain/Loss (Raw)": 1.9720021486282349, "Pretrain/Step": 8486, "Pretrain/Step Time": 8.431759111583233} +{"Pretrain/Learning Rate": 3.0620949806245943e-05, "Pretrain/Loss": 2.0282273292541504, "Pretrain/Loss (Raw)": 2.3788816928863525, "Pretrain/Step": 8487, "Pretrain/Step Time": 8.435290636494756} +{"Pretrain/Learning Rate": 3.06168132517683e-05, "Pretrain/Loss": 2.0277366638183594, "Pretrain/Loss (Raw)": 2.0116848945617676, "Pretrain/Step": 8488, "Pretrain/Step Time": 8.431652460247278} +{"Pretrain/Learning Rate": 3.061267653533381e-05, "Pretrain/Loss": 2.0257701873779297, "Pretrain/Loss (Raw)": 1.9815009832382202, "Pretrain/Step": 8489, "Pretrain/Step Time": 8.43307007662952} +{"Pretrain/Learning Rate": 3.060853965706174e-05, "Pretrain/Loss": 2.0245537757873535, "Pretrain/Loss (Raw)": 1.909416913986206, "Pretrain/Step": 8490, "Pretrain/Step Time": 8.434454711154103} +{"Pretrain/Learning Rate": 3.060440261707139e-05, "Pretrain/Loss": 2.022655487060547, "Pretrain/Loss (Raw)": 1.8210139274597168, "Pretrain/Step": 8491, "Pretrain/Step Time": 8.436257898807526} +{"Pretrain/Learning Rate": 3.060026541548204e-05, "Pretrain/Loss": 2.021212577819824, "Pretrain/Loss (Raw)": 2.1995866298675537, "Pretrain/Step": 8492, "Pretrain/Step Time": 8.436096282675862} +{"Pretrain/Learning Rate": 3.0596128052412976e-05, "Pretrain/Loss": 2.0217676162719727, "Pretrain/Loss (Raw)": 1.7791287899017334, "Pretrain/Step": 8493, "Pretrain/Step Time": 8.436525110155344} +{"Pretrain/Learning Rate": 3.0591990527983514e-05, "Pretrain/Loss": 2.0216760635375977, "Pretrain/Loss (Raw)": 1.9051645994186401, "Pretrain/Step": 8494, "Pretrain/Step Time": 8.435710996389389} +{"Pretrain/Learning Rate": 3.058785284231294e-05, "Pretrain/Loss": 2.0200629234313965, "Pretrain/Loss (Raw)": 1.6618186235427856, "Pretrain/Step": 8495, "Pretrain/Step Time": 8.439650049433112} +{"Pretrain/Learning Rate": 3.058371499552058e-05, "Pretrain/Loss": 2.020495653152466, "Pretrain/Loss (Raw)": 2.0706212520599365, "Pretrain/Step": 8496, "Pretrain/Step Time": 8.437479592859745} +{"Pretrain/Learning Rate": 3.0579576987725725e-05, "Pretrain/Loss": 2.019345760345459, "Pretrain/Loss (Raw)": 1.9597309827804565, "Pretrain/Step": 8497, "Pretrain/Step Time": 8.440345199778676} +{"Pretrain/Learning Rate": 3.0575438819047706e-05, "Pretrain/Loss": 2.0179357528686523, "Pretrain/Loss (Raw)": 1.9906567335128784, "Pretrain/Step": 8498, "Pretrain/Step Time": 8.437314506620169} +{"Pretrain/Learning Rate": 3.057130048960584e-05, "Pretrain/Loss": 2.017374038696289, "Pretrain/Loss (Raw)": 2.0192999839782715, "Pretrain/Step": 8499, "Pretrain/Step Time": 8.438817886635661} +{"Pretrain/Learning Rate": 3.0567161999519445e-05, "Pretrain/Loss": 2.0172553062438965, "Pretrain/Loss (Raw)": 1.9153499603271484, "Pretrain/Step": 8500, "Pretrain/Step Time": 8.441396679729223} +{"Pretrain/Learning Rate": 3.056302334890786e-05, "Pretrain/Loss": 2.0175046920776367, "Pretrain/Loss (Raw)": 2.021124839782715, "Pretrain/Step": 8501, "Pretrain/Step Time": 8.438889369368553} +{"Pretrain/Learning Rate": 3.0558884537890424e-05, "Pretrain/Loss": 2.016695499420166, "Pretrain/Loss (Raw)": 1.9645130634307861, "Pretrain/Step": 8502, "Pretrain/Step Time": 8.43649779073894} +{"Pretrain/Learning Rate": 3.055474556658647e-05, "Pretrain/Loss": 2.0148167610168457, "Pretrain/Loss (Raw)": 1.7987474203109741, "Pretrain/Step": 8503, "Pretrain/Step Time": 8.444814642891288} +{"Pretrain/Learning Rate": 3.055060643511534e-05, "Pretrain/Loss": 2.0145862102508545, "Pretrain/Loss (Raw)": 2.0563318729400635, "Pretrain/Step": 8504, "Pretrain/Step Time": 8.446001896634698} +{"Pretrain/Learning Rate": 3.0546467143596384e-05, "Pretrain/Loss": 2.0145115852355957, "Pretrain/Loss (Raw)": 1.9463527202606201, "Pretrain/Step": 8505, "Pretrain/Step Time": 8.44414166174829} +{"Pretrain/Learning Rate": 3.054232769214896e-05, "Pretrain/Loss": 2.0146408081054688, "Pretrain/Loss (Raw)": 1.9786884784698486, "Pretrain/Step": 8506, "Pretrain/Step Time": 8.440948298200965} +{"Pretrain/Learning Rate": 3.053818808089243e-05, "Pretrain/Loss": 2.0145626068115234, "Pretrain/Loss (Raw)": 2.0747287273406982, "Pretrain/Step": 8507, "Pretrain/Step Time": 8.440049713477492} +{"Pretrain/Learning Rate": 3.053404830994615e-05, "Pretrain/Loss": 2.013974905014038, "Pretrain/Loss (Raw)": 1.8538117408752441, "Pretrain/Step": 8508, "Pretrain/Step Time": 8.442390229552984} +{"Pretrain/Learning Rate": 3.0529908379429475e-05, "Pretrain/Loss": 2.0134365558624268, "Pretrain/Loss (Raw)": 2.1328012943267822, "Pretrain/Step": 8509, "Pretrain/Step Time": 8.440488558262587} +{"Pretrain/Learning Rate": 3.0525768289461805e-05, "Pretrain/Loss": 2.014063835144043, "Pretrain/Loss (Raw)": 2.036560535430908, "Pretrain/Step": 8510, "Pretrain/Step Time": 8.443121135234833} +{"Pretrain/Learning Rate": 3.052162804016249e-05, "Pretrain/Loss": 2.013484477996826, "Pretrain/Loss (Raw)": 2.076751708984375, "Pretrain/Step": 8511, "Pretrain/Step Time": 8.441003667190671} +{"Pretrain/Learning Rate": 3.0517487631650932e-05, "Pretrain/Loss": 2.014209032058716, "Pretrain/Loss (Raw)": 2.080392360687256, "Pretrain/Step": 8512, "Pretrain/Step Time": 8.44378438219428} +{"Pretrain/Learning Rate": 3.051334706404651e-05, "Pretrain/Loss": 2.0149080753326416, "Pretrain/Loss (Raw)": 2.120368719100952, "Pretrain/Step": 8513, "Pretrain/Step Time": 8.445898259058595} +{"Pretrain/Learning Rate": 3.0509206337468605e-05, "Pretrain/Loss": 2.017301559448242, "Pretrain/Loss (Raw)": 2.146071195602417, "Pretrain/Step": 8514, "Pretrain/Step Time": 8.445614902302623} +{"Pretrain/Learning Rate": 3.050506545203662e-05, "Pretrain/Loss": 2.015502452850342, "Pretrain/Loss (Raw)": 1.6228026151657104, "Pretrain/Step": 8515, "Pretrain/Step Time": 8.444499688223004} +{"Pretrain/Learning Rate": 3.0500924407869953e-05, "Pretrain/Loss": 2.01491117477417, "Pretrain/Loss (Raw)": 2.134897232055664, "Pretrain/Step": 8516, "Pretrain/Step Time": 8.446210579946637} +{"Pretrain/Learning Rate": 3.0496783205088007e-05, "Pretrain/Loss": 2.0158896446228027, "Pretrain/Loss (Raw)": 2.0436739921569824, "Pretrain/Step": 8517, "Pretrain/Step Time": 8.448648719117045} +{"Pretrain/Learning Rate": 3.04926418438102e-05, "Pretrain/Loss": 2.0162172317504883, "Pretrain/Loss (Raw)": 1.9340554475784302, "Pretrain/Step": 8518, "Pretrain/Step Time": 8.446844412013888} +{"Pretrain/Learning Rate": 3.0488500324155932e-05, "Pretrain/Loss": 2.015641450881958, "Pretrain/Loss (Raw)": 1.979203462600708, "Pretrain/Step": 8519, "Pretrain/Step Time": 8.449191691353917} +{"Pretrain/Learning Rate": 3.0484358646244625e-05, "Pretrain/Loss": 2.0139222145080566, "Pretrain/Loss (Raw)": 1.8396011590957642, "Pretrain/Step": 8520, "Pretrain/Step Time": 8.447665799409151} +{"Pretrain/Learning Rate": 3.0480216810195705e-05, "Pretrain/Loss": 2.0132827758789062, "Pretrain/Loss (Raw)": 1.8563976287841797, "Pretrain/Step": 8521, "Pretrain/Step Time": 8.448922336101532} +{"Pretrain/Learning Rate": 3.0476074816128598e-05, "Pretrain/Loss": 2.016850709915161, "Pretrain/Loss (Raw)": 2.4786970615386963, "Pretrain/Step": 8522, "Pretrain/Step Time": 8.448008745908737} +{"Pretrain/Learning Rate": 3.0471932664162735e-05, "Pretrain/Loss": 2.0130553245544434, "Pretrain/Loss (Raw)": 1.8930044174194336, "Pretrain/Step": 8523, "Pretrain/Step Time": 8.448456577956676} +{"Pretrain/Learning Rate": 3.0467790354417548e-05, "Pretrain/Loss": 2.0127010345458984, "Pretrain/Loss (Raw)": 2.0530240535736084, "Pretrain/Step": 8524, "Pretrain/Step Time": 8.447628255933523} +{"Pretrain/Learning Rate": 3.046364788701248e-05, "Pretrain/Loss": 2.0117952823638916, "Pretrain/Loss (Raw)": 1.8855384588241577, "Pretrain/Step": 8525, "Pretrain/Step Time": 8.448179258033633} +{"Pretrain/Learning Rate": 3.045950526206698e-05, "Pretrain/Loss": 2.0074095726013184, "Pretrain/Loss (Raw)": 1.6723171472549438, "Pretrain/Step": 8526, "Pretrain/Step Time": 8.449487313628197} +{"Pretrain/Learning Rate": 3.045536247970049e-05, "Pretrain/Loss": 2.0072903633117676, "Pretrain/Loss (Raw)": 2.008061170578003, "Pretrain/Step": 8527, "Pretrain/Step Time": 8.449067015200853} +{"Pretrain/Learning Rate": 3.0451219540032472e-05, "Pretrain/Loss": 2.0074920654296875, "Pretrain/Loss (Raw)": 1.9695872068405151, "Pretrain/Step": 8528, "Pretrain/Step Time": 8.448049742728472} +{"Pretrain/Learning Rate": 3.0447076443182383e-05, "Pretrain/Loss": 2.0108721256256104, "Pretrain/Loss (Raw)": 2.1501152515411377, "Pretrain/Step": 8529, "Pretrain/Step Time": 8.446646114811301} +{"Pretrain/Learning Rate": 3.0442933189269678e-05, "Pretrain/Loss": 2.0099949836730957, "Pretrain/Loss (Raw)": 2.104599952697754, "Pretrain/Step": 8530, "Pretrain/Step Time": 8.448500780388713} +{"Pretrain/Learning Rate": 3.0438789778413833e-05, "Pretrain/Loss": 2.0088233947753906, "Pretrain/Loss (Raw)": 1.817345142364502, "Pretrain/Step": 8531, "Pretrain/Step Time": 8.447854535654187} +{"Pretrain/Learning Rate": 3.0434646210734324e-05, "Pretrain/Loss": 2.0066256523132324, "Pretrain/Loss (Raw)": 1.9766792058944702, "Pretrain/Step": 8532, "Pretrain/Step Time": 8.448206696659327} +{"Pretrain/Learning Rate": 3.043050248635062e-05, "Pretrain/Loss": 2.0050621032714844, "Pretrain/Loss (Raw)": 1.9843231439590454, "Pretrain/Step": 8533, "Pretrain/Step Time": 8.447146892547607} +{"Pretrain/Learning Rate": 3.0426358605382205e-05, "Pretrain/Loss": 2.005354404449463, "Pretrain/Loss (Raw)": 2.051795482635498, "Pretrain/Step": 8534, "Pretrain/Step Time": 8.44833154603839} +{"Pretrain/Learning Rate": 3.0422214567948564e-05, "Pretrain/Loss": 2.005887031555176, "Pretrain/Loss (Raw)": 1.9948996305465698, "Pretrain/Step": 8535, "Pretrain/Step Time": 8.448549734428525} +{"Pretrain/Learning Rate": 3.041807037416919e-05, "Pretrain/Loss": 2.0058655738830566, "Pretrain/Loss (Raw)": 2.082120418548584, "Pretrain/Step": 8536, "Pretrain/Step Time": 8.441692717373371} +{"Pretrain/Learning Rate": 3.0413926024163575e-05, "Pretrain/Loss": 2.004263401031494, "Pretrain/Loss (Raw)": 1.7912479639053345, "Pretrain/Step": 8537, "Pretrain/Step Time": 8.445829894393682} +{"Pretrain/Learning Rate": 3.040978151805123e-05, "Pretrain/Loss": 2.0048294067382812, "Pretrain/Loss (Raw)": 2.0032076835632324, "Pretrain/Step": 8538, "Pretrain/Step Time": 8.439680332317948} +{"Pretrain/Learning Rate": 3.0405636855951636e-05, "Pretrain/Loss": 2.0043725967407227, "Pretrain/Loss (Raw)": 1.9968595504760742, "Pretrain/Step": 8539, "Pretrain/Step Time": 8.442833740264177} +{"Pretrain/Learning Rate": 3.0401492037984313e-05, "Pretrain/Loss": 2.0059351921081543, "Pretrain/Loss (Raw)": 2.1759114265441895, "Pretrain/Step": 8540, "Pretrain/Step Time": 8.442630494013429} +{"Pretrain/Learning Rate": 3.0397347064268784e-05, "Pretrain/Loss": 2.008345127105713, "Pretrain/Loss (Raw)": 2.270503044128418, "Pretrain/Step": 8541, "Pretrain/Step Time": 8.437956029549241} +{"Pretrain/Learning Rate": 3.0393201934924554e-05, "Pretrain/Loss": 2.007707118988037, "Pretrain/Loss (Raw)": 2.093413829803467, "Pretrain/Step": 8542, "Pretrain/Step Time": 8.438865222036839} +{"Pretrain/Learning Rate": 3.038905665007114e-05, "Pretrain/Loss": 2.0097713470458984, "Pretrain/Loss (Raw)": 1.9689528942108154, "Pretrain/Step": 8543, "Pretrain/Step Time": 8.442621059715748} +{"Pretrain/Learning Rate": 3.038491120982808e-05, "Pretrain/Loss": 2.0097198486328125, "Pretrain/Loss (Raw)": 2.0242443084716797, "Pretrain/Step": 8544, "Pretrain/Step Time": 8.441967349499464} +{"Pretrain/Learning Rate": 3.038076561431491e-05, "Pretrain/Loss": 2.0109341144561768, "Pretrain/Loss (Raw)": 2.0529847145080566, "Pretrain/Step": 8545, "Pretrain/Step Time": 8.442578425630927} +{"Pretrain/Learning Rate": 3.0376619863651153e-05, "Pretrain/Loss": 2.0100536346435547, "Pretrain/Loss (Raw)": 2.2380776405334473, "Pretrain/Step": 8546, "Pretrain/Step Time": 8.44539787992835} +{"Pretrain/Learning Rate": 3.0372473957956347e-05, "Pretrain/Loss": 2.0095672607421875, "Pretrain/Loss (Raw)": 2.127107620239258, "Pretrain/Step": 8547, "Pretrain/Step Time": 8.445520212873816} +{"Pretrain/Learning Rate": 3.0368327897350048e-05, "Pretrain/Loss": 2.0101685523986816, "Pretrain/Loss (Raw)": 2.2094616889953613, "Pretrain/Step": 8548, "Pretrain/Step Time": 8.44204069674015} +{"Pretrain/Learning Rate": 3.0364181681951794e-05, "Pretrain/Loss": 2.012207508087158, "Pretrain/Loss (Raw)": 2.242827892303467, "Pretrain/Step": 8549, "Pretrain/Step Time": 8.44060186855495} +{"Pretrain/Learning Rate": 3.0360035311881146e-05, "Pretrain/Loss": 2.009026050567627, "Pretrain/Loss (Raw)": 1.3590831756591797, "Pretrain/Step": 8550, "Pretrain/Step Time": 8.438590856269002} +{"Pretrain/Learning Rate": 3.035588878725766e-05, "Pretrain/Loss": 2.0070509910583496, "Pretrain/Loss (Raw)": 1.685732126235962, "Pretrain/Step": 8551, "Pretrain/Step Time": 8.438494618982077} +{"Pretrain/Learning Rate": 3.0351742108200888e-05, "Pretrain/Loss": 2.005831003189087, "Pretrain/Loss (Raw)": 2.0408318042755127, "Pretrain/Step": 8552, "Pretrain/Step Time": 8.442006472498178} +{"Pretrain/Learning Rate": 3.034759527483041e-05, "Pretrain/Loss": 2.0047836303710938, "Pretrain/Loss (Raw)": 1.9003103971481323, "Pretrain/Step": 8553, "Pretrain/Step Time": 8.444829350337386} +{"Pretrain/Learning Rate": 3.0343448287265792e-05, "Pretrain/Loss": 2.005296468734741, "Pretrain/Loss (Raw)": 1.9477449655532837, "Pretrain/Step": 8554, "Pretrain/Step Time": 8.441557513549924} +{"Pretrain/Learning Rate": 3.0339301145626613e-05, "Pretrain/Loss": 2.006131172180176, "Pretrain/Loss (Raw)": 2.025622844696045, "Pretrain/Step": 8555, "Pretrain/Step Time": 8.440753946080804} +{"Pretrain/Learning Rate": 3.033515385003245e-05, "Pretrain/Loss": 2.0062026977539062, "Pretrain/Loss (Raw)": 1.9777653217315674, "Pretrain/Step": 8556, "Pretrain/Step Time": 8.44394139200449} +{"Pretrain/Learning Rate": 3.033100640060288e-05, "Pretrain/Loss": 2.007025957107544, "Pretrain/Loss (Raw)": 2.0595884323120117, "Pretrain/Step": 8557, "Pretrain/Step Time": 8.445166194811463} +{"Pretrain/Learning Rate": 3.0326858797457496e-05, "Pretrain/Loss": 2.0065691471099854, "Pretrain/Loss (Raw)": 2.163273572921753, "Pretrain/Step": 8558, "Pretrain/Step Time": 8.44544450007379} +{"Pretrain/Learning Rate": 3.0322711040715902e-05, "Pretrain/Loss": 2.0036497116088867, "Pretrain/Loss (Raw)": 2.070279598236084, "Pretrain/Step": 8559, "Pretrain/Step Time": 8.446205334737897} +{"Pretrain/Learning Rate": 3.031856313049769e-05, "Pretrain/Loss": 2.0048322677612305, "Pretrain/Loss (Raw)": 1.9930062294006348, "Pretrain/Step": 8560, "Pretrain/Step Time": 8.444143824279308} +{"Pretrain/Learning Rate": 3.0314415066922454e-05, "Pretrain/Loss": 2.000966787338257, "Pretrain/Loss (Raw)": 1.6324321031570435, "Pretrain/Step": 8561, "Pretrain/Step Time": 8.440606337040663} +{"Pretrain/Learning Rate": 3.03102668501098e-05, "Pretrain/Loss": 1.9982843399047852, "Pretrain/Loss (Raw)": 1.9107997417449951, "Pretrain/Step": 8562, "Pretrain/Step Time": 8.44361406005919} +{"Pretrain/Learning Rate": 3.0306118480179353e-05, "Pretrain/Loss": 1.999403715133667, "Pretrain/Loss (Raw)": 2.1153247356414795, "Pretrain/Step": 8563, "Pretrain/Step Time": 8.445865295827389} +{"Pretrain/Learning Rate": 3.0301969957250718e-05, "Pretrain/Loss": 2.000967025756836, "Pretrain/Loss (Raw)": 2.1324782371520996, "Pretrain/Step": 8564, "Pretrain/Step Time": 8.4408637881279} +{"Pretrain/Learning Rate": 3.0297821281443523e-05, "Pretrain/Loss": 2.000047206878662, "Pretrain/Loss (Raw)": 1.7619889974594116, "Pretrain/Step": 8565, "Pretrain/Step Time": 8.441317792981863} +{"Pretrain/Learning Rate": 3.0293672452877374e-05, "Pretrain/Loss": 2.0030770301818848, "Pretrain/Loss (Raw)": 2.147089958190918, "Pretrain/Step": 8566, "Pretrain/Step Time": 8.43974601663649} +{"Pretrain/Learning Rate": 3.028952347167192e-05, "Pretrain/Loss": 2.0046567916870117, "Pretrain/Loss (Raw)": 2.1360113620758057, "Pretrain/Step": 8567, "Pretrain/Step Time": 8.440644565969706} +{"Pretrain/Learning Rate": 3.028537433794678e-05, "Pretrain/Loss": 2.0044775009155273, "Pretrain/Loss (Raw)": 1.9954993724822998, "Pretrain/Step": 8568, "Pretrain/Step Time": 8.438913179561496} +{"Pretrain/Learning Rate": 3.0281225051821604e-05, "Pretrain/Loss": 2.004988670349121, "Pretrain/Loss (Raw)": 1.8653697967529297, "Pretrain/Step": 8569, "Pretrain/Step Time": 8.440110810101032} +{"Pretrain/Learning Rate": 3.0277075613416022e-05, "Pretrain/Loss": 2.0049872398376465, "Pretrain/Loss (Raw)": 2.07330322265625, "Pretrain/Step": 8570, "Pretrain/Step Time": 8.442106243222952} +{"Pretrain/Learning Rate": 3.027292602284969e-05, "Pretrain/Loss": 2.004636764526367, "Pretrain/Loss (Raw)": 1.9815247058868408, "Pretrain/Step": 8571, "Pretrain/Step Time": 8.440891006961465} +{"Pretrain/Learning Rate": 3.0268776280242245e-05, "Pretrain/Loss": 2.0041215419769287, "Pretrain/Loss (Raw)": 1.8482810258865356, "Pretrain/Step": 8572, "Pretrain/Step Time": 8.443721367046237} +{"Pretrain/Learning Rate": 3.0264626385713352e-05, "Pretrain/Loss": 2.005316972732544, "Pretrain/Loss (Raw)": 2.181335926055908, "Pretrain/Step": 8573, "Pretrain/Step Time": 8.44071819074452} +{"Pretrain/Learning Rate": 3.026047633938267e-05, "Pretrain/Loss": 2.0026803016662598, "Pretrain/Loss (Raw)": 1.8975119590759277, "Pretrain/Step": 8574, "Pretrain/Step Time": 8.441282035782933} +{"Pretrain/Learning Rate": 3.0256326141369868e-05, "Pretrain/Loss": 2.004340171813965, "Pretrain/Loss (Raw)": 2.0585455894470215, "Pretrain/Step": 8575, "Pretrain/Step Time": 8.440520968288183} +{"Pretrain/Learning Rate": 3.02521757917946e-05, "Pretrain/Loss": 2.0048160552978516, "Pretrain/Loss (Raw)": 1.9659078121185303, "Pretrain/Step": 8576, "Pretrain/Step Time": 8.449977098032832} +{"Pretrain/Learning Rate": 3.0248025290776545e-05, "Pretrain/Loss": 2.004545211791992, "Pretrain/Loss (Raw)": 2.0256447792053223, "Pretrain/Step": 8577, "Pretrain/Step Time": 8.444132482632995} +{"Pretrain/Learning Rate": 3.0243874638435382e-05, "Pretrain/Loss": 2.0026330947875977, "Pretrain/Loss (Raw)": 1.9859575033187866, "Pretrain/Step": 8578, "Pretrain/Step Time": 8.44816031306982} +{"Pretrain/Learning Rate": 3.023972383489079e-05, "Pretrain/Loss": 2.0040106773376465, "Pretrain/Loss (Raw)": 2.1242117881774902, "Pretrain/Step": 8579, "Pretrain/Step Time": 8.446992859244347} +{"Pretrain/Learning Rate": 3.0235572880262452e-05, "Pretrain/Loss": 2.006542682647705, "Pretrain/Loss (Raw)": 2.0727133750915527, "Pretrain/Step": 8580, "Pretrain/Step Time": 8.441246280446649} +{"Pretrain/Learning Rate": 3.0231421774670073e-05, "Pretrain/Loss": 2.0072739124298096, "Pretrain/Loss (Raw)": 2.058837890625, "Pretrain/Step": 8581, "Pretrain/Step Time": 8.442800479009748} +{"Pretrain/Learning Rate": 3.0227270518233326e-05, "Pretrain/Loss": 2.004549503326416, "Pretrain/Loss (Raw)": 1.8728196620941162, "Pretrain/Step": 8582, "Pretrain/Step Time": 8.446390995755792} +{"Pretrain/Learning Rate": 3.022311911107192e-05, "Pretrain/Loss": 2.005366802215576, "Pretrain/Loss (Raw)": 2.0422098636627197, "Pretrain/Step": 8583, "Pretrain/Step Time": 8.446127196773887} +{"Pretrain/Learning Rate": 3.0218967553305556e-05, "Pretrain/Loss": 2.00388765335083, "Pretrain/Loss (Raw)": 1.7983213663101196, "Pretrain/Step": 8584, "Pretrain/Step Time": 8.441138193011284} +{"Pretrain/Learning Rate": 3.021481584505394e-05, "Pretrain/Loss": 2.0010030269622803, "Pretrain/Loss (Raw)": 1.9417980909347534, "Pretrain/Step": 8585, "Pretrain/Step Time": 8.443498615175486} +{"Pretrain/Learning Rate": 3.0210663986436783e-05, "Pretrain/Loss": 2.002694606781006, "Pretrain/Loss (Raw)": 2.1179468631744385, "Pretrain/Step": 8586, "Pretrain/Step Time": 8.44451248459518} +{"Pretrain/Learning Rate": 3.0206511977573816e-05, "Pretrain/Loss": 2.001457691192627, "Pretrain/Loss (Raw)": 1.868297815322876, "Pretrain/Step": 8587, "Pretrain/Step Time": 8.443405406549573} +{"Pretrain/Learning Rate": 3.020235981858473e-05, "Pretrain/Loss": 2.004223346710205, "Pretrain/Loss (Raw)": 2.353776216506958, "Pretrain/Step": 8588, "Pretrain/Step Time": 8.43932880461216} +{"Pretrain/Learning Rate": 3.0198207509589272e-05, "Pretrain/Loss": 2.0028183460235596, "Pretrain/Loss (Raw)": 1.9625383615493774, "Pretrain/Step": 8589, "Pretrain/Step Time": 8.445303553715348} +{"Pretrain/Learning Rate": 3.019405505070717e-05, "Pretrain/Loss": 2.0025558471679688, "Pretrain/Loss (Raw)": 2.098712205886841, "Pretrain/Step": 8590, "Pretrain/Step Time": 8.445191361010075} +{"Pretrain/Learning Rate": 3.0189902442058143e-05, "Pretrain/Loss": 2.0030901432037354, "Pretrain/Loss (Raw)": 2.1552653312683105, "Pretrain/Step": 8591, "Pretrain/Step Time": 8.441002266481519} +{"Pretrain/Learning Rate": 3.0185749683761948e-05, "Pretrain/Loss": 2.0036470890045166, "Pretrain/Loss (Raw)": 1.9672096967697144, "Pretrain/Step": 8592, "Pretrain/Step Time": 8.43931077606976} +{"Pretrain/Learning Rate": 3.0181596775938316e-05, "Pretrain/Loss": 2.0009703636169434, "Pretrain/Loss (Raw)": 1.845197081565857, "Pretrain/Step": 8593, "Pretrain/Step Time": 8.444107441231608} +{"Pretrain/Learning Rate": 3.0177443718706982e-05, "Pretrain/Loss": 2.0018396377563477, "Pretrain/Loss (Raw)": 1.9775595664978027, "Pretrain/Step": 8594, "Pretrain/Step Time": 8.440296748653054} +{"Pretrain/Learning Rate": 3.017329051218772e-05, "Pretrain/Loss": 2.001316547393799, "Pretrain/Loss (Raw)": 1.9995217323303223, "Pretrain/Step": 8595, "Pretrain/Step Time": 8.437306733801961} +{"Pretrain/Learning Rate": 3.0169137156500267e-05, "Pretrain/Loss": 2.0013437271118164, "Pretrain/Loss (Raw)": 1.9651519060134888, "Pretrain/Step": 8596, "Pretrain/Step Time": 8.434403700754046} +{"Pretrain/Learning Rate": 3.016498365176439e-05, "Pretrain/Loss": 2.0029406547546387, "Pretrain/Loss (Raw)": 2.144534111022949, "Pretrain/Step": 8597, "Pretrain/Step Time": 8.434447458013892} +{"Pretrain/Learning Rate": 3.0160829998099847e-05, "Pretrain/Loss": 2.0002875328063965, "Pretrain/Loss (Raw)": 1.9479074478149414, "Pretrain/Step": 8598, "Pretrain/Step Time": 8.435574831441045} +{"Pretrain/Learning Rate": 3.0156676195626416e-05, "Pretrain/Loss": 1.9993870258331299, "Pretrain/Loss (Raw)": 2.0834708213806152, "Pretrain/Step": 8599, "Pretrain/Step Time": 8.438909420743585} +{"Pretrain/Learning Rate": 3.0152522244463856e-05, "Pretrain/Loss": 1.9986987113952637, "Pretrain/Loss (Raw)": 1.9149065017700195, "Pretrain/Step": 8600, "Pretrain/Step Time": 8.436709066852927} +{"Pretrain/Learning Rate": 3.0148368144731954e-05, "Pretrain/Loss": 1.998410940170288, "Pretrain/Loss (Raw)": 2.009003162384033, "Pretrain/Step": 8601, "Pretrain/Step Time": 8.439863389357924} +{"Pretrain/Learning Rate": 3.0144213896550487e-05, "Pretrain/Loss": 1.9988858699798584, "Pretrain/Loss (Raw)": 2.082397937774658, "Pretrain/Step": 8602, "Pretrain/Step Time": 8.438371798023582} +{"Pretrain/Learning Rate": 3.014005950003923e-05, "Pretrain/Loss": 2.0023300647735596, "Pretrain/Loss (Raw)": 2.1719820499420166, "Pretrain/Step": 8603, "Pretrain/Step Time": 8.438840992748737} +{"Pretrain/Learning Rate": 3.013590495531799e-05, "Pretrain/Loss": 2.0026793479919434, "Pretrain/Loss (Raw)": 2.098621129989624, "Pretrain/Step": 8604, "Pretrain/Step Time": 8.438150880858302} +{"Pretrain/Learning Rate": 3.0131750262506547e-05, "Pretrain/Loss": 2.00061297416687, "Pretrain/Loss (Raw)": 1.9427769184112549, "Pretrain/Step": 8605, "Pretrain/Step Time": 8.442451173439622} +{"Pretrain/Learning Rate": 3.0127595421724703e-05, "Pretrain/Loss": 1.9996660947799683, "Pretrain/Loss (Raw)": 1.944875955581665, "Pretrain/Step": 8606, "Pretrain/Step Time": 8.442594738677144} +{"Pretrain/Learning Rate": 3.0123440433092265e-05, "Pretrain/Loss": 1.999359369277954, "Pretrain/Loss (Raw)": 2.067659854888916, "Pretrain/Step": 8607, "Pretrain/Step Time": 8.44691606797278} +{"Pretrain/Learning Rate": 3.011928529672903e-05, "Pretrain/Loss": 1.9990224838256836, "Pretrain/Loss (Raw)": 1.951289176940918, "Pretrain/Step": 8608, "Pretrain/Step Time": 8.448385812342167} +{"Pretrain/Learning Rate": 3.0115130012754806e-05, "Pretrain/Loss": 1.999965786933899, "Pretrain/Loss (Raw)": 2.0587713718414307, "Pretrain/Step": 8609, "Pretrain/Step Time": 8.450287822633982} +{"Pretrain/Learning Rate": 3.011097458128942e-05, "Pretrain/Loss": 1.99977445602417, "Pretrain/Loss (Raw)": 1.9270554780960083, "Pretrain/Step": 8610, "Pretrain/Step Time": 8.448013719171286} +{"Pretrain/Learning Rate": 3.010681900245268e-05, "Pretrain/Loss": 1.9997210502624512, "Pretrain/Loss (Raw)": 1.9327378273010254, "Pretrain/Step": 8611, "Pretrain/Step Time": 8.448280978947878} +{"Pretrain/Learning Rate": 3.010266327636442e-05, "Pretrain/Loss": 2.0014190673828125, "Pretrain/Loss (Raw)": 2.090493679046631, "Pretrain/Step": 8612, "Pretrain/Step Time": 8.44430959969759} +{"Pretrain/Learning Rate": 3.009850740314446e-05, "Pretrain/Loss": 2.0015954971313477, "Pretrain/Loss (Raw)": 2.0847721099853516, "Pretrain/Step": 8613, "Pretrain/Step Time": 8.446887977421284} +{"Pretrain/Learning Rate": 3.009435138291263e-05, "Pretrain/Loss": 2.002289295196533, "Pretrain/Loss (Raw)": 2.0608057975769043, "Pretrain/Step": 8614, "Pretrain/Step Time": 8.448820773512125} +{"Pretrain/Learning Rate": 3.0090195215788774e-05, "Pretrain/Loss": 1.9989569187164307, "Pretrain/Loss (Raw)": 1.9523488283157349, "Pretrain/Step": 8615, "Pretrain/Step Time": 8.445630514994264} +{"Pretrain/Learning Rate": 3.0086038901892727e-05, "Pretrain/Loss": 2.000920534133911, "Pretrain/Loss (Raw)": 2.263029098510742, "Pretrain/Step": 8616, "Pretrain/Step Time": 8.449019407853484} +{"Pretrain/Learning Rate": 3.0081882441344333e-05, "Pretrain/Loss": 2.0013277530670166, "Pretrain/Loss (Raw)": 2.033595085144043, "Pretrain/Step": 8617, "Pretrain/Step Time": 8.442987021058798} +{"Pretrain/Learning Rate": 3.007772583426344e-05, "Pretrain/Loss": 2.002744197845459, "Pretrain/Loss (Raw)": 2.090723991394043, "Pretrain/Step": 8618, "Pretrain/Step Time": 8.442901063710451} +{"Pretrain/Learning Rate": 3.0073569080769902e-05, "Pretrain/Loss": 2.00506591796875, "Pretrain/Loss (Raw)": 2.1182096004486084, "Pretrain/Step": 8619, "Pretrain/Step Time": 8.444811521098018} +{"Pretrain/Learning Rate": 3.006941218098358e-05, "Pretrain/Loss": 2.0038037300109863, "Pretrain/Loss (Raw)": 2.0380258560180664, "Pretrain/Step": 8620, "Pretrain/Step Time": 8.445273956283927} +{"Pretrain/Learning Rate": 3.0065255135024328e-05, "Pretrain/Loss": 2.0052828788757324, "Pretrain/Loss (Raw)": 1.9684451818466187, "Pretrain/Step": 8621, "Pretrain/Step Time": 8.444752329960465} +{"Pretrain/Learning Rate": 3.0061097943012013e-05, "Pretrain/Loss": 2.0055387020111084, "Pretrain/Loss (Raw)": 1.9379258155822754, "Pretrain/Step": 8622, "Pretrain/Step Time": 8.444216888397932} +{"Pretrain/Learning Rate": 3.0056940605066513e-05, "Pretrain/Loss": 2.011881113052368, "Pretrain/Loss (Raw)": 2.4736526012420654, "Pretrain/Step": 8623, "Pretrain/Step Time": 8.44128573127091} +{"Pretrain/Learning Rate": 3.0052783121307693e-05, "Pretrain/Loss": 2.0130937099456787, "Pretrain/Loss (Raw)": 2.2258284091949463, "Pretrain/Step": 8624, "Pretrain/Step Time": 8.449302705004811} +{"Pretrain/Learning Rate": 3.0048625491855438e-05, "Pretrain/Loss": 2.015929698944092, "Pretrain/Loss (Raw)": 2.3227057456970215, "Pretrain/Step": 8625, "Pretrain/Step Time": 8.448569605126977} +{"Pretrain/Learning Rate": 3.0044467716829617e-05, "Pretrain/Loss": 2.014449119567871, "Pretrain/Loss (Raw)": 1.8011817932128906, "Pretrain/Step": 8626, "Pretrain/Step Time": 8.452732956036925} +{"Pretrain/Learning Rate": 3.0040309796350123e-05, "Pretrain/Loss": 2.0129036903381348, "Pretrain/Loss (Raw)": 1.8214668035507202, "Pretrain/Step": 8627, "Pretrain/Step Time": 8.44999548047781} +{"Pretrain/Learning Rate": 3.0036151730536855e-05, "Pretrain/Loss": 2.0133795738220215, "Pretrain/Loss (Raw)": 1.9762779474258423, "Pretrain/Step": 8628, "Pretrain/Step Time": 8.447404131293297} +{"Pretrain/Learning Rate": 3.003199351950971e-05, "Pretrain/Loss": 2.014063596725464, "Pretrain/Loss (Raw)": 2.108668088912964, "Pretrain/Step": 8629, "Pretrain/Step Time": 8.448272716253996} +{"Pretrain/Learning Rate": 3.002783516338857e-05, "Pretrain/Loss": 2.0138933658599854, "Pretrain/Loss (Raw)": 1.9427295923233032, "Pretrain/Step": 8630, "Pretrain/Step Time": 8.453279312700033} +{"Pretrain/Learning Rate": 3.002367666229335e-05, "Pretrain/Loss": 2.014780044555664, "Pretrain/Loss (Raw)": 1.912233829498291, "Pretrain/Step": 8631, "Pretrain/Step Time": 8.44752687215805} +{"Pretrain/Learning Rate": 3.001951801634395e-05, "Pretrain/Loss": 2.0165774822235107, "Pretrain/Loss (Raw)": 2.286417007446289, "Pretrain/Step": 8632, "Pretrain/Step Time": 8.451315449550748} +{"Pretrain/Learning Rate": 3.001535922566029e-05, "Pretrain/Loss": 2.0178165435791016, "Pretrain/Loss (Raw)": 2.1049447059631348, "Pretrain/Step": 8633, "Pretrain/Step Time": 8.44826283864677} +{"Pretrain/Learning Rate": 3.0011200290362286e-05, "Pretrain/Loss": 2.017305374145508, "Pretrain/Loss (Raw)": 1.9132553339004517, "Pretrain/Step": 8634, "Pretrain/Step Time": 8.450032379478216} +{"Pretrain/Learning Rate": 3.0007041210569848e-05, "Pretrain/Loss": 2.0164296627044678, "Pretrain/Loss (Raw)": 1.9626299142837524, "Pretrain/Step": 8635, "Pretrain/Step Time": 8.448893329128623} +{"Pretrain/Learning Rate": 3.000288198640291e-05, "Pretrain/Loss": 2.017239570617676, "Pretrain/Loss (Raw)": 1.9574666023254395, "Pretrain/Step": 8636, "Pretrain/Step Time": 8.455245910212398} +{"Pretrain/Learning Rate": 2.9998722617981396e-05, "Pretrain/Loss": 2.0157549381256104, "Pretrain/Loss (Raw)": 1.9427871704101562, "Pretrain/Step": 8637, "Pretrain/Step Time": 8.454757479950786} +{"Pretrain/Learning Rate": 2.999456310542524e-05, "Pretrain/Loss": 2.0170910358428955, "Pretrain/Loss (Raw)": 2.207599639892578, "Pretrain/Step": 8638, "Pretrain/Step Time": 8.455726604908705} +{"Pretrain/Learning Rate": 2.9990403448854375e-05, "Pretrain/Loss": 2.01648211479187, "Pretrain/Loss (Raw)": 1.998815894126892, "Pretrain/Step": 8639, "Pretrain/Step Time": 8.453966626897454} +{"Pretrain/Learning Rate": 2.9986243648388744e-05, "Pretrain/Loss": 2.0162136554718018, "Pretrain/Loss (Raw)": 2.046002149581909, "Pretrain/Step": 8640, "Pretrain/Step Time": 8.45257087238133} +{"Pretrain/Learning Rate": 2.99820837041483e-05, "Pretrain/Loss": 2.014343738555908, "Pretrain/Loss (Raw)": 1.8810021877288818, "Pretrain/Step": 8641, "Pretrain/Step Time": 8.45062005519867} +{"Pretrain/Learning Rate": 2.997792361625298e-05, "Pretrain/Loss": 2.013997793197632, "Pretrain/Loss (Raw)": 2.101816177368164, "Pretrain/Step": 8642, "Pretrain/Step Time": 8.449574632570148} +{"Pretrain/Learning Rate": 2.9973763384822734e-05, "Pretrain/Loss": 2.0173749923706055, "Pretrain/Loss (Raw)": 2.0550949573516846, "Pretrain/Step": 8643, "Pretrain/Step Time": 8.455709232017398} +{"Pretrain/Learning Rate": 2.9969603009977537e-05, "Pretrain/Loss": 2.0148074626922607, "Pretrain/Loss (Raw)": 1.8062412738800049, "Pretrain/Step": 8644, "Pretrain/Step Time": 8.45380524545908} +{"Pretrain/Learning Rate": 2.9965442491837342e-05, "Pretrain/Loss": 2.013169050216675, "Pretrain/Loss (Raw)": 1.8339447975158691, "Pretrain/Step": 8645, "Pretrain/Step Time": 8.451976891607046} +{"Pretrain/Learning Rate": 2.996128183052211e-05, "Pretrain/Loss": 2.0131545066833496, "Pretrain/Loss (Raw)": 1.932221531867981, "Pretrain/Step": 8646, "Pretrain/Step Time": 8.449167985469103} +{"Pretrain/Learning Rate": 2.995712102615181e-05, "Pretrain/Loss": 2.013589382171631, "Pretrain/Loss (Raw)": 2.034874200820923, "Pretrain/Step": 8647, "Pretrain/Step Time": 8.450365766882896} +{"Pretrain/Learning Rate": 2.995296007884642e-05, "Pretrain/Loss": 2.015172004699707, "Pretrain/Loss (Raw)": 2.042137622833252, "Pretrain/Step": 8648, "Pretrain/Step Time": 8.452363954856992} +{"Pretrain/Learning Rate": 2.9948798988725918e-05, "Pretrain/Loss": 2.015373468399048, "Pretrain/Loss (Raw)": 1.8821959495544434, "Pretrain/Step": 8649, "Pretrain/Step Time": 8.448873467743397} +{"Pretrain/Learning Rate": 2.9944637755910294e-05, "Pretrain/Loss": 2.015359878540039, "Pretrain/Loss (Raw)": 2.4769794940948486, "Pretrain/Step": 8650, "Pretrain/Step Time": 8.44976456090808} +{"Pretrain/Learning Rate": 2.9940476380519516e-05, "Pretrain/Loss": 2.0165798664093018, "Pretrain/Loss (Raw)": 2.049129009246826, "Pretrain/Step": 8651, "Pretrain/Step Time": 8.450424594804645} +{"Pretrain/Learning Rate": 2.9936314862673592e-05, "Pretrain/Loss": 2.0154402256011963, "Pretrain/Loss (Raw)": 1.907147765159607, "Pretrain/Step": 8652, "Pretrain/Step Time": 8.453465955331922} +{"Pretrain/Learning Rate": 2.9932153202492502e-05, "Pretrain/Loss": 2.016909122467041, "Pretrain/Loss (Raw)": 2.073558807373047, "Pretrain/Step": 8653, "Pretrain/Step Time": 8.45268072001636} +{"Pretrain/Learning Rate": 2.9927991400096257e-05, "Pretrain/Loss": 2.0195398330688477, "Pretrain/Loss (Raw)": 2.0090739727020264, "Pretrain/Step": 8654, "Pretrain/Step Time": 8.450678378343582} +{"Pretrain/Learning Rate": 2.9923829455604852e-05, "Pretrain/Loss": 2.0214943885803223, "Pretrain/Loss (Raw)": 2.2582526206970215, "Pretrain/Step": 8655, "Pretrain/Step Time": 8.451268156990409} +{"Pretrain/Learning Rate": 2.9919667369138294e-05, "Pretrain/Loss": 2.0222837924957275, "Pretrain/Loss (Raw)": 2.0706138610839844, "Pretrain/Step": 8656, "Pretrain/Step Time": 8.450821304693818} +{"Pretrain/Learning Rate": 2.9915505140816597e-05, "Pretrain/Loss": 2.0195207595825195, "Pretrain/Loss (Raw)": 1.796436071395874, "Pretrain/Step": 8657, "Pretrain/Step Time": 8.451438648626208} +{"Pretrain/Learning Rate": 2.9911342770759776e-05, "Pretrain/Loss": 2.0199332237243652, "Pretrain/Loss (Raw)": 2.1574182510375977, "Pretrain/Step": 8658, "Pretrain/Step Time": 8.453409621492028} +{"Pretrain/Learning Rate": 2.9907180259087842e-05, "Pretrain/Loss": 2.0210657119750977, "Pretrain/Loss (Raw)": 1.9623113870620728, "Pretrain/Step": 8659, "Pretrain/Step Time": 8.447241796180606} +{"Pretrain/Learning Rate": 2.9903017605920836e-05, "Pretrain/Loss": 2.0220022201538086, "Pretrain/Loss (Raw)": 2.0965335369110107, "Pretrain/Step": 8660, "Pretrain/Step Time": 8.448950044810772} +{"Pretrain/Learning Rate": 2.989885481137877e-05, "Pretrain/Loss": 2.0225024223327637, "Pretrain/Loss (Raw)": 2.048367500305176, "Pretrain/Step": 8661, "Pretrain/Step Time": 8.44977030903101} +{"Pretrain/Learning Rate": 2.989469187558167e-05, "Pretrain/Loss": 2.022660493850708, "Pretrain/Loss (Raw)": 2.0720131397247314, "Pretrain/Step": 8662, "Pretrain/Step Time": 8.445211090147495} +{"Pretrain/Learning Rate": 2.9890528798649586e-05, "Pretrain/Loss": 2.021603584289551, "Pretrain/Loss (Raw)": 1.8596254587173462, "Pretrain/Step": 8663, "Pretrain/Step Time": 8.447371132671833} +{"Pretrain/Learning Rate": 2.9886365580702553e-05, "Pretrain/Loss": 2.0220823287963867, "Pretrain/Loss (Raw)": 2.14340877532959, "Pretrain/Step": 8664, "Pretrain/Step Time": 8.44723092019558} +{"Pretrain/Learning Rate": 2.9882202221860618e-05, "Pretrain/Loss": 2.02296781539917, "Pretrain/Loss (Raw)": 1.9045474529266357, "Pretrain/Step": 8665, "Pretrain/Step Time": 8.447627814486623} +{"Pretrain/Learning Rate": 2.9878038722243816e-05, "Pretrain/Loss": 2.023923397064209, "Pretrain/Loss (Raw)": 2.125561475753784, "Pretrain/Step": 8666, "Pretrain/Step Time": 8.453296383842826} +{"Pretrain/Learning Rate": 2.9873875081972214e-05, "Pretrain/Loss": 2.023742914199829, "Pretrain/Loss (Raw)": 1.9737262725830078, "Pretrain/Step": 8667, "Pretrain/Step Time": 8.4495016541332} +{"Pretrain/Learning Rate": 2.9869711301165847e-05, "Pretrain/Loss": 2.0223612785339355, "Pretrain/Loss (Raw)": 1.9990465641021729, "Pretrain/Step": 8668, "Pretrain/Step Time": 8.455071048811078} +{"Pretrain/Learning Rate": 2.9865547379944796e-05, "Pretrain/Loss": 2.0219545364379883, "Pretrain/Loss (Raw)": 2.2184603214263916, "Pretrain/Step": 8669, "Pretrain/Step Time": 8.45578409358859} +{"Pretrain/Learning Rate": 2.9861383318429116e-05, "Pretrain/Loss": 2.0220155715942383, "Pretrain/Loss (Raw)": 2.1012215614318848, "Pretrain/Step": 8670, "Pretrain/Step Time": 8.457138793542981} +{"Pretrain/Learning Rate": 2.985721911673888e-05, "Pretrain/Loss": 2.023167133331299, "Pretrain/Loss (Raw)": 2.1163487434387207, "Pretrain/Step": 8671, "Pretrain/Step Time": 8.451550088822842} +{"Pretrain/Learning Rate": 2.9853054774994145e-05, "Pretrain/Loss": 2.0222721099853516, "Pretrain/Loss (Raw)": 1.9096990823745728, "Pretrain/Step": 8672, "Pretrain/Step Time": 8.45540265366435} +{"Pretrain/Learning Rate": 2.9848890293315e-05, "Pretrain/Loss": 2.0224087238311768, "Pretrain/Loss (Raw)": 2.0704658031463623, "Pretrain/Step": 8673, "Pretrain/Step Time": 8.455783944576979} +{"Pretrain/Learning Rate": 2.9844725671821523e-05, "Pretrain/Loss": 2.0203723907470703, "Pretrain/Loss (Raw)": 1.9774155616760254, "Pretrain/Step": 8674, "Pretrain/Step Time": 8.458055943250656} +{"Pretrain/Learning Rate": 2.9840560910633792e-05, "Pretrain/Loss": 2.0183892250061035, "Pretrain/Loss (Raw)": 1.8732997179031372, "Pretrain/Step": 8675, "Pretrain/Step Time": 8.456227196380496} +{"Pretrain/Learning Rate": 2.98363960098719e-05, "Pretrain/Loss": 2.0186469554901123, "Pretrain/Loss (Raw)": 2.242424488067627, "Pretrain/Step": 8676, "Pretrain/Step Time": 8.457387084141374} +{"Pretrain/Learning Rate": 2.983223096965595e-05, "Pretrain/Loss": 2.0170037746429443, "Pretrain/Loss (Raw)": 2.0325076580047607, "Pretrain/Step": 8677, "Pretrain/Step Time": 8.461034817621112} +{"Pretrain/Learning Rate": 2.982806579010602e-05, "Pretrain/Loss": 2.023777484893799, "Pretrain/Loss (Raw)": 2.2261271476745605, "Pretrain/Step": 8678, "Pretrain/Step Time": 8.459574868902564} +{"Pretrain/Learning Rate": 2.9823900471342208e-05, "Pretrain/Loss": 2.0267069339752197, "Pretrain/Loss (Raw)": 2.060692310333252, "Pretrain/Step": 8679, "Pretrain/Step Time": 8.45573479309678} +{"Pretrain/Learning Rate": 2.9819735013484633e-05, "Pretrain/Loss": 2.0253782272338867, "Pretrain/Loss (Raw)": 1.8707729578018188, "Pretrain/Step": 8680, "Pretrain/Step Time": 8.455063264817} +{"Pretrain/Learning Rate": 2.98155694166534e-05, "Pretrain/Loss": 2.025559663772583, "Pretrain/Loss (Raw)": 1.923514485359192, "Pretrain/Step": 8681, "Pretrain/Step Time": 8.45310678333044} +{"Pretrain/Learning Rate": 2.9811403680968613e-05, "Pretrain/Loss": 2.026594877243042, "Pretrain/Loss (Raw)": 2.0802454948425293, "Pretrain/Step": 8682, "Pretrain/Step Time": 8.45648861117661} +{"Pretrain/Learning Rate": 2.9807237806550396e-05, "Pretrain/Loss": 2.028653860092163, "Pretrain/Loss (Raw)": 2.289172410964966, "Pretrain/Step": 8683, "Pretrain/Step Time": 8.452548809349537} +{"Pretrain/Learning Rate": 2.980307179351886e-05, "Pretrain/Loss": 2.02885103225708, "Pretrain/Loss (Raw)": 2.0029940605163574, "Pretrain/Step": 8684, "Pretrain/Step Time": 8.447838911786675} +{"Pretrain/Learning Rate": 2.979890564199414e-05, "Pretrain/Loss": 2.0286831855773926, "Pretrain/Loss (Raw)": 2.038111925125122, "Pretrain/Step": 8685, "Pretrain/Step Time": 8.45501821860671} +{"Pretrain/Learning Rate": 2.9794739352096358e-05, "Pretrain/Loss": 2.0295605659484863, "Pretrain/Loss (Raw)": 2.27561092376709, "Pretrain/Step": 8686, "Pretrain/Step Time": 8.455777643248439} +{"Pretrain/Learning Rate": 2.979057292394565e-05, "Pretrain/Loss": 2.029515504837036, "Pretrain/Loss (Raw)": 2.06449294090271, "Pretrain/Step": 8687, "Pretrain/Step Time": 8.451342018321157} +{"Pretrain/Learning Rate": 2.9786406357662145e-05, "Pretrain/Loss": 2.029500722885132, "Pretrain/Loss (Raw)": 1.9911185503005981, "Pretrain/Step": 8688, "Pretrain/Step Time": 8.452722925692797} +{"Pretrain/Learning Rate": 2.9782239653365983e-05, "Pretrain/Loss": 2.0321760177612305, "Pretrain/Loss (Raw)": 1.9748682975769043, "Pretrain/Step": 8689, "Pretrain/Step Time": 8.454523658379912} +{"Pretrain/Learning Rate": 2.9778072811177316e-05, "Pretrain/Loss": 2.033250331878662, "Pretrain/Loss (Raw)": 2.048304557800293, "Pretrain/Step": 8690, "Pretrain/Step Time": 8.4549790173769} +{"Pretrain/Learning Rate": 2.9773905831216287e-05, "Pretrain/Loss": 2.0320370197296143, "Pretrain/Loss (Raw)": 1.9600309133529663, "Pretrain/Step": 8691, "Pretrain/Step Time": 8.452553613111377} +{"Pretrain/Learning Rate": 2.9769738713603057e-05, "Pretrain/Loss": 2.0315029621124268, "Pretrain/Loss (Raw)": 2.064101457595825, "Pretrain/Step": 8692, "Pretrain/Step Time": 8.453065481036901} +{"Pretrain/Learning Rate": 2.9765571458457764e-05, "Pretrain/Loss": 2.0329437255859375, "Pretrain/Loss (Raw)": 1.9464192390441895, "Pretrain/Step": 8693, "Pretrain/Step Time": 8.450106294825673} +{"Pretrain/Learning Rate": 2.9761404065900576e-05, "Pretrain/Loss": 2.03263258934021, "Pretrain/Loss (Raw)": 2.1072566509246826, "Pretrain/Step": 8694, "Pretrain/Step Time": 8.449149930849671} +{"Pretrain/Learning Rate": 2.9757236536051664e-05, "Pretrain/Loss": 2.0323305130004883, "Pretrain/Loss (Raw)": 2.0973739624023438, "Pretrain/Step": 8695, "Pretrain/Step Time": 8.442697562277317} +{"Pretrain/Learning Rate": 2.9753068869031186e-05, "Pretrain/Loss": 2.031296730041504, "Pretrain/Loss (Raw)": 1.8631389141082764, "Pretrain/Step": 8696, "Pretrain/Step Time": 8.445783270522952} +{"Pretrain/Learning Rate": 2.974890106495932e-05, "Pretrain/Loss": 2.033404588699341, "Pretrain/Loss (Raw)": 2.1351850032806396, "Pretrain/Step": 8697, "Pretrain/Step Time": 8.445536205545068} +{"Pretrain/Learning Rate": 2.9744733123956242e-05, "Pretrain/Loss": 2.032210350036621, "Pretrain/Loss (Raw)": 1.9204541444778442, "Pretrain/Step": 8698, "Pretrain/Step Time": 8.445258544757962} +{"Pretrain/Learning Rate": 2.974056504614213e-05, "Pretrain/Loss": 2.0332694053649902, "Pretrain/Loss (Raw)": 2.117075204849243, "Pretrain/Step": 8699, "Pretrain/Step Time": 8.444750420749187} +{"Pretrain/Learning Rate": 2.973639683163716e-05, "Pretrain/Loss": 2.034851551055908, "Pretrain/Loss (Raw)": 2.050802707672119, "Pretrain/Step": 8700, "Pretrain/Step Time": 8.443937610834837} +{"Pretrain/Learning Rate": 2.9732228480561523e-05, "Pretrain/Loss": 2.0337915420532227, "Pretrain/Loss (Raw)": 2.0456314086914062, "Pretrain/Step": 8701, "Pretrain/Step Time": 8.441907973960042} +{"Pretrain/Learning Rate": 2.972805999303543e-05, "Pretrain/Loss": 2.033780097961426, "Pretrain/Loss (Raw)": 1.8960579633712769, "Pretrain/Step": 8702, "Pretrain/Step Time": 8.450180869549513} +{"Pretrain/Learning Rate": 2.9723891369179046e-05, "Pretrain/Loss": 2.034924030303955, "Pretrain/Loss (Raw)": 2.2049663066864014, "Pretrain/Step": 8703, "Pretrain/Step Time": 8.451168652623892} +{"Pretrain/Learning Rate": 2.9719722609112586e-05, "Pretrain/Loss": 2.0345025062561035, "Pretrain/Loss (Raw)": 1.9119594097137451, "Pretrain/Step": 8704, "Pretrain/Step Time": 8.443151647225022} +{"Pretrain/Learning Rate": 2.9715553712956257e-05, "Pretrain/Loss": 2.0349464416503906, "Pretrain/Loss (Raw)": 2.0824923515319824, "Pretrain/Step": 8705, "Pretrain/Step Time": 8.447317466139793} +{"Pretrain/Learning Rate": 2.9711384680830258e-05, "Pretrain/Loss": 2.0363144874572754, "Pretrain/Loss (Raw)": 2.1610121726989746, "Pretrain/Step": 8706, "Pretrain/Step Time": 8.444942723959684} +{"Pretrain/Learning Rate": 2.9707215512854807e-05, "Pretrain/Loss": 2.0380356311798096, "Pretrain/Loss (Raw)": 2.3445491790771484, "Pretrain/Step": 8707, "Pretrain/Step Time": 8.44445487856865} +{"Pretrain/Learning Rate": 2.9703046209150117e-05, "Pretrain/Loss": 2.0372776985168457, "Pretrain/Loss (Raw)": 1.9756773710250854, "Pretrain/Step": 8708, "Pretrain/Step Time": 8.448891250416636} +{"Pretrain/Learning Rate": 2.9698876769836403e-05, "Pretrain/Loss": 2.0340819358825684, "Pretrain/Loss (Raw)": 1.6497999429702759, "Pretrain/Step": 8709, "Pretrain/Step Time": 8.45105086825788} +{"Pretrain/Learning Rate": 2.9694707195033884e-05, "Pretrain/Loss": 2.035567045211792, "Pretrain/Loss (Raw)": 2.0629091262817383, "Pretrain/Step": 8710, "Pretrain/Step Time": 8.441047932952642} +{"Pretrain/Learning Rate": 2.9690537484862795e-05, "Pretrain/Loss": 2.0348124504089355, "Pretrain/Loss (Raw)": 1.945650339126587, "Pretrain/Step": 8711, "Pretrain/Step Time": 8.442720575258136} +{"Pretrain/Learning Rate": 2.9686367639443363e-05, "Pretrain/Loss": 2.0361030101776123, "Pretrain/Loss (Raw)": 1.9634888172149658, "Pretrain/Step": 8712, "Pretrain/Step Time": 8.448497937992215} +{"Pretrain/Learning Rate": 2.9682197658895827e-05, "Pretrain/Loss": 2.0370373725891113, "Pretrain/Loss (Raw)": 2.0613856315612793, "Pretrain/Step": 8713, "Pretrain/Step Time": 8.44624031893909} +{"Pretrain/Learning Rate": 2.967802754334042e-05, "Pretrain/Loss": 2.0345072746276855, "Pretrain/Loss (Raw)": 1.7941035032272339, "Pretrain/Step": 8714, "Pretrain/Step Time": 8.44529377296567} +{"Pretrain/Learning Rate": 2.967385729289739e-05, "Pretrain/Loss": 2.0360796451568604, "Pretrain/Loss (Raw)": 2.0695765018463135, "Pretrain/Step": 8715, "Pretrain/Step Time": 8.447641694918275} +{"Pretrain/Learning Rate": 2.966968690768697e-05, "Pretrain/Loss": 2.0318856239318848, "Pretrain/Loss (Raw)": 1.8169442415237427, "Pretrain/Step": 8716, "Pretrain/Step Time": 8.449588557705283} +{"Pretrain/Learning Rate": 2.9665516387829427e-05, "Pretrain/Loss": 2.0319669246673584, "Pretrain/Loss (Raw)": 1.9729174375534058, "Pretrain/Step": 8717, "Pretrain/Step Time": 8.446269882842898} +{"Pretrain/Learning Rate": 2.9661345733445012e-05, "Pretrain/Loss": 2.030909538269043, "Pretrain/Loss (Raw)": 1.963361144065857, "Pretrain/Step": 8718, "Pretrain/Step Time": 8.450116693973541} +{"Pretrain/Learning Rate": 2.9657174944653976e-05, "Pretrain/Loss": 2.0290937423706055, "Pretrain/Loss (Raw)": 1.9228875637054443, "Pretrain/Step": 8719, "Pretrain/Step Time": 8.451619766652584} +{"Pretrain/Learning Rate": 2.9653004021576582e-05, "Pretrain/Loss": 2.0289065837860107, "Pretrain/Loss (Raw)": 1.9432148933410645, "Pretrain/Step": 8720, "Pretrain/Step Time": 8.455446043983102} +{"Pretrain/Learning Rate": 2.9648832964333096e-05, "Pretrain/Loss": 2.028841972351074, "Pretrain/Loss (Raw)": 1.8369306325912476, "Pretrain/Step": 8721, "Pretrain/Step Time": 8.450980415567756} +{"Pretrain/Learning Rate": 2.964466177304379e-05, "Pretrain/Loss": 2.028749465942383, "Pretrain/Loss (Raw)": 1.965729832649231, "Pretrain/Step": 8722, "Pretrain/Step Time": 8.453846218064427} +{"Pretrain/Learning Rate": 2.9640490447828933e-05, "Pretrain/Loss": 2.028566598892212, "Pretrain/Loss (Raw)": 1.9761234521865845, "Pretrain/Step": 8723, "Pretrain/Step Time": 8.45633034966886} +{"Pretrain/Learning Rate": 2.9636318988808816e-05, "Pretrain/Loss": 2.0282983779907227, "Pretrain/Loss (Raw)": 1.930803894996643, "Pretrain/Step": 8724, "Pretrain/Step Time": 8.454034863039851} +{"Pretrain/Learning Rate": 2.9632147396103698e-05, "Pretrain/Loss": 2.025892496109009, "Pretrain/Loss (Raw)": 1.8365830183029175, "Pretrain/Step": 8725, "Pretrain/Step Time": 8.4580600541085} +{"Pretrain/Learning Rate": 2.9627975669833878e-05, "Pretrain/Loss": 2.026599168777466, "Pretrain/Loss (Raw)": 2.038351535797119, "Pretrain/Step": 8726, "Pretrain/Step Time": 8.460725853219628} +{"Pretrain/Learning Rate": 2.9623803810119645e-05, "Pretrain/Loss": 2.026233434677124, "Pretrain/Loss (Raw)": 2.0366766452789307, "Pretrain/Step": 8727, "Pretrain/Step Time": 8.45358913205564} +{"Pretrain/Learning Rate": 2.9619631817081284e-05, "Pretrain/Loss": 2.026548385620117, "Pretrain/Loss (Raw)": 1.9552171230316162, "Pretrain/Step": 8728, "Pretrain/Step Time": 8.453660774976015} +{"Pretrain/Learning Rate": 2.9615459690839102e-05, "Pretrain/Loss": 2.026341676712036, "Pretrain/Loss (Raw)": 1.9825420379638672, "Pretrain/Step": 8729, "Pretrain/Step Time": 8.455328725278378} +{"Pretrain/Learning Rate": 2.961128743151339e-05, "Pretrain/Loss": 2.0248258113861084, "Pretrain/Loss (Raw)": 1.8883483409881592, "Pretrain/Step": 8730, "Pretrain/Step Time": 8.454483242705464} +{"Pretrain/Learning Rate": 2.960711503922446e-05, "Pretrain/Loss": 2.0233688354492188, "Pretrain/Loss (Raw)": 1.985507845878601, "Pretrain/Step": 8731, "Pretrain/Step Time": 8.455734580755234} +{"Pretrain/Learning Rate": 2.9602942514092606e-05, "Pretrain/Loss": 2.0235092639923096, "Pretrain/Loss (Raw)": 2.1165952682495117, "Pretrain/Step": 8732, "Pretrain/Step Time": 8.45726079493761} +{"Pretrain/Learning Rate": 2.9598769856238156e-05, "Pretrain/Loss": 2.024411916732788, "Pretrain/Loss (Raw)": 2.0583016872406006, "Pretrain/Step": 8733, "Pretrain/Step Time": 8.450703909620643} +{"Pretrain/Learning Rate": 2.959459706578142e-05, "Pretrain/Loss": 2.0244641304016113, "Pretrain/Loss (Raw)": 1.9515522718429565, "Pretrain/Step": 8734, "Pretrain/Step Time": 8.455474469810724} +{"Pretrain/Learning Rate": 2.9590424142842714e-05, "Pretrain/Loss": 2.024174451828003, "Pretrain/Loss (Raw)": 2.0306105613708496, "Pretrain/Step": 8735, "Pretrain/Step Time": 8.450035814195871} +{"Pretrain/Learning Rate": 2.9586251087542367e-05, "Pretrain/Loss": 2.0247387886047363, "Pretrain/Loss (Raw)": 2.02352237701416, "Pretrain/Step": 8736, "Pretrain/Step Time": 8.449310634285212} +{"Pretrain/Learning Rate": 2.95820779000007e-05, "Pretrain/Loss": 2.0237128734588623, "Pretrain/Loss (Raw)": 1.9274483919143677, "Pretrain/Step": 8737, "Pretrain/Step Time": 8.448979757726192} +{"Pretrain/Learning Rate": 2.9577904580338045e-05, "Pretrain/Loss": 2.0235533714294434, "Pretrain/Loss (Raw)": 1.906619668006897, "Pretrain/Step": 8738, "Pretrain/Step Time": 8.452644307166338} +{"Pretrain/Learning Rate": 2.9573731128674746e-05, "Pretrain/Loss": 2.0227696895599365, "Pretrain/Loss (Raw)": 1.832457184791565, "Pretrain/Step": 8739, "Pretrain/Step Time": 8.454419799149036} +{"Pretrain/Learning Rate": 2.9569557545131128e-05, "Pretrain/Loss": 2.022552967071533, "Pretrain/Loss (Raw)": 2.06274151802063, "Pretrain/Step": 8740, "Pretrain/Step Time": 8.457462912425399} +{"Pretrain/Learning Rate": 2.9565383829827543e-05, "Pretrain/Loss": 2.022425651550293, "Pretrain/Loss (Raw)": 2.0684866905212402, "Pretrain/Step": 8741, "Pretrain/Step Time": 8.458188284188509} +{"Pretrain/Learning Rate": 2.956120998288433e-05, "Pretrain/Loss": 2.021500825881958, "Pretrain/Loss (Raw)": 1.9424049854278564, "Pretrain/Step": 8742, "Pretrain/Step Time": 8.456236811354756} +{"Pretrain/Learning Rate": 2.955703600442184e-05, "Pretrain/Loss": 2.0214321613311768, "Pretrain/Loss (Raw)": 1.9435784816741943, "Pretrain/Step": 8743, "Pretrain/Step Time": 8.457084657624364} +{"Pretrain/Learning Rate": 2.9552861894560436e-05, "Pretrain/Loss": 2.019287347793579, "Pretrain/Loss (Raw)": 1.9884847402572632, "Pretrain/Step": 8744, "Pretrain/Step Time": 8.455994449555874} +{"Pretrain/Learning Rate": 2.9548687653420472e-05, "Pretrain/Loss": 2.019991874694824, "Pretrain/Loss (Raw)": 2.1237857341766357, "Pretrain/Step": 8745, "Pretrain/Step Time": 8.458316395059228} +{"Pretrain/Learning Rate": 2.95445132811223e-05, "Pretrain/Loss": 2.0196642875671387, "Pretrain/Loss (Raw)": 2.048762798309326, "Pretrain/Step": 8746, "Pretrain/Step Time": 8.462071716785431} +{"Pretrain/Learning Rate": 2.9540338777786286e-05, "Pretrain/Loss": 2.019198179244995, "Pretrain/Loss (Raw)": 2.0585551261901855, "Pretrain/Step": 8747, "Pretrain/Step Time": 8.459818355739117} +{"Pretrain/Learning Rate": 2.9536164143532814e-05, "Pretrain/Loss": 2.0194573402404785, "Pretrain/Loss (Raw)": 2.071211814880371, "Pretrain/Step": 8748, "Pretrain/Step Time": 8.460406763479114} +{"Pretrain/Learning Rate": 2.953198937848224e-05, "Pretrain/Loss": 2.0196831226348877, "Pretrain/Loss (Raw)": 1.9973331689834595, "Pretrain/Step": 8749, "Pretrain/Step Time": 8.461508015170693} +{"Pretrain/Learning Rate": 2.952781448275495e-05, "Pretrain/Loss": 2.0162646770477295, "Pretrain/Loss (Raw)": 1.5003734827041626, "Pretrain/Step": 8750, "Pretrain/Step Time": 8.465347964316607} +{"Pretrain/Learning Rate": 2.952363945647133e-05, "Pretrain/Loss": 2.0120067596435547, "Pretrain/Loss (Raw)": 1.9286423921585083, "Pretrain/Step": 8751, "Pretrain/Step Time": 8.472059024497867} +{"Pretrain/Learning Rate": 2.9519464299751742e-05, "Pretrain/Loss": 2.011399507522583, "Pretrain/Loss (Raw)": 2.148115396499634, "Pretrain/Step": 8752, "Pretrain/Step Time": 8.465737048536539} +{"Pretrain/Learning Rate": 2.9515289012716592e-05, "Pretrain/Loss": 2.0086326599121094, "Pretrain/Loss (Raw)": 1.968520164489746, "Pretrain/Step": 8753, "Pretrain/Step Time": 8.464279601350427} +{"Pretrain/Learning Rate": 2.951111359548626e-05, "Pretrain/Loss": 2.0099408626556396, "Pretrain/Loss (Raw)": 1.9686423540115356, "Pretrain/Step": 8754, "Pretrain/Step Time": 8.461415246129036} +{"Pretrain/Learning Rate": 2.9506938048181153e-05, "Pretrain/Loss": 2.0109100341796875, "Pretrain/Loss (Raw)": 1.9455066919326782, "Pretrain/Step": 8755, "Pretrain/Step Time": 8.463929193094373} +{"Pretrain/Learning Rate": 2.950276237092167e-05, "Pretrain/Loss": 2.010951280593872, "Pretrain/Loss (Raw)": 1.9815754890441895, "Pretrain/Step": 8756, "Pretrain/Step Time": 8.46415799856186} +{"Pretrain/Learning Rate": 2.94985865638282e-05, "Pretrain/Loss": 2.011045455932617, "Pretrain/Loss (Raw)": 2.1207075119018555, "Pretrain/Step": 8757, "Pretrain/Step Time": 8.463181499391794} +{"Pretrain/Learning Rate": 2.9494410627021165e-05, "Pretrain/Loss": 2.012070417404175, "Pretrain/Loss (Raw)": 2.073920488357544, "Pretrain/Step": 8758, "Pretrain/Step Time": 8.463015481829643} +{"Pretrain/Learning Rate": 2.949023456062096e-05, "Pretrain/Loss": 2.0120418071746826, "Pretrain/Loss (Raw)": 1.9085872173309326, "Pretrain/Step": 8759, "Pretrain/Step Time": 8.460762862116098} +{"Pretrain/Learning Rate": 2.948605836474801e-05, "Pretrain/Loss": 2.0109877586364746, "Pretrain/Loss (Raw)": 2.1514852046966553, "Pretrain/Step": 8760, "Pretrain/Step Time": 8.45524189248681} +{"Pretrain/Learning Rate": 2.9481882039522734e-05, "Pretrain/Loss": 2.01202654838562, "Pretrain/Loss (Raw)": 2.2379305362701416, "Pretrain/Step": 8761, "Pretrain/Step Time": 8.45852455869317} +{"Pretrain/Learning Rate": 2.9477705585065546e-05, "Pretrain/Loss": 2.0132827758789062, "Pretrain/Loss (Raw)": 2.074044942855835, "Pretrain/Step": 8762, "Pretrain/Step Time": 8.462411154061556} +{"Pretrain/Learning Rate": 2.9473529001496867e-05, "Pretrain/Loss": 2.0129401683807373, "Pretrain/Loss (Raw)": 1.9187663793563843, "Pretrain/Step": 8763, "Pretrain/Step Time": 8.462327832356095} +{"Pretrain/Learning Rate": 2.946935228893714e-05, "Pretrain/Loss": 2.012209892272949, "Pretrain/Loss (Raw)": 1.8640155792236328, "Pretrain/Step": 8764, "Pretrain/Step Time": 8.45476646721363} +{"Pretrain/Learning Rate": 2.9465175447506787e-05, "Pretrain/Loss": 2.0132923126220703, "Pretrain/Loss (Raw)": 2.08132004737854, "Pretrain/Step": 8765, "Pretrain/Step Time": 8.45800220221281} +{"Pretrain/Learning Rate": 2.9460998477326257e-05, "Pretrain/Loss": 2.0129799842834473, "Pretrain/Loss (Raw)": 2.1676173210144043, "Pretrain/Step": 8766, "Pretrain/Step Time": 8.458754377439618} +{"Pretrain/Learning Rate": 2.945682137851597e-05, "Pretrain/Loss": 2.0126330852508545, "Pretrain/Loss (Raw)": 1.9544141292572021, "Pretrain/Step": 8767, "Pretrain/Step Time": 8.463682344183326} +{"Pretrain/Learning Rate": 2.9452644151196384e-05, "Pretrain/Loss": 2.0149312019348145, "Pretrain/Loss (Raw)": 2.3401498794555664, "Pretrain/Step": 8768, "Pretrain/Step Time": 8.463262917473912} +{"Pretrain/Learning Rate": 2.9448466795487944e-05, "Pretrain/Loss": 2.0170536041259766, "Pretrain/Loss (Raw)": 2.1526734828948975, "Pretrain/Step": 8769, "Pretrain/Step Time": 8.459274251013994} +{"Pretrain/Learning Rate": 2.9444289311511096e-05, "Pretrain/Loss": 2.0152571201324463, "Pretrain/Loss (Raw)": 1.8718819618225098, "Pretrain/Step": 8770, "Pretrain/Step Time": 8.462874103337526} +{"Pretrain/Learning Rate": 2.944011169938631e-05, "Pretrain/Loss": 2.014850616455078, "Pretrain/Loss (Raw)": 2.003068447113037, "Pretrain/Step": 8771, "Pretrain/Step Time": 8.456984609365463} +{"Pretrain/Learning Rate": 2.943593395923402e-05, "Pretrain/Loss": 2.017292022705078, "Pretrain/Loss (Raw)": 2.118743896484375, "Pretrain/Step": 8772, "Pretrain/Step Time": 8.456498634070158} +{"Pretrain/Learning Rate": 2.9431756091174706e-05, "Pretrain/Loss": 2.019239902496338, "Pretrain/Loss (Raw)": 2.083249568939209, "Pretrain/Step": 8773, "Pretrain/Step Time": 8.456552345305681} +{"Pretrain/Learning Rate": 2.9427578095328827e-05, "Pretrain/Loss": 2.019923686981201, "Pretrain/Loss (Raw)": 2.0197417736053467, "Pretrain/Step": 8774, "Pretrain/Step Time": 8.453654166311026} +{"Pretrain/Learning Rate": 2.9423399971816856e-05, "Pretrain/Loss": 2.0186409950256348, "Pretrain/Loss (Raw)": 1.870698094367981, "Pretrain/Step": 8775, "Pretrain/Step Time": 8.458340169861913} +{"Pretrain/Learning Rate": 2.9419221720759266e-05, "Pretrain/Loss": 2.0177724361419678, "Pretrain/Loss (Raw)": 1.9309709072113037, "Pretrain/Step": 8776, "Pretrain/Step Time": 8.459998365491629} +{"Pretrain/Learning Rate": 2.9415043342276537e-05, "Pretrain/Loss": 2.020002841949463, "Pretrain/Loss (Raw)": 2.1676666736602783, "Pretrain/Step": 8777, "Pretrain/Step Time": 8.460736496374011} +{"Pretrain/Learning Rate": 2.9410864836489144e-05, "Pretrain/Loss": 2.0162882804870605, "Pretrain/Loss (Raw)": 2.001519203186035, "Pretrain/Step": 8778, "Pretrain/Step Time": 8.459796268492937} +{"Pretrain/Learning Rate": 2.940668620351757e-05, "Pretrain/Loss": 2.016233205795288, "Pretrain/Loss (Raw)": 2.042081594467163, "Pretrain/Step": 8779, "Pretrain/Step Time": 8.461201418191195} +{"Pretrain/Learning Rate": 2.94025074434823e-05, "Pretrain/Loss": 2.0156497955322266, "Pretrain/Loss (Raw)": 1.8324685096740723, "Pretrain/Step": 8780, "Pretrain/Step Time": 8.457398312166333} +{"Pretrain/Learning Rate": 2.939832855650384e-05, "Pretrain/Loss": 2.0163474082946777, "Pretrain/Loss (Raw)": 2.1628456115722656, "Pretrain/Step": 8781, "Pretrain/Step Time": 8.457049461081624} +{"Pretrain/Learning Rate": 2.939414954270268e-05, "Pretrain/Loss": 2.01694393157959, "Pretrain/Loss (Raw)": 2.085447072982788, "Pretrain/Step": 8782, "Pretrain/Step Time": 8.457479557022452} +{"Pretrain/Learning Rate": 2.9389970402199307e-05, "Pretrain/Loss": 2.014918327331543, "Pretrain/Loss (Raw)": 1.9989858865737915, "Pretrain/Step": 8783, "Pretrain/Step Time": 8.464435366913676} +{"Pretrain/Learning Rate": 2.9385791135114238e-05, "Pretrain/Loss": 2.019031524658203, "Pretrain/Loss (Raw)": 2.5971028804779053, "Pretrain/Step": 8784, "Pretrain/Step Time": 8.466335844248533} +{"Pretrain/Learning Rate": 2.938161174156797e-05, "Pretrain/Loss": 2.0211269855499268, "Pretrain/Loss (Raw)": 2.0646352767944336, "Pretrain/Step": 8785, "Pretrain/Step Time": 8.464019244536757} +{"Pretrain/Learning Rate": 2.9377432221681016e-05, "Pretrain/Loss": 2.0199337005615234, "Pretrain/Loss (Raw)": 2.0047123432159424, "Pretrain/Step": 8786, "Pretrain/Step Time": 8.463016023859382} +{"Pretrain/Learning Rate": 2.9373252575573895e-05, "Pretrain/Loss": 2.0219366550445557, "Pretrain/Loss (Raw)": 2.2186665534973145, "Pretrain/Step": 8787, "Pretrain/Step Time": 8.466856759041548} +{"Pretrain/Learning Rate": 2.9369072803367115e-05, "Pretrain/Loss": 2.0233092308044434, "Pretrain/Loss (Raw)": 2.2722182273864746, "Pretrain/Step": 8788, "Pretrain/Step Time": 8.465085035189986} +{"Pretrain/Learning Rate": 2.9364892905181195e-05, "Pretrain/Loss": 2.0222220420837402, "Pretrain/Loss (Raw)": 1.9092066287994385, "Pretrain/Step": 8789, "Pretrain/Step Time": 8.466270947828889} +{"Pretrain/Learning Rate": 2.9360712881136677e-05, "Pretrain/Loss": 2.021918296813965, "Pretrain/Loss (Raw)": 2.033148765563965, "Pretrain/Step": 8790, "Pretrain/Step Time": 8.466244565322995} +{"Pretrain/Learning Rate": 2.9356532731354064e-05, "Pretrain/Loss": 2.022305488586426, "Pretrain/Loss (Raw)": 1.9091846942901611, "Pretrain/Step": 8791, "Pretrain/Step Time": 8.464810224249959} +{"Pretrain/Learning Rate": 2.9352352455953915e-05, "Pretrain/Loss": 2.0211048126220703, "Pretrain/Loss (Raw)": 1.9897434711456299, "Pretrain/Step": 8792, "Pretrain/Step Time": 8.464240234345198} +{"Pretrain/Learning Rate": 2.934817205505675e-05, "Pretrain/Loss": 2.0223302841186523, "Pretrain/Loss (Raw)": 2.0613648891448975, "Pretrain/Step": 8793, "Pretrain/Step Time": 8.461318431422114} +{"Pretrain/Learning Rate": 2.93439915287831e-05, "Pretrain/Loss": 2.021094560623169, "Pretrain/Loss (Raw)": 1.9674088954925537, "Pretrain/Step": 8794, "Pretrain/Step Time": 8.464793238788843} +{"Pretrain/Learning Rate": 2.933981087725352e-05, "Pretrain/Loss": 2.0231120586395264, "Pretrain/Loss (Raw)": 2.231950521469116, "Pretrain/Step": 8795, "Pretrain/Step Time": 8.466250574216247} +{"Pretrain/Learning Rate": 2.933563010058855e-05, "Pretrain/Loss": 2.0241146087646484, "Pretrain/Loss (Raw)": 2.1273770332336426, "Pretrain/Step": 8796, "Pretrain/Step Time": 8.46044752560556} +{"Pretrain/Learning Rate": 2.9331449198908746e-05, "Pretrain/Loss": 2.022115707397461, "Pretrain/Loss (Raw)": 1.9626319408416748, "Pretrain/Step": 8797, "Pretrain/Step Time": 8.460078364238143} +{"Pretrain/Learning Rate": 2.932726817233466e-05, "Pretrain/Loss": 2.0220088958740234, "Pretrain/Loss (Raw)": 2.087536334991455, "Pretrain/Step": 8798, "Pretrain/Step Time": 8.462770611047745} +{"Pretrain/Learning Rate": 2.932308702098684e-05, "Pretrain/Loss": 2.0229134559631348, "Pretrain/Loss (Raw)": 2.23213791847229, "Pretrain/Step": 8799, "Pretrain/Step Time": 8.464375976473093} +{"Pretrain/Learning Rate": 2.931890574498586e-05, "Pretrain/Loss": 2.0245327949523926, "Pretrain/Loss (Raw)": 2.116964340209961, "Pretrain/Step": 8800, "Pretrain/Step Time": 8.46795785240829} +{"Pretrain/Learning Rate": 2.931472434445227e-05, "Pretrain/Loss": 2.0238571166992188, "Pretrain/Loss (Raw)": 1.9839506149291992, "Pretrain/Step": 8801, "Pretrain/Step Time": 8.46588247641921} +{"Pretrain/Learning Rate": 2.9310542819506648e-05, "Pretrain/Loss": 2.0250601768493652, "Pretrain/Loss (Raw)": 2.1314468383789062, "Pretrain/Step": 8802, "Pretrain/Step Time": 8.466867826879025} +{"Pretrain/Learning Rate": 2.9306361170269568e-05, "Pretrain/Loss": 2.025937795639038, "Pretrain/Loss (Raw)": 1.985622525215149, "Pretrain/Step": 8803, "Pretrain/Step Time": 8.466567495837808} +{"Pretrain/Learning Rate": 2.9302179396861595e-05, "Pretrain/Loss": 2.02608060836792, "Pretrain/Loss (Raw)": 2.260695219039917, "Pretrain/Step": 8804, "Pretrain/Step Time": 8.465861493721604} +{"Pretrain/Learning Rate": 2.9297997499403312e-05, "Pretrain/Loss": 2.0263428688049316, "Pretrain/Loss (Raw)": 2.0660572052001953, "Pretrain/Step": 8805, "Pretrain/Step Time": 8.461212236434221} +{"Pretrain/Learning Rate": 2.92938154780153e-05, "Pretrain/Loss": 2.0241479873657227, "Pretrain/Loss (Raw)": 1.94520902633667, "Pretrain/Step": 8806, "Pretrain/Step Time": 8.46604316867888} +{"Pretrain/Learning Rate": 2.9289633332818146e-05, "Pretrain/Loss": 2.0219178199768066, "Pretrain/Loss (Raw)": 1.7752158641815186, "Pretrain/Step": 8807, "Pretrain/Step Time": 8.46570291556418} +{"Pretrain/Learning Rate": 2.928545106393244e-05, "Pretrain/Loss": 2.0232596397399902, "Pretrain/Loss (Raw)": 2.0425338745117188, "Pretrain/Step": 8808, "Pretrain/Step Time": 8.46435832977295} +{"Pretrain/Learning Rate": 2.928126867147878e-05, "Pretrain/Loss": 2.022808790206909, "Pretrain/Loss (Raw)": 1.8658076524734497, "Pretrain/Step": 8809, "Pretrain/Step Time": 8.46714018471539} +{"Pretrain/Learning Rate": 2.9277086155577743e-05, "Pretrain/Loss": 2.0243170261383057, "Pretrain/Loss (Raw)": 2.2733066082000732, "Pretrain/Step": 8810, "Pretrain/Step Time": 8.465608179569244} +{"Pretrain/Learning Rate": 2.9272903516349947e-05, "Pretrain/Loss": 2.02108097076416, "Pretrain/Loss (Raw)": 1.8749622106552124, "Pretrain/Step": 8811, "Pretrain/Step Time": 8.473893415182829} +{"Pretrain/Learning Rate": 2.926872075391599e-05, "Pretrain/Loss": 2.0203323364257812, "Pretrain/Loss (Raw)": 1.9071444272994995, "Pretrain/Step": 8812, "Pretrain/Step Time": 8.473490059375763} +{"Pretrain/Learning Rate": 2.926453786839648e-05, "Pretrain/Loss": 2.019498109817505, "Pretrain/Loss (Raw)": 1.931349515914917, "Pretrain/Step": 8813, "Pretrain/Step Time": 8.467514554038644} +{"Pretrain/Learning Rate": 2.9260354859912032e-05, "Pretrain/Loss": 2.017195701599121, "Pretrain/Loss (Raw)": 1.9809257984161377, "Pretrain/Step": 8814, "Pretrain/Step Time": 8.470860248431563} +{"Pretrain/Learning Rate": 2.9256171728583254e-05, "Pretrain/Loss": 2.015531539916992, "Pretrain/Loss (Raw)": 1.851475715637207, "Pretrain/Step": 8815, "Pretrain/Step Time": 8.474081745371222} +{"Pretrain/Learning Rate": 2.9251988474530755e-05, "Pretrain/Loss": 2.0153648853302, "Pretrain/Loss (Raw)": 1.9697844982147217, "Pretrain/Step": 8816, "Pretrain/Step Time": 8.474991230294108} +{"Pretrain/Learning Rate": 2.9247805097875174e-05, "Pretrain/Loss": 2.016011953353882, "Pretrain/Loss (Raw)": 2.0576632022857666, "Pretrain/Step": 8817, "Pretrain/Step Time": 8.473732376471162} +{"Pretrain/Learning Rate": 2.9243621598737124e-05, "Pretrain/Loss": 2.0156655311584473, "Pretrain/Loss (Raw)": 2.0039899349212646, "Pretrain/Step": 8818, "Pretrain/Step Time": 8.473970871418715} +{"Pretrain/Learning Rate": 2.9239437977237244e-05, "Pretrain/Loss": 2.0154805183410645, "Pretrain/Loss (Raw)": 1.9363218545913696, "Pretrain/Step": 8819, "Pretrain/Step Time": 8.47423785738647} +{"Pretrain/Learning Rate": 2.923525423349615e-05, "Pretrain/Loss": 2.016690492630005, "Pretrain/Loss (Raw)": 2.2189881801605225, "Pretrain/Step": 8820, "Pretrain/Step Time": 8.474687373265624} +{"Pretrain/Learning Rate": 2.9231070367634488e-05, "Pretrain/Loss": 2.0182600021362305, "Pretrain/Loss (Raw)": 2.147311210632324, "Pretrain/Step": 8821, "Pretrain/Step Time": 8.479057379066944} +{"Pretrain/Learning Rate": 2.9226886379772895e-05, "Pretrain/Loss": 2.0180373191833496, "Pretrain/Loss (Raw)": 2.0787670612335205, "Pretrain/Step": 8822, "Pretrain/Step Time": 8.478439902886748} +{"Pretrain/Learning Rate": 2.922270227003201e-05, "Pretrain/Loss": 2.0158233642578125, "Pretrain/Loss (Raw)": 1.8139601945877075, "Pretrain/Step": 8823, "Pretrain/Step Time": 8.479064170271158} +{"Pretrain/Learning Rate": 2.9218518038532495e-05, "Pretrain/Loss": 2.0149307250976562, "Pretrain/Loss (Raw)": 1.7488858699798584, "Pretrain/Step": 8824, "Pretrain/Step Time": 8.478860093280673} +{"Pretrain/Learning Rate": 2.9214333685394974e-05, "Pretrain/Loss": 2.0122311115264893, "Pretrain/Loss (Raw)": 1.7896533012390137, "Pretrain/Step": 8825, "Pretrain/Step Time": 8.47517684288323} +{"Pretrain/Learning Rate": 2.921014921074011e-05, "Pretrain/Loss": 2.0126900672912598, "Pretrain/Loss (Raw)": 1.9791803359985352, "Pretrain/Step": 8826, "Pretrain/Step Time": 8.473425913602114} +{"Pretrain/Learning Rate": 2.920596461468857e-05, "Pretrain/Loss": 2.0135085582733154, "Pretrain/Loss (Raw)": 2.2218618392944336, "Pretrain/Step": 8827, "Pretrain/Step Time": 8.480442721396685} +{"Pretrain/Learning Rate": 2.9201779897360997e-05, "Pretrain/Loss": 2.012274742126465, "Pretrain/Loss (Raw)": 1.8928792476654053, "Pretrain/Step": 8828, "Pretrain/Step Time": 8.478276012465358} +{"Pretrain/Learning Rate": 2.919759505887807e-05, "Pretrain/Loss": 2.0123727321624756, "Pretrain/Loss (Raw)": 2.0581581592559814, "Pretrain/Step": 8829, "Pretrain/Step Time": 8.478155827149749} +{"Pretrain/Learning Rate": 2.9193410099360446e-05, "Pretrain/Loss": 2.0133676528930664, "Pretrain/Loss (Raw)": 2.023444175720215, "Pretrain/Step": 8830, "Pretrain/Step Time": 8.471162980422378} +{"Pretrain/Learning Rate": 2.9189225018928794e-05, "Pretrain/Loss": 2.010800361633301, "Pretrain/Loss (Raw)": 1.8763139247894287, "Pretrain/Step": 8831, "Pretrain/Step Time": 8.477762833237648} +{"Pretrain/Learning Rate": 2.9185039817703797e-05, "Pretrain/Loss": 2.014573097229004, "Pretrain/Loss (Raw)": 2.3948888778686523, "Pretrain/Step": 8832, "Pretrain/Step Time": 8.478777207434177} +{"Pretrain/Learning Rate": 2.9180854495806126e-05, "Pretrain/Loss": 2.0150351524353027, "Pretrain/Loss (Raw)": 2.1416449546813965, "Pretrain/Step": 8833, "Pretrain/Step Time": 8.4803383089602} +{"Pretrain/Learning Rate": 2.9176669053356465e-05, "Pretrain/Loss": 2.0124149322509766, "Pretrain/Loss (Raw)": 1.825617790222168, "Pretrain/Step": 8834, "Pretrain/Step Time": 8.478881653398275} +{"Pretrain/Learning Rate": 2.9172483490475498e-05, "Pretrain/Loss": 2.0100932121276855, "Pretrain/Loss (Raw)": 2.0473415851593018, "Pretrain/Step": 8835, "Pretrain/Step Time": 8.486916977912188} +{"Pretrain/Learning Rate": 2.9168297807283905e-05, "Pretrain/Loss": 2.0093436241149902, "Pretrain/Loss (Raw)": 1.8797526359558105, "Pretrain/Step": 8836, "Pretrain/Step Time": 8.481604466214776} +{"Pretrain/Learning Rate": 2.9164112003902383e-05, "Pretrain/Loss": 2.0118801593780518, "Pretrain/Loss (Raw)": 1.9744675159454346, "Pretrain/Step": 8837, "Pretrain/Step Time": 8.483821319416165} +{"Pretrain/Learning Rate": 2.9159926080451626e-05, "Pretrain/Loss": 2.0113883018493652, "Pretrain/Loss (Raw)": 1.9999384880065918, "Pretrain/Step": 8838, "Pretrain/Step Time": 8.486859824508429} +{"Pretrain/Learning Rate": 2.9155740037052337e-05, "Pretrain/Loss": 2.011307716369629, "Pretrain/Loss (Raw)": 1.9353370666503906, "Pretrain/Step": 8839, "Pretrain/Step Time": 8.484356738626957} +{"Pretrain/Learning Rate": 2.915155387382521e-05, "Pretrain/Loss": 2.0101938247680664, "Pretrain/Loss (Raw)": 1.8209131956100464, "Pretrain/Step": 8840, "Pretrain/Step Time": 8.48167810216546} +{"Pretrain/Learning Rate": 2.914736759089096e-05, "Pretrain/Loss": 2.0104994773864746, "Pretrain/Loss (Raw)": 2.1005373001098633, "Pretrain/Step": 8841, "Pretrain/Step Time": 8.484720816835761} +{"Pretrain/Learning Rate": 2.914318118837029e-05, "Pretrain/Loss": 2.0112643241882324, "Pretrain/Loss (Raw)": 1.8919923305511475, "Pretrain/Step": 8842, "Pretrain/Step Time": 8.48822877369821} +{"Pretrain/Learning Rate": 2.91389946663839e-05, "Pretrain/Loss": 2.010810136795044, "Pretrain/Loss (Raw)": 2.0114378929138184, "Pretrain/Step": 8843, "Pretrain/Step Time": 8.483647629618645} +{"Pretrain/Learning Rate": 2.9134808025052524e-05, "Pretrain/Loss": 2.01365065574646, "Pretrain/Loss (Raw)": 2.1805336475372314, "Pretrain/Step": 8844, "Pretrain/Step Time": 8.480957075953484} +{"Pretrain/Learning Rate": 2.9130621264496872e-05, "Pretrain/Loss": 2.013801336288452, "Pretrain/Loss (Raw)": 1.9921989440917969, "Pretrain/Step": 8845, "Pretrain/Step Time": 8.48329059407115} +{"Pretrain/Learning Rate": 2.912643438483767e-05, "Pretrain/Loss": 2.015277862548828, "Pretrain/Loss (Raw)": 2.1523633003234863, "Pretrain/Step": 8846, "Pretrain/Step Time": 8.476190885528922} +{"Pretrain/Learning Rate": 2.912224738619564e-05, "Pretrain/Loss": 2.0157742500305176, "Pretrain/Loss (Raw)": 1.9864327907562256, "Pretrain/Step": 8847, "Pretrain/Step Time": 8.47872600145638} +{"Pretrain/Learning Rate": 2.911806026869151e-05, "Pretrain/Loss": 2.017517566680908, "Pretrain/Loss (Raw)": 2.1663362979888916, "Pretrain/Step": 8848, "Pretrain/Step Time": 8.47834387049079} +{"Pretrain/Learning Rate": 2.9113873032446016e-05, "Pretrain/Loss": 2.019360303878784, "Pretrain/Loss (Raw)": 2.0728373527526855, "Pretrain/Step": 8849, "Pretrain/Step Time": 8.481321828439832} +{"Pretrain/Learning Rate": 2.9109685677579895e-05, "Pretrain/Loss": 2.0199708938598633, "Pretrain/Loss (Raw)": 2.0438339710235596, "Pretrain/Step": 8850, "Pretrain/Step Time": 8.480709390714765} +{"Pretrain/Learning Rate": 2.910549820421389e-05, "Pretrain/Loss": 2.0211730003356934, "Pretrain/Loss (Raw)": 2.1299970149993896, "Pretrain/Step": 8851, "Pretrain/Step Time": 8.483819095417857} +{"Pretrain/Learning Rate": 2.910131061246873e-05, "Pretrain/Loss": 2.02323842048645, "Pretrain/Loss (Raw)": 2.195207357406616, "Pretrain/Step": 8852, "Pretrain/Step Time": 8.484002474695444} +{"Pretrain/Learning Rate": 2.9097122902465175e-05, "Pretrain/Loss": 2.0255656242370605, "Pretrain/Loss (Raw)": 2.1344709396362305, "Pretrain/Step": 8853, "Pretrain/Step Time": 8.483635880053043} +{"Pretrain/Learning Rate": 2.9092935074323963e-05, "Pretrain/Loss": 2.026362657546997, "Pretrain/Loss (Raw)": 2.1403632164001465, "Pretrain/Step": 8854, "Pretrain/Step Time": 8.483283136039972} +{"Pretrain/Learning Rate": 2.9088747128165856e-05, "Pretrain/Loss": 2.0264806747436523, "Pretrain/Loss (Raw)": 2.0517725944519043, "Pretrain/Step": 8855, "Pretrain/Step Time": 8.485711926594377} +{"Pretrain/Learning Rate": 2.9084559064111616e-05, "Pretrain/Loss": 2.02775239944458, "Pretrain/Loss (Raw)": 2.1180267333984375, "Pretrain/Step": 8856, "Pretrain/Step Time": 8.487381404265761} +{"Pretrain/Learning Rate": 2.908037088228198e-05, "Pretrain/Loss": 2.026597499847412, "Pretrain/Loss (Raw)": 1.8346925973892212, "Pretrain/Step": 8857, "Pretrain/Step Time": 8.482985500246286} +{"Pretrain/Learning Rate": 2.9076182582797738e-05, "Pretrain/Loss": 2.0284500122070312, "Pretrain/Loss (Raw)": 2.125448226928711, "Pretrain/Step": 8858, "Pretrain/Step Time": 8.485904777422547} +{"Pretrain/Learning Rate": 2.907199416577964e-05, "Pretrain/Loss": 2.024411201477051, "Pretrain/Loss (Raw)": 1.4685750007629395, "Pretrain/Step": 8859, "Pretrain/Step Time": 8.486334783956409} +{"Pretrain/Learning Rate": 2.906780563134846e-05, "Pretrain/Loss": 2.0239858627319336, "Pretrain/Loss (Raw)": 2.062157392501831, "Pretrain/Step": 8860, "Pretrain/Step Time": 8.486298440024257} +{"Pretrain/Learning Rate": 2.906361697962498e-05, "Pretrain/Loss": 2.0238566398620605, "Pretrain/Loss (Raw)": 2.0417511463165283, "Pretrain/Step": 8861, "Pretrain/Step Time": 8.48637836240232} +{"Pretrain/Learning Rate": 2.905942821072996e-05, "Pretrain/Loss": 2.0224928855895996, "Pretrain/Loss (Raw)": 1.7769954204559326, "Pretrain/Step": 8862, "Pretrain/Step Time": 8.482472201809287} +{"Pretrain/Learning Rate": 2.9055239324784188e-05, "Pretrain/Loss": 2.0214555263519287, "Pretrain/Loss (Raw)": 1.8978201150894165, "Pretrain/Step": 8863, "Pretrain/Step Time": 8.483293389901519} +{"Pretrain/Learning Rate": 2.9051050321908458e-05, "Pretrain/Loss": 2.0219080448150635, "Pretrain/Loss (Raw)": 2.0814332962036133, "Pretrain/Step": 8864, "Pretrain/Step Time": 8.482798798009753} +{"Pretrain/Learning Rate": 2.904686120222354e-05, "Pretrain/Loss": 2.021209239959717, "Pretrain/Loss (Raw)": 1.8380346298217773, "Pretrain/Step": 8865, "Pretrain/Step Time": 8.484365360811353} +{"Pretrain/Learning Rate": 2.904267196585024e-05, "Pretrain/Loss": 2.022793769836426, "Pretrain/Loss (Raw)": 2.1094138622283936, "Pretrain/Step": 8866, "Pretrain/Step Time": 8.484812112525105} +{"Pretrain/Learning Rate": 2.9038482612909335e-05, "Pretrain/Loss": 2.0221972465515137, "Pretrain/Loss (Raw)": 1.7561057806015015, "Pretrain/Step": 8867, "Pretrain/Step Time": 8.47880713827908} +{"Pretrain/Learning Rate": 2.9034293143521634e-05, "Pretrain/Loss": 2.021597385406494, "Pretrain/Loss (Raw)": 1.9859620332717896, "Pretrain/Step": 8868, "Pretrain/Step Time": 8.489402070641518} +{"Pretrain/Learning Rate": 2.9030103557807937e-05, "Pretrain/Loss": 2.021481990814209, "Pretrain/Loss (Raw)": 2.0537331104278564, "Pretrain/Step": 8869, "Pretrain/Step Time": 8.48503608815372} +{"Pretrain/Learning Rate": 2.902591385588904e-05, "Pretrain/Loss": 2.0229732990264893, "Pretrain/Loss (Raw)": 2.1332736015319824, "Pretrain/Step": 8870, "Pretrain/Step Time": 8.486824743449688} +{"Pretrain/Learning Rate": 2.902172403788576e-05, "Pretrain/Loss": 2.023437738418579, "Pretrain/Loss (Raw)": 2.0030157566070557, "Pretrain/Step": 8871, "Pretrain/Step Time": 8.484698565676808} +{"Pretrain/Learning Rate": 2.90175341039189e-05, "Pretrain/Loss": 2.024993896484375, "Pretrain/Loss (Raw)": 2.187664270401001, "Pretrain/Step": 8872, "Pretrain/Step Time": 8.486138083040714} +{"Pretrain/Learning Rate": 2.9013344054109277e-05, "Pretrain/Loss": 2.02439546585083, "Pretrain/Loss (Raw)": 2.0472095012664795, "Pretrain/Step": 8873, "Pretrain/Step Time": 8.485628098249435} +{"Pretrain/Learning Rate": 2.9009153888577706e-05, "Pretrain/Loss": 2.023935317993164, "Pretrain/Loss (Raw)": 1.9898608922958374, "Pretrain/Step": 8874, "Pretrain/Step Time": 8.481123501434922} +{"Pretrain/Learning Rate": 2.9004963607445006e-05, "Pretrain/Loss": 2.0246052742004395, "Pretrain/Loss (Raw)": 2.1443114280700684, "Pretrain/Step": 8875, "Pretrain/Step Time": 8.480171259492636} +{"Pretrain/Learning Rate": 2.900077321083201e-05, "Pretrain/Loss": 2.025345802307129, "Pretrain/Loss (Raw)": 2.1659836769104004, "Pretrain/Step": 8876, "Pretrain/Step Time": 8.484194405376911} +{"Pretrain/Learning Rate": 2.8996582698859536e-05, "Pretrain/Loss": 2.025787353515625, "Pretrain/Loss (Raw)": 2.0538554191589355, "Pretrain/Step": 8877, "Pretrain/Step Time": 8.48093318939209} +{"Pretrain/Learning Rate": 2.899239207164842e-05, "Pretrain/Loss": 2.028959274291992, "Pretrain/Loss (Raw)": 1.9063984155654907, "Pretrain/Step": 8878, "Pretrain/Step Time": 8.47701677121222} +{"Pretrain/Learning Rate": 2.8988201329319492e-05, "Pretrain/Loss": 2.029656410217285, "Pretrain/Loss (Raw)": 2.0178792476654053, "Pretrain/Step": 8879, "Pretrain/Step Time": 8.471141247078776} +{"Pretrain/Learning Rate": 2.898401047199359e-05, "Pretrain/Loss": 2.029154062271118, "Pretrain/Loss (Raw)": 2.0837931632995605, "Pretrain/Step": 8880, "Pretrain/Step Time": 8.471797823905945} +{"Pretrain/Learning Rate": 2.897981949979155e-05, "Pretrain/Loss": 2.027209758758545, "Pretrain/Loss (Raw)": 1.7196636199951172, "Pretrain/Step": 8881, "Pretrain/Step Time": 8.473662639036775} +{"Pretrain/Learning Rate": 2.897562841283422e-05, "Pretrain/Loss": 2.0278756618499756, "Pretrain/Loss (Raw)": 2.0538785457611084, "Pretrain/Step": 8882, "Pretrain/Step Time": 8.473066905513406} +{"Pretrain/Learning Rate": 2.8971437211242458e-05, "Pretrain/Loss": 2.0281548500061035, "Pretrain/Loss (Raw)": 1.9812225103378296, "Pretrain/Step": 8883, "Pretrain/Step Time": 8.474292278289795} +{"Pretrain/Learning Rate": 2.8967245895137096e-05, "Pretrain/Loss": 2.028205633163452, "Pretrain/Loss (Raw)": 1.9880868196487427, "Pretrain/Step": 8884, "Pretrain/Step Time": 8.477384008467197} +{"Pretrain/Learning Rate": 2.8963054464638993e-05, "Pretrain/Loss": 2.0262928009033203, "Pretrain/Loss (Raw)": 1.8758591413497925, "Pretrain/Step": 8885, "Pretrain/Step Time": 8.475897153839469} +{"Pretrain/Learning Rate": 2.8958862919869013e-05, "Pretrain/Loss": 2.0261411666870117, "Pretrain/Loss (Raw)": 2.0545027256011963, "Pretrain/Step": 8886, "Pretrain/Step Time": 8.4736810605973} +{"Pretrain/Learning Rate": 2.8954671260948008e-05, "Pretrain/Loss": 2.027195930480957, "Pretrain/Loss (Raw)": 2.043614387512207, "Pretrain/Step": 8887, "Pretrain/Step Time": 8.475807381793857} +{"Pretrain/Learning Rate": 2.8950479487996853e-05, "Pretrain/Loss": 2.023782253265381, "Pretrain/Loss (Raw)": 1.714530110359192, "Pretrain/Step": 8888, "Pretrain/Step Time": 8.476138204336166} +{"Pretrain/Learning Rate": 2.89462876011364e-05, "Pretrain/Loss": 2.0227231979370117, "Pretrain/Loss (Raw)": 2.1023764610290527, "Pretrain/Step": 8889, "Pretrain/Step Time": 8.474698383361101} +{"Pretrain/Learning Rate": 2.8942095600487523e-05, "Pretrain/Loss": 2.0217247009277344, "Pretrain/Loss (Raw)": 1.946232795715332, "Pretrain/Step": 8890, "Pretrain/Step Time": 8.468149611726403} +{"Pretrain/Learning Rate": 2.8937903486171102e-05, "Pretrain/Loss": 2.023365020751953, "Pretrain/Loss (Raw)": 2.128713607788086, "Pretrain/Step": 8891, "Pretrain/Step Time": 8.470279168337584} +{"Pretrain/Learning Rate": 2.893371125830801e-05, "Pretrain/Loss": 2.0256900787353516, "Pretrain/Loss (Raw)": 2.1616322994232178, "Pretrain/Step": 8892, "Pretrain/Step Time": 8.474471231922507} +{"Pretrain/Learning Rate": 2.8929518917019133e-05, "Pretrain/Loss": 2.0251688957214355, "Pretrain/Loss (Raw)": 2.014589786529541, "Pretrain/Step": 8893, "Pretrain/Step Time": 8.471941344439983} +{"Pretrain/Learning Rate": 2.892532646242534e-05, "Pretrain/Loss": 2.026210308074951, "Pretrain/Loss (Raw)": 2.3009495735168457, "Pretrain/Step": 8894, "Pretrain/Step Time": 8.468656733632088} +{"Pretrain/Learning Rate": 2.892113389464753e-05, "Pretrain/Loss": 2.0270752906799316, "Pretrain/Loss (Raw)": 2.0651540756225586, "Pretrain/Step": 8895, "Pretrain/Step Time": 8.465918051078916} +{"Pretrain/Learning Rate": 2.8916941213806582e-05, "Pretrain/Loss": 2.024914503097534, "Pretrain/Loss (Raw)": 2.0635273456573486, "Pretrain/Step": 8896, "Pretrain/Step Time": 8.469817137345672} +{"Pretrain/Learning Rate": 2.89127484200234e-05, "Pretrain/Loss": 2.0241732597351074, "Pretrain/Loss (Raw)": 2.057812213897705, "Pretrain/Step": 8897, "Pretrain/Step Time": 8.477001750841737} +{"Pretrain/Learning Rate": 2.8908555513418877e-05, "Pretrain/Loss": 2.023686408996582, "Pretrain/Loss (Raw)": 1.8095510005950928, "Pretrain/Step": 8898, "Pretrain/Step Time": 8.478069085627794} +{"Pretrain/Learning Rate": 2.8904362494113912e-05, "Pretrain/Loss": 2.0225720405578613, "Pretrain/Loss (Raw)": 1.8604321479797363, "Pretrain/Step": 8899, "Pretrain/Step Time": 8.482380906119943} +{"Pretrain/Learning Rate": 2.89001693622294e-05, "Pretrain/Loss": 2.022825241088867, "Pretrain/Loss (Raw)": 2.151136636734009, "Pretrain/Step": 8900, "Pretrain/Step Time": 8.480292553082108} +{"Pretrain/Learning Rate": 2.8895976117886258e-05, "Pretrain/Loss": 2.020543336868286, "Pretrain/Loss (Raw)": 1.7911709547042847, "Pretrain/Step": 8901, "Pretrain/Step Time": 8.483495688065886} +{"Pretrain/Learning Rate": 2.8891782761205387e-05, "Pretrain/Loss": 2.0199153423309326, "Pretrain/Loss (Raw)": 1.9393576383590698, "Pretrain/Step": 8902, "Pretrain/Step Time": 8.488974008709192} +{"Pretrain/Learning Rate": 2.8887589292307717e-05, "Pretrain/Loss": 2.021512508392334, "Pretrain/Loss (Raw)": 2.075172185897827, "Pretrain/Step": 8903, "Pretrain/Step Time": 8.481757033616304} +{"Pretrain/Learning Rate": 2.8883395711314137e-05, "Pretrain/Loss": 2.021458148956299, "Pretrain/Loss (Raw)": 1.9240000247955322, "Pretrain/Step": 8904, "Pretrain/Step Time": 8.479929748922586} +{"Pretrain/Learning Rate": 2.8879202018345587e-05, "Pretrain/Loss": 2.0196170806884766, "Pretrain/Loss (Raw)": 1.9320194721221924, "Pretrain/Step": 8905, "Pretrain/Step Time": 8.481070306152105} +{"Pretrain/Learning Rate": 2.8875008213522975e-05, "Pretrain/Loss": 2.018159866333008, "Pretrain/Loss (Raw)": 1.814980149269104, "Pretrain/Step": 8906, "Pretrain/Step Time": 8.481621455401182} +{"Pretrain/Learning Rate": 2.887081429696723e-05, "Pretrain/Loss": 2.0189900398254395, "Pretrain/Loss (Raw)": 2.1483561992645264, "Pretrain/Step": 8907, "Pretrain/Step Time": 8.476714849472046} +{"Pretrain/Learning Rate": 2.8866620268799293e-05, "Pretrain/Loss": 2.019620895385742, "Pretrain/Loss (Raw)": 1.9132091999053955, "Pretrain/Step": 8908, "Pretrain/Step Time": 8.479796763509512} +{"Pretrain/Learning Rate": 2.8862426129140084e-05, "Pretrain/Loss": 2.016169786453247, "Pretrain/Loss (Raw)": 1.7210922241210938, "Pretrain/Step": 8909, "Pretrain/Step Time": 8.481753202155232} +{"Pretrain/Learning Rate": 2.885823187811054e-05, "Pretrain/Loss": 2.015730381011963, "Pretrain/Loss (Raw)": 2.0292038917541504, "Pretrain/Step": 8910, "Pretrain/Step Time": 8.487425250932574} +{"Pretrain/Learning Rate": 2.8854037515831596e-05, "Pretrain/Loss": 2.0168991088867188, "Pretrain/Loss (Raw)": 2.1485915184020996, "Pretrain/Step": 8911, "Pretrain/Step Time": 8.478970168158412} +{"Pretrain/Learning Rate": 2.88498430424242e-05, "Pretrain/Loss": 2.0135579109191895, "Pretrain/Loss (Raw)": 2.1694352626800537, "Pretrain/Step": 8912, "Pretrain/Step Time": 8.480421006679535} +{"Pretrain/Learning Rate": 2.884564845800929e-05, "Pretrain/Loss": 2.0137062072753906, "Pretrain/Loss (Raw)": 2.0836181640625, "Pretrain/Step": 8913, "Pretrain/Step Time": 8.481182897463441} +{"Pretrain/Learning Rate": 2.8841453762707825e-05, "Pretrain/Loss": 2.0135021209716797, "Pretrain/Loss (Raw)": 1.9785969257354736, "Pretrain/Step": 8914, "Pretrain/Step Time": 8.482268726453185} +{"Pretrain/Learning Rate": 2.8837258956640746e-05, "Pretrain/Loss": 2.0115528106689453, "Pretrain/Loss (Raw)": 1.9691418409347534, "Pretrain/Step": 8915, "Pretrain/Step Time": 8.487316105514765} +{"Pretrain/Learning Rate": 2.883306403992901e-05, "Pretrain/Loss": 2.0100207328796387, "Pretrain/Loss (Raw)": 2.0760979652404785, "Pretrain/Step": 8916, "Pretrain/Step Time": 8.491550447419286} +{"Pretrain/Learning Rate": 2.882886901269357e-05, "Pretrain/Loss": 2.009981155395508, "Pretrain/Loss (Raw)": 1.9041603803634644, "Pretrain/Step": 8917, "Pretrain/Step Time": 8.487105689942837} +{"Pretrain/Learning Rate": 2.8824673875055397e-05, "Pretrain/Loss": 2.0108983516693115, "Pretrain/Loss (Raw)": 2.1505348682403564, "Pretrain/Step": 8918, "Pretrain/Step Time": 8.4909996856004} +{"Pretrain/Learning Rate": 2.8820478627135448e-05, "Pretrain/Loss": 2.0117459297180176, "Pretrain/Loss (Raw)": 2.017698049545288, "Pretrain/Step": 8919, "Pretrain/Step Time": 8.490983286872506} +{"Pretrain/Learning Rate": 2.8816283269054694e-05, "Pretrain/Loss": 2.0112810134887695, "Pretrain/Loss (Raw)": 1.9302082061767578, "Pretrain/Step": 8920, "Pretrain/Step Time": 8.490391789004207} +{"Pretrain/Learning Rate": 2.88120878009341e-05, "Pretrain/Loss": 2.011216640472412, "Pretrain/Loss (Raw)": 2.0531394481658936, "Pretrain/Step": 8921, "Pretrain/Step Time": 8.49273013882339} +{"Pretrain/Learning Rate": 2.880789222289464e-05, "Pretrain/Loss": 2.0136804580688477, "Pretrain/Loss (Raw)": 2.2827773094177246, "Pretrain/Step": 8922, "Pretrain/Step Time": 8.484021181240678} +{"Pretrain/Learning Rate": 2.8803696535057288e-05, "Pretrain/Loss": 2.010608673095703, "Pretrain/Loss (Raw)": 1.8387600183486938, "Pretrain/Step": 8923, "Pretrain/Step Time": 8.482660494744778} +{"Pretrain/Learning Rate": 2.8799500737543033e-05, "Pretrain/Loss": 2.0113768577575684, "Pretrain/Loss (Raw)": 2.2256906032562256, "Pretrain/Step": 8924, "Pretrain/Step Time": 8.483283264562488} +{"Pretrain/Learning Rate": 2.8795304830472856e-05, "Pretrain/Loss": 2.012105941772461, "Pretrain/Loss (Raw)": 2.055969715118408, "Pretrain/Step": 8925, "Pretrain/Step Time": 8.483753206208348} +{"Pretrain/Learning Rate": 2.8791108813967733e-05, "Pretrain/Loss": 2.0102648735046387, "Pretrain/Loss (Raw)": 1.8518871068954468, "Pretrain/Step": 8926, "Pretrain/Step Time": 8.481825534254313} +{"Pretrain/Learning Rate": 2.878691268814866e-05, "Pretrain/Loss": 2.0067172050476074, "Pretrain/Loss (Raw)": 1.778030514717102, "Pretrain/Step": 8927, "Pretrain/Step Time": 8.482459634542465} +{"Pretrain/Learning Rate": 2.878271645313663e-05, "Pretrain/Loss": 2.006725549697876, "Pretrain/Loss (Raw)": 2.1180214881896973, "Pretrain/Step": 8928, "Pretrain/Step Time": 8.47623285278678} +{"Pretrain/Learning Rate": 2.8778520109052643e-05, "Pretrain/Loss": 2.0070371627807617, "Pretrain/Loss (Raw)": 2.023831844329834, "Pretrain/Step": 8929, "Pretrain/Step Time": 8.479311591014266} +{"Pretrain/Learning Rate": 2.8774323656017686e-05, "Pretrain/Loss": 2.0070033073425293, "Pretrain/Loss (Raw)": 2.1271159648895264, "Pretrain/Step": 8930, "Pretrain/Step Time": 8.474788112565875} +{"Pretrain/Learning Rate": 2.8770127094152772e-05, "Pretrain/Loss": 2.0069336891174316, "Pretrain/Loss (Raw)": 1.9767353534698486, "Pretrain/Step": 8931, "Pretrain/Step Time": 8.477030577138066} +{"Pretrain/Learning Rate": 2.8765930423578897e-05, "Pretrain/Loss": 2.0062880516052246, "Pretrain/Loss (Raw)": 2.1780378818511963, "Pretrain/Step": 8932, "Pretrain/Step Time": 8.483119830489159} +{"Pretrain/Learning Rate": 2.8761733644417076e-05, "Pretrain/Loss": 2.0060524940490723, "Pretrain/Loss (Raw)": 2.0358972549438477, "Pretrain/Step": 8933, "Pretrain/Step Time": 8.482622183859348} +{"Pretrain/Learning Rate": 2.875753675678831e-05, "Pretrain/Loss": 2.0060083866119385, "Pretrain/Loss (Raw)": 1.939579963684082, "Pretrain/Step": 8934, "Pretrain/Step Time": 8.479102559387684} +{"Pretrain/Learning Rate": 2.8753339760813634e-05, "Pretrain/Loss": 2.0086472034454346, "Pretrain/Loss (Raw)": 2.1129872798919678, "Pretrain/Step": 8935, "Pretrain/Step Time": 8.479742471128702} +{"Pretrain/Learning Rate": 2.8749142656614042e-05, "Pretrain/Loss": 2.0078611373901367, "Pretrain/Loss (Raw)": 1.9419044256210327, "Pretrain/Step": 8936, "Pretrain/Step Time": 8.482330344617367} +{"Pretrain/Learning Rate": 2.8744945444310566e-05, "Pretrain/Loss": 2.006530284881592, "Pretrain/Loss (Raw)": 1.6954805850982666, "Pretrain/Step": 8937, "Pretrain/Step Time": 8.482114676386118} +{"Pretrain/Learning Rate": 2.874074812402423e-05, "Pretrain/Loss": 2.0058748722076416, "Pretrain/Loss (Raw)": 2.189392566680908, "Pretrain/Step": 8938, "Pretrain/Step Time": 8.483909884467721} +{"Pretrain/Learning Rate": 2.8736550695876054e-05, "Pretrain/Loss": 2.0056354999542236, "Pretrain/Loss (Raw)": 1.8443297147750854, "Pretrain/Step": 8939, "Pretrain/Step Time": 8.478125622496009} +{"Pretrain/Learning Rate": 2.873235315998708e-05, "Pretrain/Loss": 2.0077831745147705, "Pretrain/Loss (Raw)": 2.182028293609619, "Pretrain/Step": 8940, "Pretrain/Step Time": 8.47767337411642} +{"Pretrain/Learning Rate": 2.8728155516478334e-05, "Pretrain/Loss": 2.0073187351226807, "Pretrain/Loss (Raw)": 1.871920108795166, "Pretrain/Step": 8941, "Pretrain/Step Time": 8.474676214158535} +{"Pretrain/Learning Rate": 2.8723957765470844e-05, "Pretrain/Loss": 2.0081627368927, "Pretrain/Loss (Raw)": 2.088953971862793, "Pretrain/Step": 8942, "Pretrain/Step Time": 8.47491928935051} +{"Pretrain/Learning Rate": 2.871975990708566e-05, "Pretrain/Loss": 2.0094094276428223, "Pretrain/Loss (Raw)": 2.011063575744629, "Pretrain/Step": 8943, "Pretrain/Step Time": 8.472861122339964} +{"Pretrain/Learning Rate": 2.8715561941443826e-05, "Pretrain/Loss": 2.010136127471924, "Pretrain/Loss (Raw)": 2.062809467315674, "Pretrain/Step": 8944, "Pretrain/Step Time": 8.470062775537372} +{"Pretrain/Learning Rate": 2.8711363868666375e-05, "Pretrain/Loss": 2.0099544525146484, "Pretrain/Loss (Raw)": 2.0343799591064453, "Pretrain/Step": 8945, "Pretrain/Step Time": 8.467019872739911} +{"Pretrain/Learning Rate": 2.8707165688874372e-05, "Pretrain/Loss": 2.008636713027954, "Pretrain/Loss (Raw)": 1.8353278636932373, "Pretrain/Step": 8946, "Pretrain/Step Time": 8.4648167360574} +{"Pretrain/Learning Rate": 2.870296740218885e-05, "Pretrain/Loss": 2.0085816383361816, "Pretrain/Loss (Raw)": 1.9292680025100708, "Pretrain/Step": 8947, "Pretrain/Step Time": 8.462956875562668} +{"Pretrain/Learning Rate": 2.869876900873088e-05, "Pretrain/Loss": 2.0080490112304688, "Pretrain/Loss (Raw)": 2.150819778442383, "Pretrain/Step": 8948, "Pretrain/Step Time": 8.470015352591872} +{"Pretrain/Learning Rate": 2.869457050862151e-05, "Pretrain/Loss": 2.0066487789154053, "Pretrain/Loss (Raw)": 1.9680649042129517, "Pretrain/Step": 8949, "Pretrain/Step Time": 8.469797112047672} +{"Pretrain/Learning Rate": 2.8690371901981804e-05, "Pretrain/Loss": 2.005833387374878, "Pretrain/Loss (Raw)": 1.974401831626892, "Pretrain/Step": 8950, "Pretrain/Step Time": 8.471607025712729} +{"Pretrain/Learning Rate": 2.8686173188932836e-05, "Pretrain/Loss": 2.009075403213501, "Pretrain/Loss (Raw)": 2.2289459705352783, "Pretrain/Step": 8951, "Pretrain/Step Time": 8.47357857041061} +{"Pretrain/Learning Rate": 2.868197436959565e-05, "Pretrain/Loss": 2.012007236480713, "Pretrain/Loss (Raw)": 2.124173879623413, "Pretrain/Step": 8952, "Pretrain/Step Time": 8.469805540516973} +{"Pretrain/Learning Rate": 2.867777544409133e-05, "Pretrain/Loss": 2.0124688148498535, "Pretrain/Loss (Raw)": 1.8487200736999512, "Pretrain/Step": 8953, "Pretrain/Step Time": 8.472186105325818} +{"Pretrain/Learning Rate": 2.8673576412540953e-05, "Pretrain/Loss": 2.0151994228363037, "Pretrain/Loss (Raw)": 2.328700542449951, "Pretrain/Step": 8954, "Pretrain/Step Time": 8.474685257300735} +{"Pretrain/Learning Rate": 2.8669377275065585e-05, "Pretrain/Loss": 2.0138659477233887, "Pretrain/Loss (Raw)": 2.051179885864258, "Pretrain/Step": 8955, "Pretrain/Step Time": 8.471742672845721} +{"Pretrain/Learning Rate": 2.8665178031786315e-05, "Pretrain/Loss": 2.014641761779785, "Pretrain/Loss (Raw)": 1.9921752214431763, "Pretrain/Step": 8956, "Pretrain/Step Time": 8.470816822722554} +{"Pretrain/Learning Rate": 2.8660978682824218e-05, "Pretrain/Loss": 2.0134358406066895, "Pretrain/Loss (Raw)": 1.9037871360778809, "Pretrain/Step": 8957, "Pretrain/Step Time": 8.47145914286375} +{"Pretrain/Learning Rate": 2.865677922830038e-05, "Pretrain/Loss": 2.01188325881958, "Pretrain/Loss (Raw)": 1.8247045278549194, "Pretrain/Step": 8958, "Pretrain/Step Time": 8.471699139103293} +{"Pretrain/Learning Rate": 2.8652579668335887e-05, "Pretrain/Loss": 2.012600898742676, "Pretrain/Loss (Raw)": 1.9681978225708008, "Pretrain/Step": 8959, "Pretrain/Step Time": 8.464545080438256} +{"Pretrain/Learning Rate": 2.864838000305184e-05, "Pretrain/Loss": 2.010099172592163, "Pretrain/Loss (Raw)": 2.0746777057647705, "Pretrain/Step": 8960, "Pretrain/Step Time": 8.467919457703829} +{"Pretrain/Learning Rate": 2.864418023256933e-05, "Pretrain/Loss": 2.008842706680298, "Pretrain/Loss (Raw)": 1.9808076620101929, "Pretrain/Step": 8961, "Pretrain/Step Time": 8.464749250560999} +{"Pretrain/Learning Rate": 2.8639980357009455e-05, "Pretrain/Loss": 2.009453296661377, "Pretrain/Loss (Raw)": 1.9037742614746094, "Pretrain/Step": 8962, "Pretrain/Step Time": 8.464694002643228} +{"Pretrain/Learning Rate": 2.8635780376493304e-05, "Pretrain/Loss": 2.0072832107543945, "Pretrain/Loss (Raw)": 1.7695430517196655, "Pretrain/Step": 8963, "Pretrain/Step Time": 8.461723830550909} +{"Pretrain/Learning Rate": 2.863158029114199e-05, "Pretrain/Loss": 2.0098111629486084, "Pretrain/Loss (Raw)": 2.203371524810791, "Pretrain/Step": 8964, "Pretrain/Step Time": 8.462037865072489} +{"Pretrain/Learning Rate": 2.8627380101076616e-05, "Pretrain/Loss": 2.01185941696167, "Pretrain/Loss (Raw)": 2.236621618270874, "Pretrain/Step": 8965, "Pretrain/Step Time": 8.460946749895811} +{"Pretrain/Learning Rate": 2.86231798064183e-05, "Pretrain/Loss": 2.010932445526123, "Pretrain/Loss (Raw)": 1.8813062906265259, "Pretrain/Step": 8966, "Pretrain/Step Time": 8.464456243440509} +{"Pretrain/Learning Rate": 2.861897940728815e-05, "Pretrain/Loss": 2.0118250846862793, "Pretrain/Loss (Raw)": 2.0495810508728027, "Pretrain/Step": 8967, "Pretrain/Step Time": 8.462145740166306} +{"Pretrain/Learning Rate": 2.861477890380727e-05, "Pretrain/Loss": 2.014622688293457, "Pretrain/Loss (Raw)": 2.178992509841919, "Pretrain/Step": 8968, "Pretrain/Step Time": 8.462803572416306} +{"Pretrain/Learning Rate": 2.8610578296096796e-05, "Pretrain/Loss": 2.0143542289733887, "Pretrain/Loss (Raw)": 2.066162347793579, "Pretrain/Step": 8969, "Pretrain/Step Time": 8.456878898665309} +{"Pretrain/Learning Rate": 2.860637758427784e-05, "Pretrain/Loss": 2.014691114425659, "Pretrain/Loss (Raw)": 1.9351457357406616, "Pretrain/Step": 8970, "Pretrain/Step Time": 8.45573553815484} +{"Pretrain/Learning Rate": 2.860217676847153e-05, "Pretrain/Loss": 2.014601469039917, "Pretrain/Loss (Raw)": 1.9999711513519287, "Pretrain/Step": 8971, "Pretrain/Step Time": 8.458470806479454} +{"Pretrain/Learning Rate": 2.8597975848798992e-05, "Pretrain/Loss": 2.013388156890869, "Pretrain/Loss (Raw)": 2.025200366973877, "Pretrain/Step": 8972, "Pretrain/Step Time": 8.459700629115105} +{"Pretrain/Learning Rate": 2.8593774825381358e-05, "Pretrain/Loss": 2.0119550228118896, "Pretrain/Loss (Raw)": 1.8087559938430786, "Pretrain/Step": 8973, "Pretrain/Step Time": 8.458006029948592} +{"Pretrain/Learning Rate": 2.8589573698339757e-05, "Pretrain/Loss": 2.010861873626709, "Pretrain/Loss (Raw)": 2.012441635131836, "Pretrain/Step": 8974, "Pretrain/Step Time": 8.46012426353991} +{"Pretrain/Learning Rate": 2.858537246779533e-05, "Pretrain/Loss": 2.0088820457458496, "Pretrain/Loss (Raw)": 1.7330503463745117, "Pretrain/Step": 8975, "Pretrain/Step Time": 8.460499877110124} +{"Pretrain/Learning Rate": 2.858117113386921e-05, "Pretrain/Loss": 2.0080583095550537, "Pretrain/Loss (Raw)": 2.0608842372894287, "Pretrain/Step": 8976, "Pretrain/Step Time": 8.458957927301526} +{"Pretrain/Learning Rate": 2.8576969696682556e-05, "Pretrain/Loss": 2.008209228515625, "Pretrain/Loss (Raw)": 2.0921316146850586, "Pretrain/Step": 8977, "Pretrain/Step Time": 8.458187479525805} +{"Pretrain/Learning Rate": 2.8572768156356493e-05, "Pretrain/Loss": 2.007068395614624, "Pretrain/Loss (Raw)": 1.897818684577942, "Pretrain/Step": 8978, "Pretrain/Step Time": 8.456602295860648} +{"Pretrain/Learning Rate": 2.8568566513012186e-05, "Pretrain/Loss": 2.0076277256011963, "Pretrain/Loss (Raw)": 2.2015769481658936, "Pretrain/Step": 8979, "Pretrain/Step Time": 8.45270549505949} +{"Pretrain/Learning Rate": 2.8564364766770774e-05, "Pretrain/Loss": 2.0032267570495605, "Pretrain/Loss (Raw)": 1.6319153308868408, "Pretrain/Step": 8980, "Pretrain/Step Time": 8.456306375563145} +{"Pretrain/Learning Rate": 2.856016291775342e-05, "Pretrain/Loss": 2.002121925354004, "Pretrain/Loss (Raw)": 1.9930258989334106, "Pretrain/Step": 8981, "Pretrain/Step Time": 8.456469118595123} +{"Pretrain/Learning Rate": 2.8555960966081273e-05, "Pretrain/Loss": 2.0014243125915527, "Pretrain/Loss (Raw)": 2.0510802268981934, "Pretrain/Step": 8982, "Pretrain/Step Time": 8.45455033890903} +{"Pretrain/Learning Rate": 2.855175891187551e-05, "Pretrain/Loss": 2.000406503677368, "Pretrain/Loss (Raw)": 1.9215128421783447, "Pretrain/Step": 8983, "Pretrain/Step Time": 8.453481445088983} +{"Pretrain/Learning Rate": 2.854755675525727e-05, "Pretrain/Loss": 1.9999053478240967, "Pretrain/Loss (Raw)": 2.0538463592529297, "Pretrain/Step": 8984, "Pretrain/Step Time": 8.452591912820935} +{"Pretrain/Learning Rate": 2.8543354496347734e-05, "Pretrain/Loss": 2.0003461837768555, "Pretrain/Loss (Raw)": 1.8911219835281372, "Pretrain/Step": 8985, "Pretrain/Step Time": 8.45199647732079} +{"Pretrain/Learning Rate": 2.853915213526807e-05, "Pretrain/Loss": 1.9987609386444092, "Pretrain/Loss (Raw)": 1.922551155090332, "Pretrain/Step": 8986, "Pretrain/Step Time": 8.452018907293677} +{"Pretrain/Learning Rate": 2.8534949672139455e-05, "Pretrain/Loss": 2.004457473754883, "Pretrain/Loss (Raw)": 2.1977245807647705, "Pretrain/Step": 8987, "Pretrain/Step Time": 8.44970945827663} +{"Pretrain/Learning Rate": 2.8530747107083057e-05, "Pretrain/Loss": 2.003650188446045, "Pretrain/Loss (Raw)": 1.958832025527954, "Pretrain/Step": 8988, "Pretrain/Step Time": 8.44877534918487} +{"Pretrain/Learning Rate": 2.8526544440220047e-05, "Pretrain/Loss": 2.005023717880249, "Pretrain/Loss (Raw)": 2.2175636291503906, "Pretrain/Step": 8989, "Pretrain/Step Time": 8.44976532831788} +{"Pretrain/Learning Rate": 2.852234167167162e-05, "Pretrain/Loss": 2.007019519805908, "Pretrain/Loss (Raw)": 2.032440185546875, "Pretrain/Step": 8990, "Pretrain/Step Time": 8.450111012905836} +{"Pretrain/Learning Rate": 2.851813880155895e-05, "Pretrain/Loss": 2.007420778274536, "Pretrain/Loss (Raw)": 1.9491972923278809, "Pretrain/Step": 8991, "Pretrain/Step Time": 8.449465189129114} +{"Pretrain/Learning Rate": 2.851393583000323e-05, "Pretrain/Loss": 2.0072884559631348, "Pretrain/Loss (Raw)": 2.064514636993408, "Pretrain/Step": 8992, "Pretrain/Step Time": 8.450569238513708} +{"Pretrain/Learning Rate": 2.8509732757125658e-05, "Pretrain/Loss": 2.0077571868896484, "Pretrain/Loss (Raw)": 1.897995114326477, "Pretrain/Step": 8993, "Pretrain/Step Time": 8.447413111105561} +{"Pretrain/Learning Rate": 2.8505529583047404e-05, "Pretrain/Loss": 2.00717830657959, "Pretrain/Loss (Raw)": 2.0353238582611084, "Pretrain/Step": 8994, "Pretrain/Step Time": 8.446887636557221} +{"Pretrain/Learning Rate": 2.8501326307889675e-05, "Pretrain/Loss": 2.009490489959717, "Pretrain/Loss (Raw)": 2.052063465118408, "Pretrain/Step": 8995, "Pretrain/Step Time": 8.447397043928504} +{"Pretrain/Learning Rate": 2.8497122931773673e-05, "Pretrain/Loss": 2.0094661712646484, "Pretrain/Loss (Raw)": 1.9828660488128662, "Pretrain/Step": 8996, "Pretrain/Step Time": 8.439606642350554} +{"Pretrain/Learning Rate": 2.84929194548206e-05, "Pretrain/Loss": 2.00862455368042, "Pretrain/Loss (Raw)": 1.9459986686706543, "Pretrain/Step": 8997, "Pretrain/Step Time": 8.449226787313819} +{"Pretrain/Learning Rate": 2.8488715877151655e-05, "Pretrain/Loss": 2.0078582763671875, "Pretrain/Loss (Raw)": 2.0352060794830322, "Pretrain/Step": 8998, "Pretrain/Step Time": 8.447345780208707} +{"Pretrain/Learning Rate": 2.8484512198888046e-05, "Pretrain/Loss": 2.009422540664673, "Pretrain/Loss (Raw)": 2.2032382488250732, "Pretrain/Step": 8999, "Pretrain/Step Time": 8.449833776801825} +{"Pretrain/Learning Rate": 2.8480308420150982e-05, "Pretrain/Loss": 2.008329153060913, "Pretrain/Loss (Raw)": 2.047691583633423, "Pretrain/Step": 9000, "Pretrain/Step Time": 8.449221067130566} +{"Pretrain/Learning Rate": 2.8476104541061676e-05, "Pretrain/Loss": 2.010769844055176, "Pretrain/Loss (Raw)": 2.3596439361572266, "Pretrain/Step": 9001, "Pretrain/Step Time": 8.449106166139245} +{"Pretrain/Learning Rate": 2.847190056174135e-05, "Pretrain/Loss": 2.010741949081421, "Pretrain/Loss (Raw)": 1.9862791299819946, "Pretrain/Step": 9002, "Pretrain/Step Time": 8.447229366749525} +{"Pretrain/Learning Rate": 2.8467696482311224e-05, "Pretrain/Loss": 2.0095057487487793, "Pretrain/Loss (Raw)": 1.9860942363739014, "Pretrain/Step": 9003, "Pretrain/Step Time": 8.449399013072252} +{"Pretrain/Learning Rate": 2.8463492302892515e-05, "Pretrain/Loss": 2.0096588134765625, "Pretrain/Loss (Raw)": 2.1855309009552, "Pretrain/Step": 9004, "Pretrain/Step Time": 8.442150870338082} +{"Pretrain/Learning Rate": 2.845928802360644e-05, "Pretrain/Loss": 2.0127804279327393, "Pretrain/Loss (Raw)": 2.4534568786621094, "Pretrain/Step": 9005, "Pretrain/Step Time": 8.444654155522585} +{"Pretrain/Learning Rate": 2.8455083644574232e-05, "Pretrain/Loss": 2.013601064682007, "Pretrain/Loss (Raw)": 2.0114247798919678, "Pretrain/Step": 9006, "Pretrain/Step Time": 8.444235499948263} +{"Pretrain/Learning Rate": 2.8450879165917127e-05, "Pretrain/Loss": 2.014125347137451, "Pretrain/Loss (Raw)": 2.084967613220215, "Pretrain/Step": 9007, "Pretrain/Step Time": 8.44503876939416} +{"Pretrain/Learning Rate": 2.844667458775635e-05, "Pretrain/Loss": 2.0134201049804688, "Pretrain/Loss (Raw)": 1.9935328960418701, "Pretrain/Step": 9008, "Pretrain/Step Time": 8.445959953591228} +{"Pretrain/Learning Rate": 2.8442469910213144e-05, "Pretrain/Loss": 2.01511549949646, "Pretrain/Loss (Raw)": 1.9366945028305054, "Pretrain/Step": 9009, "Pretrain/Step Time": 8.444564208388329} +{"Pretrain/Learning Rate": 2.843826513340875e-05, "Pretrain/Loss": 2.015389919281006, "Pretrain/Loss (Raw)": 2.08899188041687, "Pretrain/Step": 9010, "Pretrain/Step Time": 8.446467822417617} +{"Pretrain/Learning Rate": 2.8434060257464402e-05, "Pretrain/Loss": 2.0156900882720947, "Pretrain/Loss (Raw)": 2.019641399383545, "Pretrain/Step": 9011, "Pretrain/Step Time": 8.43989452905953} +{"Pretrain/Learning Rate": 2.8429855282501338e-05, "Pretrain/Loss": 2.0160679817199707, "Pretrain/Loss (Raw)": 2.036470413208008, "Pretrain/Step": 9012, "Pretrain/Step Time": 8.435566172003746} +{"Pretrain/Learning Rate": 2.8425650208640825e-05, "Pretrain/Loss": 2.0176353454589844, "Pretrain/Loss (Raw)": 2.0764551162719727, "Pretrain/Step": 9013, "Pretrain/Step Time": 8.44665402173996} +{"Pretrain/Learning Rate": 2.8421445036004096e-05, "Pretrain/Loss": 2.0180931091308594, "Pretrain/Loss (Raw)": 2.1131107807159424, "Pretrain/Step": 9014, "Pretrain/Step Time": 8.44535681605339} +{"Pretrain/Learning Rate": 2.8417239764712424e-05, "Pretrain/Loss": 2.017148017883301, "Pretrain/Loss (Raw)": 1.922661542892456, "Pretrain/Step": 9015, "Pretrain/Step Time": 8.444745535030961} +{"Pretrain/Learning Rate": 2.8413034394887038e-05, "Pretrain/Loss": 2.0202832221984863, "Pretrain/Loss (Raw)": 2.115812063217163, "Pretrain/Step": 9016, "Pretrain/Step Time": 8.449778089299798} +{"Pretrain/Learning Rate": 2.8408828926649218e-05, "Pretrain/Loss": 2.0179014205932617, "Pretrain/Loss (Raw)": 1.7975413799285889, "Pretrain/Step": 9017, "Pretrain/Step Time": 8.448185661807656} +{"Pretrain/Learning Rate": 2.8404623360120213e-05, "Pretrain/Loss": 2.0188074111938477, "Pretrain/Loss (Raw)": 2.062166213989258, "Pretrain/Step": 9018, "Pretrain/Step Time": 8.449024613946676} +{"Pretrain/Learning Rate": 2.84004176954213e-05, "Pretrain/Loss": 2.016106128692627, "Pretrain/Loss (Raw)": 1.7829526662826538, "Pretrain/Step": 9019, "Pretrain/Step Time": 8.44988945685327} +{"Pretrain/Learning Rate": 2.8396211932673742e-05, "Pretrain/Loss": 2.014284133911133, "Pretrain/Loss (Raw)": 1.9284124374389648, "Pretrain/Step": 9020, "Pretrain/Step Time": 8.446011325344443} +{"Pretrain/Learning Rate": 2.83920060719988e-05, "Pretrain/Loss": 2.0125789642333984, "Pretrain/Loss (Raw)": 1.7963309288024902, "Pretrain/Step": 9021, "Pretrain/Step Time": 8.443439396098256} +{"Pretrain/Learning Rate": 2.838780011351776e-05, "Pretrain/Loss": 2.0110538005828857, "Pretrain/Loss (Raw)": 2.1057374477386475, "Pretrain/Step": 9022, "Pretrain/Step Time": 8.44235742278397} +{"Pretrain/Learning Rate": 2.8383594057351887e-05, "Pretrain/Loss": 2.0105693340301514, "Pretrain/Loss (Raw)": 2.0031380653381348, "Pretrain/Step": 9023, "Pretrain/Step Time": 8.442181387916207} +{"Pretrain/Learning Rate": 2.837938790362247e-05, "Pretrain/Loss": 2.009446859359741, "Pretrain/Loss (Raw)": 1.9198640584945679, "Pretrain/Step": 9024, "Pretrain/Step Time": 8.442077910527587} +{"Pretrain/Learning Rate": 2.8375181652450784e-05, "Pretrain/Loss": 2.0069432258605957, "Pretrain/Loss (Raw)": 1.7373416423797607, "Pretrain/Step": 9025, "Pretrain/Step Time": 8.438717775046825} +{"Pretrain/Learning Rate": 2.8370975303958107e-05, "Pretrain/Loss": 2.0101265907287598, "Pretrain/Loss (Raw)": 2.2169973850250244, "Pretrain/Step": 9026, "Pretrain/Step Time": 8.434443108737469} +{"Pretrain/Learning Rate": 2.8366768858265743e-05, "Pretrain/Loss": 2.0111255645751953, "Pretrain/Loss (Raw)": 1.9883219003677368, "Pretrain/Step": 9027, "Pretrain/Step Time": 8.430118260905147} +{"Pretrain/Learning Rate": 2.8362562315494966e-05, "Pretrain/Loss": 2.0105085372924805, "Pretrain/Loss (Raw)": 2.072148323059082, "Pretrain/Step": 9028, "Pretrain/Step Time": 8.430491307750344} +{"Pretrain/Learning Rate": 2.835835567576708e-05, "Pretrain/Loss": 2.0103907585144043, "Pretrain/Loss (Raw)": 1.7760937213897705, "Pretrain/Step": 9029, "Pretrain/Step Time": 8.42909374833107} +{"Pretrain/Learning Rate": 2.8354148939203374e-05, "Pretrain/Loss": 2.011237144470215, "Pretrain/Loss (Raw)": 2.0476858615875244, "Pretrain/Step": 9030, "Pretrain/Step Time": 8.428279310464859} +{"Pretrain/Learning Rate": 2.8349942105925142e-05, "Pretrain/Loss": 2.0097146034240723, "Pretrain/Loss (Raw)": 1.8803377151489258, "Pretrain/Step": 9031, "Pretrain/Step Time": 8.431350914761424} +{"Pretrain/Learning Rate": 2.8345735176053702e-05, "Pretrain/Loss": 2.011549472808838, "Pretrain/Loss (Raw)": 2.1588642597198486, "Pretrain/Step": 9032, "Pretrain/Step Time": 8.432148955762386} +{"Pretrain/Learning Rate": 2.8341528149710332e-05, "Pretrain/Loss": 2.009692668914795, "Pretrain/Loss (Raw)": 1.6942949295043945, "Pretrain/Step": 9033, "Pretrain/Step Time": 8.432467386126518} +{"Pretrain/Learning Rate": 2.8337321027016368e-05, "Pretrain/Loss": 2.01192569732666, "Pretrain/Loss (Raw)": 2.1008379459381104, "Pretrain/Step": 9034, "Pretrain/Step Time": 8.430658558383584} +{"Pretrain/Learning Rate": 2.8333113808093098e-05, "Pretrain/Loss": 2.0122056007385254, "Pretrain/Loss (Raw)": 2.184169054031372, "Pretrain/Step": 9035, "Pretrain/Step Time": 8.429484810680151} +{"Pretrain/Learning Rate": 2.832890649306184e-05, "Pretrain/Loss": 2.012533187866211, "Pretrain/Loss (Raw)": 1.955164909362793, "Pretrain/Step": 9036, "Pretrain/Step Time": 8.428383465856314} +{"Pretrain/Learning Rate": 2.8324699082043913e-05, "Pretrain/Loss": 2.0150816440582275, "Pretrain/Loss (Raw)": 2.0472779273986816, "Pretrain/Step": 9037, "Pretrain/Step Time": 8.425307404249907} +{"Pretrain/Learning Rate": 2.832049157516063e-05, "Pretrain/Loss": 2.0149240493774414, "Pretrain/Loss (Raw)": 2.0090439319610596, "Pretrain/Step": 9038, "Pretrain/Step Time": 8.426887679845095} +{"Pretrain/Learning Rate": 2.8316283972533315e-05, "Pretrain/Loss": 2.0131702423095703, "Pretrain/Loss (Raw)": 1.9241132736206055, "Pretrain/Step": 9039, "Pretrain/Step Time": 8.430967366322875} +{"Pretrain/Learning Rate": 2.831207627428329e-05, "Pretrain/Loss": 2.0134525299072266, "Pretrain/Loss (Raw)": 2.2055680751800537, "Pretrain/Step": 9040, "Pretrain/Step Time": 8.426038092002273} +{"Pretrain/Learning Rate": 2.830786848053188e-05, "Pretrain/Loss": 2.017202854156494, "Pretrain/Loss (Raw)": 2.563633680343628, "Pretrain/Step": 9041, "Pretrain/Step Time": 8.427122885361314} +{"Pretrain/Learning Rate": 2.830366059140041e-05, "Pretrain/Loss": 2.018089771270752, "Pretrain/Loss (Raw)": 2.0921308994293213, "Pretrain/Step": 9042, "Pretrain/Step Time": 8.427541490644217} +{"Pretrain/Learning Rate": 2.8299452607010218e-05, "Pretrain/Loss": 2.016599655151367, "Pretrain/Loss (Raw)": 1.778415322303772, "Pretrain/Step": 9043, "Pretrain/Step Time": 8.417573096230626} +{"Pretrain/Learning Rate": 2.8295244527482633e-05, "Pretrain/Loss": 2.0169711112976074, "Pretrain/Loss (Raw)": 2.123621940612793, "Pretrain/Step": 9044, "Pretrain/Step Time": 8.414351617917418} +{"Pretrain/Learning Rate": 2.8291036352939004e-05, "Pretrain/Loss": 2.0179378986358643, "Pretrain/Loss (Raw)": 2.0279269218444824, "Pretrain/Step": 9045, "Pretrain/Step Time": 8.41701766103506} +{"Pretrain/Learning Rate": 2.8286828083500662e-05, "Pretrain/Loss": 2.017361640930176, "Pretrain/Loss (Raw)": 2.0767810344696045, "Pretrain/Step": 9046, "Pretrain/Step Time": 8.417705532163382} +{"Pretrain/Learning Rate": 2.8282619719288945e-05, "Pretrain/Loss": 2.0166893005371094, "Pretrain/Loss (Raw)": 1.9316165447235107, "Pretrain/Step": 9047, "Pretrain/Step Time": 8.416081631556153} +{"Pretrain/Learning Rate": 2.8278411260425196e-05, "Pretrain/Loss": 2.0183801651000977, "Pretrain/Loss (Raw)": 2.1466541290283203, "Pretrain/Step": 9048, "Pretrain/Step Time": 8.417150750756264} +{"Pretrain/Learning Rate": 2.8274202707030778e-05, "Pretrain/Loss": 2.0196194648742676, "Pretrain/Loss (Raw)": 2.2117786407470703, "Pretrain/Step": 9049, "Pretrain/Step Time": 8.416544530540705} +{"Pretrain/Learning Rate": 2.826999405922703e-05, "Pretrain/Loss": 2.0169315338134766, "Pretrain/Loss (Raw)": 1.938698649406433, "Pretrain/Step": 9050, "Pretrain/Step Time": 8.418708143755794} +{"Pretrain/Learning Rate": 2.8265785317135307e-05, "Pretrain/Loss": 2.017761707305908, "Pretrain/Loss (Raw)": 1.9450491666793823, "Pretrain/Step": 9051, "Pretrain/Step Time": 8.422345362603664} +{"Pretrain/Learning Rate": 2.8261576480876974e-05, "Pretrain/Loss": 2.0160775184631348, "Pretrain/Loss (Raw)": 2.0101261138916016, "Pretrain/Step": 9052, "Pretrain/Step Time": 8.4220099914819} +{"Pretrain/Learning Rate": 2.8257367550573372e-05, "Pretrain/Loss": 2.0156612396240234, "Pretrain/Loss (Raw)": 2.0026471614837646, "Pretrain/Step": 9053, "Pretrain/Step Time": 8.420378329232335} +{"Pretrain/Learning Rate": 2.825315852634588e-05, "Pretrain/Loss": 2.018390417098999, "Pretrain/Loss (Raw)": 2.2012388706207275, "Pretrain/Step": 9054, "Pretrain/Step Time": 8.420336766168475} +{"Pretrain/Learning Rate": 2.824894940831585e-05, "Pretrain/Loss": 2.02133846282959, "Pretrain/Loss (Raw)": 2.155369758605957, "Pretrain/Step": 9055, "Pretrain/Step Time": 8.421978330239654} +{"Pretrain/Learning Rate": 2.824474019660466e-05, "Pretrain/Loss": 2.0209758281707764, "Pretrain/Loss (Raw)": 2.0716135501861572, "Pretrain/Step": 9056, "Pretrain/Step Time": 8.421507211402059} +{"Pretrain/Learning Rate": 2.8240530891333672e-05, "Pretrain/Loss": 2.0209732055664062, "Pretrain/Loss (Raw)": 2.0235071182250977, "Pretrain/Step": 9057, "Pretrain/Step Time": 8.42272623628378} +{"Pretrain/Learning Rate": 2.8236321492624255e-05, "Pretrain/Loss": 2.020723342895508, "Pretrain/Loss (Raw)": 2.0951144695281982, "Pretrain/Step": 9058, "Pretrain/Step Time": 8.424562280997634} +{"Pretrain/Learning Rate": 2.8232112000597795e-05, "Pretrain/Loss": 2.021090030670166, "Pretrain/Loss (Raw)": 2.023655891418457, "Pretrain/Step": 9059, "Pretrain/Step Time": 8.421824591234326} +{"Pretrain/Learning Rate": 2.8227902415375664e-05, "Pretrain/Loss": 2.019418716430664, "Pretrain/Loss (Raw)": 1.9641510248184204, "Pretrain/Step": 9060, "Pretrain/Step Time": 8.415059307590127} +{"Pretrain/Learning Rate": 2.822369273707923e-05, "Pretrain/Loss": 2.020008087158203, "Pretrain/Loss (Raw)": 2.1113216876983643, "Pretrain/Step": 9061, "Pretrain/Step Time": 8.414341107010841} +{"Pretrain/Learning Rate": 2.8219482965829908e-05, "Pretrain/Loss": 2.0204944610595703, "Pretrain/Loss (Raw)": 2.0018255710601807, "Pretrain/Step": 9062, "Pretrain/Step Time": 8.418704830110073} +{"Pretrain/Learning Rate": 2.8215273101749057e-05, "Pretrain/Loss": 2.020535945892334, "Pretrain/Loss (Raw)": 2.118324041366577, "Pretrain/Step": 9063, "Pretrain/Step Time": 8.426513263955712} +{"Pretrain/Learning Rate": 2.8211063144958068e-05, "Pretrain/Loss": 2.0204122066497803, "Pretrain/Loss (Raw)": 1.9260454177856445, "Pretrain/Step": 9064, "Pretrain/Step Time": 8.422977739945054} +{"Pretrain/Learning Rate": 2.8206853095578338e-05, "Pretrain/Loss": 2.023944854736328, "Pretrain/Loss (Raw)": 2.147684097290039, "Pretrain/Step": 9065, "Pretrain/Step Time": 8.420384492725134} +{"Pretrain/Learning Rate": 2.8202642953731263e-05, "Pretrain/Loss": 2.022427558898926, "Pretrain/Loss (Raw)": 1.995118260383606, "Pretrain/Step": 9066, "Pretrain/Step Time": 8.418795879930258} +{"Pretrain/Learning Rate": 2.8198432719538238e-05, "Pretrain/Loss": 2.0240230560302734, "Pretrain/Loss (Raw)": 2.0485587120056152, "Pretrain/Step": 9067, "Pretrain/Step Time": 8.418626725673676} +{"Pretrain/Learning Rate": 2.8194222393120658e-05, "Pretrain/Loss": 2.0232346057891846, "Pretrain/Loss (Raw)": 2.0811336040496826, "Pretrain/Step": 9068, "Pretrain/Step Time": 8.420230310410261} +{"Pretrain/Learning Rate": 2.8190011974599924e-05, "Pretrain/Loss": 2.023966073989868, "Pretrain/Loss (Raw)": 1.965558648109436, "Pretrain/Step": 9069, "Pretrain/Step Time": 8.422237645834684} +{"Pretrain/Learning Rate": 2.818580146409744e-05, "Pretrain/Loss": 2.025075912475586, "Pretrain/Loss (Raw)": 2.2309799194335938, "Pretrain/Step": 9070, "Pretrain/Step Time": 8.415169712156057} +{"Pretrain/Learning Rate": 2.8181590861734624e-05, "Pretrain/Loss": 2.0252737998962402, "Pretrain/Loss (Raw)": 2.036428689956665, "Pretrain/Step": 9071, "Pretrain/Step Time": 8.41788101196289} +{"Pretrain/Learning Rate": 2.8177380167632876e-05, "Pretrain/Loss": 2.0249035358428955, "Pretrain/Loss (Raw)": 2.0154004096984863, "Pretrain/Step": 9072, "Pretrain/Step Time": 8.41574764251709} +{"Pretrain/Learning Rate": 2.8173169381913612e-05, "Pretrain/Loss": 2.02402400970459, "Pretrain/Loss (Raw)": 1.9218106269836426, "Pretrain/Step": 9073, "Pretrain/Step Time": 8.424606589600444} +{"Pretrain/Learning Rate": 2.8168958504698245e-05, "Pretrain/Loss": 2.023379325866699, "Pretrain/Loss (Raw)": 1.7528016567230225, "Pretrain/Step": 9074, "Pretrain/Step Time": 8.42351384460926} +{"Pretrain/Learning Rate": 2.8164747536108193e-05, "Pretrain/Loss": 2.023991584777832, "Pretrain/Loss (Raw)": 2.007641077041626, "Pretrain/Step": 9075, "Pretrain/Step Time": 8.426469745114446} +{"Pretrain/Learning Rate": 2.8160536476264875e-05, "Pretrain/Loss": 2.0217578411102295, "Pretrain/Loss (Raw)": 1.8648895025253296, "Pretrain/Step": 9076, "Pretrain/Step Time": 8.42103179357946} +{"Pretrain/Learning Rate": 2.8156325325289717e-05, "Pretrain/Loss": 2.023898124694824, "Pretrain/Loss (Raw)": 2.242018699645996, "Pretrain/Step": 9077, "Pretrain/Step Time": 8.419516876339912} +{"Pretrain/Learning Rate": 2.8152114083304148e-05, "Pretrain/Loss": 2.0238990783691406, "Pretrain/Loss (Raw)": 1.974515676498413, "Pretrain/Step": 9078, "Pretrain/Step Time": 8.421711023896933} +{"Pretrain/Learning Rate": 2.814790275042959e-05, "Pretrain/Loss": 2.022653579711914, "Pretrain/Loss (Raw)": 2.0695271492004395, "Pretrain/Step": 9079, "Pretrain/Step Time": 8.421842662617564} +{"Pretrain/Learning Rate": 2.8143691326787468e-05, "Pretrain/Loss": 2.021852970123291, "Pretrain/Loss (Raw)": 2.021709680557251, "Pretrain/Step": 9080, "Pretrain/Step Time": 8.430418668314815} +{"Pretrain/Learning Rate": 2.813947981249923e-05, "Pretrain/Loss": 2.0201125144958496, "Pretrain/Loss (Raw)": 1.625964641571045, "Pretrain/Step": 9081, "Pretrain/Step Time": 8.428997540846467} +{"Pretrain/Learning Rate": 2.8135268207686306e-05, "Pretrain/Loss": 2.0169167518615723, "Pretrain/Loss (Raw)": 1.919592261314392, "Pretrain/Step": 9082, "Pretrain/Step Time": 8.427171625196934} +{"Pretrain/Learning Rate": 2.8131056512470134e-05, "Pretrain/Loss": 2.016970634460449, "Pretrain/Loss (Raw)": 2.0580763816833496, "Pretrain/Step": 9083, "Pretrain/Step Time": 8.427281295880675} +{"Pretrain/Learning Rate": 2.8126844726972146e-05, "Pretrain/Loss": 2.0168299674987793, "Pretrain/Loss (Raw)": 1.974184274673462, "Pretrain/Step": 9084, "Pretrain/Step Time": 8.427985969930887} +{"Pretrain/Learning Rate": 2.8122632851313803e-05, "Pretrain/Loss": 2.0189995765686035, "Pretrain/Loss (Raw)": 2.1815197467803955, "Pretrain/Step": 9085, "Pretrain/Step Time": 8.428800521418452} +{"Pretrain/Learning Rate": 2.8118420885616538e-05, "Pretrain/Loss": 2.020867109298706, "Pretrain/Loss (Raw)": 2.0637166500091553, "Pretrain/Step": 9086, "Pretrain/Step Time": 8.426463931798935} +{"Pretrain/Learning Rate": 2.811420883000181e-05, "Pretrain/Loss": 2.02075457572937, "Pretrain/Loss (Raw)": 1.9538151025772095, "Pretrain/Step": 9087, "Pretrain/Step Time": 8.430912144482136} +{"Pretrain/Learning Rate": 2.8109996684591062e-05, "Pretrain/Loss": 2.0193610191345215, "Pretrain/Loss (Raw)": 1.896329641342163, "Pretrain/Step": 9088, "Pretrain/Step Time": 8.427090644836426} +{"Pretrain/Learning Rate": 2.8105784449505756e-05, "Pretrain/Loss": 2.0196757316589355, "Pretrain/Loss (Raw)": 2.021045446395874, "Pretrain/Step": 9089, "Pretrain/Step Time": 8.43038084357977} +{"Pretrain/Learning Rate": 2.8101572124867336e-05, "Pretrain/Loss": 2.0191328525543213, "Pretrain/Loss (Raw)": 1.8342819213867188, "Pretrain/Step": 9090, "Pretrain/Step Time": 8.428576463833451} +{"Pretrain/Learning Rate": 2.8097359710797277e-05, "Pretrain/Loss": 2.020524263381958, "Pretrain/Loss (Raw)": 1.9476765394210815, "Pretrain/Step": 9091, "Pretrain/Step Time": 8.424996107816696} +{"Pretrain/Learning Rate": 2.809314720741703e-05, "Pretrain/Loss": 2.019155502319336, "Pretrain/Loss (Raw)": 2.0281410217285156, "Pretrain/Step": 9092, "Pretrain/Step Time": 8.4279268309474} +{"Pretrain/Learning Rate": 2.8088934614848068e-05, "Pretrain/Loss": 2.016101121902466, "Pretrain/Loss (Raw)": 1.8456699848175049, "Pretrain/Step": 9093, "Pretrain/Step Time": 8.426246197894216} +{"Pretrain/Learning Rate": 2.8084721933211854e-05, "Pretrain/Loss": 2.0151636600494385, "Pretrain/Loss (Raw)": 1.7613136768341064, "Pretrain/Step": 9094, "Pretrain/Step Time": 8.422495318576694} +{"Pretrain/Learning Rate": 2.808050916262986e-05, "Pretrain/Loss": 2.014711380004883, "Pretrain/Loss (Raw)": 1.9916943311691284, "Pretrain/Step": 9095, "Pretrain/Step Time": 8.425644567236304} +{"Pretrain/Learning Rate": 2.8076296303223548e-05, "Pretrain/Loss": 2.0155084133148193, "Pretrain/Loss (Raw)": 2.2810115814208984, "Pretrain/Step": 9096, "Pretrain/Step Time": 8.425252744928002} +{"Pretrain/Learning Rate": 2.8072083355114404e-05, "Pretrain/Loss": 2.0154571533203125, "Pretrain/Loss (Raw)": 2.059622287750244, "Pretrain/Step": 9097, "Pretrain/Step Time": 8.429213294759393} +{"Pretrain/Learning Rate": 2.80678703184239e-05, "Pretrain/Loss": 2.0164968967437744, "Pretrain/Loss (Raw)": 2.0681917667388916, "Pretrain/Step": 9098, "Pretrain/Step Time": 8.433111729100347} +{"Pretrain/Learning Rate": 2.8063657193273528e-05, "Pretrain/Loss": 2.017357349395752, "Pretrain/Loss (Raw)": 2.110112190246582, "Pretrain/Step": 9099, "Pretrain/Step Time": 8.427563136443496} +{"Pretrain/Learning Rate": 2.805944397978475e-05, "Pretrain/Loss": 2.0175652503967285, "Pretrain/Loss (Raw)": 2.051837205886841, "Pretrain/Step": 9100, "Pretrain/Step Time": 8.427730003371835} +{"Pretrain/Learning Rate": 2.8055230678079064e-05, "Pretrain/Loss": 2.019763469696045, "Pretrain/Loss (Raw)": 2.090106964111328, "Pretrain/Step": 9101, "Pretrain/Step Time": 8.425151415169239} +{"Pretrain/Learning Rate": 2.805101728827796e-05, "Pretrain/Loss": 2.020029306411743, "Pretrain/Loss (Raw)": 2.046492099761963, "Pretrain/Step": 9102, "Pretrain/Step Time": 8.426627380773425} +{"Pretrain/Learning Rate": 2.8046803810502915e-05, "Pretrain/Loss": 2.020268440246582, "Pretrain/Loss (Raw)": 1.7636380195617676, "Pretrain/Step": 9103, "Pretrain/Step Time": 8.423853270709515} +{"Pretrain/Learning Rate": 2.8042590244875437e-05, "Pretrain/Loss": 2.021671772003174, "Pretrain/Loss (Raw)": 2.2405169010162354, "Pretrain/Step": 9104, "Pretrain/Step Time": 8.42433512583375} +{"Pretrain/Learning Rate": 2.8038376591517012e-05, "Pretrain/Loss": 2.02024245262146, "Pretrain/Loss (Raw)": 1.9091987609863281, "Pretrain/Step": 9105, "Pretrain/Step Time": 8.428541334345937} +{"Pretrain/Learning Rate": 2.803416285054914e-05, "Pretrain/Loss": 2.01710844039917, "Pretrain/Loss (Raw)": 1.4966295957565308, "Pretrain/Step": 9106, "Pretrain/Step Time": 8.42983459495008} +{"Pretrain/Learning Rate": 2.802994902209332e-05, "Pretrain/Loss": 2.01633620262146, "Pretrain/Loss (Raw)": 2.102749824523926, "Pretrain/Step": 9107, "Pretrain/Step Time": 8.428586900234222} +{"Pretrain/Learning Rate": 2.8025735106271055e-05, "Pretrain/Loss": 2.0220556259155273, "Pretrain/Loss (Raw)": 2.363992929458618, "Pretrain/Step": 9108, "Pretrain/Step Time": 8.426463210955262} +{"Pretrain/Learning Rate": 2.8021521103203853e-05, "Pretrain/Loss": 2.0219264030456543, "Pretrain/Loss (Raw)": 1.976500391960144, "Pretrain/Step": 9109, "Pretrain/Step Time": 8.424641916528344} +{"Pretrain/Learning Rate": 2.801730701301322e-05, "Pretrain/Loss": 2.021121025085449, "Pretrain/Loss (Raw)": 1.9479875564575195, "Pretrain/Step": 9110, "Pretrain/Step Time": 8.427341977134347} +{"Pretrain/Learning Rate": 2.801309283582067e-05, "Pretrain/Loss": 2.0256805419921875, "Pretrain/Loss (Raw)": 2.5051376819610596, "Pretrain/Step": 9111, "Pretrain/Step Time": 8.42707877419889} +{"Pretrain/Learning Rate": 2.8008878571747706e-05, "Pretrain/Loss": 2.0262014865875244, "Pretrain/Loss (Raw)": 2.1205103397369385, "Pretrain/Step": 9112, "Pretrain/Step Time": 8.43111271969974} +{"Pretrain/Learning Rate": 2.800466422091585e-05, "Pretrain/Loss": 2.027144193649292, "Pretrain/Loss (Raw)": 2.0118134021759033, "Pretrain/Step": 9113, "Pretrain/Step Time": 8.433153724297881} +{"Pretrain/Learning Rate": 2.800044978344662e-05, "Pretrain/Loss": 2.0274860858917236, "Pretrain/Loss (Raw)": 1.9662944078445435, "Pretrain/Step": 9114, "Pretrain/Step Time": 8.430793950334191} +{"Pretrain/Learning Rate": 2.7996235259461544e-05, "Pretrain/Loss": 2.024871349334717, "Pretrain/Loss (Raw)": 1.8630443811416626, "Pretrain/Step": 9115, "Pretrain/Step Time": 8.432835921645164} +{"Pretrain/Learning Rate": 2.799202064908213e-05, "Pretrain/Loss": 2.0252737998962402, "Pretrain/Loss (Raw)": 2.0103344917297363, "Pretrain/Step": 9116, "Pretrain/Step Time": 8.433301439508796} +{"Pretrain/Learning Rate": 2.7987805952429908e-05, "Pretrain/Loss": 2.0217952728271484, "Pretrain/Loss (Raw)": 1.7723065614700317, "Pretrain/Step": 9117, "Pretrain/Step Time": 8.432977885007858} +{"Pretrain/Learning Rate": 2.7983591169626404e-05, "Pretrain/Loss": 2.020803928375244, "Pretrain/Loss (Raw)": 1.9055842161178589, "Pretrain/Step": 9118, "Pretrain/Step Time": 8.431256925687194} +{"Pretrain/Learning Rate": 2.797937630079316e-05, "Pretrain/Loss": 2.0203299522399902, "Pretrain/Loss (Raw)": 1.8884832859039307, "Pretrain/Step": 9119, "Pretrain/Step Time": 8.436122292652726} +{"Pretrain/Learning Rate": 2.7975161346051698e-05, "Pretrain/Loss": 2.0198373794555664, "Pretrain/Loss (Raw)": 2.0014843940734863, "Pretrain/Step": 9120, "Pretrain/Step Time": 8.437692064791918} +{"Pretrain/Learning Rate": 2.7970946305523553e-05, "Pretrain/Loss": 2.0213088989257812, "Pretrain/Loss (Raw)": 2.086373805999756, "Pretrain/Step": 9121, "Pretrain/Step Time": 8.438465256243944} +{"Pretrain/Learning Rate": 2.7966731179330267e-05, "Pretrain/Loss": 2.020529270172119, "Pretrain/Loss (Raw)": 1.9355159997940063, "Pretrain/Step": 9122, "Pretrain/Step Time": 8.436254119500518} +{"Pretrain/Learning Rate": 2.7962515967593383e-05, "Pretrain/Loss": 2.021328926086426, "Pretrain/Loss (Raw)": 2.1544034481048584, "Pretrain/Step": 9123, "Pretrain/Step Time": 8.438541308045387} +{"Pretrain/Learning Rate": 2.7958300670434434e-05, "Pretrain/Loss": 2.0224108695983887, "Pretrain/Loss (Raw)": 2.1213667392730713, "Pretrain/Step": 9124, "Pretrain/Step Time": 8.439813915640116} +{"Pretrain/Learning Rate": 2.795408528797498e-05, "Pretrain/Loss": 2.0210931301116943, "Pretrain/Loss (Raw)": 1.7773131132125854, "Pretrain/Step": 9125, "Pretrain/Step Time": 8.433984806761146} +{"Pretrain/Learning Rate": 2.794986982033655e-05, "Pretrain/Loss": 2.021061420440674, "Pretrain/Loss (Raw)": 2.031165361404419, "Pretrain/Step": 9126, "Pretrain/Step Time": 8.435084879398346} +{"Pretrain/Learning Rate": 2.7945654267640704e-05, "Pretrain/Loss": 2.0199785232543945, "Pretrain/Loss (Raw)": 2.0646274089813232, "Pretrain/Step": 9127, "Pretrain/Step Time": 8.433433717116714} +{"Pretrain/Learning Rate": 2.794143863000899e-05, "Pretrain/Loss": 2.019432783126831, "Pretrain/Loss (Raw)": 1.9778236150741577, "Pretrain/Step": 9128, "Pretrain/Step Time": 8.431147387251258} +{"Pretrain/Learning Rate": 2.7937222907562983e-05, "Pretrain/Loss": 2.0175845623016357, "Pretrain/Loss (Raw)": 2.1230833530426025, "Pretrain/Step": 9129, "Pretrain/Step Time": 8.430936586111784} +{"Pretrain/Learning Rate": 2.7933007100424214e-05, "Pretrain/Loss": 2.016918659210205, "Pretrain/Loss (Raw)": 1.9010450839996338, "Pretrain/Step": 9130, "Pretrain/Step Time": 8.433333676308393} +{"Pretrain/Learning Rate": 2.7928791208714256e-05, "Pretrain/Loss": 2.017753839492798, "Pretrain/Loss (Raw)": 2.092996597290039, "Pretrain/Step": 9131, "Pretrain/Step Time": 8.431743642315269} +{"Pretrain/Learning Rate": 2.7924575232554663e-05, "Pretrain/Loss": 2.0170607566833496, "Pretrain/Loss (Raw)": 2.0967936515808105, "Pretrain/Step": 9132, "Pretrain/Step Time": 8.431054934859276} +{"Pretrain/Learning Rate": 2.7920359172067e-05, "Pretrain/Loss": 2.0119853019714355, "Pretrain/Loss (Raw)": 1.8037999868392944, "Pretrain/Step": 9133, "Pretrain/Step Time": 8.43582952581346} +{"Pretrain/Learning Rate": 2.791614302737284e-05, "Pretrain/Loss": 2.0122737884521484, "Pretrain/Loss (Raw)": 2.0483787059783936, "Pretrain/Step": 9134, "Pretrain/Step Time": 8.43664950504899} +{"Pretrain/Learning Rate": 2.7911926798593763e-05, "Pretrain/Loss": 2.0114731788635254, "Pretrain/Loss (Raw)": 1.9824758768081665, "Pretrain/Step": 9135, "Pretrain/Step Time": 8.434432925656438} +{"Pretrain/Learning Rate": 2.7907710485851323e-05, "Pretrain/Loss": 2.01015567779541, "Pretrain/Loss (Raw)": 1.8249057531356812, "Pretrain/Step": 9136, "Pretrain/Step Time": 8.434864033013582} +{"Pretrain/Learning Rate": 2.7903494089267103e-05, "Pretrain/Loss": 2.01045560836792, "Pretrain/Loss (Raw)": 1.9750611782073975, "Pretrain/Step": 9137, "Pretrain/Step Time": 8.438741132616997} +{"Pretrain/Learning Rate": 2.7899277608962675e-05, "Pretrain/Loss": 2.0090556144714355, "Pretrain/Loss (Raw)": 1.9097943305969238, "Pretrain/Step": 9138, "Pretrain/Step Time": 8.438268285244703} +{"Pretrain/Learning Rate": 2.7895061045059622e-05, "Pretrain/Loss": 2.0098507404327393, "Pretrain/Loss (Raw)": 2.121431350708008, "Pretrain/Step": 9139, "Pretrain/Step Time": 8.43875502049923} +{"Pretrain/Learning Rate": 2.7890844397679524e-05, "Pretrain/Loss": 2.0101380348205566, "Pretrain/Loss (Raw)": 2.0732359886169434, "Pretrain/Step": 9140, "Pretrain/Step Time": 8.43901357613504} +{"Pretrain/Learning Rate": 2.7886627666943967e-05, "Pretrain/Loss": 2.0107879638671875, "Pretrain/Loss (Raw)": 2.159640312194824, "Pretrain/Step": 9141, "Pretrain/Step Time": 8.434026220813394} +{"Pretrain/Learning Rate": 2.7882410852974538e-05, "Pretrain/Loss": 2.00946307182312, "Pretrain/Loss (Raw)": 1.9435216188430786, "Pretrain/Step": 9142, "Pretrain/Step Time": 8.434415632858872} +{"Pretrain/Learning Rate": 2.7878193955892816e-05, "Pretrain/Loss": 2.0127716064453125, "Pretrain/Loss (Raw)": 2.346165895462036, "Pretrain/Step": 9143, "Pretrain/Step Time": 8.442474467679858} +{"Pretrain/Learning Rate": 2.787397697582041e-05, "Pretrain/Loss": 2.012103796005249, "Pretrain/Loss (Raw)": 2.030341625213623, "Pretrain/Step": 9144, "Pretrain/Step Time": 8.435686575248837} +{"Pretrain/Learning Rate": 2.7869759912878896e-05, "Pretrain/Loss": 2.0139660835266113, "Pretrain/Loss (Raw)": 2.0358970165252686, "Pretrain/Step": 9145, "Pretrain/Step Time": 8.436764581128955} +{"Pretrain/Learning Rate": 2.7865542767189878e-05, "Pretrain/Loss": 2.014310836791992, "Pretrain/Loss (Raw)": 2.10629940032959, "Pretrain/Step": 9146, "Pretrain/Step Time": 8.441669635474682} +{"Pretrain/Learning Rate": 2.7861325538874967e-05, "Pretrain/Loss": 2.0154128074645996, "Pretrain/Loss (Raw)": 1.9240010976791382, "Pretrain/Step": 9147, "Pretrain/Step Time": 8.440009849146008} +{"Pretrain/Learning Rate": 2.785710822805574e-05, "Pretrain/Loss": 2.0164573192596436, "Pretrain/Loss (Raw)": 2.0621261596679688, "Pretrain/Step": 9148, "Pretrain/Step Time": 8.439995247870684} +{"Pretrain/Learning Rate": 2.785289083485381e-05, "Pretrain/Loss": 2.0174474716186523, "Pretrain/Loss (Raw)": 1.923062801361084, "Pretrain/Step": 9149, "Pretrain/Step Time": 8.445691609755158} +{"Pretrain/Learning Rate": 2.7848673359390787e-05, "Pretrain/Loss": 2.016667604446411, "Pretrain/Loss (Raw)": 2.0059282779693604, "Pretrain/Step": 9150, "Pretrain/Step Time": 8.446195902302861} +{"Pretrain/Learning Rate": 2.7844455801788277e-05, "Pretrain/Loss": 2.0156705379486084, "Pretrain/Loss (Raw)": 1.8754959106445312, "Pretrain/Step": 9151, "Pretrain/Step Time": 8.444894295185804} +{"Pretrain/Learning Rate": 2.7840238162167892e-05, "Pretrain/Loss": 2.0156216621398926, "Pretrain/Loss (Raw)": 1.9136463403701782, "Pretrain/Step": 9152, "Pretrain/Step Time": 8.442330999299884} +{"Pretrain/Learning Rate": 2.7836020440651232e-05, "Pretrain/Loss": 2.016862630844116, "Pretrain/Loss (Raw)": 1.8961409330368042, "Pretrain/Step": 9153, "Pretrain/Step Time": 8.440946595743299} +{"Pretrain/Learning Rate": 2.783180263735993e-05, "Pretrain/Loss": 2.0149052143096924, "Pretrain/Loss (Raw)": 1.966468095779419, "Pretrain/Step": 9154, "Pretrain/Step Time": 8.441965078935027} +{"Pretrain/Learning Rate": 2.7827584752415593e-05, "Pretrain/Loss": 2.0147738456726074, "Pretrain/Loss (Raw)": 1.971511960029602, "Pretrain/Step": 9155, "Pretrain/Step Time": 8.4404532071203} +{"Pretrain/Learning Rate": 2.782336678593984e-05, "Pretrain/Loss": 2.0139808654785156, "Pretrain/Loss (Raw)": 1.9706580638885498, "Pretrain/Step": 9156, "Pretrain/Step Time": 8.441435607150197} +{"Pretrain/Learning Rate": 2.7819148738054306e-05, "Pretrain/Loss": 2.0148203372955322, "Pretrain/Loss (Raw)": 1.8835206031799316, "Pretrain/Step": 9157, "Pretrain/Step Time": 8.441090682521462} +{"Pretrain/Learning Rate": 2.7814930608880597e-05, "Pretrain/Loss": 2.0144736766815186, "Pretrain/Loss (Raw)": 2.0032975673675537, "Pretrain/Step": 9158, "Pretrain/Step Time": 8.441094228997827} +{"Pretrain/Learning Rate": 2.781071239854035e-05, "Pretrain/Loss": 2.0157392024993896, "Pretrain/Loss (Raw)": 2.0423338413238525, "Pretrain/Step": 9159, "Pretrain/Step Time": 8.438368869945407} +{"Pretrain/Learning Rate": 2.780649410715519e-05, "Pretrain/Loss": 2.0139260292053223, "Pretrain/Loss (Raw)": 1.9267877340316772, "Pretrain/Step": 9160, "Pretrain/Step Time": 8.437459547072649} +{"Pretrain/Learning Rate": 2.7802275734846755e-05, "Pretrain/Loss": 2.0156161785125732, "Pretrain/Loss (Raw)": 1.910630464553833, "Pretrain/Step": 9161, "Pretrain/Step Time": 8.434674767777324} +{"Pretrain/Learning Rate": 2.7798057281736677e-05, "Pretrain/Loss": 2.010166645050049, "Pretrain/Loss (Raw)": 1.4033137559890747, "Pretrain/Step": 9162, "Pretrain/Step Time": 8.438771786168218} +{"Pretrain/Learning Rate": 2.7793838747946588e-05, "Pretrain/Loss": 2.007748603820801, "Pretrain/Loss (Raw)": 1.8746695518493652, "Pretrain/Step": 9163, "Pretrain/Step Time": 8.446077080443501} +{"Pretrain/Learning Rate": 2.778962013359812e-05, "Pretrain/Loss": 2.007744789123535, "Pretrain/Loss (Raw)": 1.9546476602554321, "Pretrain/Step": 9164, "Pretrain/Step Time": 8.446741908788681} +{"Pretrain/Learning Rate": 2.778540143881293e-05, "Pretrain/Loss": 2.010745048522949, "Pretrain/Loss (Raw)": 2.431319236755371, "Pretrain/Step": 9165, "Pretrain/Step Time": 8.44567179121077} +{"Pretrain/Learning Rate": 2.778118266371265e-05, "Pretrain/Loss": 2.0116968154907227, "Pretrain/Loss (Raw)": 2.1308791637420654, "Pretrain/Step": 9166, "Pretrain/Step Time": 8.438606217503548} +{"Pretrain/Learning Rate": 2.777696380841893e-05, "Pretrain/Loss": 2.0112221240997314, "Pretrain/Loss (Raw)": 1.8633345365524292, "Pretrain/Step": 9167, "Pretrain/Step Time": 8.436177445575595} +{"Pretrain/Learning Rate": 2.777274487305342e-05, "Pretrain/Loss": 2.0096912384033203, "Pretrain/Loss (Raw)": 2.0096521377563477, "Pretrain/Step": 9168, "Pretrain/Step Time": 8.439044654369354} +{"Pretrain/Learning Rate": 2.776852585773776e-05, "Pretrain/Loss": 2.0051584243774414, "Pretrain/Loss (Raw)": 1.9833931922912598, "Pretrain/Step": 9169, "Pretrain/Step Time": 8.436439184471965} +{"Pretrain/Learning Rate": 2.7764306762593613e-05, "Pretrain/Loss": 2.004650354385376, "Pretrain/Loss (Raw)": 2.0271172523498535, "Pretrain/Step": 9170, "Pretrain/Step Time": 8.435574827715755} +{"Pretrain/Learning Rate": 2.776008758774263e-05, "Pretrain/Loss": 2.005429744720459, "Pretrain/Loss (Raw)": 1.878169059753418, "Pretrain/Step": 9171, "Pretrain/Step Time": 8.438519097864628} +{"Pretrain/Learning Rate": 2.775586833330646e-05, "Pretrain/Loss": 2.004223108291626, "Pretrain/Loss (Raw)": 1.9691815376281738, "Pretrain/Step": 9172, "Pretrain/Step Time": 8.43722752481699} +{"Pretrain/Learning Rate": 2.7751648999406777e-05, "Pretrain/Loss": 2.004955768585205, "Pretrain/Loss (Raw)": 2.121673583984375, "Pretrain/Step": 9173, "Pretrain/Step Time": 8.44229213707149} +{"Pretrain/Learning Rate": 2.774742958616523e-05, "Pretrain/Loss": 2.0038580894470215, "Pretrain/Loss (Raw)": 1.9363069534301758, "Pretrain/Step": 9174, "Pretrain/Step Time": 8.442467469722033} +{"Pretrain/Learning Rate": 2.7743210093703494e-05, "Pretrain/Loss": 2.003986358642578, "Pretrain/Loss (Raw)": 1.9480185508728027, "Pretrain/Step": 9175, "Pretrain/Step Time": 8.44335213303566} +{"Pretrain/Learning Rate": 2.773899052214322e-05, "Pretrain/Loss": 2.003044366836548, "Pretrain/Loss (Raw)": 2.026093006134033, "Pretrain/Step": 9176, "Pretrain/Step Time": 8.443907326087356} +{"Pretrain/Learning Rate": 2.7734770871606087e-05, "Pretrain/Loss": 2.0022644996643066, "Pretrain/Loss (Raw)": 2.111940860748291, "Pretrain/Step": 9177, "Pretrain/Step Time": 8.442596271634102} +{"Pretrain/Learning Rate": 2.7730551142213767e-05, "Pretrain/Loss": 2.0024423599243164, "Pretrain/Loss (Raw)": 1.9614601135253906, "Pretrain/Step": 9178, "Pretrain/Step Time": 8.44270339794457} +{"Pretrain/Learning Rate": 2.7726331334087928e-05, "Pretrain/Loss": 2.0028085708618164, "Pretrain/Loss (Raw)": 1.9919439554214478, "Pretrain/Step": 9179, "Pretrain/Step Time": 8.44145186059177} +{"Pretrain/Learning Rate": 2.7722111447350253e-05, "Pretrain/Loss": 2.00746488571167, "Pretrain/Loss (Raw)": 2.6061158180236816, "Pretrain/Step": 9180, "Pretrain/Step Time": 8.446052942425013} +{"Pretrain/Learning Rate": 2.7717891482122405e-05, "Pretrain/Loss": 2.0079116821289062, "Pretrain/Loss (Raw)": 2.059861183166504, "Pretrain/Step": 9181, "Pretrain/Step Time": 8.44847759976983} +{"Pretrain/Learning Rate": 2.7713671438526073e-05, "Pretrain/Loss": 2.00717830657959, "Pretrain/Loss (Raw)": 2.10736083984375, "Pretrain/Step": 9182, "Pretrain/Step Time": 8.446638390421867} +{"Pretrain/Learning Rate": 2.7709451316682938e-05, "Pretrain/Loss": 2.006831645965576, "Pretrain/Loss (Raw)": 2.1109769344329834, "Pretrain/Step": 9183, "Pretrain/Step Time": 8.443145677447319} +{"Pretrain/Learning Rate": 2.770523111671469e-05, "Pretrain/Loss": 2.005732536315918, "Pretrain/Loss (Raw)": 1.9309427738189697, "Pretrain/Step": 9184, "Pretrain/Step Time": 8.443849621340632} +{"Pretrain/Learning Rate": 2.7701010838743007e-05, "Pretrain/Loss": 2.006925344467163, "Pretrain/Loss (Raw)": 2.1761794090270996, "Pretrain/Step": 9185, "Pretrain/Step Time": 8.44136375375092} +{"Pretrain/Learning Rate": 2.7696790482889578e-05, "Pretrain/Loss": 2.0075571537017822, "Pretrain/Loss (Raw)": 2.175992012023926, "Pretrain/Step": 9186, "Pretrain/Step Time": 8.439392423257232} +{"Pretrain/Learning Rate": 2.7692570049276095e-05, "Pretrain/Loss": 2.006596803665161, "Pretrain/Loss (Raw)": 1.900739073753357, "Pretrain/Step": 9187, "Pretrain/Step Time": 8.440129432827234} +{"Pretrain/Learning Rate": 2.7688349538024257e-05, "Pretrain/Loss": 2.006798267364502, "Pretrain/Loss (Raw)": 1.989933729171753, "Pretrain/Step": 9188, "Pretrain/Step Time": 8.443640986457467} +{"Pretrain/Learning Rate": 2.768412894925576e-05, "Pretrain/Loss": 2.0069875717163086, "Pretrain/Loss (Raw)": 2.1355621814727783, "Pretrain/Step": 9189, "Pretrain/Step Time": 8.444398883730173} +{"Pretrain/Learning Rate": 2.7679908283092286e-05, "Pretrain/Loss": 2.0050230026245117, "Pretrain/Loss (Raw)": 1.7503533363342285, "Pretrain/Step": 9190, "Pretrain/Step Time": 8.444240586832166} +{"Pretrain/Learning Rate": 2.7675687539655554e-05, "Pretrain/Loss": 2.0025999546051025, "Pretrain/Loss (Raw)": 1.8081578016281128, "Pretrain/Step": 9191, "Pretrain/Step Time": 8.437209352850914} +{"Pretrain/Learning Rate": 2.7671466719067253e-05, "Pretrain/Loss": 2.003499984741211, "Pretrain/Loss (Raw)": 2.0412847995758057, "Pretrain/Step": 9192, "Pretrain/Step Time": 8.435074327513576} +{"Pretrain/Learning Rate": 2.7667245821449094e-05, "Pretrain/Loss": 2.001707077026367, "Pretrain/Loss (Raw)": 1.9181468486785889, "Pretrain/Step": 9193, "Pretrain/Step Time": 8.43729467689991} +{"Pretrain/Learning Rate": 2.7663024846922787e-05, "Pretrain/Loss": 2.0023128986358643, "Pretrain/Loss (Raw)": 2.072675943374634, "Pretrain/Step": 9194, "Pretrain/Step Time": 8.438616881147027} +{"Pretrain/Learning Rate": 2.7658803795610026e-05, "Pretrain/Loss": 2.0039262771606445, "Pretrain/Loss (Raw)": 2.2550737857818604, "Pretrain/Step": 9195, "Pretrain/Step Time": 8.440110484138131} +{"Pretrain/Learning Rate": 2.765458266763254e-05, "Pretrain/Loss": 2.0021443367004395, "Pretrain/Loss (Raw)": 1.8530378341674805, "Pretrain/Step": 9196, "Pretrain/Step Time": 8.44069872610271} +{"Pretrain/Learning Rate": 2.765036146311203e-05, "Pretrain/Loss": 2.001741409301758, "Pretrain/Loss (Raw)": 1.9139840602874756, "Pretrain/Step": 9197, "Pretrain/Step Time": 8.443988231942058} +{"Pretrain/Learning Rate": 2.7646140182170216e-05, "Pretrain/Loss": 2.000107526779175, "Pretrain/Loss (Raw)": 2.0218472480773926, "Pretrain/Step": 9198, "Pretrain/Step Time": 8.448311917483807} +{"Pretrain/Learning Rate": 2.764191882492882e-05, "Pretrain/Loss": 1.9999496936798096, "Pretrain/Loss (Raw)": 2.0162291526794434, "Pretrain/Step": 9199, "Pretrain/Step Time": 8.4436518792063} +{"Pretrain/Learning Rate": 2.7637697391509555e-05, "Pretrain/Loss": 2.000239372253418, "Pretrain/Loss (Raw)": 2.0524885654449463, "Pretrain/Step": 9200, "Pretrain/Step Time": 8.448418702930212} +{"Pretrain/Learning Rate": 2.7633475882034145e-05, "Pretrain/Loss": 2.001223564147949, "Pretrain/Loss (Raw)": 2.0477728843688965, "Pretrain/Step": 9201, "Pretrain/Step Time": 8.440671062096953} +{"Pretrain/Learning Rate": 2.7629254296624308e-05, "Pretrain/Loss": 2.002042531967163, "Pretrain/Loss (Raw)": 1.8576314449310303, "Pretrain/Step": 9202, "Pretrain/Step Time": 8.442111862823367} +{"Pretrain/Learning Rate": 2.762503263540178e-05, "Pretrain/Loss": 2.0029549598693848, "Pretrain/Loss (Raw)": 2.1244306564331055, "Pretrain/Step": 9203, "Pretrain/Step Time": 8.441171117126942} +{"Pretrain/Learning Rate": 2.762081089848829e-05, "Pretrain/Loss": 2.0040817260742188, "Pretrain/Loss (Raw)": 2.009150981903076, "Pretrain/Step": 9204, "Pretrain/Step Time": 8.439348209649324} +{"Pretrain/Learning Rate": 2.7616589086005566e-05, "Pretrain/Loss": 2.003692388534546, "Pretrain/Loss (Raw)": 2.192159414291382, "Pretrain/Step": 9205, "Pretrain/Step Time": 8.440047279000282} +{"Pretrain/Learning Rate": 2.7612367198075334e-05, "Pretrain/Loss": 2.0044097900390625, "Pretrain/Loss (Raw)": 2.0663340091705322, "Pretrain/Step": 9206, "Pretrain/Step Time": 8.436150653287768} +{"Pretrain/Learning Rate": 2.760814523481934e-05, "Pretrain/Loss": 2.003713846206665, "Pretrain/Loss (Raw)": 1.9804589748382568, "Pretrain/Step": 9207, "Pretrain/Step Time": 8.437587482854724} +{"Pretrain/Learning Rate": 2.7603923196359315e-05, "Pretrain/Loss": 2.003709316253662, "Pretrain/Loss (Raw)": 2.0211191177368164, "Pretrain/Step": 9208, "Pretrain/Step Time": 8.430367546156049} +{"Pretrain/Learning Rate": 2.7599701082817e-05, "Pretrain/Loss": 2.0073890686035156, "Pretrain/Loss (Raw)": 2.0969812870025635, "Pretrain/Step": 9209, "Pretrain/Step Time": 8.430185316130519} +{"Pretrain/Learning Rate": 2.759547889431414e-05, "Pretrain/Loss": 2.009471893310547, "Pretrain/Loss (Raw)": 2.1861937046051025, "Pretrain/Step": 9210, "Pretrain/Step Time": 8.431186811998487} +{"Pretrain/Learning Rate": 2.759125663097248e-05, "Pretrain/Loss": 2.008327007293701, "Pretrain/Loss (Raw)": 1.9115407466888428, "Pretrain/Step": 9211, "Pretrain/Step Time": 8.428274592384696} +{"Pretrain/Learning Rate": 2.758703429291375e-05, "Pretrain/Loss": 2.008751153945923, "Pretrain/Loss (Raw)": 2.0284533500671387, "Pretrain/Step": 9212, "Pretrain/Step Time": 8.427535811439157} +{"Pretrain/Learning Rate": 2.7582811880259725e-05, "Pretrain/Loss": 2.0051076412200928, "Pretrain/Loss (Raw)": 1.7151670455932617, "Pretrain/Step": 9213, "Pretrain/Step Time": 8.42942899465561} +{"Pretrain/Learning Rate": 2.7578589393132125e-05, "Pretrain/Loss": 2.005908966064453, "Pretrain/Loss (Raw)": 2.166259288787842, "Pretrain/Step": 9214, "Pretrain/Step Time": 8.4287148155272} +{"Pretrain/Learning Rate": 2.7574366831652725e-05, "Pretrain/Loss": 2.0048882961273193, "Pretrain/Loss (Raw)": 1.8231757879257202, "Pretrain/Step": 9215, "Pretrain/Step Time": 8.429540861397982} +{"Pretrain/Learning Rate": 2.7570144195943277e-05, "Pretrain/Loss": 2.006453037261963, "Pretrain/Loss (Raw)": 2.0966594219207764, "Pretrain/Step": 9216, "Pretrain/Step Time": 8.430667512118816} +{"Pretrain/Learning Rate": 2.7565921486125524e-05, "Pretrain/Loss": 2.0056023597717285, "Pretrain/Loss (Raw)": 1.912134051322937, "Pretrain/Step": 9217, "Pretrain/Step Time": 8.426422780379653} +{"Pretrain/Learning Rate": 2.7561698702321236e-05, "Pretrain/Loss": 2.005500078201294, "Pretrain/Loss (Raw)": 1.8211740255355835, "Pretrain/Step": 9218, "Pretrain/Step Time": 8.429595828056335} +{"Pretrain/Learning Rate": 2.755747584465217e-05, "Pretrain/Loss": 2.005756139755249, "Pretrain/Loss (Raw)": 1.9804651737213135, "Pretrain/Step": 9219, "Pretrain/Step Time": 8.428174667060375} +{"Pretrain/Learning Rate": 2.755325291324009e-05, "Pretrain/Loss": 2.0058436393737793, "Pretrain/Loss (Raw)": 2.039315938949585, "Pretrain/Step": 9220, "Pretrain/Step Time": 8.428252087906003} +{"Pretrain/Learning Rate": 2.754902990820677e-05, "Pretrain/Loss": 2.006720542907715, "Pretrain/Loss (Raw)": 1.9579393863677979, "Pretrain/Step": 9221, "Pretrain/Step Time": 8.426422068849206} +{"Pretrain/Learning Rate": 2.7544806829673963e-05, "Pretrain/Loss": 2.01129412651062, "Pretrain/Loss (Raw)": 2.3467323780059814, "Pretrain/Step": 9222, "Pretrain/Step Time": 8.42856029421091} +{"Pretrain/Learning Rate": 2.7540583677763447e-05, "Pretrain/Loss": 2.0122504234313965, "Pretrain/Loss (Raw)": 2.114088296890259, "Pretrain/Step": 9223, "Pretrain/Step Time": 8.42976700887084} +{"Pretrain/Learning Rate": 2.7536360452596992e-05, "Pretrain/Loss": 2.010200262069702, "Pretrain/Loss (Raw)": 2.018605947494507, "Pretrain/Step": 9224, "Pretrain/Step Time": 8.431565746665001} +{"Pretrain/Learning Rate": 2.7532137154296374e-05, "Pretrain/Loss": 2.0101945400238037, "Pretrain/Loss (Raw)": 2.0588889122009277, "Pretrain/Step": 9225, "Pretrain/Step Time": 8.427635978907347} +{"Pretrain/Learning Rate": 2.7527913782983362e-05, "Pretrain/Loss": 2.0084452629089355, "Pretrain/Loss (Raw)": 1.8442699909210205, "Pretrain/Step": 9226, "Pretrain/Step Time": 8.42447367683053} +{"Pretrain/Learning Rate": 2.752369033877974e-05, "Pretrain/Loss": 2.0071911811828613, "Pretrain/Loss (Raw)": 1.9495885372161865, "Pretrain/Step": 9227, "Pretrain/Step Time": 8.424324525520205} +{"Pretrain/Learning Rate": 2.7519466821807283e-05, "Pretrain/Loss": 2.007265567779541, "Pretrain/Loss (Raw)": 2.06136155128479, "Pretrain/Step": 9228, "Pretrain/Step Time": 8.429914720356464} +{"Pretrain/Learning Rate": 2.7515243232187782e-05, "Pretrain/Loss": 2.006662368774414, "Pretrain/Loss (Raw)": 2.0129234790802, "Pretrain/Step": 9229, "Pretrain/Step Time": 8.43477514386177} +{"Pretrain/Learning Rate": 2.7511019570043006e-05, "Pretrain/Loss": 2.0048367977142334, "Pretrain/Loss (Raw)": 1.8127819299697876, "Pretrain/Step": 9230, "Pretrain/Step Time": 8.433423144742846} +{"Pretrain/Learning Rate": 2.7506795835494765e-05, "Pretrain/Loss": 2.0083775520324707, "Pretrain/Loss (Raw)": 2.2168567180633545, "Pretrain/Step": 9231, "Pretrain/Step Time": 8.431990124285221} +{"Pretrain/Learning Rate": 2.7502572028664825e-05, "Pretrain/Loss": 2.006256580352783, "Pretrain/Loss (Raw)": 1.9690521955490112, "Pretrain/Step": 9232, "Pretrain/Step Time": 8.434307251125574} +{"Pretrain/Learning Rate": 2.749834814967498e-05, "Pretrain/Loss": 2.0072789192199707, "Pretrain/Loss (Raw)": 2.0400726795196533, "Pretrain/Step": 9233, "Pretrain/Step Time": 8.42812000401318} +{"Pretrain/Learning Rate": 2.749412419864703e-05, "Pretrain/Loss": 2.010333776473999, "Pretrain/Loss (Raw)": 1.8876227140426636, "Pretrain/Step": 9234, "Pretrain/Step Time": 8.430841693654656} +{"Pretrain/Learning Rate": 2.748990017570277e-05, "Pretrain/Loss": 2.008814573287964, "Pretrain/Loss (Raw)": 1.90830659866333, "Pretrain/Step": 9235, "Pretrain/Step Time": 8.430989297106862} +{"Pretrain/Learning Rate": 2.7485676080964e-05, "Pretrain/Loss": 2.0063748359680176, "Pretrain/Loss (Raw)": 2.051713705062866, "Pretrain/Step": 9236, "Pretrain/Step Time": 8.429914059117436} +{"Pretrain/Learning Rate": 2.7481451914552502e-05, "Pretrain/Loss": 2.0058255195617676, "Pretrain/Loss (Raw)": 1.906184434890747, "Pretrain/Step": 9237, "Pretrain/Step Time": 8.432742865756154} +{"Pretrain/Learning Rate": 2.7477227676590093e-05, "Pretrain/Loss": 2.006352424621582, "Pretrain/Loss (Raw)": 2.0154356956481934, "Pretrain/Step": 9238, "Pretrain/Step Time": 8.42886702902615} +{"Pretrain/Learning Rate": 2.747300336719857e-05, "Pretrain/Loss": 2.0022361278533936, "Pretrain/Loss (Raw)": 1.9782485961914062, "Pretrain/Step": 9239, "Pretrain/Step Time": 8.433090614154935} +{"Pretrain/Learning Rate": 2.746877898649973e-05, "Pretrain/Loss": 2.002450704574585, "Pretrain/Loss (Raw)": 2.147966146469116, "Pretrain/Step": 9240, "Pretrain/Step Time": 8.428333438932896} +{"Pretrain/Learning Rate": 2.7464554534615394e-05, "Pretrain/Loss": 2.0008232593536377, "Pretrain/Loss (Raw)": 1.8035016059875488, "Pretrain/Step": 9241, "Pretrain/Step Time": 8.429041000083089} +{"Pretrain/Learning Rate": 2.7460330011667375e-05, "Pretrain/Loss": 2.0005483627319336, "Pretrain/Loss (Raw)": 1.9311095476150513, "Pretrain/Step": 9242, "Pretrain/Step Time": 8.429177299141884} +{"Pretrain/Learning Rate": 2.7456105417777463e-05, "Pretrain/Loss": 2.0020856857299805, "Pretrain/Loss (Raw)": 2.059826374053955, "Pretrain/Step": 9243, "Pretrain/Step Time": 8.428731756284833} +{"Pretrain/Learning Rate": 2.7451880753067482e-05, "Pretrain/Loss": 2.003187417984009, "Pretrain/Loss (Raw)": 2.1513490676879883, "Pretrain/Step": 9244, "Pretrain/Step Time": 8.429077396169305} +{"Pretrain/Learning Rate": 2.7447656017659252e-05, "Pretrain/Loss": 2.0049004554748535, "Pretrain/Loss (Raw)": 1.9915904998779297, "Pretrain/Step": 9245, "Pretrain/Step Time": 8.43426121585071} +{"Pretrain/Learning Rate": 2.7443431211674588e-05, "Pretrain/Loss": 2.0052883625030518, "Pretrain/Loss (Raw)": 1.955235481262207, "Pretrain/Step": 9246, "Pretrain/Step Time": 8.434075519442558} +{"Pretrain/Learning Rate": 2.7439206335235308e-05, "Pretrain/Loss": 2.005931854248047, "Pretrain/Loss (Raw)": 1.9708350896835327, "Pretrain/Step": 9247, "Pretrain/Step Time": 8.429619763046503} +{"Pretrain/Learning Rate": 2.7434981388463227e-05, "Pretrain/Loss": 2.004497528076172, "Pretrain/Loss (Raw)": 1.817901372909546, "Pretrain/Step": 9248, "Pretrain/Step Time": 8.431506788358092} +{"Pretrain/Learning Rate": 2.7430756371480175e-05, "Pretrain/Loss": 2.00268816947937, "Pretrain/Loss (Raw)": 1.8547710180282593, "Pretrain/Step": 9249, "Pretrain/Step Time": 8.431324863806367} +{"Pretrain/Learning Rate": 2.742653128440798e-05, "Pretrain/Loss": 2.004171371459961, "Pretrain/Loss (Raw)": 2.125371217727661, "Pretrain/Step": 9250, "Pretrain/Step Time": 8.431030029430985} +{"Pretrain/Learning Rate": 2.7422306127368463e-05, "Pretrain/Loss": 2.0039000511169434, "Pretrain/Loss (Raw)": 2.119673013687134, "Pretrain/Step": 9251, "Pretrain/Step Time": 8.434476094320416} +{"Pretrain/Learning Rate": 2.741808090048346e-05, "Pretrain/Loss": 2.0028023719787598, "Pretrain/Loss (Raw)": 1.9808744192123413, "Pretrain/Step": 9252, "Pretrain/Step Time": 8.428277710452676} +{"Pretrain/Learning Rate": 2.7413855603874798e-05, "Pretrain/Loss": 2.0048179626464844, "Pretrain/Loss (Raw)": 2.0353095531463623, "Pretrain/Step": 9253, "Pretrain/Step Time": 8.430147539824247} +{"Pretrain/Learning Rate": 2.7409630237664314e-05, "Pretrain/Loss": 2.0060179233551025, "Pretrain/Loss (Raw)": 2.18475079536438, "Pretrain/Step": 9254, "Pretrain/Step Time": 8.430172227323055} +{"Pretrain/Learning Rate": 2.7405404801973838e-05, "Pretrain/Loss": 2.006805896759033, "Pretrain/Loss (Raw)": 2.1654794216156006, "Pretrain/Step": 9255, "Pretrain/Step Time": 8.4334481600672} +{"Pretrain/Learning Rate": 2.740117929692521e-05, "Pretrain/Loss": 2.006610631942749, "Pretrain/Loss (Raw)": 1.9528270959854126, "Pretrain/Step": 9256, "Pretrain/Step Time": 8.440956192091107} +{"Pretrain/Learning Rate": 2.7396953722640267e-05, "Pretrain/Loss": 2.0060415267944336, "Pretrain/Loss (Raw)": 2.050253391265869, "Pretrain/Step": 9257, "Pretrain/Step Time": 8.439664898440242} +{"Pretrain/Learning Rate": 2.739272807924086e-05, "Pretrain/Loss": 2.0071983337402344, "Pretrain/Loss (Raw)": 2.049091339111328, "Pretrain/Step": 9258, "Pretrain/Step Time": 8.436001310124993} +{"Pretrain/Learning Rate": 2.7388502366848817e-05, "Pretrain/Loss": 2.0056240558624268, "Pretrain/Loss (Raw)": 1.8915131092071533, "Pretrain/Step": 9259, "Pretrain/Step Time": 8.438002889975905} +{"Pretrain/Learning Rate": 2.7384276585586e-05, "Pretrain/Loss": 2.0026698112487793, "Pretrain/Loss (Raw)": 1.7186392545700073, "Pretrain/Step": 9260, "Pretrain/Step Time": 8.440674785524607} +{"Pretrain/Learning Rate": 2.7380050735574242e-05, "Pretrain/Loss": 2.0046353340148926, "Pretrain/Loss (Raw)": 2.0553860664367676, "Pretrain/Step": 9261, "Pretrain/Step Time": 8.434139819815755} +{"Pretrain/Learning Rate": 2.7375824816935395e-05, "Pretrain/Loss": 2.005228042602539, "Pretrain/Loss (Raw)": 2.12424373626709, "Pretrain/Step": 9262, "Pretrain/Step Time": 8.433780299499631} +{"Pretrain/Learning Rate": 2.737159882979133e-05, "Pretrain/Loss": 2.0053093433380127, "Pretrain/Loss (Raw)": 1.9929015636444092, "Pretrain/Step": 9263, "Pretrain/Step Time": 8.438035929575562} +{"Pretrain/Learning Rate": 2.736737277426387e-05, "Pretrain/Loss": 2.0076422691345215, "Pretrain/Loss (Raw)": 2.1235435009002686, "Pretrain/Step": 9264, "Pretrain/Step Time": 8.438346967101097} +{"Pretrain/Learning Rate": 2.736314665047489e-05, "Pretrain/Loss": 2.0083374977111816, "Pretrain/Loss (Raw)": 2.0640270709991455, "Pretrain/Step": 9265, "Pretrain/Step Time": 8.434729909524322} +{"Pretrain/Learning Rate": 2.7358920458546244e-05, "Pretrain/Loss": 2.008047342300415, "Pretrain/Loss (Raw)": 1.8726599216461182, "Pretrain/Step": 9266, "Pretrain/Step Time": 8.43433327972889} +{"Pretrain/Learning Rate": 2.7354694198599784e-05, "Pretrain/Loss": 2.007305145263672, "Pretrain/Loss (Raw)": 2.0263848304748535, "Pretrain/Step": 9267, "Pretrain/Step Time": 8.435840211808681} +{"Pretrain/Learning Rate": 2.735046787075739e-05, "Pretrain/Loss": 2.0042285919189453, "Pretrain/Loss (Raw)": 1.6794490814208984, "Pretrain/Step": 9268, "Pretrain/Step Time": 8.436192564666271} +{"Pretrain/Learning Rate": 2.73462414751409e-05, "Pretrain/Loss": 2.0013020038604736, "Pretrain/Loss (Raw)": 1.7850648164749146, "Pretrain/Step": 9269, "Pretrain/Step Time": 8.432598430663347} +{"Pretrain/Learning Rate": 2.734201501187219e-05, "Pretrain/Loss": 2.0021512508392334, "Pretrain/Loss (Raw)": 2.052213191986084, "Pretrain/Step": 9270, "Pretrain/Step Time": 8.433858796954155} +{"Pretrain/Learning Rate": 2.7337788481073133e-05, "Pretrain/Loss": 1.998410940170288, "Pretrain/Loss (Raw)": 1.8674007654190063, "Pretrain/Step": 9271, "Pretrain/Step Time": 8.425196588039398} +{"Pretrain/Learning Rate": 2.7333561882865587e-05, "Pretrain/Loss": 1.9981153011322021, "Pretrain/Loss (Raw)": 1.9924994707107544, "Pretrain/Step": 9272, "Pretrain/Step Time": 8.426543103531003} +{"Pretrain/Learning Rate": 2.7329335217371445e-05, "Pretrain/Loss": 1.9993051290512085, "Pretrain/Loss (Raw)": 2.188199520111084, "Pretrain/Step": 9273, "Pretrain/Step Time": 8.433737767860293} +{"Pretrain/Learning Rate": 2.7325108484712546e-05, "Pretrain/Loss": 1.9982231855392456, "Pretrain/Loss (Raw)": 1.9678120613098145, "Pretrain/Step": 9274, "Pretrain/Step Time": 8.426952382549644} +{"Pretrain/Learning Rate": 2.732088168501079e-05, "Pretrain/Loss": 1.9984841346740723, "Pretrain/Loss (Raw)": 1.9573854207992554, "Pretrain/Step": 9275, "Pretrain/Step Time": 8.42739931307733} +{"Pretrain/Learning Rate": 2.7316654818388048e-05, "Pretrain/Loss": 1.997628927230835, "Pretrain/Loss (Raw)": 1.9526572227478027, "Pretrain/Step": 9276, "Pretrain/Step Time": 8.429107412695885} +{"Pretrain/Learning Rate": 2.7312427884966196e-05, "Pretrain/Loss": 1.9976779222488403, "Pretrain/Loss (Raw)": 1.9293572902679443, "Pretrain/Step": 9277, "Pretrain/Step Time": 8.424233701080084} +{"Pretrain/Learning Rate": 2.7308200884867114e-05, "Pretrain/Loss": 1.9977545738220215, "Pretrain/Loss (Raw)": 2.01574969291687, "Pretrain/Step": 9278, "Pretrain/Step Time": 8.424784673377872} +{"Pretrain/Learning Rate": 2.7303973818212693e-05, "Pretrain/Loss": 1.9990370273590088, "Pretrain/Loss (Raw)": 2.039628267288208, "Pretrain/Step": 9279, "Pretrain/Step Time": 8.429699376225471} +{"Pretrain/Learning Rate": 2.7299746685124806e-05, "Pretrain/Loss": 2.000455379486084, "Pretrain/Loss (Raw)": 2.095191717147827, "Pretrain/Step": 9280, "Pretrain/Step Time": 8.429521473124623} +{"Pretrain/Learning Rate": 2.7295519485725347e-05, "Pretrain/Loss": 2.0017483234405518, "Pretrain/Loss (Raw)": 2.0616390705108643, "Pretrain/Step": 9281, "Pretrain/Step Time": 8.431997615844011} +{"Pretrain/Learning Rate": 2.72912922201362e-05, "Pretrain/Loss": 2.0032730102539062, "Pretrain/Loss (Raw)": 2.1616294384002686, "Pretrain/Step": 9282, "Pretrain/Step Time": 8.430657047778368} +{"Pretrain/Learning Rate": 2.7287064888479252e-05, "Pretrain/Loss": 2.0040178298950195, "Pretrain/Loss (Raw)": 2.0668458938598633, "Pretrain/Step": 9283, "Pretrain/Step Time": 8.4342977758497} +{"Pretrain/Learning Rate": 2.7282837490876413e-05, "Pretrain/Loss": 2.0035035610198975, "Pretrain/Loss (Raw)": 1.904827356338501, "Pretrain/Step": 9284, "Pretrain/Step Time": 8.435386646538973} +{"Pretrain/Learning Rate": 2.7278610027449553e-05, "Pretrain/Loss": 2.0049116611480713, "Pretrain/Loss (Raw)": 2.0637638568878174, "Pretrain/Step": 9285, "Pretrain/Step Time": 8.431373899802566} +{"Pretrain/Learning Rate": 2.7274382498320584e-05, "Pretrain/Loss": 2.005202293395996, "Pretrain/Loss (Raw)": 2.040512800216675, "Pretrain/Step": 9286, "Pretrain/Step Time": 8.430446058511734} +{"Pretrain/Learning Rate": 2.7270154903611393e-05, "Pretrain/Loss": 2.0056722164154053, "Pretrain/Loss (Raw)": 2.102461099624634, "Pretrain/Step": 9287, "Pretrain/Step Time": 8.429421788081527} +{"Pretrain/Learning Rate": 2.7265927243443896e-05, "Pretrain/Loss": 2.005570888519287, "Pretrain/Loss (Raw)": 1.9138399362564087, "Pretrain/Step": 9288, "Pretrain/Step Time": 8.431682283058763} +{"Pretrain/Learning Rate": 2.726169951793998e-05, "Pretrain/Loss": 2.0067858695983887, "Pretrain/Loss (Raw)": 2.0661447048187256, "Pretrain/Step": 9289, "Pretrain/Step Time": 8.433772210031748} +{"Pretrain/Learning Rate": 2.725747172722155e-05, "Pretrain/Loss": 2.0141494274139404, "Pretrain/Loss (Raw)": 2.3458473682403564, "Pretrain/Step": 9290, "Pretrain/Step Time": 8.43127365782857} +{"Pretrain/Learning Rate": 2.7253243871410518e-05, "Pretrain/Loss": 2.0152101516723633, "Pretrain/Loss (Raw)": 2.010420083999634, "Pretrain/Step": 9291, "Pretrain/Step Time": 8.426159393042326} +{"Pretrain/Learning Rate": 2.7249015950628787e-05, "Pretrain/Loss": 2.013781785964966, "Pretrain/Loss (Raw)": 1.7718334197998047, "Pretrain/Step": 9292, "Pretrain/Step Time": 8.424003379419446} +{"Pretrain/Learning Rate": 2.7244787964998265e-05, "Pretrain/Loss": 2.0087523460388184, "Pretrain/Loss (Raw)": 1.7875584363937378, "Pretrain/Step": 9293, "Pretrain/Step Time": 8.423453832045197} +{"Pretrain/Learning Rate": 2.7240559914640867e-05, "Pretrain/Loss": 2.007676124572754, "Pretrain/Loss (Raw)": 1.9931269884109497, "Pretrain/Step": 9294, "Pretrain/Step Time": 8.428121861070395} +{"Pretrain/Learning Rate": 2.72363317996785e-05, "Pretrain/Loss": 2.009084463119507, "Pretrain/Loss (Raw)": 2.0435853004455566, "Pretrain/Step": 9295, "Pretrain/Step Time": 8.430406471714377} +{"Pretrain/Learning Rate": 2.723210362023308e-05, "Pretrain/Loss": 2.008368968963623, "Pretrain/Loss (Raw)": 1.9180738925933838, "Pretrain/Step": 9296, "Pretrain/Step Time": 8.431297121569514} +{"Pretrain/Learning Rate": 2.7227875376426533e-05, "Pretrain/Loss": 2.0086283683776855, "Pretrain/Loss (Raw)": 2.0166094303131104, "Pretrain/Step": 9297, "Pretrain/Step Time": 8.434051973745227} +{"Pretrain/Learning Rate": 2.7223647068380763e-05, "Pretrain/Loss": 2.0058512687683105, "Pretrain/Loss (Raw)": 1.6716276407241821, "Pretrain/Step": 9298, "Pretrain/Step Time": 8.433582397177815} +{"Pretrain/Learning Rate": 2.7219418696217703e-05, "Pretrain/Loss": 2.006037950515747, "Pretrain/Loss (Raw)": 1.9020682573318481, "Pretrain/Step": 9299, "Pretrain/Step Time": 8.434872990474105} +{"Pretrain/Learning Rate": 2.721519026005927e-05, "Pretrain/Loss": 2.005331516265869, "Pretrain/Loss (Raw)": 1.8787822723388672, "Pretrain/Step": 9300, "Pretrain/Step Time": 8.43838688544929} +{"Pretrain/Learning Rate": 2.721096176002738e-05, "Pretrain/Loss": 2.0060346126556396, "Pretrain/Loss (Raw)": 2.2116379737854004, "Pretrain/Step": 9301, "Pretrain/Step Time": 8.43535616621375} +{"Pretrain/Learning Rate": 2.7206733196243973e-05, "Pretrain/Loss": 2.0061235427856445, "Pretrain/Loss (Raw)": 1.9476909637451172, "Pretrain/Step": 9302, "Pretrain/Step Time": 8.429122135043144} +{"Pretrain/Learning Rate": 2.7202504568830966e-05, "Pretrain/Loss": 2.0063834190368652, "Pretrain/Loss (Raw)": 1.9812716245651245, "Pretrain/Step": 9303, "Pretrain/Step Time": 8.430218767374754} +{"Pretrain/Learning Rate": 2.7198275877910288e-05, "Pretrain/Loss": 2.006937026977539, "Pretrain/Loss (Raw)": 2.0969738960266113, "Pretrain/Step": 9304, "Pretrain/Step Time": 8.431323494762182} +{"Pretrain/Learning Rate": 2.719404712360389e-05, "Pretrain/Loss": 2.0051960945129395, "Pretrain/Loss (Raw)": 1.8890926837921143, "Pretrain/Step": 9305, "Pretrain/Step Time": 8.433189699426293} +{"Pretrain/Learning Rate": 2.7189818306033676e-05, "Pretrain/Loss": 2.0043511390686035, "Pretrain/Loss (Raw)": 1.8533306121826172, "Pretrain/Step": 9306, "Pretrain/Step Time": 8.431766355410218} +{"Pretrain/Learning Rate": 2.7185589425321602e-05, "Pretrain/Loss": 2.005539894104004, "Pretrain/Loss (Raw)": 2.1441104412078857, "Pretrain/Step": 9307, "Pretrain/Step Time": 8.432183492928743} +{"Pretrain/Learning Rate": 2.7181360481589592e-05, "Pretrain/Loss": 1.9993774890899658, "Pretrain/Loss (Raw)": 1.8173245191574097, "Pretrain/Step": 9308, "Pretrain/Step Time": 8.42906796373427} +{"Pretrain/Learning Rate": 2.7177131474959592e-05, "Pretrain/Loss": 1.998410940170288, "Pretrain/Loss (Raw)": 1.9361273050308228, "Pretrain/Step": 9309, "Pretrain/Step Time": 8.427135828882456} +{"Pretrain/Learning Rate": 2.717290240555354e-05, "Pretrain/Loss": 1.99659264087677, "Pretrain/Loss (Raw)": 1.8746193647384644, "Pretrain/Step": 9310, "Pretrain/Step Time": 8.432613760232925} +{"Pretrain/Learning Rate": 2.7168673273493385e-05, "Pretrain/Loss": 1.9955953359603882, "Pretrain/Loss (Raw)": 1.9833277463912964, "Pretrain/Step": 9311, "Pretrain/Step Time": 8.434911858290434} +{"Pretrain/Learning Rate": 2.716444407890106e-05, "Pretrain/Loss": 1.996216058731079, "Pretrain/Loss (Raw)": 2.0103936195373535, "Pretrain/Step": 9312, "Pretrain/Step Time": 8.433585576713085} +{"Pretrain/Learning Rate": 2.7160214821898518e-05, "Pretrain/Loss": 1.994980812072754, "Pretrain/Loss (Raw)": 2.0180587768554688, "Pretrain/Step": 9313, "Pretrain/Step Time": 8.434842854738235} +{"Pretrain/Learning Rate": 2.7155985502607702e-05, "Pretrain/Loss": 1.9936838150024414, "Pretrain/Loss (Raw)": 2.009979009628296, "Pretrain/Step": 9314, "Pretrain/Step Time": 8.434496497735381} +{"Pretrain/Learning Rate": 2.7151756121150563e-05, "Pretrain/Loss": 1.9940721988677979, "Pretrain/Loss (Raw)": 1.950452446937561, "Pretrain/Step": 9315, "Pretrain/Step Time": 8.43736313097179} +{"Pretrain/Learning Rate": 2.714752667764906e-05, "Pretrain/Loss": 1.9943022727966309, "Pretrain/Loss (Raw)": 2.019387722015381, "Pretrain/Step": 9316, "Pretrain/Step Time": 8.43821812979877} +{"Pretrain/Learning Rate": 2.714329717222513e-05, "Pretrain/Loss": 1.993786334991455, "Pretrain/Loss (Raw)": 2.0695090293884277, "Pretrain/Step": 9317, "Pretrain/Step Time": 8.437786540016532} +{"Pretrain/Learning Rate": 2.713906760500074e-05, "Pretrain/Loss": 1.9950271844863892, "Pretrain/Loss (Raw)": 1.9091979265213013, "Pretrain/Step": 9318, "Pretrain/Step Time": 8.435728378593922} +{"Pretrain/Learning Rate": 2.7134837976097842e-05, "Pretrain/Loss": 1.9965208768844604, "Pretrain/Loss (Raw)": 1.9993549585342407, "Pretrain/Step": 9319, "Pretrain/Step Time": 8.435726853087544} +{"Pretrain/Learning Rate": 2.7130608285638398e-05, "Pretrain/Loss": 1.9968430995941162, "Pretrain/Loss (Raw)": 2.082519769668579, "Pretrain/Step": 9320, "Pretrain/Step Time": 8.436838069930673} +{"Pretrain/Learning Rate": 2.7126378533744373e-05, "Pretrain/Loss": 1.997377872467041, "Pretrain/Loss (Raw)": 1.986582636833191, "Pretrain/Step": 9321, "Pretrain/Step Time": 8.438459919765592} +{"Pretrain/Learning Rate": 2.7122148720537715e-05, "Pretrain/Loss": 1.9988601207733154, "Pretrain/Loss (Raw)": 2.262420415878296, "Pretrain/Step": 9322, "Pretrain/Step Time": 8.439256377518177} +{"Pretrain/Learning Rate": 2.7117918846140394e-05, "Pretrain/Loss": 1.9975086450576782, "Pretrain/Loss (Raw)": 2.0820906162261963, "Pretrain/Step": 9323, "Pretrain/Step Time": 8.435439171269536} +{"Pretrain/Learning Rate": 2.711368891067438e-05, "Pretrain/Loss": 1.9995405673980713, "Pretrain/Loss (Raw)": 2.11311411857605, "Pretrain/Step": 9324, "Pretrain/Step Time": 8.436495481058955} +{"Pretrain/Learning Rate": 2.710945891426163e-05, "Pretrain/Loss": 1.9992969036102295, "Pretrain/Loss (Raw)": 1.8827860355377197, "Pretrain/Step": 9325, "Pretrain/Step Time": 8.43300668336451} +{"Pretrain/Learning Rate": 2.7105228857024127e-05, "Pretrain/Loss": 2.000460147857666, "Pretrain/Loss (Raw)": 2.170790672302246, "Pretrain/Step": 9326, "Pretrain/Step Time": 8.437768161296844} +{"Pretrain/Learning Rate": 2.7100998739083827e-05, "Pretrain/Loss": 1.9940166473388672, "Pretrain/Loss (Raw)": 1.1914242506027222, "Pretrain/Step": 9327, "Pretrain/Step Time": 8.44075707346201} +{"Pretrain/Learning Rate": 2.7096768560562712e-05, "Pretrain/Loss": 1.994457483291626, "Pretrain/Loss (Raw)": 2.10892653465271, "Pretrain/Step": 9328, "Pretrain/Step Time": 8.437645209953189} +{"Pretrain/Learning Rate": 2.7092538321582756e-05, "Pretrain/Loss": 1.9939312934875488, "Pretrain/Loss (Raw)": 1.9804021120071411, "Pretrain/Step": 9329, "Pretrain/Step Time": 8.442769760265946} +{"Pretrain/Learning Rate": 2.708830802226593e-05, "Pretrain/Loss": 1.9951210021972656, "Pretrain/Loss (Raw)": 2.009925365447998, "Pretrain/Step": 9330, "Pretrain/Step Time": 8.441100992262363} +{"Pretrain/Learning Rate": 2.708407766273422e-05, "Pretrain/Loss": 1.9929265975952148, "Pretrain/Loss (Raw)": 1.8435500860214233, "Pretrain/Step": 9331, "Pretrain/Step Time": 8.441308319568634} +{"Pretrain/Learning Rate": 2.707984724310959e-05, "Pretrain/Loss": 1.9927386045455933, "Pretrain/Loss (Raw)": 1.9850800037384033, "Pretrain/Step": 9332, "Pretrain/Step Time": 8.444938831031322} +{"Pretrain/Learning Rate": 2.7075616763514034e-05, "Pretrain/Loss": 1.9911584854125977, "Pretrain/Loss (Raw)": 1.9899040460586548, "Pretrain/Step": 9333, "Pretrain/Step Time": 8.44513158686459} +{"Pretrain/Learning Rate": 2.7071386224069533e-05, "Pretrain/Loss": 1.991542100906372, "Pretrain/Loss (Raw)": 2.1154556274414062, "Pretrain/Step": 9334, "Pretrain/Step Time": 8.445600347593427} +{"Pretrain/Learning Rate": 2.7067155624898073e-05, "Pretrain/Loss": 1.993076205253601, "Pretrain/Loss (Raw)": 2.1768171787261963, "Pretrain/Step": 9335, "Pretrain/Step Time": 8.444111656397581} +{"Pretrain/Learning Rate": 2.706292496612164e-05, "Pretrain/Loss": 1.992437720298767, "Pretrain/Loss (Raw)": 1.939375877380371, "Pretrain/Step": 9336, "Pretrain/Step Time": 8.4446612149477} +{"Pretrain/Learning Rate": 2.7058694247862216e-05, "Pretrain/Loss": 1.9899394512176514, "Pretrain/Loss (Raw)": 1.7771971225738525, "Pretrain/Step": 9337, "Pretrain/Step Time": 8.445062836632133} +{"Pretrain/Learning Rate": 2.705446347024179e-05, "Pretrain/Loss": 1.9872840642929077, "Pretrain/Loss (Raw)": 1.8463224172592163, "Pretrain/Step": 9338, "Pretrain/Step Time": 8.442592609673738} +{"Pretrain/Learning Rate": 2.7050232633382366e-05, "Pretrain/Loss": 1.9880750179290771, "Pretrain/Loss (Raw)": 2.012788772583008, "Pretrain/Step": 9339, "Pretrain/Step Time": 8.445937687531114} +{"Pretrain/Learning Rate": 2.704600173740593e-05, "Pretrain/Loss": 1.987870216369629, "Pretrain/Loss (Raw)": 2.0022244453430176, "Pretrain/Step": 9340, "Pretrain/Step Time": 8.446161048486829} +{"Pretrain/Learning Rate": 2.7041770782434468e-05, "Pretrain/Loss": 1.990852952003479, "Pretrain/Loss (Raw)": 2.096952438354492, "Pretrain/Step": 9341, "Pretrain/Step Time": 8.445191495120525} +{"Pretrain/Learning Rate": 2.7037539768589988e-05, "Pretrain/Loss": 1.9899237155914307, "Pretrain/Loss (Raw)": 2.0473456382751465, "Pretrain/Step": 9342, "Pretrain/Step Time": 8.448401940986514} +{"Pretrain/Learning Rate": 2.703330869599449e-05, "Pretrain/Loss": 1.9909523725509644, "Pretrain/Loss (Raw)": 1.9548269510269165, "Pretrain/Step": 9343, "Pretrain/Step Time": 8.444679545238614} +{"Pretrain/Learning Rate": 2.7029077564769967e-05, "Pretrain/Loss": 1.993009090423584, "Pretrain/Loss (Raw)": 2.359929323196411, "Pretrain/Step": 9344, "Pretrain/Step Time": 8.444656731560826} +{"Pretrain/Learning Rate": 2.702484637503842e-05, "Pretrain/Loss": 1.992116093635559, "Pretrain/Loss (Raw)": 1.7978132963180542, "Pretrain/Step": 9345, "Pretrain/Step Time": 8.443865122273564} +{"Pretrain/Learning Rate": 2.7020615126921854e-05, "Pretrain/Loss": 1.9931271076202393, "Pretrain/Loss (Raw)": 1.9506044387817383, "Pretrain/Step": 9346, "Pretrain/Step Time": 8.445083290338516} +{"Pretrain/Learning Rate": 2.7016383820542278e-05, "Pretrain/Loss": 1.9916024208068848, "Pretrain/Loss (Raw)": 1.7852857112884521, "Pretrain/Step": 9347, "Pretrain/Step Time": 8.445643495768309} +{"Pretrain/Learning Rate": 2.70121524560217e-05, "Pretrain/Loss": 1.991229772567749, "Pretrain/Loss (Raw)": 1.9916150569915771, "Pretrain/Step": 9348, "Pretrain/Step Time": 8.445020576938987} +{"Pretrain/Learning Rate": 2.7007921033482118e-05, "Pretrain/Loss": 1.9902634620666504, "Pretrain/Loss (Raw)": 1.8342453241348267, "Pretrain/Step": 9349, "Pretrain/Step Time": 8.448717035353184} +{"Pretrain/Learning Rate": 2.700368955304555e-05, "Pretrain/Loss": 1.990781545639038, "Pretrain/Loss (Raw)": 2.4130752086639404, "Pretrain/Step": 9350, "Pretrain/Step Time": 8.443968137726188} +{"Pretrain/Learning Rate": 2.6999458014834006e-05, "Pretrain/Loss": 1.9879344701766968, "Pretrain/Loss (Raw)": 1.749644160270691, "Pretrain/Step": 9351, "Pretrain/Step Time": 8.442054811865091} +{"Pretrain/Learning Rate": 2.69952264189695e-05, "Pretrain/Loss": 1.9832448959350586, "Pretrain/Loss (Raw)": 1.4183334112167358, "Pretrain/Step": 9352, "Pretrain/Step Time": 8.440706353634596} +{"Pretrain/Learning Rate": 2.6990994765574053e-05, "Pretrain/Loss": 1.9835216999053955, "Pretrain/Loss (Raw)": 2.0943305492401123, "Pretrain/Step": 9353, "Pretrain/Step Time": 8.445321129634976} +{"Pretrain/Learning Rate": 2.6986763054769665e-05, "Pretrain/Loss": 1.9844568967819214, "Pretrain/Loss (Raw)": 1.9639703035354614, "Pretrain/Step": 9354, "Pretrain/Step Time": 8.443675899878144} +{"Pretrain/Learning Rate": 2.6982531286678368e-05, "Pretrain/Loss": 1.9860228300094604, "Pretrain/Loss (Raw)": 2.150031328201294, "Pretrain/Step": 9355, "Pretrain/Step Time": 8.44876592233777} +{"Pretrain/Learning Rate": 2.697829946142218e-05, "Pretrain/Loss": 1.987032175064087, "Pretrain/Loss (Raw)": 2.190542697906494, "Pretrain/Step": 9356, "Pretrain/Step Time": 8.442789712920785} +{"Pretrain/Learning Rate": 2.697406757912312e-05, "Pretrain/Loss": 1.9862780570983887, "Pretrain/Loss (Raw)": 1.9164180755615234, "Pretrain/Step": 9357, "Pretrain/Step Time": 8.440507298335433} +{"Pretrain/Learning Rate": 2.6969835639903217e-05, "Pretrain/Loss": 1.9876068830490112, "Pretrain/Loss (Raw)": 1.9828675985336304, "Pretrain/Step": 9358, "Pretrain/Step Time": 8.445088371634483} +{"Pretrain/Learning Rate": 2.6965603643884492e-05, "Pretrain/Loss": 1.9844465255737305, "Pretrain/Loss (Raw)": 1.8123258352279663, "Pretrain/Step": 9359, "Pretrain/Step Time": 8.444553723558784} +{"Pretrain/Learning Rate": 2.6961371591188966e-05, "Pretrain/Loss": 1.983818769454956, "Pretrain/Loss (Raw)": 1.8887079954147339, "Pretrain/Step": 9360, "Pretrain/Step Time": 8.440533552318811} +{"Pretrain/Learning Rate": 2.6957139481938677e-05, "Pretrain/Loss": 1.9841068983078003, "Pretrain/Loss (Raw)": 2.0769402980804443, "Pretrain/Step": 9361, "Pretrain/Step Time": 8.441412139683962} +{"Pretrain/Learning Rate": 2.6952907316255648e-05, "Pretrain/Loss": 1.9842462539672852, "Pretrain/Loss (Raw)": 1.9054592847824097, "Pretrain/Step": 9362, "Pretrain/Step Time": 8.438356285914779} +{"Pretrain/Learning Rate": 2.6948675094261923e-05, "Pretrain/Loss": 1.985274314880371, "Pretrain/Loss (Raw)": 2.0398974418640137, "Pretrain/Step": 9363, "Pretrain/Step Time": 8.439928887411952} +{"Pretrain/Learning Rate": 2.6944442816079518e-05, "Pretrain/Loss": 1.9841707944869995, "Pretrain/Loss (Raw)": 1.9104628562927246, "Pretrain/Step": 9364, "Pretrain/Step Time": 8.439249204471707} +{"Pretrain/Learning Rate": 2.6940210481830475e-05, "Pretrain/Loss": 1.984731912612915, "Pretrain/Loss (Raw)": 1.9780163764953613, "Pretrain/Step": 9365, "Pretrain/Step Time": 8.440367316827178} +{"Pretrain/Learning Rate": 2.6935978091636826e-05, "Pretrain/Loss": 1.9840291738510132, "Pretrain/Loss (Raw)": 1.9254871606826782, "Pretrain/Step": 9366, "Pretrain/Step Time": 8.441449349746108} +{"Pretrain/Learning Rate": 2.6931745645620616e-05, "Pretrain/Loss": 1.9837322235107422, "Pretrain/Loss (Raw)": 1.9402304887771606, "Pretrain/Step": 9367, "Pretrain/Step Time": 8.439469577744603} +{"Pretrain/Learning Rate": 2.6927513143903893e-05, "Pretrain/Loss": 1.9797158241271973, "Pretrain/Loss (Raw)": 1.633864402770996, "Pretrain/Step": 9368, "Pretrain/Step Time": 8.440191637724638} +{"Pretrain/Learning Rate": 2.6923280586608672e-05, "Pretrain/Loss": 1.9815043210983276, "Pretrain/Loss (Raw)": 2.0324313640594482, "Pretrain/Step": 9369, "Pretrain/Step Time": 8.439429610967636} +{"Pretrain/Learning Rate": 2.691904797385702e-05, "Pretrain/Loss": 1.9826977252960205, "Pretrain/Loss (Raw)": 2.083869218826294, "Pretrain/Step": 9370, "Pretrain/Step Time": 8.441132176667452} +{"Pretrain/Learning Rate": 2.691481530577097e-05, "Pretrain/Loss": 1.9825100898742676, "Pretrain/Loss (Raw)": 2.0358049869537354, "Pretrain/Step": 9371, "Pretrain/Step Time": 8.447176517918706} +{"Pretrain/Learning Rate": 2.6910582582472564e-05, "Pretrain/Loss": 1.9817733764648438, "Pretrain/Loss (Raw)": 2.057041645050049, "Pretrain/Step": 9372, "Pretrain/Step Time": 8.443686926737428} +{"Pretrain/Learning Rate": 2.6906349804083868e-05, "Pretrain/Loss": 1.9805669784545898, "Pretrain/Loss (Raw)": 1.8371893167495728, "Pretrain/Step": 9373, "Pretrain/Step Time": 8.440821008756757} +{"Pretrain/Learning Rate": 2.6902116970726915e-05, "Pretrain/Loss": 1.9797970056533813, "Pretrain/Loss (Raw)": 1.8566780090332031, "Pretrain/Step": 9374, "Pretrain/Step Time": 8.443606251850724} +{"Pretrain/Learning Rate": 2.6897884082523762e-05, "Pretrain/Loss": 1.9808590412139893, "Pretrain/Loss (Raw)": 2.106760263442993, "Pretrain/Step": 9375, "Pretrain/Step Time": 8.448238510638475} +{"Pretrain/Learning Rate": 2.6893651139596453e-05, "Pretrain/Loss": 1.9826356172561646, "Pretrain/Loss (Raw)": 2.0453169345855713, "Pretrain/Step": 9376, "Pretrain/Step Time": 8.442566690966487} +{"Pretrain/Learning Rate": 2.6889418142067046e-05, "Pretrain/Loss": 1.9830834865570068, "Pretrain/Loss (Raw)": 1.9120895862579346, "Pretrain/Step": 9377, "Pretrain/Step Time": 8.442623691633344} +{"Pretrain/Learning Rate": 2.6885185090057607e-05, "Pretrain/Loss": 1.9825376272201538, "Pretrain/Loss (Raw)": 2.055504560470581, "Pretrain/Step": 9378, "Pretrain/Step Time": 8.441699724644423} +{"Pretrain/Learning Rate": 2.688095198369019e-05, "Pretrain/Loss": 1.9815125465393066, "Pretrain/Loss (Raw)": 1.9884748458862305, "Pretrain/Step": 9379, "Pretrain/Step Time": 8.43751578591764} +{"Pretrain/Learning Rate": 2.6876718823086837e-05, "Pretrain/Loss": 1.9804325103759766, "Pretrain/Loss (Raw)": 1.8426182270050049, "Pretrain/Step": 9380, "Pretrain/Step Time": 8.441356502473354} +{"Pretrain/Learning Rate": 2.687248560836963e-05, "Pretrain/Loss": 1.9813940525054932, "Pretrain/Loss (Raw)": 2.1583995819091797, "Pretrain/Step": 9381, "Pretrain/Step Time": 8.438842564821243} +{"Pretrain/Learning Rate": 2.686825233966061e-05, "Pretrain/Loss": 1.978563666343689, "Pretrain/Loss (Raw)": 1.8224543333053589, "Pretrain/Step": 9382, "Pretrain/Step Time": 8.437132148072124} +{"Pretrain/Learning Rate": 2.6864019017081854e-05, "Pretrain/Loss": 1.978310227394104, "Pretrain/Loss (Raw)": 2.1330409049987793, "Pretrain/Step": 9383, "Pretrain/Step Time": 8.43437989614904} +{"Pretrain/Learning Rate": 2.6859785640755426e-05, "Pretrain/Loss": 1.9771636724472046, "Pretrain/Loss (Raw)": 1.8060697317123413, "Pretrain/Step": 9384, "Pretrain/Step Time": 8.429672077298164} +{"Pretrain/Learning Rate": 2.6855552210803393e-05, "Pretrain/Loss": 1.9755699634552002, "Pretrain/Loss (Raw)": 1.8462483882904053, "Pretrain/Step": 9385, "Pretrain/Step Time": 8.43347817286849} +{"Pretrain/Learning Rate": 2.6851318727347813e-05, "Pretrain/Loss": 1.9754741191864014, "Pretrain/Loss (Raw)": 2.036837100982666, "Pretrain/Step": 9386, "Pretrain/Step Time": 8.434838389977813} +{"Pretrain/Learning Rate": 2.684708519051077e-05, "Pretrain/Loss": 1.9777883291244507, "Pretrain/Loss (Raw)": 2.18772292137146, "Pretrain/Step": 9387, "Pretrain/Step Time": 8.432726241648197} +{"Pretrain/Learning Rate": 2.6842851600414313e-05, "Pretrain/Loss": 1.9792506694793701, "Pretrain/Loss (Raw)": 1.9058395624160767, "Pretrain/Step": 9388, "Pretrain/Step Time": 8.429883232340217} +{"Pretrain/Learning Rate": 2.6838617957180547e-05, "Pretrain/Loss": 1.977150321006775, "Pretrain/Loss (Raw)": 1.7865220308303833, "Pretrain/Step": 9389, "Pretrain/Step Time": 8.432254457846284} +{"Pretrain/Learning Rate": 2.6834384260931523e-05, "Pretrain/Loss": 1.9829570055007935, "Pretrain/Loss (Raw)": 2.8675010204315186, "Pretrain/Step": 9390, "Pretrain/Step Time": 8.43691523000598} +{"Pretrain/Learning Rate": 2.6830150511789314e-05, "Pretrain/Loss": 1.9820983409881592, "Pretrain/Loss (Raw)": 1.882991909980774, "Pretrain/Step": 9391, "Pretrain/Step Time": 8.43646639212966} +{"Pretrain/Learning Rate": 2.6825916709876013e-05, "Pretrain/Loss": 1.9822057485580444, "Pretrain/Loss (Raw)": 2.137284755706787, "Pretrain/Step": 9392, "Pretrain/Step Time": 8.4333067368716} +{"Pretrain/Learning Rate": 2.6821682855313685e-05, "Pretrain/Loss": 1.9826935529708862, "Pretrain/Loss (Raw)": 2.126474380493164, "Pretrain/Step": 9393, "Pretrain/Step Time": 8.43448187969625} +{"Pretrain/Learning Rate": 2.6817448948224422e-05, "Pretrain/Loss": 1.9841525554656982, "Pretrain/Loss (Raw)": 2.0594229698181152, "Pretrain/Step": 9394, "Pretrain/Step Time": 8.435196358710527} +{"Pretrain/Learning Rate": 2.68132149887303e-05, "Pretrain/Loss": 1.9845434427261353, "Pretrain/Loss (Raw)": 2.0764050483703613, "Pretrain/Step": 9395, "Pretrain/Step Time": 8.432431980967522} +{"Pretrain/Learning Rate": 2.68089809769534e-05, "Pretrain/Loss": 1.985274076461792, "Pretrain/Loss (Raw)": 1.7729740142822266, "Pretrain/Step": 9396, "Pretrain/Step Time": 8.432831140235066} +{"Pretrain/Learning Rate": 2.6804746913015804e-05, "Pretrain/Loss": 1.9883428812026978, "Pretrain/Loss (Raw)": 2.1778764724731445, "Pretrain/Step": 9397, "Pretrain/Step Time": 8.44024750776589} +{"Pretrain/Learning Rate": 2.6800512797039607e-05, "Pretrain/Loss": 1.9872643947601318, "Pretrain/Loss (Raw)": 1.9141554832458496, "Pretrain/Step": 9398, "Pretrain/Step Time": 8.439625792205334} +{"Pretrain/Learning Rate": 2.6796278629146894e-05, "Pretrain/Loss": 1.988030195236206, "Pretrain/Loss (Raw)": 1.9654241800308228, "Pretrain/Step": 9399, "Pretrain/Step Time": 8.437816767022014} +{"Pretrain/Learning Rate": 2.6792044409459756e-05, "Pretrain/Loss": 1.988110065460205, "Pretrain/Loss (Raw)": 2.002737522125244, "Pretrain/Step": 9400, "Pretrain/Step Time": 8.438127875328064} +{"Pretrain/Learning Rate": 2.6787810138100277e-05, "Pretrain/Loss": 1.9874200820922852, "Pretrain/Loss (Raw)": 2.099868059158325, "Pretrain/Step": 9401, "Pretrain/Step Time": 8.432098992168903} +{"Pretrain/Learning Rate": 2.6783575815190553e-05, "Pretrain/Loss": 1.9876625537872314, "Pretrain/Loss (Raw)": 1.998844861984253, "Pretrain/Step": 9402, "Pretrain/Step Time": 8.435508282855153} +{"Pretrain/Learning Rate": 2.677934144085267e-05, "Pretrain/Loss": 1.9898229837417603, "Pretrain/Loss (Raw)": 2.2339301109313965, "Pretrain/Step": 9403, "Pretrain/Step Time": 8.433502905070782} +{"Pretrain/Learning Rate": 2.6775107015208744e-05, "Pretrain/Loss": 1.9907476902008057, "Pretrain/Loss (Raw)": 2.071040153503418, "Pretrain/Step": 9404, "Pretrain/Step Time": 8.435029437765479} +{"Pretrain/Learning Rate": 2.6770872538380855e-05, "Pretrain/Loss": 1.9911487102508545, "Pretrain/Loss (Raw)": 1.980663537979126, "Pretrain/Step": 9405, "Pretrain/Step Time": 8.435889203101397} +{"Pretrain/Learning Rate": 2.6766638010491102e-05, "Pretrain/Loss": 1.9906563758850098, "Pretrain/Loss (Raw)": 1.9527273178100586, "Pretrain/Step": 9406, "Pretrain/Step Time": 8.434869630262256} +{"Pretrain/Learning Rate": 2.6762403431661588e-05, "Pretrain/Loss": 1.9904391765594482, "Pretrain/Loss (Raw)": 2.011833429336548, "Pretrain/Step": 9407, "Pretrain/Step Time": 8.432730194181204} +{"Pretrain/Learning Rate": 2.675816880201441e-05, "Pretrain/Loss": 1.989713191986084, "Pretrain/Loss (Raw)": 2.0022616386413574, "Pretrain/Step": 9408, "Pretrain/Step Time": 8.430022723972797} +{"Pretrain/Learning Rate": 2.675393412167168e-05, "Pretrain/Loss": 1.9893662929534912, "Pretrain/Loss (Raw)": 2.017239570617676, "Pretrain/Step": 9409, "Pretrain/Step Time": 8.427063543349504} +{"Pretrain/Learning Rate": 2.674969939075549e-05, "Pretrain/Loss": 1.9890797138214111, "Pretrain/Loss (Raw)": 2.124962568283081, "Pretrain/Step": 9410, "Pretrain/Step Time": 8.429455000907183} +{"Pretrain/Learning Rate": 2.674546460938796e-05, "Pretrain/Loss": 1.9901551008224487, "Pretrain/Loss (Raw)": 2.204475164413452, "Pretrain/Step": 9411, "Pretrain/Step Time": 8.4260786306113} +{"Pretrain/Learning Rate": 2.6741229777691185e-05, "Pretrain/Loss": 1.9912829399108887, "Pretrain/Loss (Raw)": 2.049194812774658, "Pretrain/Step": 9412, "Pretrain/Step Time": 8.42658681422472} +{"Pretrain/Learning Rate": 2.6736994895787275e-05, "Pretrain/Loss": 1.9921720027923584, "Pretrain/Loss (Raw)": 2.177562713623047, "Pretrain/Step": 9413, "Pretrain/Step Time": 8.429126305505633} +{"Pretrain/Learning Rate": 2.6732759963798344e-05, "Pretrain/Loss": 1.9924824237823486, "Pretrain/Loss (Raw)": 2.0802459716796875, "Pretrain/Step": 9414, "Pretrain/Step Time": 8.428110176697373} +{"Pretrain/Learning Rate": 2.6728524981846493e-05, "Pretrain/Loss": 1.9917221069335938, "Pretrain/Loss (Raw)": 2.005140542984009, "Pretrain/Step": 9415, "Pretrain/Step Time": 8.42994267679751} +{"Pretrain/Learning Rate": 2.6724289950053855e-05, "Pretrain/Loss": 1.992769479751587, "Pretrain/Loss (Raw)": 2.047891139984131, "Pretrain/Step": 9416, "Pretrain/Step Time": 8.426287332549691} +{"Pretrain/Learning Rate": 2.672005486854253e-05, "Pretrain/Loss": 1.9924039840698242, "Pretrain/Loss (Raw)": 2.0193841457366943, "Pretrain/Step": 9417, "Pretrain/Step Time": 8.422731548547745} +{"Pretrain/Learning Rate": 2.6715819737434627e-05, "Pretrain/Loss": 1.988438606262207, "Pretrain/Loss (Raw)": 1.8382691144943237, "Pretrain/Step": 9418, "Pretrain/Step Time": 8.424030425027013} +{"Pretrain/Learning Rate": 2.671158455685227e-05, "Pretrain/Loss": 1.9887510538101196, "Pretrain/Loss (Raw)": 2.050412893295288, "Pretrain/Step": 9419, "Pretrain/Step Time": 8.427296731621027} +{"Pretrain/Learning Rate": 2.6707349326917585e-05, "Pretrain/Loss": 1.9905192852020264, "Pretrain/Loss (Raw)": 1.998177409172058, "Pretrain/Step": 9420, "Pretrain/Step Time": 8.428181067109108} +{"Pretrain/Learning Rate": 2.6703114047752692e-05, "Pretrain/Loss": 1.9929637908935547, "Pretrain/Loss (Raw)": 2.1004374027252197, "Pretrain/Step": 9421, "Pretrain/Step Time": 8.428122039884329} +{"Pretrain/Learning Rate": 2.66988787194797e-05, "Pretrain/Loss": 1.9926719665527344, "Pretrain/Loss (Raw)": 1.9557965993881226, "Pretrain/Step": 9422, "Pretrain/Step Time": 8.430087441578507} +{"Pretrain/Learning Rate": 2.6694643342220733e-05, "Pretrain/Loss": 1.9927124977111816, "Pretrain/Loss (Raw)": 2.048762083053589, "Pretrain/Step": 9423, "Pretrain/Step Time": 8.428031941875815} +{"Pretrain/Learning Rate": 2.6690407916097927e-05, "Pretrain/Loss": 1.992795467376709, "Pretrain/Loss (Raw)": 1.9286892414093018, "Pretrain/Step": 9424, "Pretrain/Step Time": 8.426421968266368} +{"Pretrain/Learning Rate": 2.6686172441233396e-05, "Pretrain/Loss": 1.9928526878356934, "Pretrain/Loss (Raw)": 2.0239484310150146, "Pretrain/Step": 9425, "Pretrain/Step Time": 8.424089692533016} +{"Pretrain/Learning Rate": 2.6681936917749273e-05, "Pretrain/Loss": 1.9948084354400635, "Pretrain/Loss (Raw)": 1.9219520092010498, "Pretrain/Step": 9426, "Pretrain/Step Time": 8.42265809699893} +{"Pretrain/Learning Rate": 2.6677701345767692e-05, "Pretrain/Loss": 1.9942348003387451, "Pretrain/Loss (Raw)": 1.828629970550537, "Pretrain/Step": 9427, "Pretrain/Step Time": 8.41935720667243} +{"Pretrain/Learning Rate": 2.667346572541076e-05, "Pretrain/Loss": 1.994339108467102, "Pretrain/Loss (Raw)": 1.8921445608139038, "Pretrain/Step": 9428, "Pretrain/Step Time": 8.421398874372244} +{"Pretrain/Learning Rate": 2.6669230056800638e-05, "Pretrain/Loss": 1.9890586137771606, "Pretrain/Loss (Raw)": 1.5357332229614258, "Pretrain/Step": 9429, "Pretrain/Step Time": 8.418791618198156} +{"Pretrain/Learning Rate": 2.6664994340059435e-05, "Pretrain/Loss": 1.9913755655288696, "Pretrain/Loss (Raw)": 2.244259834289551, "Pretrain/Step": 9430, "Pretrain/Step Time": 8.427066484466195} +{"Pretrain/Learning Rate": 2.666075857530929e-05, "Pretrain/Loss": 1.993382453918457, "Pretrain/Loss (Raw)": 2.23815655708313, "Pretrain/Step": 9431, "Pretrain/Step Time": 8.426024874672294} +{"Pretrain/Learning Rate": 2.6656522762672353e-05, "Pretrain/Loss": 1.99312424659729, "Pretrain/Loss (Raw)": 2.063922166824341, "Pretrain/Step": 9432, "Pretrain/Step Time": 8.42086029611528} +{"Pretrain/Learning Rate": 2.6652286902270745e-05, "Pretrain/Loss": 1.9954853057861328, "Pretrain/Loss (Raw)": 2.1913137435913086, "Pretrain/Step": 9433, "Pretrain/Step Time": 8.42043399065733} +{"Pretrain/Learning Rate": 2.664805099422661e-05, "Pretrain/Loss": 1.9982699155807495, "Pretrain/Loss (Raw)": 2.209754705429077, "Pretrain/Step": 9434, "Pretrain/Step Time": 8.421789769083261} +{"Pretrain/Learning Rate": 2.6643815038662085e-05, "Pretrain/Loss": 1.9979228973388672, "Pretrain/Loss (Raw)": 2.099693536758423, "Pretrain/Step": 9435, "Pretrain/Step Time": 8.423432655632496} +{"Pretrain/Learning Rate": 2.6639579035699312e-05, "Pretrain/Loss": 2.0000195503234863, "Pretrain/Loss (Raw)": 2.0856995582580566, "Pretrain/Step": 9436, "Pretrain/Step Time": 8.422879159450531} +{"Pretrain/Learning Rate": 2.663534298546044e-05, "Pretrain/Loss": 2.0012829303741455, "Pretrain/Loss (Raw)": 2.0978291034698486, "Pretrain/Step": 9437, "Pretrain/Step Time": 8.421912448480725} +{"Pretrain/Learning Rate": 2.6631106888067597e-05, "Pretrain/Loss": 2.0011916160583496, "Pretrain/Loss (Raw)": 1.8629519939422607, "Pretrain/Step": 9438, "Pretrain/Step Time": 8.419778248295188} +{"Pretrain/Learning Rate": 2.662687074364294e-05, "Pretrain/Loss": 2.0011677742004395, "Pretrain/Loss (Raw)": 1.9802563190460205, "Pretrain/Step": 9439, "Pretrain/Step Time": 8.41701740771532} +{"Pretrain/Learning Rate": 2.662263455230861e-05, "Pretrain/Loss": 2.0025227069854736, "Pretrain/Loss (Raw)": 2.1838343143463135, "Pretrain/Step": 9440, "Pretrain/Step Time": 8.423390721902251} +{"Pretrain/Learning Rate": 2.661839831418676e-05, "Pretrain/Loss": 2.0030951499938965, "Pretrain/Loss (Raw)": 2.091346263885498, "Pretrain/Step": 9441, "Pretrain/Step Time": 8.421044057235122} +{"Pretrain/Learning Rate": 2.661416202939953e-05, "Pretrain/Loss": 2.0032804012298584, "Pretrain/Loss (Raw)": 2.033679246902466, "Pretrain/Step": 9442, "Pretrain/Step Time": 8.42249989695847} +{"Pretrain/Learning Rate": 2.6609925698069084e-05, "Pretrain/Loss": 2.0057830810546875, "Pretrain/Loss (Raw)": 2.2707643508911133, "Pretrain/Step": 9443, "Pretrain/Step Time": 8.422489512711763} +{"Pretrain/Learning Rate": 2.6605689320317562e-05, "Pretrain/Loss": 2.004794120788574, "Pretrain/Loss (Raw)": 1.8928319215774536, "Pretrain/Step": 9444, "Pretrain/Step Time": 8.420079050585628} +{"Pretrain/Learning Rate": 2.6601452896267115e-05, "Pretrain/Loss": 2.005545139312744, "Pretrain/Loss (Raw)": 2.1656267642974854, "Pretrain/Step": 9445, "Pretrain/Step Time": 8.420305129140615} +{"Pretrain/Learning Rate": 2.6597216426039907e-05, "Pretrain/Loss": 2.0057384967803955, "Pretrain/Loss (Raw)": 1.9339407682418823, "Pretrain/Step": 9446, "Pretrain/Step Time": 8.420526280999184} +{"Pretrain/Learning Rate": 2.6592979909758092e-05, "Pretrain/Loss": 2.005357265472412, "Pretrain/Loss (Raw)": 1.950566291809082, "Pretrain/Step": 9447, "Pretrain/Step Time": 8.420671546831727} +{"Pretrain/Learning Rate": 2.6588743347543825e-05, "Pretrain/Loss": 2.0050299167633057, "Pretrain/Loss (Raw)": 2.0406157970428467, "Pretrain/Step": 9448, "Pretrain/Step Time": 8.41924124211073} +{"Pretrain/Learning Rate": 2.658450673951926e-05, "Pretrain/Loss": 2.004962205886841, "Pretrain/Loss (Raw)": 1.9779168367385864, "Pretrain/Step": 9449, "Pretrain/Step Time": 8.419448517262936} +{"Pretrain/Learning Rate": 2.6580270085806557e-05, "Pretrain/Loss": 2.004063129425049, "Pretrain/Loss (Raw)": 2.147324800491333, "Pretrain/Step": 9450, "Pretrain/Step Time": 8.413989713415504} +{"Pretrain/Learning Rate": 2.657603338652788e-05, "Pretrain/Loss": 2.0027027130126953, "Pretrain/Loss (Raw)": 1.9079545736312866, "Pretrain/Step": 9451, "Pretrain/Step Time": 8.415410643443465} +{"Pretrain/Learning Rate": 2.6571796641805396e-05, "Pretrain/Loss": 2.001938819885254, "Pretrain/Loss (Raw)": 2.0153677463531494, "Pretrain/Step": 9452, "Pretrain/Step Time": 8.422403682023287} +{"Pretrain/Learning Rate": 2.656755985176127e-05, "Pretrain/Loss": 2.003236770629883, "Pretrain/Loss (Raw)": 2.0489234924316406, "Pretrain/Step": 9453, "Pretrain/Step Time": 8.423080990090966} +{"Pretrain/Learning Rate": 2.656332301651765e-05, "Pretrain/Loss": 2.002293825149536, "Pretrain/Loss (Raw)": 2.0500898361206055, "Pretrain/Step": 9454, "Pretrain/Step Time": 8.412655035033822} +{"Pretrain/Learning Rate": 2.6559086136196714e-05, "Pretrain/Loss": 2.0079727172851562, "Pretrain/Loss (Raw)": 1.9183008670806885, "Pretrain/Step": 9455, "Pretrain/Step Time": 8.415017688646913} +{"Pretrain/Learning Rate": 2.6554849210920636e-05, "Pretrain/Loss": 2.007874011993408, "Pretrain/Loss (Raw)": 2.096328020095825, "Pretrain/Step": 9456, "Pretrain/Step Time": 8.417737098410726} +{"Pretrain/Learning Rate": 2.6550612240811568e-05, "Pretrain/Loss": 2.009533405303955, "Pretrain/Loss (Raw)": 2.192800760269165, "Pretrain/Step": 9457, "Pretrain/Step Time": 8.416102582588792} +{"Pretrain/Learning Rate": 2.65463752259917e-05, "Pretrain/Loss": 2.0110011100769043, "Pretrain/Loss (Raw)": 2.1977601051330566, "Pretrain/Step": 9458, "Pretrain/Step Time": 8.415940033271909} +{"Pretrain/Learning Rate": 2.654213816658318e-05, "Pretrain/Loss": 2.011815309524536, "Pretrain/Loss (Raw)": 1.947769284248352, "Pretrain/Step": 9459, "Pretrain/Step Time": 8.416171476244926} +{"Pretrain/Learning Rate": 2.65379010627082e-05, "Pretrain/Loss": 2.0122714042663574, "Pretrain/Loss (Raw)": 2.0434610843658447, "Pretrain/Step": 9460, "Pretrain/Step Time": 8.415806537494063} +{"Pretrain/Learning Rate": 2.6533663914488922e-05, "Pretrain/Loss": 2.0128910541534424, "Pretrain/Loss (Raw)": 2.0692334175109863, "Pretrain/Step": 9461, "Pretrain/Step Time": 8.414922930300236} +{"Pretrain/Learning Rate": 2.652942672204753e-05, "Pretrain/Loss": 2.0130348205566406, "Pretrain/Loss (Raw)": 2.13385272026062, "Pretrain/Step": 9462, "Pretrain/Step Time": 8.416781784966588} +{"Pretrain/Learning Rate": 2.6525189485506202e-05, "Pretrain/Loss": 2.008972644805908, "Pretrain/Loss (Raw)": 1.6568471193313599, "Pretrain/Step": 9463, "Pretrain/Step Time": 8.416318910196424} +{"Pretrain/Learning Rate": 2.6520952204987104e-05, "Pretrain/Loss": 2.0104258060455322, "Pretrain/Loss (Raw)": 2.1253890991210938, "Pretrain/Step": 9464, "Pretrain/Step Time": 8.417843854054809} +{"Pretrain/Learning Rate": 2.651671488061242e-05, "Pretrain/Loss": 2.010180711746216, "Pretrain/Loss (Raw)": 1.7458230257034302, "Pretrain/Step": 9465, "Pretrain/Step Time": 8.41713435202837} +{"Pretrain/Learning Rate": 2.6512477512504337e-05, "Pretrain/Loss": 2.0109524726867676, "Pretrain/Loss (Raw)": 1.9451290369033813, "Pretrain/Step": 9466, "Pretrain/Step Time": 8.424749705940485} +{"Pretrain/Learning Rate": 2.6508240100785026e-05, "Pretrain/Loss": 2.009666919708252, "Pretrain/Loss (Raw)": 1.8481948375701904, "Pretrain/Step": 9467, "Pretrain/Step Time": 8.422765552997589} +{"Pretrain/Learning Rate": 2.6504002645576675e-05, "Pretrain/Loss": 2.008582592010498, "Pretrain/Loss (Raw)": 1.8634792566299438, "Pretrain/Step": 9468, "Pretrain/Step Time": 8.423057496547699} +{"Pretrain/Learning Rate": 2.6499765147001478e-05, "Pretrain/Loss": 2.0085601806640625, "Pretrain/Loss (Raw)": 2.0940611362457275, "Pretrain/Step": 9469, "Pretrain/Step Time": 8.430573346093297} +{"Pretrain/Learning Rate": 2.6495527605181603e-05, "Pretrain/Loss": 2.009456157684326, "Pretrain/Loss (Raw)": 2.1620349884033203, "Pretrain/Step": 9470, "Pretrain/Step Time": 8.428709464147687} +{"Pretrain/Learning Rate": 2.649129002023924e-05, "Pretrain/Loss": 2.010948657989502, "Pretrain/Loss (Raw)": 2.1458740234375, "Pretrain/Step": 9471, "Pretrain/Step Time": 8.426428824663162} +{"Pretrain/Learning Rate": 2.648705239229658e-05, "Pretrain/Loss": 2.0084280967712402, "Pretrain/Loss (Raw)": 2.037280797958374, "Pretrain/Step": 9472, "Pretrain/Step Time": 8.429222172126174} +{"Pretrain/Learning Rate": 2.648281472147582e-05, "Pretrain/Loss": 2.0078787803649902, "Pretrain/Loss (Raw)": 1.727521538734436, "Pretrain/Step": 9473, "Pretrain/Step Time": 8.42868865467608} +{"Pretrain/Learning Rate": 2.6478577007899136e-05, "Pretrain/Loss": 2.008488655090332, "Pretrain/Loss (Raw)": 2.0286407470703125, "Pretrain/Step": 9474, "Pretrain/Step Time": 8.426239872351289} +{"Pretrain/Learning Rate": 2.6474339251688734e-05, "Pretrain/Loss": 2.0096616744995117, "Pretrain/Loss (Raw)": 1.9354571104049683, "Pretrain/Step": 9475, "Pretrain/Step Time": 8.426631981506944} +{"Pretrain/Learning Rate": 2.6470101452966788e-05, "Pretrain/Loss": 2.0081899166107178, "Pretrain/Loss (Raw)": 1.8032186031341553, "Pretrain/Step": 9476, "Pretrain/Step Time": 8.427224520593882} +{"Pretrain/Learning Rate": 2.6465863611855512e-05, "Pretrain/Loss": 2.009129047393799, "Pretrain/Loss (Raw)": 1.9544525146484375, "Pretrain/Step": 9477, "Pretrain/Step Time": 8.426232606172562} +{"Pretrain/Learning Rate": 2.6461625728477086e-05, "Pretrain/Loss": 2.0069656372070312, "Pretrain/Loss (Raw)": 2.1361546516418457, "Pretrain/Step": 9478, "Pretrain/Step Time": 8.432552929967642} +{"Pretrain/Learning Rate": 2.6457387802953715e-05, "Pretrain/Loss": 2.005364179611206, "Pretrain/Loss (Raw)": 1.5446665287017822, "Pretrain/Step": 9479, "Pretrain/Step Time": 8.432195166125894} +{"Pretrain/Learning Rate": 2.64531498354076e-05, "Pretrain/Loss": 2.0101640224456787, "Pretrain/Loss (Raw)": 2.0327165126800537, "Pretrain/Step": 9480, "Pretrain/Step Time": 8.43066742643714} +{"Pretrain/Learning Rate": 2.6448911825960926e-05, "Pretrain/Loss": 2.0104684829711914, "Pretrain/Loss (Raw)": 2.1332905292510986, "Pretrain/Step": 9481, "Pretrain/Step Time": 8.429094653576612} +{"Pretrain/Learning Rate": 2.6444673774735908e-05, "Pretrain/Loss": 2.0101637840270996, "Pretrain/Loss (Raw)": 1.9249720573425293, "Pretrain/Step": 9482, "Pretrain/Step Time": 8.431494161486626} +{"Pretrain/Learning Rate": 2.644043568185473e-05, "Pretrain/Loss": 2.010542869567871, "Pretrain/Loss (Raw)": 2.198531150817871, "Pretrain/Step": 9483, "Pretrain/Step Time": 8.427650608122349} +{"Pretrain/Learning Rate": 2.643619754743961e-05, "Pretrain/Loss": 2.0105462074279785, "Pretrain/Loss (Raw)": 2.1909942626953125, "Pretrain/Step": 9484, "Pretrain/Step Time": 8.430531974881887} +{"Pretrain/Learning Rate": 2.6431959371612753e-05, "Pretrain/Loss": 2.0120458602905273, "Pretrain/Loss (Raw)": 2.1083617210388184, "Pretrain/Step": 9485, "Pretrain/Step Time": 8.432275107130408} +{"Pretrain/Learning Rate": 2.6427721154496348e-05, "Pretrain/Loss": 2.0124616622924805, "Pretrain/Loss (Raw)": 2.0361151695251465, "Pretrain/Step": 9486, "Pretrain/Step Time": 8.43114111199975} +{"Pretrain/Learning Rate": 2.6423482896212615e-05, "Pretrain/Loss": 2.0136404037475586, "Pretrain/Loss (Raw)": 1.9631928205490112, "Pretrain/Step": 9487, "Pretrain/Step Time": 8.431269969791174} +{"Pretrain/Learning Rate": 2.641924459688375e-05, "Pretrain/Loss": 2.01579213142395, "Pretrain/Loss (Raw)": 2.1641345024108887, "Pretrain/Step": 9488, "Pretrain/Step Time": 8.441636178642511} +{"Pretrain/Learning Rate": 2.641500625663197e-05, "Pretrain/Loss": 2.0131709575653076, "Pretrain/Loss (Raw)": 1.7414127588272095, "Pretrain/Step": 9489, "Pretrain/Step Time": 8.443881995975971} +{"Pretrain/Learning Rate": 2.641076787557949e-05, "Pretrain/Loss": 2.014345645904541, "Pretrain/Loss (Raw)": 2.0558512210845947, "Pretrain/Step": 9490, "Pretrain/Step Time": 8.444970725104213} +{"Pretrain/Learning Rate": 2.6406529453848505e-05, "Pretrain/Loss": 2.0127880573272705, "Pretrain/Loss (Raw)": 1.8405051231384277, "Pretrain/Step": 9491, "Pretrain/Step Time": 8.444242779165506} +{"Pretrain/Learning Rate": 2.6402290991561236e-05, "Pretrain/Loss": 2.012805461883545, "Pretrain/Loss (Raw)": 1.912672996520996, "Pretrain/Step": 9492, "Pretrain/Step Time": 8.444843290373683} +{"Pretrain/Learning Rate": 2.639805248883989e-05, "Pretrain/Loss": 2.012446880340576, "Pretrain/Loss (Raw)": 1.9321446418762207, "Pretrain/Step": 9493, "Pretrain/Step Time": 8.438092006370425} +{"Pretrain/Learning Rate": 2.639381394580669e-05, "Pretrain/Loss": 2.0098562240600586, "Pretrain/Loss (Raw)": 1.593888759613037, "Pretrain/Step": 9494, "Pretrain/Step Time": 8.449550358578563} +{"Pretrain/Learning Rate": 2.638957536258385e-05, "Pretrain/Loss": 2.0089340209960938, "Pretrain/Loss (Raw)": 1.8221805095672607, "Pretrain/Step": 9495, "Pretrain/Step Time": 8.45040919445455} +{"Pretrain/Learning Rate": 2.638533673929358e-05, "Pretrain/Loss": 2.0114169120788574, "Pretrain/Loss (Raw)": 1.951683521270752, "Pretrain/Step": 9496, "Pretrain/Step Time": 8.449934303760529} +{"Pretrain/Learning Rate": 2.638109807605811e-05, "Pretrain/Loss": 2.0110015869140625, "Pretrain/Loss (Raw)": 1.9792416095733643, "Pretrain/Step": 9497, "Pretrain/Step Time": 8.448231665417552} +{"Pretrain/Learning Rate": 2.637685937299964e-05, "Pretrain/Loss": 2.010467767715454, "Pretrain/Loss (Raw)": 2.0155603885650635, "Pretrain/Step": 9498, "Pretrain/Step Time": 8.446807395666838} +{"Pretrain/Learning Rate": 2.63726206302404e-05, "Pretrain/Loss": 2.0102486610412598, "Pretrain/Loss (Raw)": 2.0077145099639893, "Pretrain/Step": 9499, "Pretrain/Step Time": 8.444743137806654} +{"Pretrain/Learning Rate": 2.6368381847902624e-05, "Pretrain/Loss": 2.010620594024658, "Pretrain/Loss (Raw)": 2.1047074794769287, "Pretrain/Step": 9500, "Pretrain/Step Time": 8.445661194622517} +{"Pretrain/Learning Rate": 2.6364143026108518e-05, "Pretrain/Loss": 2.011415481567383, "Pretrain/Loss (Raw)": 1.9389307498931885, "Pretrain/Step": 9501, "Pretrain/Step Time": 8.451343476772308} +{"Pretrain/Learning Rate": 2.6359904164980303e-05, "Pretrain/Loss": 2.011894941329956, "Pretrain/Loss (Raw)": 1.918046236038208, "Pretrain/Step": 9502, "Pretrain/Step Time": 8.449261652305722} +{"Pretrain/Learning Rate": 2.635566526464021e-05, "Pretrain/Loss": 2.0123627185821533, "Pretrain/Loss (Raw)": 2.1666107177734375, "Pretrain/Step": 9503, "Pretrain/Step Time": 8.446243811398745} +{"Pretrain/Learning Rate": 2.635142632521047e-05, "Pretrain/Loss": 2.010128974914551, "Pretrain/Loss (Raw)": 1.7594083547592163, "Pretrain/Step": 9504, "Pretrain/Step Time": 8.4465251583606} +{"Pretrain/Learning Rate": 2.6347187346813305e-05, "Pretrain/Loss": 2.0120253562927246, "Pretrain/Loss (Raw)": 2.1548171043395996, "Pretrain/Step": 9505, "Pretrain/Step Time": 8.448748525232077} +{"Pretrain/Learning Rate": 2.6342948329570944e-05, "Pretrain/Loss": 2.014258861541748, "Pretrain/Loss (Raw)": 2.341398000717163, "Pretrain/Step": 9506, "Pretrain/Step Time": 8.448365783318877} +{"Pretrain/Learning Rate": 2.6338709273605605e-05, "Pretrain/Loss": 2.0141775608062744, "Pretrain/Loss (Raw)": 1.9780771732330322, "Pretrain/Step": 9507, "Pretrain/Step Time": 8.451683904975653} +{"Pretrain/Learning Rate": 2.6334470179039537e-05, "Pretrain/Loss": 2.016361951828003, "Pretrain/Loss (Raw)": 2.1222214698791504, "Pretrain/Step": 9508, "Pretrain/Step Time": 8.450555235147476} +{"Pretrain/Learning Rate": 2.6330231045994962e-05, "Pretrain/Loss": 2.0164055824279785, "Pretrain/Loss (Raw)": 2.164003849029541, "Pretrain/Step": 9509, "Pretrain/Step Time": 8.452008418738842} +{"Pretrain/Learning Rate": 2.632599187459411e-05, "Pretrain/Loss": 2.0180444717407227, "Pretrain/Loss (Raw)": 2.0322108268737793, "Pretrain/Step": 9510, "Pretrain/Step Time": 8.454240007326007} +{"Pretrain/Learning Rate": 2.6321752664959215e-05, "Pretrain/Loss": 2.0174448490142822, "Pretrain/Loss (Raw)": 2.056304693222046, "Pretrain/Step": 9511, "Pretrain/Step Time": 8.45735857449472} +{"Pretrain/Learning Rate": 2.6317513417212518e-05, "Pretrain/Loss": 2.018136501312256, "Pretrain/Loss (Raw)": 1.8946051597595215, "Pretrain/Step": 9512, "Pretrain/Step Time": 8.458276484161615} +{"Pretrain/Learning Rate": 2.6313274131476244e-05, "Pretrain/Loss": 2.017702341079712, "Pretrain/Loss (Raw)": 1.7906579971313477, "Pretrain/Step": 9513, "Pretrain/Step Time": 8.456507390365005} +{"Pretrain/Learning Rate": 2.630903480787264e-05, "Pretrain/Loss": 2.0193257331848145, "Pretrain/Loss (Raw)": 2.2446365356445312, "Pretrain/Step": 9514, "Pretrain/Step Time": 8.455888632684946} +{"Pretrain/Learning Rate": 2.6304795446523937e-05, "Pretrain/Loss": 2.018432140350342, "Pretrain/Loss (Raw)": 2.0733041763305664, "Pretrain/Step": 9515, "Pretrain/Step Time": 8.45877007395029} +{"Pretrain/Learning Rate": 2.6300556047552382e-05, "Pretrain/Loss": 2.017383098602295, "Pretrain/Loss (Raw)": 1.771586298942566, "Pretrain/Step": 9516, "Pretrain/Step Time": 8.46069036051631} +{"Pretrain/Learning Rate": 2.6296316611080212e-05, "Pretrain/Loss": 2.0186972618103027, "Pretrain/Loss (Raw)": 1.9547427892684937, "Pretrain/Step": 9517, "Pretrain/Step Time": 8.458196189254522} +{"Pretrain/Learning Rate": 2.6292077137229663e-05, "Pretrain/Loss": 2.011741876602173, "Pretrain/Loss (Raw)": 1.9772059917449951, "Pretrain/Step": 9518, "Pretrain/Step Time": 8.463379837572575} +{"Pretrain/Learning Rate": 2.628783762612298e-05, "Pretrain/Loss": 2.0116755962371826, "Pretrain/Loss (Raw)": 1.8745086193084717, "Pretrain/Step": 9519, "Pretrain/Step Time": 8.457820298150182} +{"Pretrain/Learning Rate": 2.6283598077882404e-05, "Pretrain/Loss": 2.0107076168060303, "Pretrain/Loss (Raw)": 2.013380527496338, "Pretrain/Step": 9520, "Pretrain/Step Time": 8.460832482203841} +{"Pretrain/Learning Rate": 2.6279358492630184e-05, "Pretrain/Loss": 2.0098133087158203, "Pretrain/Loss (Raw)": 2.012010097503662, "Pretrain/Step": 9521, "Pretrain/Step Time": 8.457943841814995} +{"Pretrain/Learning Rate": 2.6275118870488575e-05, "Pretrain/Loss": 2.0095748901367188, "Pretrain/Loss (Raw)": 2.0288872718811035, "Pretrain/Step": 9522, "Pretrain/Step Time": 8.456319427117705} +{"Pretrain/Learning Rate": 2.6270879211579796e-05, "Pretrain/Loss": 2.007704257965088, "Pretrain/Loss (Raw)": 1.8369767665863037, "Pretrain/Step": 9523, "Pretrain/Step Time": 8.457316065207124} +{"Pretrain/Learning Rate": 2.626663951602612e-05, "Pretrain/Loss": 2.008226156234741, "Pretrain/Loss (Raw)": 1.8397799730300903, "Pretrain/Step": 9524, "Pretrain/Step Time": 8.460154300555587} +{"Pretrain/Learning Rate": 2.626239978394978e-05, "Pretrain/Loss": 2.0067272186279297, "Pretrain/Loss (Raw)": 1.9860032796859741, "Pretrain/Step": 9525, "Pretrain/Step Time": 8.452367162331939} +{"Pretrain/Learning Rate": 2.6258160015473038e-05, "Pretrain/Loss": 2.0068821907043457, "Pretrain/Loss (Raw)": 1.9340102672576904, "Pretrain/Step": 9526, "Pretrain/Step Time": 8.456502137705684} +{"Pretrain/Learning Rate": 2.6253920210718142e-05, "Pretrain/Loss": 2.008983612060547, "Pretrain/Loss (Raw)": 2.234421968460083, "Pretrain/Step": 9527, "Pretrain/Step Time": 8.461467429995537} +{"Pretrain/Learning Rate": 2.6249680369807333e-05, "Pretrain/Loss": 2.008664131164551, "Pretrain/Loss (Raw)": 1.9617990255355835, "Pretrain/Step": 9528, "Pretrain/Step Time": 8.46295946650207} +{"Pretrain/Learning Rate": 2.6245440492862872e-05, "Pretrain/Loss": 2.0072150230407715, "Pretrain/Loss (Raw)": 1.9144014120101929, "Pretrain/Step": 9529, "Pretrain/Step Time": 8.461829800158739} +{"Pretrain/Learning Rate": 2.6241200580007012e-05, "Pretrain/Loss": 2.0079843997955322, "Pretrain/Loss (Raw)": 2.0973236560821533, "Pretrain/Step": 9530, "Pretrain/Step Time": 8.459428194910288} +{"Pretrain/Learning Rate": 2.623696063136201e-05, "Pretrain/Loss": 2.0060739517211914, "Pretrain/Loss (Raw)": 1.9893687963485718, "Pretrain/Step": 9531, "Pretrain/Step Time": 8.462022967636585} +{"Pretrain/Learning Rate": 2.623272064705013e-05, "Pretrain/Loss": 2.0068893432617188, "Pretrain/Loss (Raw)": 2.1754276752471924, "Pretrain/Step": 9532, "Pretrain/Step Time": 8.462079379707575} +{"Pretrain/Learning Rate": 2.622848062719361e-05, "Pretrain/Loss": 2.007521390914917, "Pretrain/Loss (Raw)": 2.0615787506103516, "Pretrain/Step": 9533, "Pretrain/Step Time": 8.46359041146934} +{"Pretrain/Learning Rate": 2.6224240571914716e-05, "Pretrain/Loss": 2.0087695121765137, "Pretrain/Loss (Raw)": 2.1124484539031982, "Pretrain/Step": 9534, "Pretrain/Step Time": 8.467870011925697} +{"Pretrain/Learning Rate": 2.6220000481335705e-05, "Pretrain/Loss": 2.0103416442871094, "Pretrain/Loss (Raw)": 2.213078498840332, "Pretrain/Step": 9535, "Pretrain/Step Time": 8.464505104348063} +{"Pretrain/Learning Rate": 2.6215760355578845e-05, "Pretrain/Loss": 2.0111846923828125, "Pretrain/Loss (Raw)": 2.1101956367492676, "Pretrain/Step": 9536, "Pretrain/Step Time": 8.466816721484065} +{"Pretrain/Learning Rate": 2.62115201947664e-05, "Pretrain/Loss": 2.0115811824798584, "Pretrain/Loss (Raw)": 2.067965030670166, "Pretrain/Step": 9537, "Pretrain/Step Time": 8.472527055069804} +{"Pretrain/Learning Rate": 2.620727999902061e-05, "Pretrain/Loss": 2.0099191665649414, "Pretrain/Loss (Raw)": 1.9122240543365479, "Pretrain/Step": 9538, "Pretrain/Step Time": 8.470728125423193} +{"Pretrain/Learning Rate": 2.6203039768463756e-05, "Pretrain/Loss": 2.0082881450653076, "Pretrain/Loss (Raw)": 1.9957228899002075, "Pretrain/Step": 9539, "Pretrain/Step Time": 8.47209445387125} +{"Pretrain/Learning Rate": 2.61987995032181e-05, "Pretrain/Loss": 2.0081095695495605, "Pretrain/Loss (Raw)": 2.0263147354125977, "Pretrain/Step": 9540, "Pretrain/Step Time": 8.469448532909155} +{"Pretrain/Learning Rate": 2.6194559203405905e-05, "Pretrain/Loss": 2.0057811737060547, "Pretrain/Loss (Raw)": 1.87954580783844, "Pretrain/Step": 9541, "Pretrain/Step Time": 8.469461593776941} +{"Pretrain/Learning Rate": 2.619031886914944e-05, "Pretrain/Loss": 2.005990743637085, "Pretrain/Loss (Raw)": 2.107067346572876, "Pretrain/Step": 9542, "Pretrain/Step Time": 8.471817921847105} +{"Pretrain/Learning Rate": 2.6186078500570972e-05, "Pretrain/Loss": 2.0060019493103027, "Pretrain/Loss (Raw)": 2.0065982341766357, "Pretrain/Step": 9543, "Pretrain/Step Time": 8.473305394873023} +{"Pretrain/Learning Rate": 2.618183809779276e-05, "Pretrain/Loss": 2.004790782928467, "Pretrain/Loss (Raw)": 1.8928595781326294, "Pretrain/Step": 9544, "Pretrain/Step Time": 8.473410662263632} +{"Pretrain/Learning Rate": 2.617759766093708e-05, "Pretrain/Loss": 2.0043981075286865, "Pretrain/Loss (Raw)": 1.969109296798706, "Pretrain/Step": 9545, "Pretrain/Step Time": 8.473925804719329} +{"Pretrain/Learning Rate": 2.6173357190126206e-05, "Pretrain/Loss": 2.0081372261047363, "Pretrain/Loss (Raw)": 2.3168892860412598, "Pretrain/Step": 9546, "Pretrain/Step Time": 8.472397623583674} +{"Pretrain/Learning Rate": 2.61691166854824e-05, "Pretrain/Loss": 2.0061323642730713, "Pretrain/Loss (Raw)": 1.7937724590301514, "Pretrain/Step": 9547, "Pretrain/Step Time": 8.472969261929393} +{"Pretrain/Learning Rate": 2.6164876147127948e-05, "Pretrain/Loss": 2.006988763809204, "Pretrain/Loss (Raw)": 2.107797145843506, "Pretrain/Step": 9548, "Pretrain/Step Time": 8.471016628667712} +{"Pretrain/Learning Rate": 2.6160635575185106e-05, "Pretrain/Loss": 2.0060524940490723, "Pretrain/Loss (Raw)": 1.9805911779403687, "Pretrain/Step": 9549, "Pretrain/Step Time": 8.472045017406344} +{"Pretrain/Learning Rate": 2.615639496977616e-05, "Pretrain/Loss": 2.005523204803467, "Pretrain/Loss (Raw)": 1.8880351781845093, "Pretrain/Step": 9550, "Pretrain/Step Time": 8.46619163453579} +{"Pretrain/Learning Rate": 2.615215433102337e-05, "Pretrain/Loss": 2.003969192504883, "Pretrain/Loss (Raw)": 1.8498541116714478, "Pretrain/Step": 9551, "Pretrain/Step Time": 8.473701428622007} +{"Pretrain/Learning Rate": 2.6147913659049028e-05, "Pretrain/Loss": 2.0009756088256836, "Pretrain/Loss (Raw)": 1.5455451011657715, "Pretrain/Step": 9552, "Pretrain/Step Time": 8.477578366175294} +{"Pretrain/Learning Rate": 2.6143672953975406e-05, "Pretrain/Loss": 2.001584768295288, "Pretrain/Loss (Raw)": 2.1018927097320557, "Pretrain/Step": 9553, "Pretrain/Step Time": 8.482840046286583} +{"Pretrain/Learning Rate": 2.6139432215924785e-05, "Pretrain/Loss": 2.0023539066314697, "Pretrain/Loss (Raw)": 2.0204248428344727, "Pretrain/Step": 9554, "Pretrain/Step Time": 8.483273774385452} +{"Pretrain/Learning Rate": 2.613519144501943e-05, "Pretrain/Loss": 2.004171848297119, "Pretrain/Loss (Raw)": 2.0613198280334473, "Pretrain/Step": 9555, "Pretrain/Step Time": 8.483648834750056} +{"Pretrain/Learning Rate": 2.6130950641381636e-05, "Pretrain/Loss": 2.0053181648254395, "Pretrain/Loss (Raw)": 2.0388600826263428, "Pretrain/Step": 9556, "Pretrain/Step Time": 8.481081077829003} +{"Pretrain/Learning Rate": 2.6126709805133676e-05, "Pretrain/Loss": 2.008007049560547, "Pretrain/Loss (Raw)": 1.8799189329147339, "Pretrain/Step": 9557, "Pretrain/Step Time": 8.479286694899201} +{"Pretrain/Learning Rate": 2.6122468936397832e-05, "Pretrain/Loss": 2.006197929382324, "Pretrain/Loss (Raw)": 2.012683391571045, "Pretrain/Step": 9558, "Pretrain/Step Time": 8.477811969816685} +{"Pretrain/Learning Rate": 2.6118228035296388e-05, "Pretrain/Loss": 2.005354404449463, "Pretrain/Loss (Raw)": 2.1302125453948975, "Pretrain/Step": 9559, "Pretrain/Step Time": 8.479914512485266} +{"Pretrain/Learning Rate": 2.6113987101951625e-05, "Pretrain/Loss": 2.006702423095703, "Pretrain/Loss (Raw)": 2.236449718475342, "Pretrain/Step": 9560, "Pretrain/Step Time": 8.481276692822576} +{"Pretrain/Learning Rate": 2.6109746136485828e-05, "Pretrain/Loss": 2.005859375, "Pretrain/Loss (Raw)": 2.083421468734741, "Pretrain/Step": 9561, "Pretrain/Step Time": 8.480073859915137} +{"Pretrain/Learning Rate": 2.610550513902129e-05, "Pretrain/Loss": 2.0036020278930664, "Pretrain/Loss (Raw)": 1.9208208322525024, "Pretrain/Step": 9562, "Pretrain/Step Time": 8.477122757583857} +{"Pretrain/Learning Rate": 2.6101264109680286e-05, "Pretrain/Loss": 2.004197597503662, "Pretrain/Loss (Raw)": 2.1759228706359863, "Pretrain/Step": 9563, "Pretrain/Step Time": 8.476079268381} +{"Pretrain/Learning Rate": 2.6097023048585113e-05, "Pretrain/Loss": 2.004207134246826, "Pretrain/Loss (Raw)": 2.0868980884552, "Pretrain/Step": 9564, "Pretrain/Step Time": 8.479201920330524} +{"Pretrain/Learning Rate": 2.6092781955858046e-05, "Pretrain/Loss": 2.003119468688965, "Pretrain/Loss (Raw)": 1.9586232900619507, "Pretrain/Step": 9565, "Pretrain/Step Time": 8.481718698516488} +{"Pretrain/Learning Rate": 2.6088540831621388e-05, "Pretrain/Loss": 2.0039572715759277, "Pretrain/Loss (Raw)": 1.9701753854751587, "Pretrain/Step": 9566, "Pretrain/Step Time": 8.47826444171369} +{"Pretrain/Learning Rate": 2.608429967599742e-05, "Pretrain/Loss": 2.0055789947509766, "Pretrain/Loss (Raw)": 2.18782639503479, "Pretrain/Step": 9567, "Pretrain/Step Time": 8.484103068709373} +{"Pretrain/Learning Rate": 2.6080058489108435e-05, "Pretrain/Loss": 2.002901554107666, "Pretrain/Loss (Raw)": 1.8411377668380737, "Pretrain/Step": 9568, "Pretrain/Step Time": 8.47779631987214} +{"Pretrain/Learning Rate": 2.6075817271076725e-05, "Pretrain/Loss": 2.0013785362243652, "Pretrain/Loss (Raw)": 1.8964028358459473, "Pretrain/Step": 9569, "Pretrain/Step Time": 8.482336746528745} +{"Pretrain/Learning Rate": 2.6071576022024585e-05, "Pretrain/Loss": 1.9989498853683472, "Pretrain/Loss (Raw)": 1.7228106260299683, "Pretrain/Step": 9570, "Pretrain/Step Time": 8.481673199683428} +{"Pretrain/Learning Rate": 2.60673347420743e-05, "Pretrain/Loss": 1.997859239578247, "Pretrain/Loss (Raw)": 2.1311514377593994, "Pretrain/Step": 9571, "Pretrain/Step Time": 8.481129053980112} +{"Pretrain/Learning Rate": 2.6063093431348173e-05, "Pretrain/Loss": 1.9998841285705566, "Pretrain/Loss (Raw)": 2.1520373821258545, "Pretrain/Step": 9572, "Pretrain/Step Time": 8.479650296270847} +{"Pretrain/Learning Rate": 2.6058852089968493e-05, "Pretrain/Loss": 2.000274181365967, "Pretrain/Loss (Raw)": 2.2155492305755615, "Pretrain/Step": 9573, "Pretrain/Step Time": 8.47947945818305} +{"Pretrain/Learning Rate": 2.6054610718057565e-05, "Pretrain/Loss": 2.000412940979004, "Pretrain/Loss (Raw)": 1.9516971111297607, "Pretrain/Step": 9574, "Pretrain/Step Time": 8.482432648539543} +{"Pretrain/Learning Rate": 2.6050369315737683e-05, "Pretrain/Loss": 2.0012426376342773, "Pretrain/Loss (Raw)": 2.0567543506622314, "Pretrain/Step": 9575, "Pretrain/Step Time": 8.486500468105078} +{"Pretrain/Learning Rate": 2.6046127883131132e-05, "Pretrain/Loss": 2.000678062438965, "Pretrain/Loss (Raw)": 1.968346357345581, "Pretrain/Step": 9576, "Pretrain/Step Time": 8.489933738484979} +{"Pretrain/Learning Rate": 2.604188642036023e-05, "Pretrain/Loss": 2.0018653869628906, "Pretrain/Loss (Raw)": 2.1299076080322266, "Pretrain/Step": 9577, "Pretrain/Step Time": 8.483650540933013} +{"Pretrain/Learning Rate": 2.603764492754726e-05, "Pretrain/Loss": 2.0004806518554688, "Pretrain/Loss (Raw)": 1.9700783491134644, "Pretrain/Step": 9578, "Pretrain/Step Time": 8.490647347643971} +{"Pretrain/Learning Rate": 2.6033403404814537e-05, "Pretrain/Loss": 2.0012130737304688, "Pretrain/Loss (Raw)": 2.0017194747924805, "Pretrain/Step": 9579, "Pretrain/Step Time": 8.491918815299869} +{"Pretrain/Learning Rate": 2.6029161852284356e-05, "Pretrain/Loss": 2.0016582012176514, "Pretrain/Loss (Raw)": 2.0723228454589844, "Pretrain/Step": 9580, "Pretrain/Step Time": 8.482183346524835} +{"Pretrain/Learning Rate": 2.6024920270079013e-05, "Pretrain/Loss": 2.000509738922119, "Pretrain/Loss (Raw)": 1.9019426107406616, "Pretrain/Step": 9581, "Pretrain/Step Time": 8.488584650680423} +{"Pretrain/Learning Rate": 2.602067865832082e-05, "Pretrain/Loss": 2.0005743503570557, "Pretrain/Loss (Raw)": 2.0583417415618896, "Pretrain/Step": 9582, "Pretrain/Step Time": 8.490144550800323} +{"Pretrain/Learning Rate": 2.6016437017132073e-05, "Pretrain/Loss": 2.001756429672241, "Pretrain/Loss (Raw)": 2.069615602493286, "Pretrain/Step": 9583, "Pretrain/Step Time": 8.491767460480332} +{"Pretrain/Learning Rate": 2.6012195346635082e-05, "Pretrain/Loss": 1.9988033771514893, "Pretrain/Loss (Raw)": 1.7183364629745483, "Pretrain/Step": 9584, "Pretrain/Step Time": 8.492004673928022} +{"Pretrain/Learning Rate": 2.600795364695216e-05, "Pretrain/Loss": 1.997154712677002, "Pretrain/Loss (Raw)": 1.981774926185608, "Pretrain/Step": 9585, "Pretrain/Step Time": 8.488066151738167} +{"Pretrain/Learning Rate": 2.60037119182056e-05, "Pretrain/Loss": 1.9960110187530518, "Pretrain/Loss (Raw)": 2.0513556003570557, "Pretrain/Step": 9586, "Pretrain/Step Time": 8.489974426105618} +{"Pretrain/Learning Rate": 2.599947016051771e-05, "Pretrain/Loss": 1.9983088970184326, "Pretrain/Loss (Raw)": 2.241898775100708, "Pretrain/Step": 9587, "Pretrain/Step Time": 8.491532215848565} +{"Pretrain/Learning Rate": 2.5995228374010804e-05, "Pretrain/Loss": 1.9967286586761475, "Pretrain/Loss (Raw)": 1.8412004709243774, "Pretrain/Step": 9588, "Pretrain/Step Time": 8.491300279274583} +{"Pretrain/Learning Rate": 2.599098655880719e-05, "Pretrain/Loss": 1.9973986148834229, "Pretrain/Loss (Raw)": 2.1549744606018066, "Pretrain/Step": 9589, "Pretrain/Step Time": 8.490789666771889} +{"Pretrain/Learning Rate": 2.598674471502918e-05, "Pretrain/Loss": 1.9968289136886597, "Pretrain/Loss (Raw)": 2.0609397888183594, "Pretrain/Step": 9590, "Pretrain/Step Time": 8.487042604014277} +{"Pretrain/Learning Rate": 2.5982502842799083e-05, "Pretrain/Loss": 1.998944878578186, "Pretrain/Loss (Raw)": 1.927692174911499, "Pretrain/Step": 9591, "Pretrain/Step Time": 8.492119977250695} +{"Pretrain/Learning Rate": 2.5978260942239212e-05, "Pretrain/Loss": 1.9972935914993286, "Pretrain/Loss (Raw)": 1.9140191078186035, "Pretrain/Step": 9592, "Pretrain/Step Time": 8.489168154075742} +{"Pretrain/Learning Rate": 2.5974019013471867e-05, "Pretrain/Loss": 1.9990142583847046, "Pretrain/Loss (Raw)": 1.9660712480545044, "Pretrain/Step": 9593, "Pretrain/Step Time": 8.499550325796008} +{"Pretrain/Learning Rate": 2.5969777056619376e-05, "Pretrain/Loss": 2.000441074371338, "Pretrain/Loss (Raw)": 2.127748489379883, "Pretrain/Step": 9594, "Pretrain/Step Time": 8.494737198576331} +{"Pretrain/Learning Rate": 2.5965535071804043e-05, "Pretrain/Loss": 2.003753900527954, "Pretrain/Loss (Raw)": 2.2722384929656982, "Pretrain/Step": 9595, "Pretrain/Step Time": 8.49466285482049} +{"Pretrain/Learning Rate": 2.5961293059148195e-05, "Pretrain/Loss": 2.0037612915039062, "Pretrain/Loss (Raw)": 1.8644320964813232, "Pretrain/Step": 9596, "Pretrain/Step Time": 8.495117757469416} +{"Pretrain/Learning Rate": 2.595705101877413e-05, "Pretrain/Loss": 2.002349376678467, "Pretrain/Loss (Raw)": 1.9133347272872925, "Pretrain/Step": 9597, "Pretrain/Step Time": 8.48826351761818} +{"Pretrain/Learning Rate": 2.5952808950804175e-05, "Pretrain/Loss": 2.0026676654815674, "Pretrain/Loss (Raw)": 2.2027769088745117, "Pretrain/Step": 9598, "Pretrain/Step Time": 8.48727192543447} +{"Pretrain/Learning Rate": 2.594856685536065e-05, "Pretrain/Loss": 2.0005173683166504, "Pretrain/Loss (Raw)": 1.8706430196762085, "Pretrain/Step": 9599, "Pretrain/Step Time": 8.49332644045353} +{"Pretrain/Learning Rate": 2.5944324732565867e-05, "Pretrain/Loss": 2.0002565383911133, "Pretrain/Loss (Raw)": 2.00388240814209, "Pretrain/Step": 9600, "Pretrain/Step Time": 8.487994730472565} +{"Pretrain/Learning Rate": 2.5940082582542146e-05, "Pretrain/Loss": 2.0036730766296387, "Pretrain/Loss (Raw)": 2.164848566055298, "Pretrain/Step": 9601, "Pretrain/Step Time": 8.489435750991106} +{"Pretrain/Learning Rate": 2.5935840405411804e-05, "Pretrain/Loss": 2.0044546127319336, "Pretrain/Loss (Raw)": 2.128648042678833, "Pretrain/Step": 9602, "Pretrain/Step Time": 8.492936747148633} +{"Pretrain/Learning Rate": 2.5931598201297165e-05, "Pretrain/Loss": 2.00504732131958, "Pretrain/Loss (Raw)": 2.011364221572876, "Pretrain/Step": 9603, "Pretrain/Step Time": 8.495189236477017} +{"Pretrain/Learning Rate": 2.592735597032055e-05, "Pretrain/Loss": 2.006772756576538, "Pretrain/Loss (Raw)": 2.024068593978882, "Pretrain/Step": 9604, "Pretrain/Step Time": 8.491598702967167} +{"Pretrain/Learning Rate": 2.5923113712604273e-05, "Pretrain/Loss": 2.006680488586426, "Pretrain/Loss (Raw)": 1.942624807357788, "Pretrain/Step": 9605, "Pretrain/Step Time": 8.487756421789527} +{"Pretrain/Learning Rate": 2.591887142827067e-05, "Pretrain/Loss": 2.008173704147339, "Pretrain/Loss (Raw)": 2.32729434967041, "Pretrain/Step": 9606, "Pretrain/Step Time": 8.483035739511251} +{"Pretrain/Learning Rate": 2.5914629117442057e-05, "Pretrain/Loss": 2.0118966102600098, "Pretrain/Loss (Raw)": 2.021177053451538, "Pretrain/Step": 9607, "Pretrain/Step Time": 8.484990235418081} +{"Pretrain/Learning Rate": 2.5910386780240757e-05, "Pretrain/Loss": 2.012652635574341, "Pretrain/Loss (Raw)": 2.1295175552368164, "Pretrain/Step": 9608, "Pretrain/Step Time": 8.48584078811109} +{"Pretrain/Learning Rate": 2.5906144416789097e-05, "Pretrain/Loss": 2.0111119747161865, "Pretrain/Loss (Raw)": 1.936065673828125, "Pretrain/Step": 9609, "Pretrain/Step Time": 8.486303187906742} +{"Pretrain/Learning Rate": 2.5901902027209398e-05, "Pretrain/Loss": 2.0119121074676514, "Pretrain/Loss (Raw)": 2.027409076690674, "Pretrain/Step": 9610, "Pretrain/Step Time": 8.486029095947742} +{"Pretrain/Learning Rate": 2.589765961162399e-05, "Pretrain/Loss": 2.009086847305298, "Pretrain/Loss (Raw)": 1.8368748426437378, "Pretrain/Step": 9611, "Pretrain/Step Time": 8.486238522455096} +{"Pretrain/Learning Rate": 2.5893417170155206e-05, "Pretrain/Loss": 2.008561134338379, "Pretrain/Loss (Raw)": 2.1237406730651855, "Pretrain/Step": 9612, "Pretrain/Step Time": 8.488879900425673} +{"Pretrain/Learning Rate": 2.5889174702925363e-05, "Pretrain/Loss": 2.0077896118164062, "Pretrain/Loss (Raw)": 2.0095837116241455, "Pretrain/Step": 9613, "Pretrain/Step Time": 8.491730265319347} +{"Pretrain/Learning Rate": 2.5884932210056796e-05, "Pretrain/Loss": 2.0074493885040283, "Pretrain/Loss (Raw)": 1.9925668239593506, "Pretrain/Step": 9614, "Pretrain/Step Time": 8.486470501869917} +{"Pretrain/Learning Rate": 2.588068969167183e-05, "Pretrain/Loss": 2.0067009925842285, "Pretrain/Loss (Raw)": 1.867401361465454, "Pretrain/Step": 9615, "Pretrain/Step Time": 8.491352746263146} +{"Pretrain/Learning Rate": 2.5876447147892797e-05, "Pretrain/Loss": 2.007321834564209, "Pretrain/Loss (Raw)": 2.2435851097106934, "Pretrain/Step": 9616, "Pretrain/Step Time": 8.482561636716127} +{"Pretrain/Learning Rate": 2.587220457884203e-05, "Pretrain/Loss": 2.007850408554077, "Pretrain/Loss (Raw)": 1.809074878692627, "Pretrain/Step": 9617, "Pretrain/Step Time": 8.483588747680187} +{"Pretrain/Learning Rate": 2.586796198464186e-05, "Pretrain/Loss": 2.0092434883117676, "Pretrain/Loss (Raw)": 2.2341670989990234, "Pretrain/Step": 9618, "Pretrain/Step Time": 8.482338845729828} +{"Pretrain/Learning Rate": 2.5863719365414618e-05, "Pretrain/Loss": 2.0102787017822266, "Pretrain/Loss (Raw)": 1.9730167388916016, "Pretrain/Step": 9619, "Pretrain/Step Time": 8.480730017647147} +{"Pretrain/Learning Rate": 2.5859476721282632e-05, "Pretrain/Loss": 2.014491558074951, "Pretrain/Loss (Raw)": 2.451932191848755, "Pretrain/Step": 9620, "Pretrain/Step Time": 8.482989527285099} +{"Pretrain/Learning Rate": 2.5855234052368245e-05, "Pretrain/Loss": 2.0156092643737793, "Pretrain/Loss (Raw)": 2.0752108097076416, "Pretrain/Step": 9621, "Pretrain/Step Time": 8.481976110488176} +{"Pretrain/Learning Rate": 2.585099135879379e-05, "Pretrain/Loss": 2.0173354148864746, "Pretrain/Loss (Raw)": 1.8148225545883179, "Pretrain/Step": 9622, "Pretrain/Step Time": 8.471353482455015} +{"Pretrain/Learning Rate": 2.5846748640681595e-05, "Pretrain/Loss": 2.0192513465881348, "Pretrain/Loss (Raw)": 2.0674185752868652, "Pretrain/Step": 9623, "Pretrain/Step Time": 8.468690730631351} +{"Pretrain/Learning Rate": 2.5842505898154e-05, "Pretrain/Loss": 2.0197973251342773, "Pretrain/Loss (Raw)": 2.021603584289551, "Pretrain/Step": 9624, "Pretrain/Step Time": 8.473980356007814} +{"Pretrain/Learning Rate": 2.583826313133334e-05, "Pretrain/Loss": 2.019850492477417, "Pretrain/Loss (Raw)": 1.986016035079956, "Pretrain/Step": 9625, "Pretrain/Step Time": 8.474261036142707} +{"Pretrain/Learning Rate": 2.5834020340341953e-05, "Pretrain/Loss": 2.020639657974243, "Pretrain/Loss (Raw)": 2.1165714263916016, "Pretrain/Step": 9626, "Pretrain/Step Time": 8.474667405709624} +{"Pretrain/Learning Rate": 2.5829777525302185e-05, "Pretrain/Loss": 2.019880533218384, "Pretrain/Loss (Raw)": 1.910554051399231, "Pretrain/Step": 9627, "Pretrain/Step Time": 8.470411993563175} +{"Pretrain/Learning Rate": 2.5825534686336362e-05, "Pretrain/Loss": 2.018252372741699, "Pretrain/Loss (Raw)": 1.8963242769241333, "Pretrain/Step": 9628, "Pretrain/Step Time": 8.475497804582119} +{"Pretrain/Learning Rate": 2.582129182356683e-05, "Pretrain/Loss": 2.021124839782715, "Pretrain/Loss (Raw)": 2.3065552711486816, "Pretrain/Step": 9629, "Pretrain/Step Time": 8.468316929414868} +{"Pretrain/Learning Rate": 2.5817048937115923e-05, "Pretrain/Loss": 2.0196642875671387, "Pretrain/Loss (Raw)": 1.7311054468154907, "Pretrain/Step": 9630, "Pretrain/Step Time": 8.471218544989824} +{"Pretrain/Learning Rate": 2.5812806027105984e-05, "Pretrain/Loss": 2.0174317359924316, "Pretrain/Loss (Raw)": 1.8808492422103882, "Pretrain/Step": 9631, "Pretrain/Step Time": 8.466777674853802} +{"Pretrain/Learning Rate": 2.5808563093659365e-05, "Pretrain/Loss": 2.0201077461242676, "Pretrain/Loss (Raw)": 2.101945161819458, "Pretrain/Step": 9632, "Pretrain/Step Time": 8.474208349362016} +{"Pretrain/Learning Rate": 2.5804320136898398e-05, "Pretrain/Loss": 2.0196571350097656, "Pretrain/Loss (Raw)": 2.0971262454986572, "Pretrain/Step": 9633, "Pretrain/Step Time": 8.470993269234896} +{"Pretrain/Learning Rate": 2.5800077156945425e-05, "Pretrain/Loss": 2.0198616981506348, "Pretrain/Loss (Raw)": 2.3676042556762695, "Pretrain/Step": 9634, "Pretrain/Step Time": 8.475808549672365} +{"Pretrain/Learning Rate": 2.5795834153922787e-05, "Pretrain/Loss": 2.01954984664917, "Pretrain/Loss (Raw)": 1.938162922859192, "Pretrain/Step": 9635, "Pretrain/Step Time": 8.472496638074517} +{"Pretrain/Learning Rate": 2.5791591127952835e-05, "Pretrain/Loss": 2.018914222717285, "Pretrain/Loss (Raw)": 2.040850877761841, "Pretrain/Step": 9636, "Pretrain/Step Time": 8.47316519729793} +{"Pretrain/Learning Rate": 2.5787348079157906e-05, "Pretrain/Loss": 2.0167531967163086, "Pretrain/Loss (Raw)": 1.8873907327651978, "Pretrain/Step": 9637, "Pretrain/Step Time": 8.468622563406825} +{"Pretrain/Learning Rate": 2.5783105007660364e-05, "Pretrain/Loss": 2.0162572860717773, "Pretrain/Loss (Raw)": 1.9687353372573853, "Pretrain/Step": 9638, "Pretrain/Step Time": 8.466990543529391} +{"Pretrain/Learning Rate": 2.577886191358253e-05, "Pretrain/Loss": 2.0161936283111572, "Pretrain/Loss (Raw)": 2.048166275024414, "Pretrain/Step": 9639, "Pretrain/Step Time": 8.463780101388693} +{"Pretrain/Learning Rate": 2.5774618797046763e-05, "Pretrain/Loss": 2.017163038253784, "Pretrain/Loss (Raw)": 2.0186870098114014, "Pretrain/Step": 9640, "Pretrain/Step Time": 8.463679203763604} +{"Pretrain/Learning Rate": 2.577037565817541e-05, "Pretrain/Loss": 2.0194523334503174, "Pretrain/Loss (Raw)": 2.083686113357544, "Pretrain/Step": 9641, "Pretrain/Step Time": 8.465194387361407} +{"Pretrain/Learning Rate": 2.5766132497090817e-05, "Pretrain/Loss": 2.0182435512542725, "Pretrain/Loss (Raw)": 2.089900255203247, "Pretrain/Step": 9642, "Pretrain/Step Time": 8.465453499928117} +{"Pretrain/Learning Rate": 2.576188931391533e-05, "Pretrain/Loss": 2.0164895057678223, "Pretrain/Loss (Raw)": 1.8488049507141113, "Pretrain/Step": 9643, "Pretrain/Step Time": 8.465139597654343} +{"Pretrain/Learning Rate": 2.575764610877131e-05, "Pretrain/Loss": 2.019080638885498, "Pretrain/Loss (Raw)": 2.1032516956329346, "Pretrain/Step": 9644, "Pretrain/Step Time": 8.467204248532653} +{"Pretrain/Learning Rate": 2.5753402881781097e-05, "Pretrain/Loss": 2.019833564758301, "Pretrain/Loss (Raw)": 2.051117181777954, "Pretrain/Step": 9645, "Pretrain/Step Time": 8.467821823433042} +{"Pretrain/Learning Rate": 2.574915963306704e-05, "Pretrain/Loss": 2.020328998565674, "Pretrain/Loss (Raw)": 2.040590286254883, "Pretrain/Step": 9646, "Pretrain/Step Time": 8.459264615550637} +{"Pretrain/Learning Rate": 2.574491636275149e-05, "Pretrain/Loss": 2.0204203128814697, "Pretrain/Loss (Raw)": 1.886220097541809, "Pretrain/Step": 9647, "Pretrain/Step Time": 8.463423928245902} +{"Pretrain/Learning Rate": 2.5740673070956806e-05, "Pretrain/Loss": 2.0202291011810303, "Pretrain/Loss (Raw)": 1.988908290863037, "Pretrain/Step": 9648, "Pretrain/Step Time": 8.462950572371483} +{"Pretrain/Learning Rate": 2.573642975780534e-05, "Pretrain/Loss": 2.0201492309570312, "Pretrain/Loss (Raw)": 2.001781463623047, "Pretrain/Step": 9649, "Pretrain/Step Time": 8.464922789484262} +{"Pretrain/Learning Rate": 2.5732186423419437e-05, "Pretrain/Loss": 2.0195443630218506, "Pretrain/Loss (Raw)": 1.9514580965042114, "Pretrain/Step": 9650, "Pretrain/Step Time": 8.466373493894935} +{"Pretrain/Learning Rate": 2.572794306792145e-05, "Pretrain/Loss": 2.0200893878936768, "Pretrain/Loss (Raw)": 1.9067387580871582, "Pretrain/Step": 9651, "Pretrain/Step Time": 8.466299230232835} +{"Pretrain/Learning Rate": 2.5723699691433743e-05, "Pretrain/Loss": 2.0215377807617188, "Pretrain/Loss (Raw)": 2.025158166885376, "Pretrain/Step": 9652, "Pretrain/Step Time": 8.46635545603931} +{"Pretrain/Learning Rate": 2.5719456294078665e-05, "Pretrain/Loss": 2.022646903991699, "Pretrain/Loss (Raw)": 2.127976179122925, "Pretrain/Step": 9653, "Pretrain/Step Time": 8.469665490090847} +{"Pretrain/Learning Rate": 2.5715212875978577e-05, "Pretrain/Loss": 2.019932508468628, "Pretrain/Loss (Raw)": 1.5865817070007324, "Pretrain/Step": 9654, "Pretrain/Step Time": 8.46268785186112} +{"Pretrain/Learning Rate": 2.5710969437255823e-05, "Pretrain/Loss": 2.019613265991211, "Pretrain/Loss (Raw)": 2.193587064743042, "Pretrain/Step": 9655, "Pretrain/Step Time": 8.458298414945602} +{"Pretrain/Learning Rate": 2.570672597803277e-05, "Pretrain/Loss": 2.0190658569335938, "Pretrain/Loss (Raw)": 1.891688346862793, "Pretrain/Step": 9656, "Pretrain/Step Time": 8.457737999036908} +{"Pretrain/Learning Rate": 2.5702482498431768e-05, "Pretrain/Loss": 2.0210916996002197, "Pretrain/Loss (Raw)": 2.1737186908721924, "Pretrain/Step": 9657, "Pretrain/Step Time": 8.460141882300377} +{"Pretrain/Learning Rate": 2.5698238998575176e-05, "Pretrain/Loss": 2.0205254554748535, "Pretrain/Loss (Raw)": 2.02484393119812, "Pretrain/Step": 9658, "Pretrain/Step Time": 8.46216326765716} +{"Pretrain/Learning Rate": 2.5693995478585363e-05, "Pretrain/Loss": 2.0202219486236572, "Pretrain/Loss (Raw)": 1.9505316019058228, "Pretrain/Step": 9659, "Pretrain/Step Time": 8.46404866501689} +{"Pretrain/Learning Rate": 2.5689751938584678e-05, "Pretrain/Loss": 2.0218658447265625, "Pretrain/Loss (Raw)": 2.385821580886841, "Pretrain/Step": 9660, "Pretrain/Step Time": 8.463452877476811} +{"Pretrain/Learning Rate": 2.5685508378695476e-05, "Pretrain/Loss": 2.0219788551330566, "Pretrain/Loss (Raw)": 2.0760767459869385, "Pretrain/Step": 9661, "Pretrain/Step Time": 8.45942240767181} +{"Pretrain/Learning Rate": 2.5681264799040127e-05, "Pretrain/Loss": 2.0217323303222656, "Pretrain/Loss (Raw)": 2.0808682441711426, "Pretrain/Step": 9662, "Pretrain/Step Time": 8.45480466261506} +{"Pretrain/Learning Rate": 2.5677021199740986e-05, "Pretrain/Loss": 2.018925905227661, "Pretrain/Loss (Raw)": 1.8538695573806763, "Pretrain/Step": 9663, "Pretrain/Step Time": 8.46186981536448} +{"Pretrain/Learning Rate": 2.567277758092042e-05, "Pretrain/Loss": 2.017613649368286, "Pretrain/Loss (Raw)": 1.9422301054000854, "Pretrain/Step": 9664, "Pretrain/Step Time": 8.462544031441212} +{"Pretrain/Learning Rate": 2.5668533942700786e-05, "Pretrain/Loss": 2.016841411590576, "Pretrain/Loss (Raw)": 1.969120740890503, "Pretrain/Step": 9665, "Pretrain/Step Time": 8.456447573378682} +{"Pretrain/Learning Rate": 2.5664290285204447e-05, "Pretrain/Loss": 2.0174272060394287, "Pretrain/Loss (Raw)": 1.9871882200241089, "Pretrain/Step": 9666, "Pretrain/Step Time": 8.455685524269938} +{"Pretrain/Learning Rate": 2.5660046608553763e-05, "Pretrain/Loss": 2.0187835693359375, "Pretrain/Loss (Raw)": 2.16935658454895, "Pretrain/Step": 9667, "Pretrain/Step Time": 8.457286505028605} +{"Pretrain/Learning Rate": 2.5655802912871095e-05, "Pretrain/Loss": 2.0190958976745605, "Pretrain/Loss (Raw)": 2.066276788711548, "Pretrain/Step": 9668, "Pretrain/Step Time": 8.460314011201262} +{"Pretrain/Learning Rate": 2.5651559198278824e-05, "Pretrain/Loss": 2.0187008380889893, "Pretrain/Loss (Raw)": 1.8289774656295776, "Pretrain/Step": 9669, "Pretrain/Step Time": 8.458184245973825} +{"Pretrain/Learning Rate": 2.5647315464899297e-05, "Pretrain/Loss": 2.0169506072998047, "Pretrain/Loss (Raw)": 1.8830420970916748, "Pretrain/Step": 9670, "Pretrain/Step Time": 8.458973424509168} +{"Pretrain/Learning Rate": 2.5643071712854888e-05, "Pretrain/Loss": 2.014599323272705, "Pretrain/Loss (Raw)": 1.7056583166122437, "Pretrain/Step": 9671, "Pretrain/Step Time": 8.461647627875209} +{"Pretrain/Learning Rate": 2.5638827942267958e-05, "Pretrain/Loss": 2.014514446258545, "Pretrain/Loss (Raw)": 1.8819814920425415, "Pretrain/Step": 9672, "Pretrain/Step Time": 8.461153386160731} +{"Pretrain/Learning Rate": 2.563458415326087e-05, "Pretrain/Loss": 2.0132434368133545, "Pretrain/Loss (Raw)": 1.8064074516296387, "Pretrain/Step": 9673, "Pretrain/Step Time": 8.463087951764464} +{"Pretrain/Learning Rate": 2.5630340345956e-05, "Pretrain/Loss": 2.0121188163757324, "Pretrain/Loss (Raw)": 2.1729576587677, "Pretrain/Step": 9674, "Pretrain/Step Time": 8.463545048609376} +{"Pretrain/Learning Rate": 2.5626096520475713e-05, "Pretrain/Loss": 2.0139987468719482, "Pretrain/Loss (Raw)": 2.0344021320343018, "Pretrain/Step": 9675, "Pretrain/Step Time": 8.46052754111588} +{"Pretrain/Learning Rate": 2.5621852676942377e-05, "Pretrain/Loss": 2.013195753097534, "Pretrain/Loss (Raw)": 2.0049960613250732, "Pretrain/Step": 9676, "Pretrain/Step Time": 8.467051077634096} +{"Pretrain/Learning Rate": 2.5617608815478343e-05, "Pretrain/Loss": 2.013711452484131, "Pretrain/Loss (Raw)": 2.0465891361236572, "Pretrain/Step": 9677, "Pretrain/Step Time": 8.472128169611096} +{"Pretrain/Learning Rate": 2.5613364936206004e-05, "Pretrain/Loss": 2.0142323970794678, "Pretrain/Loss (Raw)": 1.9547303915023804, "Pretrain/Step": 9678, "Pretrain/Step Time": 8.472246507182717} +{"Pretrain/Learning Rate": 2.5609121039247718e-05, "Pretrain/Loss": 2.01523494720459, "Pretrain/Loss (Raw)": 1.9782090187072754, "Pretrain/Step": 9679, "Pretrain/Step Time": 8.46803392842412} +{"Pretrain/Learning Rate": 2.5604877124725855e-05, "Pretrain/Loss": 2.0206117630004883, "Pretrain/Loss (Raw)": 2.2337379455566406, "Pretrain/Step": 9680, "Pretrain/Step Time": 8.466813750565052} +{"Pretrain/Learning Rate": 2.560063319276279e-05, "Pretrain/Loss": 2.0211777687072754, "Pretrain/Loss (Raw)": 2.1743619441986084, "Pretrain/Step": 9681, "Pretrain/Step Time": 8.46161449700594} +{"Pretrain/Learning Rate": 2.559638924348089e-05, "Pretrain/Loss": 2.020350694656372, "Pretrain/Loss (Raw)": 1.9145548343658447, "Pretrain/Step": 9682, "Pretrain/Step Time": 8.459724262356758} +{"Pretrain/Learning Rate": 2.5592145277002523e-05, "Pretrain/Loss": 2.020385265350342, "Pretrain/Loss (Raw)": 2.065723180770874, "Pretrain/Step": 9683, "Pretrain/Step Time": 8.464863628149033} +{"Pretrain/Learning Rate": 2.558790129345006e-05, "Pretrain/Loss": 2.0186104774475098, "Pretrain/Loss (Raw)": 1.811676263809204, "Pretrain/Step": 9684, "Pretrain/Step Time": 8.461868731305003} +{"Pretrain/Learning Rate": 2.5583657292945883e-05, "Pretrain/Loss": 2.0186119079589844, "Pretrain/Loss (Raw)": 1.8801103830337524, "Pretrain/Step": 9685, "Pretrain/Step Time": 8.46333652921021} +{"Pretrain/Learning Rate": 2.5579413275612368e-05, "Pretrain/Loss": 2.017707347869873, "Pretrain/Loss (Raw)": 1.8969428539276123, "Pretrain/Step": 9686, "Pretrain/Step Time": 8.46150565892458} +{"Pretrain/Learning Rate": 2.5575169241571873e-05, "Pretrain/Loss": 2.017566442489624, "Pretrain/Loss (Raw)": 2.1121649742126465, "Pretrain/Step": 9687, "Pretrain/Step Time": 8.459293784573674} +{"Pretrain/Learning Rate": 2.557092519094677e-05, "Pretrain/Loss": 2.0133585929870605, "Pretrain/Loss (Raw)": 1.6978403329849243, "Pretrain/Step": 9688, "Pretrain/Step Time": 8.462913412600756} +{"Pretrain/Learning Rate": 2.5566681123859448e-05, "Pretrain/Loss": 2.0129547119140625, "Pretrain/Loss (Raw)": 2.0317134857177734, "Pretrain/Step": 9689, "Pretrain/Step Time": 8.461193474009633} +{"Pretrain/Learning Rate": 2.556243704043228e-05, "Pretrain/Loss": 2.013247489929199, "Pretrain/Loss (Raw)": 1.9582878351211548, "Pretrain/Step": 9690, "Pretrain/Step Time": 8.46831819601357} +{"Pretrain/Learning Rate": 2.5558192940787633e-05, "Pretrain/Loss": 2.0127604007720947, "Pretrain/Loss (Raw)": 2.113598108291626, "Pretrain/Step": 9691, "Pretrain/Step Time": 8.46790681220591} +{"Pretrain/Learning Rate": 2.5553948825047886e-05, "Pretrain/Loss": 2.012216567993164, "Pretrain/Loss (Raw)": 2.017279863357544, "Pretrain/Step": 9692, "Pretrain/Step Time": 8.465889109298587} +{"Pretrain/Learning Rate": 2.5549704693335412e-05, "Pretrain/Loss": 2.0116934776306152, "Pretrain/Loss (Raw)": 1.8916618824005127, "Pretrain/Step": 9693, "Pretrain/Step Time": 8.463895086199045} +{"Pretrain/Learning Rate": 2.5545460545772593e-05, "Pretrain/Loss": 2.010911226272583, "Pretrain/Loss (Raw)": 1.8700661659240723, "Pretrain/Step": 9694, "Pretrain/Step Time": 8.469115538522601} +{"Pretrain/Learning Rate": 2.5541216382481802e-05, "Pretrain/Loss": 2.0120716094970703, "Pretrain/Loss (Raw)": 2.3363771438598633, "Pretrain/Step": 9695, "Pretrain/Step Time": 8.465350108221173} +{"Pretrain/Learning Rate": 2.5536972203585426e-05, "Pretrain/Loss": 2.0127782821655273, "Pretrain/Loss (Raw)": 1.931536078453064, "Pretrain/Step": 9696, "Pretrain/Step Time": 8.469344159588218} +{"Pretrain/Learning Rate": 2.5532728009205825e-05, "Pretrain/Loss": 2.0139918327331543, "Pretrain/Loss (Raw)": 2.0517592430114746, "Pretrain/Step": 9697, "Pretrain/Step Time": 8.466679153963923} +{"Pretrain/Learning Rate": 2.552848379946539e-05, "Pretrain/Loss": 2.0164153575897217, "Pretrain/Loss (Raw)": 2.033026933670044, "Pretrain/Step": 9698, "Pretrain/Step Time": 8.467595636844635} +{"Pretrain/Learning Rate": 2.5524239574486502e-05, "Pretrain/Loss": 2.015887975692749, "Pretrain/Loss (Raw)": 2.063642978668213, "Pretrain/Step": 9699, "Pretrain/Step Time": 8.463672509416938} +{"Pretrain/Learning Rate": 2.5519995334391527e-05, "Pretrain/Loss": 2.0146474838256836, "Pretrain/Loss (Raw)": 1.9932383298873901, "Pretrain/Step": 9700, "Pretrain/Step Time": 8.467578859999776} +{"Pretrain/Learning Rate": 2.5515751079302863e-05, "Pretrain/Loss": 2.0114798545837402, "Pretrain/Loss (Raw)": 1.8101001977920532, "Pretrain/Step": 9701, "Pretrain/Step Time": 8.465032616630197} +{"Pretrain/Learning Rate": 2.551150680934288e-05, "Pretrain/Loss": 2.012641668319702, "Pretrain/Loss (Raw)": 2.1004159450531006, "Pretrain/Step": 9702, "Pretrain/Step Time": 8.460447084158659} +{"Pretrain/Learning Rate": 2.550726252463395e-05, "Pretrain/Loss": 2.011939287185669, "Pretrain/Loss (Raw)": 1.9668712615966797, "Pretrain/Step": 9703, "Pretrain/Step Time": 8.455720257014036} +{"Pretrain/Learning Rate": 2.5503018225298464e-05, "Pretrain/Loss": 2.0116000175476074, "Pretrain/Loss (Raw)": 1.9248985052108765, "Pretrain/Step": 9704, "Pretrain/Step Time": 8.455607848241925} +{"Pretrain/Learning Rate": 2.5498773911458805e-05, "Pretrain/Loss": 2.011549234390259, "Pretrain/Loss (Raw)": 2.12341046333313, "Pretrain/Step": 9705, "Pretrain/Step Time": 8.460082542151213} +{"Pretrain/Learning Rate": 2.5494529583237357e-05, "Pretrain/Loss": 2.0130577087402344, "Pretrain/Loss (Raw)": 2.1631600856781006, "Pretrain/Step": 9706, "Pretrain/Step Time": 8.457552084699273} +{"Pretrain/Learning Rate": 2.549028524075649e-05, "Pretrain/Loss": 2.015660285949707, "Pretrain/Loss (Raw)": 2.3348493576049805, "Pretrain/Step": 9707, "Pretrain/Step Time": 8.453221458941698} +{"Pretrain/Learning Rate": 2.5486040884138597e-05, "Pretrain/Loss": 2.013000965118408, "Pretrain/Loss (Raw)": 1.7319071292877197, "Pretrain/Step": 9708, "Pretrain/Step Time": 8.45582959242165} +{"Pretrain/Learning Rate": 2.548179651350605e-05, "Pretrain/Loss": 2.01434326171875, "Pretrain/Loss (Raw)": 2.0737497806549072, "Pretrain/Step": 9709, "Pretrain/Step Time": 8.449781840667129} +{"Pretrain/Learning Rate": 2.5477552128981248e-05, "Pretrain/Loss": 2.0131497383117676, "Pretrain/Loss (Raw)": 1.9056050777435303, "Pretrain/Step": 9710, "Pretrain/Step Time": 8.455588785931468} +{"Pretrain/Learning Rate": 2.5473307730686563e-05, "Pretrain/Loss": 2.0137417316436768, "Pretrain/Loss (Raw)": 2.1454060077667236, "Pretrain/Step": 9711, "Pretrain/Step Time": 8.452607264742255} +{"Pretrain/Learning Rate": 2.5469063318744392e-05, "Pretrain/Loss": 2.015702724456787, "Pretrain/Loss (Raw)": 1.9693396091461182, "Pretrain/Step": 9712, "Pretrain/Step Time": 8.449813490733504} +{"Pretrain/Learning Rate": 2.5464818893277104e-05, "Pretrain/Loss": 2.017012596130371, "Pretrain/Loss (Raw)": 2.1494388580322266, "Pretrain/Step": 9713, "Pretrain/Step Time": 8.453429171815515} +{"Pretrain/Learning Rate": 2.5460574454407088e-05, "Pretrain/Loss": 2.0157828330993652, "Pretrain/Loss (Raw)": 1.8939441442489624, "Pretrain/Step": 9714, "Pretrain/Step Time": 8.460965497419238} +{"Pretrain/Learning Rate": 2.5456330002256734e-05, "Pretrain/Loss": 2.013408660888672, "Pretrain/Loss (Raw)": 1.9379887580871582, "Pretrain/Step": 9715, "Pretrain/Step Time": 8.458432829007506} +{"Pretrain/Learning Rate": 2.5452085536948428e-05, "Pretrain/Loss": 2.0170204639434814, "Pretrain/Loss (Raw)": 2.303510904312134, "Pretrain/Step": 9716, "Pretrain/Step Time": 8.453163025900722} +{"Pretrain/Learning Rate": 2.544784105860456e-05, "Pretrain/Loss": 2.015246868133545, "Pretrain/Loss (Raw)": 1.927971601486206, "Pretrain/Step": 9717, "Pretrain/Step Time": 8.453527592122555} +{"Pretrain/Learning Rate": 2.544359656734751e-05, "Pretrain/Loss": 2.014516830444336, "Pretrain/Loss (Raw)": 1.9674814939498901, "Pretrain/Step": 9718, "Pretrain/Step Time": 8.453904634341598} +{"Pretrain/Learning Rate": 2.543935206329966e-05, "Pretrain/Loss": 2.0157694816589355, "Pretrain/Loss (Raw)": 2.0880608558654785, "Pretrain/Step": 9719, "Pretrain/Step Time": 8.450350729748607} +{"Pretrain/Learning Rate": 2.5435107546583404e-05, "Pretrain/Loss": 2.01694917678833, "Pretrain/Loss (Raw)": 2.0649828910827637, "Pretrain/Step": 9720, "Pretrain/Step Time": 8.450406482443213} +{"Pretrain/Learning Rate": 2.543086301732113e-05, "Pretrain/Loss": 2.0174498558044434, "Pretrain/Loss (Raw)": 2.030174732208252, "Pretrain/Step": 9721, "Pretrain/Step Time": 8.443219255656004} +{"Pretrain/Learning Rate": 2.5426618475635218e-05, "Pretrain/Loss": 2.0164711475372314, "Pretrain/Loss (Raw)": 2.002455234527588, "Pretrain/Step": 9722, "Pretrain/Step Time": 8.448193605989218} +{"Pretrain/Learning Rate": 2.5422373921648068e-05, "Pretrain/Loss": 2.0149521827697754, "Pretrain/Loss (Raw)": 2.077829599380493, "Pretrain/Step": 9723, "Pretrain/Step Time": 8.444677682593465} +{"Pretrain/Learning Rate": 2.5418129355482068e-05, "Pretrain/Loss": 2.0171360969543457, "Pretrain/Loss (Raw)": 2.1439528465270996, "Pretrain/Step": 9724, "Pretrain/Step Time": 8.442826852202415} +{"Pretrain/Learning Rate": 2.5413884777259594e-05, "Pretrain/Loss": 2.017906904220581, "Pretrain/Loss (Raw)": 2.011993169784546, "Pretrain/Step": 9725, "Pretrain/Step Time": 8.445648608729243} +{"Pretrain/Learning Rate": 2.5409640187103047e-05, "Pretrain/Loss": 2.0154216289520264, "Pretrain/Loss (Raw)": 1.884683609008789, "Pretrain/Step": 9726, "Pretrain/Step Time": 8.445451794192195} +{"Pretrain/Learning Rate": 2.5405395585134817e-05, "Pretrain/Loss": 2.0185627937316895, "Pretrain/Loss (Raw)": 2.2727365493774414, "Pretrain/Step": 9727, "Pretrain/Step Time": 8.445434167981148} +{"Pretrain/Learning Rate": 2.5401150971477293e-05, "Pretrain/Loss": 2.0196876525878906, "Pretrain/Loss (Raw)": 2.147862195968628, "Pretrain/Step": 9728, "Pretrain/Step Time": 8.446581175550818} +{"Pretrain/Learning Rate": 2.539690634625286e-05, "Pretrain/Loss": 2.0198843479156494, "Pretrain/Loss (Raw)": 2.189998149871826, "Pretrain/Step": 9729, "Pretrain/Step Time": 8.44821210950613} +{"Pretrain/Learning Rate": 2.539266170958391e-05, "Pretrain/Loss": 2.0187573432922363, "Pretrain/Loss (Raw)": 1.9843785762786865, "Pretrain/Step": 9730, "Pretrain/Step Time": 8.447199258953333} +{"Pretrain/Learning Rate": 2.538841706159284e-05, "Pretrain/Loss": 2.0180046558380127, "Pretrain/Loss (Raw)": 1.9150387048721313, "Pretrain/Step": 9731, "Pretrain/Step Time": 8.447072878479958} +{"Pretrain/Learning Rate": 2.5384172402402033e-05, "Pretrain/Loss": 2.0170414447784424, "Pretrain/Loss (Raw)": 1.9007850885391235, "Pretrain/Step": 9732, "Pretrain/Step Time": 8.449020273983479} +{"Pretrain/Learning Rate": 2.5379927732133895e-05, "Pretrain/Loss": 2.0177600383758545, "Pretrain/Loss (Raw)": 2.0345919132232666, "Pretrain/Step": 9733, "Pretrain/Step Time": 8.44971933402121} +{"Pretrain/Learning Rate": 2.5375683050910802e-05, "Pretrain/Loss": 2.014646530151367, "Pretrain/Loss (Raw)": 1.9287437200546265, "Pretrain/Step": 9734, "Pretrain/Step Time": 8.451587479561567} +{"Pretrain/Learning Rate": 2.5371438358855154e-05, "Pretrain/Loss": 2.0154707431793213, "Pretrain/Loss (Raw)": 2.126708745956421, "Pretrain/Step": 9735, "Pretrain/Step Time": 8.449348650872707} +{"Pretrain/Learning Rate": 2.536719365608934e-05, "Pretrain/Loss": 2.0155832767486572, "Pretrain/Loss (Raw)": 2.1439168453216553, "Pretrain/Step": 9736, "Pretrain/Step Time": 8.450375650078058} +{"Pretrain/Learning Rate": 2.536294894273576e-05, "Pretrain/Loss": 2.011336326599121, "Pretrain/Loss (Raw)": 1.39246666431427, "Pretrain/Step": 9737, "Pretrain/Step Time": 8.450488116592169} +{"Pretrain/Learning Rate": 2.5358704218916806e-05, "Pretrain/Loss": 2.010059118270874, "Pretrain/Loss (Raw)": 1.8639088869094849, "Pretrain/Step": 9738, "Pretrain/Step Time": 8.451386453583837} +{"Pretrain/Learning Rate": 2.5354459484754862e-05, "Pretrain/Loss": 2.0120410919189453, "Pretrain/Loss (Raw)": 2.0905649662017822, "Pretrain/Step": 9739, "Pretrain/Step Time": 8.45251364260912} +{"Pretrain/Learning Rate": 2.535021474037233e-05, "Pretrain/Loss": 2.012765407562256, "Pretrain/Loss (Raw)": 2.2164735794067383, "Pretrain/Step": 9740, "Pretrain/Step Time": 8.448921300470829} +{"Pretrain/Learning Rate": 2.5345969985891605e-05, "Pretrain/Loss": 2.011723279953003, "Pretrain/Loss (Raw)": 1.8761674165725708, "Pretrain/Step": 9741, "Pretrain/Step Time": 8.443314600735903} +{"Pretrain/Learning Rate": 2.5341725221435077e-05, "Pretrain/Loss": 2.011427402496338, "Pretrain/Loss (Raw)": 1.9546918869018555, "Pretrain/Step": 9742, "Pretrain/Step Time": 8.445904348045588} +{"Pretrain/Learning Rate": 2.533748044712514e-05, "Pretrain/Loss": 2.010535955429077, "Pretrain/Loss (Raw)": 1.7533189058303833, "Pretrain/Step": 9743, "Pretrain/Step Time": 8.441810172051191} +{"Pretrain/Learning Rate": 2.5333235663084204e-05, "Pretrain/Loss": 2.009565830230713, "Pretrain/Loss (Raw)": 2.1194093227386475, "Pretrain/Step": 9744, "Pretrain/Step Time": 8.44097545184195} +{"Pretrain/Learning Rate": 2.5328990869434645e-05, "Pretrain/Loss": 2.0101542472839355, "Pretrain/Loss (Raw)": 1.8843871355056763, "Pretrain/Step": 9745, "Pretrain/Step Time": 8.44214466959238} +{"Pretrain/Learning Rate": 2.532474606629886e-05, "Pretrain/Loss": 2.006875514984131, "Pretrain/Loss (Raw)": 1.8144826889038086, "Pretrain/Step": 9746, "Pretrain/Step Time": 8.445327650755644} +{"Pretrain/Learning Rate": 2.5320501253799262e-05, "Pretrain/Loss": 2.0074024200439453, "Pretrain/Loss (Raw)": 2.0404791831970215, "Pretrain/Step": 9747, "Pretrain/Step Time": 8.446599112823606} +{"Pretrain/Learning Rate": 2.5316256432058228e-05, "Pretrain/Loss": 2.004833221435547, "Pretrain/Loss (Raw)": 2.1230785846710205, "Pretrain/Step": 9748, "Pretrain/Step Time": 8.446311747655272} +{"Pretrain/Learning Rate": 2.5312011601198173e-05, "Pretrain/Loss": 2.0040459632873535, "Pretrain/Loss (Raw)": 1.9744104146957397, "Pretrain/Step": 9749, "Pretrain/Step Time": 8.450128154829144} +{"Pretrain/Learning Rate": 2.5307766761341472e-05, "Pretrain/Loss": 2.007880926132202, "Pretrain/Loss (Raw)": 2.3057057857513428, "Pretrain/Step": 9750, "Pretrain/Step Time": 8.447507243603468} +{"Pretrain/Learning Rate": 2.530352191261054e-05, "Pretrain/Loss": 2.0072805881500244, "Pretrain/Loss (Raw)": 1.990580677986145, "Pretrain/Step": 9751, "Pretrain/Step Time": 8.45341657474637} +{"Pretrain/Learning Rate": 2.529927705512776e-05, "Pretrain/Loss": 2.0070137977600098, "Pretrain/Loss (Raw)": 1.9874569177627563, "Pretrain/Step": 9752, "Pretrain/Step Time": 8.447988012805581} +{"Pretrain/Learning Rate": 2.5295032189015543e-05, "Pretrain/Loss": 2.0058135986328125, "Pretrain/Loss (Raw)": 1.8324037790298462, "Pretrain/Step": 9753, "Pretrain/Step Time": 8.449435614049435} +{"Pretrain/Learning Rate": 2.5290787314396285e-05, "Pretrain/Loss": 2.0059690475463867, "Pretrain/Loss (Raw)": 2.1364638805389404, "Pretrain/Step": 9754, "Pretrain/Step Time": 8.453437177464366} +{"Pretrain/Learning Rate": 2.528654243139238e-05, "Pretrain/Loss": 2.0063400268554688, "Pretrain/Loss (Raw)": 1.9580128192901611, "Pretrain/Step": 9755, "Pretrain/Step Time": 8.452501904219389} +{"Pretrain/Learning Rate": 2.528229754012622e-05, "Pretrain/Loss": 2.006300210952759, "Pretrain/Loss (Raw)": 1.8912620544433594, "Pretrain/Step": 9756, "Pretrain/Step Time": 8.445939423516393} +{"Pretrain/Learning Rate": 2.5278052640720207e-05, "Pretrain/Loss": 2.0049524307250977, "Pretrain/Loss (Raw)": 2.134002447128296, "Pretrain/Step": 9757, "Pretrain/Step Time": 8.446099296212196} +{"Pretrain/Learning Rate": 2.5273807733296745e-05, "Pretrain/Loss": 2.007659673690796, "Pretrain/Loss (Raw)": 2.0776450634002686, "Pretrain/Step": 9758, "Pretrain/Step Time": 8.44364702515304} +{"Pretrain/Learning Rate": 2.526956281797824e-05, "Pretrain/Loss": 2.0086097717285156, "Pretrain/Loss (Raw)": 2.0024850368499756, "Pretrain/Step": 9759, "Pretrain/Step Time": 8.447561468929052} +{"Pretrain/Learning Rate": 2.5265317894887076e-05, "Pretrain/Loss": 2.0103893280029297, "Pretrain/Loss (Raw)": 2.329685926437378, "Pretrain/Step": 9760, "Pretrain/Step Time": 8.44185728020966} +{"Pretrain/Learning Rate": 2.5261072964145648e-05, "Pretrain/Loss": 2.009636878967285, "Pretrain/Loss (Raw)": 2.0008339881896973, "Pretrain/Step": 9761, "Pretrain/Step Time": 8.442820377647877} +{"Pretrain/Learning Rate": 2.5256828025876374e-05, "Pretrain/Loss": 2.0069854259490967, "Pretrain/Loss (Raw)": 2.0282111167907715, "Pretrain/Step": 9762, "Pretrain/Step Time": 8.441623598337173} +{"Pretrain/Learning Rate": 2.5252583080201643e-05, "Pretrain/Loss": 2.007979393005371, "Pretrain/Loss (Raw)": 2.0653676986694336, "Pretrain/Step": 9763, "Pretrain/Step Time": 8.443603111431003} +{"Pretrain/Learning Rate": 2.5248338127243855e-05, "Pretrain/Loss": 2.007100820541382, "Pretrain/Loss (Raw)": 1.9284292459487915, "Pretrain/Step": 9764, "Pretrain/Step Time": 8.441533643752337} +{"Pretrain/Learning Rate": 2.5244093167125417e-05, "Pretrain/Loss": 2.007481575012207, "Pretrain/Loss (Raw)": 1.9361207485198975, "Pretrain/Step": 9765, "Pretrain/Step Time": 8.444559818133712} +{"Pretrain/Learning Rate": 2.5239848199968717e-05, "Pretrain/Loss": 2.0077829360961914, "Pretrain/Loss (Raw)": 2.0073139667510986, "Pretrain/Step": 9766, "Pretrain/Step Time": 8.44484636373818} +{"Pretrain/Learning Rate": 2.5235603225896166e-05, "Pretrain/Loss": 2.0083959102630615, "Pretrain/Loss (Raw)": 2.126620054244995, "Pretrain/Step": 9767, "Pretrain/Step Time": 8.445871230214834} +{"Pretrain/Learning Rate": 2.523135824503016e-05, "Pretrain/Loss": 2.0088415145874023, "Pretrain/Loss (Raw)": 2.075716733932495, "Pretrain/Step": 9768, "Pretrain/Step Time": 8.44557448104024} +{"Pretrain/Learning Rate": 2.5227113257493107e-05, "Pretrain/Loss": 2.007578134536743, "Pretrain/Loss (Raw)": 1.9219818115234375, "Pretrain/Step": 9769, "Pretrain/Step Time": 8.44373419880867} +{"Pretrain/Learning Rate": 2.5222868263407407e-05, "Pretrain/Loss": 2.0063765048980713, "Pretrain/Loss (Raw)": 1.93608558177948, "Pretrain/Step": 9770, "Pretrain/Step Time": 8.44920557178557} +{"Pretrain/Learning Rate": 2.5218623262895448e-05, "Pretrain/Loss": 2.0089306831359863, "Pretrain/Loss (Raw)": 2.1757662296295166, "Pretrain/Step": 9771, "Pretrain/Step Time": 8.449454810470343} +{"Pretrain/Learning Rate": 2.5214378256079646e-05, "Pretrain/Loss": 2.0088396072387695, "Pretrain/Loss (Raw)": 2.0915987491607666, "Pretrain/Step": 9772, "Pretrain/Step Time": 8.445968372747302} +{"Pretrain/Learning Rate": 2.5210133243082394e-05, "Pretrain/Loss": 2.008213758468628, "Pretrain/Loss (Raw)": 1.9709725379943848, "Pretrain/Step": 9773, "Pretrain/Step Time": 8.444144943729043} +{"Pretrain/Learning Rate": 2.5205888224026102e-05, "Pretrain/Loss": 2.007763385772705, "Pretrain/Loss (Raw)": 1.9829318523406982, "Pretrain/Step": 9774, "Pretrain/Step Time": 8.443441128358245} +{"Pretrain/Learning Rate": 2.520164319903317e-05, "Pretrain/Loss": 2.0073297023773193, "Pretrain/Loss (Raw)": 1.83072829246521, "Pretrain/Step": 9775, "Pretrain/Step Time": 8.443584213033319} +{"Pretrain/Learning Rate": 2.5197398168226e-05, "Pretrain/Loss": 2.007791519165039, "Pretrain/Loss (Raw)": 2.0480124950408936, "Pretrain/Step": 9776, "Pretrain/Step Time": 8.44262284040451} +{"Pretrain/Learning Rate": 2.519315313172699e-05, "Pretrain/Loss": 2.009131908416748, "Pretrain/Loss (Raw)": 2.173380136489868, "Pretrain/Step": 9777, "Pretrain/Step Time": 8.440946096554399} +{"Pretrain/Learning Rate": 2.5188908089658543e-05, "Pretrain/Loss": 2.009885311126709, "Pretrain/Loss (Raw)": 2.047856330871582, "Pretrain/Step": 9778, "Pretrain/Step Time": 8.442427203059196} +{"Pretrain/Learning Rate": 2.5184663042143066e-05, "Pretrain/Loss": 2.0099830627441406, "Pretrain/Loss (Raw)": 1.9192558526992798, "Pretrain/Step": 9779, "Pretrain/Step Time": 8.444783264771104} +{"Pretrain/Learning Rate": 2.5180417989302956e-05, "Pretrain/Loss": 2.0109682083129883, "Pretrain/Loss (Raw)": 2.1513009071350098, "Pretrain/Step": 9780, "Pretrain/Step Time": 8.445398159325123} +{"Pretrain/Learning Rate": 2.5176172931260634e-05, "Pretrain/Loss": 2.0083625316619873, "Pretrain/Loss (Raw)": 1.7944217920303345, "Pretrain/Step": 9781, "Pretrain/Step Time": 8.444825172424316} +{"Pretrain/Learning Rate": 2.517192786813848e-05, "Pretrain/Loss": 2.0128564834594727, "Pretrain/Loss (Raw)": 2.161809206008911, "Pretrain/Step": 9782, "Pretrain/Step Time": 8.44650349393487} +{"Pretrain/Learning Rate": 2.5167682800058906e-05, "Pretrain/Loss": 2.0124154090881348, "Pretrain/Loss (Raw)": 2.137132406234741, "Pretrain/Step": 9783, "Pretrain/Step Time": 8.447207979857922} +{"Pretrain/Learning Rate": 2.516343772714432e-05, "Pretrain/Loss": 2.014063835144043, "Pretrain/Loss (Raw)": 2.1026861667633057, "Pretrain/Step": 9784, "Pretrain/Step Time": 8.448855023831129} +{"Pretrain/Learning Rate": 2.5159192649517115e-05, "Pretrain/Loss": 2.0124869346618652, "Pretrain/Loss (Raw)": 1.9718550443649292, "Pretrain/Step": 9785, "Pretrain/Step Time": 8.45131941512227} +{"Pretrain/Learning Rate": 2.5154947567299714e-05, "Pretrain/Loss": 2.01086688041687, "Pretrain/Loss (Raw)": 1.8174885511398315, "Pretrain/Step": 9786, "Pretrain/Step Time": 8.449605667963624} +{"Pretrain/Learning Rate": 2.5150702480614502e-05, "Pretrain/Loss": 2.011678695678711, "Pretrain/Loss (Raw)": 2.05444073677063, "Pretrain/Step": 9787, "Pretrain/Step Time": 8.444006156176329} +{"Pretrain/Learning Rate": 2.514645738958389e-05, "Pretrain/Loss": 2.0068860054016113, "Pretrain/Loss (Raw)": 1.7723592519760132, "Pretrain/Step": 9788, "Pretrain/Step Time": 8.444095112383366} +{"Pretrain/Learning Rate": 2.5142212294330282e-05, "Pretrain/Loss": 2.0067977905273438, "Pretrain/Loss (Raw)": 2.064800500869751, "Pretrain/Step": 9789, "Pretrain/Step Time": 8.4466452319175} +{"Pretrain/Learning Rate": 2.5137967194976087e-05, "Pretrain/Loss": 2.0066964626312256, "Pretrain/Loss (Raw)": 2.0678775310516357, "Pretrain/Step": 9790, "Pretrain/Step Time": 8.444498995319009} +{"Pretrain/Learning Rate": 2.5133722091643706e-05, "Pretrain/Loss": 2.005450963973999, "Pretrain/Loss (Raw)": 1.694448471069336, "Pretrain/Step": 9791, "Pretrain/Step Time": 8.437762193381786} +{"Pretrain/Learning Rate": 2.5129476984455537e-05, "Pretrain/Loss": 2.0055904388427734, "Pretrain/Loss (Raw)": 1.9600881338119507, "Pretrain/Step": 9792, "Pretrain/Step Time": 8.443147534504533} +{"Pretrain/Learning Rate": 2.5125231873533995e-05, "Pretrain/Loss": 2.0073904991149902, "Pretrain/Loss (Raw)": 2.1995513439178467, "Pretrain/Step": 9793, "Pretrain/Step Time": 8.444258382543921} +{"Pretrain/Learning Rate": 2.5120986759001474e-05, "Pretrain/Loss": 2.0111258029937744, "Pretrain/Loss (Raw)": 2.465261459350586, "Pretrain/Step": 9794, "Pretrain/Step Time": 8.44582881219685} +{"Pretrain/Learning Rate": 2.511674164098039e-05, "Pretrain/Loss": 2.0111517906188965, "Pretrain/Loss (Raw)": 2.172703504562378, "Pretrain/Step": 9795, "Pretrain/Step Time": 8.443778704851866} +{"Pretrain/Learning Rate": 2.5112496519593147e-05, "Pretrain/Loss": 2.0093846321105957, "Pretrain/Loss (Raw)": 1.8400954008102417, "Pretrain/Step": 9796, "Pretrain/Step Time": 8.443373210728168} +{"Pretrain/Learning Rate": 2.510825139496214e-05, "Pretrain/Loss": 2.010334014892578, "Pretrain/Loss (Raw)": 1.9504871368408203, "Pretrain/Step": 9797, "Pretrain/Step Time": 8.448731180280447} +{"Pretrain/Learning Rate": 2.510400626720978e-05, "Pretrain/Loss": 2.010152816772461, "Pretrain/Loss (Raw)": 1.8598402738571167, "Pretrain/Step": 9798, "Pretrain/Step Time": 8.445286365225911} +{"Pretrain/Learning Rate": 2.5099761136458478e-05, "Pretrain/Loss": 2.0141124725341797, "Pretrain/Loss (Raw)": 2.2125227451324463, "Pretrain/Step": 9799, "Pretrain/Step Time": 8.441451465710998} +{"Pretrain/Learning Rate": 2.5095516002830626e-05, "Pretrain/Loss": 2.015956401824951, "Pretrain/Loss (Raw)": 2.1179864406585693, "Pretrain/Step": 9800, "Pretrain/Step Time": 8.440118016675115} +{"Pretrain/Learning Rate": 2.5091270866448646e-05, "Pretrain/Loss": 2.0169076919555664, "Pretrain/Loss (Raw)": 1.9281718730926514, "Pretrain/Step": 9801, "Pretrain/Step Time": 8.442697301506996} +{"Pretrain/Learning Rate": 2.5087025727434938e-05, "Pretrain/Loss": 2.015718936920166, "Pretrain/Loss (Raw)": 2.020817756652832, "Pretrain/Step": 9802, "Pretrain/Step Time": 8.440495509654284} +{"Pretrain/Learning Rate": 2.5082780585911895e-05, "Pretrain/Loss": 2.01617431640625, "Pretrain/Loss (Raw)": 2.092696189880371, "Pretrain/Step": 9803, "Pretrain/Step Time": 8.44765566661954} +{"Pretrain/Learning Rate": 2.5078535442001934e-05, "Pretrain/Loss": 2.0144598484039307, "Pretrain/Loss (Raw)": 1.7855249643325806, "Pretrain/Step": 9804, "Pretrain/Step Time": 8.442608185112476} +{"Pretrain/Learning Rate": 2.5074290295827457e-05, "Pretrain/Loss": 2.0137414932250977, "Pretrain/Loss (Raw)": 1.9546434879302979, "Pretrain/Step": 9805, "Pretrain/Step Time": 8.43878809735179} +{"Pretrain/Learning Rate": 2.5070045147510874e-05, "Pretrain/Loss": 2.0140907764434814, "Pretrain/Loss (Raw)": 1.9994157552719116, "Pretrain/Step": 9806, "Pretrain/Step Time": 8.43950343504548} +{"Pretrain/Learning Rate": 2.506579999717459e-05, "Pretrain/Loss": 2.0153794288635254, "Pretrain/Loss (Raw)": 2.1431825160980225, "Pretrain/Step": 9807, "Pretrain/Step Time": 8.435887923464179} +{"Pretrain/Learning Rate": 2.506155484494101e-05, "Pretrain/Loss": 2.0138847827911377, "Pretrain/Loss (Raw)": 2.042410373687744, "Pretrain/Step": 9808, "Pretrain/Step Time": 8.440135605633259} +{"Pretrain/Learning Rate": 2.5057309690932533e-05, "Pretrain/Loss": 2.014260768890381, "Pretrain/Loss (Raw)": 2.2225019931793213, "Pretrain/Step": 9809, "Pretrain/Step Time": 8.439643746241927} +{"Pretrain/Learning Rate": 2.5053064535271575e-05, "Pretrain/Loss": 2.0147905349731445, "Pretrain/Loss (Raw)": 1.9823558330535889, "Pretrain/Step": 9810, "Pretrain/Step Time": 8.441983116790652} +{"Pretrain/Learning Rate": 2.504881937808054e-05, "Pretrain/Loss": 2.0136401653289795, "Pretrain/Loss (Raw)": 1.9184805154800415, "Pretrain/Step": 9811, "Pretrain/Step Time": 8.437989499419928} +{"Pretrain/Learning Rate": 2.5044574219481832e-05, "Pretrain/Loss": 2.0140490531921387, "Pretrain/Loss (Raw)": 1.8640018701553345, "Pretrain/Step": 9812, "Pretrain/Step Time": 8.439185228198767} +{"Pretrain/Learning Rate": 2.5040329059597862e-05, "Pretrain/Loss": 2.0159902572631836, "Pretrain/Loss (Raw)": 2.128591537475586, "Pretrain/Step": 9813, "Pretrain/Step Time": 8.440336341038346} +{"Pretrain/Learning Rate": 2.503608389855103e-05, "Pretrain/Loss": 2.017899990081787, "Pretrain/Loss (Raw)": 2.141374111175537, "Pretrain/Step": 9814, "Pretrain/Step Time": 8.443466734141111} +{"Pretrain/Learning Rate": 2.5031838736463743e-05, "Pretrain/Loss": 2.0186405181884766, "Pretrain/Loss (Raw)": 2.206979751586914, "Pretrain/Step": 9815, "Pretrain/Step Time": 8.440703483298421} +{"Pretrain/Learning Rate": 2.5027593573458403e-05, "Pretrain/Loss": 2.02115535736084, "Pretrain/Loss (Raw)": 2.019723892211914, "Pretrain/Step": 9816, "Pretrain/Step Time": 8.442334655672312} +{"Pretrain/Learning Rate": 2.5023348409657425e-05, "Pretrain/Loss": 2.0214993953704834, "Pretrain/Loss (Raw)": 2.0757570266723633, "Pretrain/Step": 9817, "Pretrain/Step Time": 8.443854732438922} +{"Pretrain/Learning Rate": 2.5019103245183218e-05, "Pretrain/Loss": 2.0214171409606934, "Pretrain/Loss (Raw)": 1.9477384090423584, "Pretrain/Step": 9818, "Pretrain/Step Time": 8.440122820436954} +{"Pretrain/Learning Rate": 2.5014858080158175e-05, "Pretrain/Loss": 2.0219058990478516, "Pretrain/Loss (Raw)": 2.176193952560425, "Pretrain/Step": 9819, "Pretrain/Step Time": 8.439211985096335} +{"Pretrain/Learning Rate": 2.5010612914704714e-05, "Pretrain/Loss": 2.020902633666992, "Pretrain/Loss (Raw)": 1.8888251781463623, "Pretrain/Step": 9820, "Pretrain/Step Time": 8.438658129423857} +{"Pretrain/Learning Rate": 2.5006367748945236e-05, "Pretrain/Loss": 2.0212242603302, "Pretrain/Loss (Raw)": 1.9328478574752808, "Pretrain/Step": 9821, "Pretrain/Step Time": 8.438801096752286} +{"Pretrain/Learning Rate": 2.5002122583002148e-05, "Pretrain/Loss": 2.0204033851623535, "Pretrain/Loss (Raw)": 1.764992594718933, "Pretrain/Step": 9822, "Pretrain/Step Time": 8.43241610378027} +{"Pretrain/Learning Rate": 2.4997877416997858e-05, "Pretrain/Loss": 2.0182456970214844, "Pretrain/Loss (Raw)": 2.0602102279663086, "Pretrain/Step": 9823, "Pretrain/Step Time": 8.436920199543238} +{"Pretrain/Learning Rate": 2.499363225105477e-05, "Pretrain/Loss": 2.01973295211792, "Pretrain/Loss (Raw)": 2.121915340423584, "Pretrain/Step": 9824, "Pretrain/Step Time": 8.436598181724548} +{"Pretrain/Learning Rate": 2.498938708529529e-05, "Pretrain/Loss": 2.0178558826446533, "Pretrain/Loss (Raw)": 1.8114837408065796, "Pretrain/Step": 9825, "Pretrain/Step Time": 8.441393850371242} +{"Pretrain/Learning Rate": 2.4985141919841827e-05, "Pretrain/Loss": 2.0188188552856445, "Pretrain/Loss (Raw)": 2.1562576293945312, "Pretrain/Step": 9826, "Pretrain/Step Time": 8.441434724256396} +{"Pretrain/Learning Rate": 2.4980896754816788e-05, "Pretrain/Loss": 2.0206785202026367, "Pretrain/Loss (Raw)": 2.301692008972168, "Pretrain/Step": 9827, "Pretrain/Step Time": 8.439815578982234} +{"Pretrain/Learning Rate": 2.497665159034258e-05, "Pretrain/Loss": 2.0213818550109863, "Pretrain/Loss (Raw)": 2.0832526683807373, "Pretrain/Step": 9828, "Pretrain/Step Time": 8.439092384651303} +{"Pretrain/Learning Rate": 2.4972406426541602e-05, "Pretrain/Loss": 2.023435592651367, "Pretrain/Loss (Raw)": 2.0729832649230957, "Pretrain/Step": 9829, "Pretrain/Step Time": 8.442980635911226} +{"Pretrain/Learning Rate": 2.4968161263536266e-05, "Pretrain/Loss": 2.0201823711395264, "Pretrain/Loss (Raw)": 1.6840211153030396, "Pretrain/Step": 9830, "Pretrain/Step Time": 8.44409603625536} +{"Pretrain/Learning Rate": 2.4963916101448977e-05, "Pretrain/Loss": 2.020169258117676, "Pretrain/Loss (Raw)": 1.965193748474121, "Pretrain/Step": 9831, "Pretrain/Step Time": 8.444702167063951} +{"Pretrain/Learning Rate": 2.495967094040214e-05, "Pretrain/Loss": 2.0227227210998535, "Pretrain/Loss (Raw)": 2.2517387866973877, "Pretrain/Step": 9832, "Pretrain/Step Time": 8.444830495864153} +{"Pretrain/Learning Rate": 2.4955425780518174e-05, "Pretrain/Loss": 2.0224006175994873, "Pretrain/Loss (Raw)": 2.0821797847747803, "Pretrain/Step": 9833, "Pretrain/Step Time": 8.44370786845684} +{"Pretrain/Learning Rate": 2.4951180621919465e-05, "Pretrain/Loss": 2.0202622413635254, "Pretrain/Loss (Raw)": 1.8894599676132202, "Pretrain/Step": 9834, "Pretrain/Step Time": 8.445791184902191} +{"Pretrain/Learning Rate": 2.4946935464728427e-05, "Pretrain/Loss": 2.0180554389953613, "Pretrain/Loss (Raw)": 2.052382469177246, "Pretrain/Step": 9835, "Pretrain/Step Time": 8.447933344170451} +{"Pretrain/Learning Rate": 2.494269030906747e-05, "Pretrain/Loss": 2.020956039428711, "Pretrain/Loss (Raw)": 2.1031641960144043, "Pretrain/Step": 9836, "Pretrain/Step Time": 8.447660313919187} +{"Pretrain/Learning Rate": 2.4938445155058995e-05, "Pretrain/Loss": 2.0215096473693848, "Pretrain/Loss (Raw)": 2.144615650177002, "Pretrain/Step": 9837, "Pretrain/Step Time": 8.445500811561942} +{"Pretrain/Learning Rate": 2.493420000282542e-05, "Pretrain/Loss": 2.0216007232666016, "Pretrain/Loss (Raw)": 1.9172340631484985, "Pretrain/Step": 9838, "Pretrain/Step Time": 8.440850434824824} +{"Pretrain/Learning Rate": 2.492995485248913e-05, "Pretrain/Loss": 2.0224204063415527, "Pretrain/Loss (Raw)": 2.250356912612915, "Pretrain/Step": 9839, "Pretrain/Step Time": 8.441472370177507} +{"Pretrain/Learning Rate": 2.492570970417255e-05, "Pretrain/Loss": 2.0220885276794434, "Pretrain/Loss (Raw)": 1.9268475770950317, "Pretrain/Step": 9840, "Pretrain/Step Time": 8.441560318693519} +{"Pretrain/Learning Rate": 2.4921464557998072e-05, "Pretrain/Loss": 2.0196759700775146, "Pretrain/Loss (Raw)": 1.8406496047973633, "Pretrain/Step": 9841, "Pretrain/Step Time": 8.443809933960438} +{"Pretrain/Learning Rate": 2.491721941408811e-05, "Pretrain/Loss": 2.020061492919922, "Pretrain/Loss (Raw)": 1.9432945251464844, "Pretrain/Step": 9842, "Pretrain/Step Time": 8.436526525765657} +{"Pretrain/Learning Rate": 2.491297427256507e-05, "Pretrain/Loss": 2.018512725830078, "Pretrain/Loss (Raw)": 1.73971688747406, "Pretrain/Step": 9843, "Pretrain/Step Time": 8.435699926689267} +{"Pretrain/Learning Rate": 2.490872913355136e-05, "Pretrain/Loss": 2.015148878097534, "Pretrain/Loss (Raw)": 1.8729549646377563, "Pretrain/Step": 9844, "Pretrain/Step Time": 8.439637366682291} +{"Pretrain/Learning Rate": 2.4904483997169373e-05, "Pretrain/Loss": 2.0151004791259766, "Pretrain/Loss (Raw)": 1.9217795133590698, "Pretrain/Step": 9845, "Pretrain/Step Time": 8.438940864056349} +{"Pretrain/Learning Rate": 2.4900238863541524e-05, "Pretrain/Loss": 2.0158345699310303, "Pretrain/Loss (Raw)": 2.0614237785339355, "Pretrain/Step": 9846, "Pretrain/Step Time": 8.444373972713947} +{"Pretrain/Learning Rate": 2.489599373279022e-05, "Pretrain/Loss": 2.0158610343933105, "Pretrain/Loss (Raw)": 2.0914430618286133, "Pretrain/Step": 9847, "Pretrain/Step Time": 8.441515738144517} +{"Pretrain/Learning Rate": 2.489174860503786e-05, "Pretrain/Loss": 2.0149025917053223, "Pretrain/Loss (Raw)": 1.942310094833374, "Pretrain/Step": 9848, "Pretrain/Step Time": 8.446036517620087} +{"Pretrain/Learning Rate": 2.488750348040686e-05, "Pretrain/Loss": 2.0130956172943115, "Pretrain/Loss (Raw)": 1.7989070415496826, "Pretrain/Step": 9849, "Pretrain/Step Time": 8.444434313103557} +{"Pretrain/Learning Rate": 2.488325835901961e-05, "Pretrain/Loss": 2.0128567218780518, "Pretrain/Loss (Raw)": 1.9718562364578247, "Pretrain/Step": 9850, "Pretrain/Step Time": 8.438915427774191} +{"Pretrain/Learning Rate": 2.4879013240998525e-05, "Pretrain/Loss": 2.0116758346557617, "Pretrain/Loss (Raw)": 1.9266570806503296, "Pretrain/Step": 9851, "Pretrain/Step Time": 8.443062348291278} +{"Pretrain/Learning Rate": 2.4874768126466007e-05, "Pretrain/Loss": 2.0088963508605957, "Pretrain/Loss (Raw)": 1.7881934642791748, "Pretrain/Step": 9852, "Pretrain/Step Time": 8.444588426500559} +{"Pretrain/Learning Rate": 2.4870523015544462e-05, "Pretrain/Loss": 2.00924015045166, "Pretrain/Loss (Raw)": 2.055995464324951, "Pretrain/Step": 9853, "Pretrain/Step Time": 8.440640369430184} +{"Pretrain/Learning Rate": 2.48662779083563e-05, "Pretrain/Loss": 2.0101521015167236, "Pretrain/Loss (Raw)": 2.001422643661499, "Pretrain/Step": 9854, "Pretrain/Step Time": 8.44464792497456} +{"Pretrain/Learning Rate": 2.4862032805023916e-05, "Pretrain/Loss": 2.007113456726074, "Pretrain/Loss (Raw)": 1.883774757385254, "Pretrain/Step": 9855, "Pretrain/Step Time": 8.43858034722507} +{"Pretrain/Learning Rate": 2.4857787705669717e-05, "Pretrain/Loss": 2.005802631378174, "Pretrain/Loss (Raw)": 1.9800958633422852, "Pretrain/Step": 9856, "Pretrain/Step Time": 8.43751803971827} +{"Pretrain/Learning Rate": 2.4853542610416113e-05, "Pretrain/Loss": 2.0063440799713135, "Pretrain/Loss (Raw)": 2.2593069076538086, "Pretrain/Step": 9857, "Pretrain/Step Time": 8.441602818667889} +{"Pretrain/Learning Rate": 2.4849297519385497e-05, "Pretrain/Loss": 2.0070087909698486, "Pretrain/Loss (Raw)": 2.069460153579712, "Pretrain/Step": 9858, "Pretrain/Step Time": 8.441841211169958} +{"Pretrain/Learning Rate": 2.4845052432700292e-05, "Pretrain/Loss": 2.0091071128845215, "Pretrain/Loss (Raw)": 2.1836202144622803, "Pretrain/Step": 9859, "Pretrain/Step Time": 8.4437798820436} +{"Pretrain/Learning Rate": 2.4840807350482884e-05, "Pretrain/Loss": 2.0083389282226562, "Pretrain/Loss (Raw)": 1.802452564239502, "Pretrain/Step": 9860, "Pretrain/Step Time": 8.441678244620562} +{"Pretrain/Learning Rate": 2.4836562272855684e-05, "Pretrain/Loss": 2.0098347663879395, "Pretrain/Loss (Raw)": 2.2260706424713135, "Pretrain/Step": 9861, "Pretrain/Step Time": 8.441179947927594} +{"Pretrain/Learning Rate": 2.4832317199941096e-05, "Pretrain/Loss": 2.009852409362793, "Pretrain/Loss (Raw)": 1.9309641122817993, "Pretrain/Step": 9862, "Pretrain/Step Time": 8.442653499543667} +{"Pretrain/Learning Rate": 2.4828072131861522e-05, "Pretrain/Loss": 2.007978677749634, "Pretrain/Loss (Raw)": 1.8869009017944336, "Pretrain/Step": 9863, "Pretrain/Step Time": 8.442477378994226} +{"Pretrain/Learning Rate": 2.4823827068739375e-05, "Pretrain/Loss": 2.00600528717041, "Pretrain/Loss (Raw)": 1.8913248777389526, "Pretrain/Step": 9864, "Pretrain/Step Time": 8.447403207421303} +{"Pretrain/Learning Rate": 2.481958201069705e-05, "Pretrain/Loss": 2.0096330642700195, "Pretrain/Loss (Raw)": 1.8568363189697266, "Pretrain/Step": 9865, "Pretrain/Step Time": 8.446170022711158} +{"Pretrain/Learning Rate": 2.4815336957856947e-05, "Pretrain/Loss": 2.012031316757202, "Pretrain/Loss (Raw)": 2.170865058898926, "Pretrain/Step": 9866, "Pretrain/Step Time": 8.44256249256432} +{"Pretrain/Learning Rate": 2.481109191034147e-05, "Pretrain/Loss": 2.012523651123047, "Pretrain/Loss (Raw)": 2.153571128845215, "Pretrain/Step": 9867, "Pretrain/Step Time": 8.445163358002901} +{"Pretrain/Learning Rate": 2.4806846868273024e-05, "Pretrain/Loss": 2.010660409927368, "Pretrain/Loss (Raw)": 1.9779911041259766, "Pretrain/Step": 9868, "Pretrain/Step Time": 8.443978037685156} +{"Pretrain/Learning Rate": 2.4802601831774013e-05, "Pretrain/Loss": 2.012899398803711, "Pretrain/Loss (Raw)": 2.1627538204193115, "Pretrain/Step": 9869, "Pretrain/Step Time": 8.441018372774124} +{"Pretrain/Learning Rate": 2.4798356800966836e-05, "Pretrain/Loss": 2.0132529735565186, "Pretrain/Loss (Raw)": 1.999969482421875, "Pretrain/Step": 9870, "Pretrain/Step Time": 8.444536561146379} +{"Pretrain/Learning Rate": 2.4794111775973904e-05, "Pretrain/Loss": 2.016756534576416, "Pretrain/Loss (Raw)": 2.201758861541748, "Pretrain/Step": 9871, "Pretrain/Step Time": 8.446504456922412} +{"Pretrain/Learning Rate": 2.4789866756917615e-05, "Pretrain/Loss": 2.017198085784912, "Pretrain/Loss (Raw)": 2.1759541034698486, "Pretrain/Step": 9872, "Pretrain/Step Time": 8.449356812983751} +{"Pretrain/Learning Rate": 2.4785621743920363e-05, "Pretrain/Loss": 2.019399642944336, "Pretrain/Loss (Raw)": 2.166181802749634, "Pretrain/Step": 9873, "Pretrain/Step Time": 8.44750683940947} +{"Pretrain/Learning Rate": 2.478137673710456e-05, "Pretrain/Loss": 2.020817756652832, "Pretrain/Loss (Raw)": 1.9959924221038818, "Pretrain/Step": 9874, "Pretrain/Step Time": 8.443825542926788} +{"Pretrain/Learning Rate": 2.4777131736592606e-05, "Pretrain/Loss": 2.0218920707702637, "Pretrain/Loss (Raw)": 2.1779773235321045, "Pretrain/Step": 9875, "Pretrain/Step Time": 8.44558304734528} +{"Pretrain/Learning Rate": 2.47728867425069e-05, "Pretrain/Loss": 2.0212440490722656, "Pretrain/Loss (Raw)": 2.0401477813720703, "Pretrain/Step": 9876, "Pretrain/Step Time": 8.446439599618316} +{"Pretrain/Learning Rate": 2.476864175496985e-05, "Pretrain/Loss": 2.021786689758301, "Pretrain/Loss (Raw)": 2.0438523292541504, "Pretrain/Step": 9877, "Pretrain/Step Time": 8.444966856390238} +{"Pretrain/Learning Rate": 2.4764396774103846e-05, "Pretrain/Loss": 2.017509937286377, "Pretrain/Loss (Raw)": 1.7582772970199585, "Pretrain/Step": 9878, "Pretrain/Step Time": 8.445432901382446} +{"Pretrain/Learning Rate": 2.4760151800031296e-05, "Pretrain/Loss": 2.0178494453430176, "Pretrain/Loss (Raw)": 2.034055471420288, "Pretrain/Step": 9879, "Pretrain/Step Time": 8.450157646089792} +{"Pretrain/Learning Rate": 2.4755906832874596e-05, "Pretrain/Loss": 2.0204010009765625, "Pretrain/Loss (Raw)": 2.3140509128570557, "Pretrain/Step": 9880, "Pretrain/Step Time": 8.450402736663818} +{"Pretrain/Learning Rate": 2.4751661872756154e-05, "Pretrain/Loss": 2.0206785202026367, "Pretrain/Loss (Raw)": 1.867921233177185, "Pretrain/Step": 9881, "Pretrain/Step Time": 8.45369753614068} +{"Pretrain/Learning Rate": 2.4747416919798373e-05, "Pretrain/Loss": 2.0207438468933105, "Pretrain/Loss (Raw)": 2.1448538303375244, "Pretrain/Step": 9882, "Pretrain/Step Time": 8.448365792632103} +{"Pretrain/Learning Rate": 2.474317197412364e-05, "Pretrain/Loss": 2.0225253105163574, "Pretrain/Loss (Raw)": 2.186028003692627, "Pretrain/Step": 9883, "Pretrain/Step Time": 8.450206248089671} +{"Pretrain/Learning Rate": 2.4738927035854358e-05, "Pretrain/Loss": 2.0242180824279785, "Pretrain/Loss (Raw)": 2.1079084873199463, "Pretrain/Step": 9884, "Pretrain/Step Time": 8.44940554536879} +{"Pretrain/Learning Rate": 2.4734682105112936e-05, "Pretrain/Loss": 2.022462844848633, "Pretrain/Loss (Raw)": 1.9093340635299683, "Pretrain/Step": 9885, "Pretrain/Step Time": 8.456561436876655} +{"Pretrain/Learning Rate": 2.4730437182021767e-05, "Pretrain/Loss": 2.021773099899292, "Pretrain/Loss (Raw)": 1.9893901348114014, "Pretrain/Step": 9886, "Pretrain/Step Time": 8.455307122319937} +{"Pretrain/Learning Rate": 2.4726192266703257e-05, "Pretrain/Loss": 2.020631790161133, "Pretrain/Loss (Raw)": 1.8563915491104126, "Pretrain/Step": 9887, "Pretrain/Step Time": 8.463197389617562} +{"Pretrain/Learning Rate": 2.4721947359279795e-05, "Pretrain/Loss": 2.0178475379943848, "Pretrain/Loss (Raw)": 1.973319411277771, "Pretrain/Step": 9888, "Pretrain/Step Time": 8.458643836900592} +{"Pretrain/Learning Rate": 2.471770245987379e-05, "Pretrain/Loss": 2.017958879470825, "Pretrain/Loss (Raw)": 2.0150599479675293, "Pretrain/Step": 9889, "Pretrain/Step Time": 8.460846811532974} +{"Pretrain/Learning Rate": 2.471345756860763e-05, "Pretrain/Loss": 2.018540859222412, "Pretrain/Loss (Raw)": 2.1026880741119385, "Pretrain/Step": 9890, "Pretrain/Step Time": 8.455742366611958} +{"Pretrain/Learning Rate": 2.4709212685603717e-05, "Pretrain/Loss": 2.0181264877319336, "Pretrain/Loss (Raw)": 2.0123517513275146, "Pretrain/Step": 9891, "Pretrain/Step Time": 8.45642289146781} +{"Pretrain/Learning Rate": 2.470496781098446e-05, "Pretrain/Loss": 2.0180959701538086, "Pretrain/Loss (Raw)": 1.9244986772537231, "Pretrain/Step": 9892, "Pretrain/Step Time": 8.458206014707685} +{"Pretrain/Learning Rate": 2.470072294487224e-05, "Pretrain/Loss": 2.0188655853271484, "Pretrain/Loss (Raw)": 2.0346312522888184, "Pretrain/Step": 9893, "Pretrain/Step Time": 8.457806464284658} +{"Pretrain/Learning Rate": 2.4696478087389466e-05, "Pretrain/Loss": 2.0172080993652344, "Pretrain/Loss (Raw)": 1.7951828241348267, "Pretrain/Step": 9894, "Pretrain/Step Time": 8.45665149949491} +{"Pretrain/Learning Rate": 2.4692233238658534e-05, "Pretrain/Loss": 2.015687942504883, "Pretrain/Loss (Raw)": 1.9320460557937622, "Pretrain/Step": 9895, "Pretrain/Step Time": 8.46402077935636} +{"Pretrain/Learning Rate": 2.4687988398801833e-05, "Pretrain/Loss": 2.012500047683716, "Pretrain/Loss (Raw)": 1.6676673889160156, "Pretrain/Step": 9896, "Pretrain/Step Time": 8.463037021458149} +{"Pretrain/Learning Rate": 2.4683743567941778e-05, "Pretrain/Loss": 2.0133111476898193, "Pretrain/Loss (Raw)": 2.0257673263549805, "Pretrain/Step": 9897, "Pretrain/Step Time": 8.460769463330507} +{"Pretrain/Learning Rate": 2.4679498746200747e-05, "Pretrain/Loss": 2.014828681945801, "Pretrain/Loss (Raw)": 2.1303486824035645, "Pretrain/Step": 9898, "Pretrain/Step Time": 8.459622068330646} +{"Pretrain/Learning Rate": 2.4675253933701144e-05, "Pretrain/Loss": 2.015366315841675, "Pretrain/Loss (Raw)": 2.244586944580078, "Pretrain/Step": 9899, "Pretrain/Step Time": 8.456643400713801} +{"Pretrain/Learning Rate": 2.4671009130565364e-05, "Pretrain/Loss": 2.016845226287842, "Pretrain/Loss (Raw)": 2.2808678150177, "Pretrain/Step": 9900, "Pretrain/Step Time": 8.458260087296367} +{"Pretrain/Learning Rate": 2.4666764336915805e-05, "Pretrain/Loss": 2.0167012214660645, "Pretrain/Loss (Raw)": 1.9525741338729858, "Pretrain/Step": 9901, "Pretrain/Step Time": 8.46314232237637} +{"Pretrain/Learning Rate": 2.4662519552874863e-05, "Pretrain/Loss": 2.0164709091186523, "Pretrain/Loss (Raw)": 1.9534450769424438, "Pretrain/Step": 9902, "Pretrain/Step Time": 8.465851224958897} +{"Pretrain/Learning Rate": 2.465827477856493e-05, "Pretrain/Loss": 2.018207550048828, "Pretrain/Loss (Raw)": 2.0530214309692383, "Pretrain/Step": 9903, "Pretrain/Step Time": 8.46245887503028} +{"Pretrain/Learning Rate": 2.4654030014108405e-05, "Pretrain/Loss": 2.015842914581299, "Pretrain/Loss (Raw)": 1.7453263998031616, "Pretrain/Step": 9904, "Pretrain/Step Time": 8.462080208584666} +{"Pretrain/Learning Rate": 2.4649785259627675e-05, "Pretrain/Loss": 2.015408754348755, "Pretrain/Loss (Raw)": 2.1178078651428223, "Pretrain/Step": 9905, "Pretrain/Step Time": 8.464103750884533} +{"Pretrain/Learning Rate": 2.4645540515245143e-05, "Pretrain/Loss": 2.015349864959717, "Pretrain/Loss (Raw)": 2.04030442237854, "Pretrain/Step": 9906, "Pretrain/Step Time": 8.461978685110807} +{"Pretrain/Learning Rate": 2.4641295781083203e-05, "Pretrain/Loss": 2.0153555870056152, "Pretrain/Loss (Raw)": 1.9199987649917603, "Pretrain/Step": 9907, "Pretrain/Step Time": 8.457488112151623} +{"Pretrain/Learning Rate": 2.463705105726425e-05, "Pretrain/Loss": 2.014042377471924, "Pretrain/Loss (Raw)": 1.9832087755203247, "Pretrain/Step": 9908, "Pretrain/Step Time": 8.46465558744967} +{"Pretrain/Learning Rate": 2.4632806343910663e-05, "Pretrain/Loss": 2.017289400100708, "Pretrain/Loss (Raw)": 2.2100484371185303, "Pretrain/Step": 9909, "Pretrain/Step Time": 8.462964158505201} +{"Pretrain/Learning Rate": 2.4628561641144855e-05, "Pretrain/Loss": 2.0187430381774902, "Pretrain/Loss (Raw)": 2.3479011058807373, "Pretrain/Step": 9910, "Pretrain/Step Time": 8.464016074314713} +{"Pretrain/Learning Rate": 2.4624316949089204e-05, "Pretrain/Loss": 2.015955924987793, "Pretrain/Loss (Raw)": 1.780346155166626, "Pretrain/Step": 9911, "Pretrain/Step Time": 8.465975161641836} +{"Pretrain/Learning Rate": 2.462007226786611e-05, "Pretrain/Loss": 2.016538381576538, "Pretrain/Loss (Raw)": 2.17724871635437, "Pretrain/Step": 9912, "Pretrain/Step Time": 8.465369647368789} +{"Pretrain/Learning Rate": 2.461582759759797e-05, "Pretrain/Loss": 2.0174484252929688, "Pretrain/Loss (Raw)": 2.088343620300293, "Pretrain/Step": 9913, "Pretrain/Step Time": 8.460405452176929} +{"Pretrain/Learning Rate": 2.461158293840717e-05, "Pretrain/Loss": 2.018059730529785, "Pretrain/Loss (Raw)": 1.8957133293151855, "Pretrain/Step": 9914, "Pretrain/Step Time": 8.463221030309796} +{"Pretrain/Learning Rate": 2.4607338290416096e-05, "Pretrain/Loss": 2.0177550315856934, "Pretrain/Loss (Raw)": 2.01547908782959, "Pretrain/Step": 9915, "Pretrain/Step Time": 8.470312232151628} +{"Pretrain/Learning Rate": 2.4603093653747146e-05, "Pretrain/Loss": 2.0180201530456543, "Pretrain/Loss (Raw)": 1.8062485456466675, "Pretrain/Step": 9916, "Pretrain/Step Time": 8.46639634296298} +{"Pretrain/Learning Rate": 2.4598849028522713e-05, "Pretrain/Loss": 2.018704414367676, "Pretrain/Loss (Raw)": 2.1524157524108887, "Pretrain/Step": 9917, "Pretrain/Step Time": 8.465608207508922} +{"Pretrain/Learning Rate": 2.4594604414865192e-05, "Pretrain/Loss": 2.0186307430267334, "Pretrain/Loss (Raw)": 2.0584540367126465, "Pretrain/Step": 9918, "Pretrain/Step Time": 8.469257159158587} +{"Pretrain/Learning Rate": 2.4590359812896956e-05, "Pretrain/Loss": 2.02170467376709, "Pretrain/Loss (Raw)": 2.087877035140991, "Pretrain/Step": 9919, "Pretrain/Step Time": 8.471791256219149} +{"Pretrain/Learning Rate": 2.458611522274041e-05, "Pretrain/Loss": 2.021092653274536, "Pretrain/Loss (Raw)": 1.8817837238311768, "Pretrain/Step": 9920, "Pretrain/Step Time": 8.469604132696986} +{"Pretrain/Learning Rate": 2.458187064451794e-05, "Pretrain/Loss": 2.0184030532836914, "Pretrain/Loss (Raw)": 1.8552876710891724, "Pretrain/Step": 9921, "Pretrain/Step Time": 8.470302389934659} +{"Pretrain/Learning Rate": 2.4577626078351934e-05, "Pretrain/Loss": 2.013845443725586, "Pretrain/Loss (Raw)": 1.8818936347961426, "Pretrain/Step": 9922, "Pretrain/Step Time": 8.476246137171984} +{"Pretrain/Learning Rate": 2.4573381524364788e-05, "Pretrain/Loss": 2.012932538986206, "Pretrain/Loss (Raw)": 2.055830955505371, "Pretrain/Step": 9923, "Pretrain/Step Time": 8.475579041987658} +{"Pretrain/Learning Rate": 2.456913698267888e-05, "Pretrain/Loss": 2.013394594192505, "Pretrain/Loss (Raw)": 1.8992499113082886, "Pretrain/Step": 9924, "Pretrain/Step Time": 8.475524278357625} +{"Pretrain/Learning Rate": 2.4564892453416605e-05, "Pretrain/Loss": 2.0158510208129883, "Pretrain/Loss (Raw)": 2.26491379737854, "Pretrain/Step": 9925, "Pretrain/Step Time": 8.470473801717162} +{"Pretrain/Learning Rate": 2.4560647936700345e-05, "Pretrain/Loss": 2.0164713859558105, "Pretrain/Loss (Raw)": 1.939252257347107, "Pretrain/Step": 9926, "Pretrain/Step Time": 8.476550381630659} +{"Pretrain/Learning Rate": 2.4556403432652496e-05, "Pretrain/Loss": 2.0145840644836426, "Pretrain/Loss (Raw)": 1.970907211303711, "Pretrain/Step": 9927, "Pretrain/Step Time": 8.476184569299221} +{"Pretrain/Learning Rate": 2.4552158941395443e-05, "Pretrain/Loss": 2.01427960395813, "Pretrain/Loss (Raw)": 2.0790185928344727, "Pretrain/Step": 9928, "Pretrain/Step Time": 8.480398712679744} +{"Pretrain/Learning Rate": 2.454791446305157e-05, "Pretrain/Loss": 2.0120410919189453, "Pretrain/Loss (Raw)": 1.6416484117507935, "Pretrain/Step": 9929, "Pretrain/Step Time": 8.480268994346261} +{"Pretrain/Learning Rate": 2.4543669997743262e-05, "Pretrain/Loss": 2.0137033462524414, "Pretrain/Loss (Raw)": 2.233612537384033, "Pretrain/Step": 9930, "Pretrain/Step Time": 8.48320340178907} +{"Pretrain/Learning Rate": 2.4539425545592908e-05, "Pretrain/Loss": 2.0126705169677734, "Pretrain/Loss (Raw)": 1.9604907035827637, "Pretrain/Step": 9931, "Pretrain/Step Time": 8.476052919402719} +{"Pretrain/Learning Rate": 2.4535181106722895e-05, "Pretrain/Loss": 2.0147528648376465, "Pretrain/Loss (Raw)": 2.0520553588867188, "Pretrain/Step": 9932, "Pretrain/Step Time": 8.476145414635539} +{"Pretrain/Learning Rate": 2.4530936681255614e-05, "Pretrain/Loss": 2.013672351837158, "Pretrain/Loss (Raw)": 1.8163471221923828, "Pretrain/Step": 9933, "Pretrain/Step Time": 8.47436429001391} +{"Pretrain/Learning Rate": 2.4526692269313436e-05, "Pretrain/Loss": 2.015284299850464, "Pretrain/Loss (Raw)": 2.2057485580444336, "Pretrain/Step": 9934, "Pretrain/Step Time": 8.476575456559658} +{"Pretrain/Learning Rate": 2.452244787101875e-05, "Pretrain/Loss": 2.014418601989746, "Pretrain/Loss (Raw)": 2.0323774814605713, "Pretrain/Step": 9935, "Pretrain/Step Time": 8.478468101471663} +{"Pretrain/Learning Rate": 2.4518203486493946e-05, "Pretrain/Loss": 2.0152623653411865, "Pretrain/Loss (Raw)": 2.150390148162842, "Pretrain/Step": 9936, "Pretrain/Step Time": 8.470409551635385} +{"Pretrain/Learning Rate": 2.4513959115861406e-05, "Pretrain/Loss": 2.01279616355896, "Pretrain/Loss (Raw)": 1.906830072402954, "Pretrain/Step": 9937, "Pretrain/Step Time": 8.477095287293196} +{"Pretrain/Learning Rate": 2.4509714759243517e-05, "Pretrain/Loss": 2.010913133621216, "Pretrain/Loss (Raw)": 1.7413461208343506, "Pretrain/Step": 9938, "Pretrain/Step Time": 8.480565706267953} +{"Pretrain/Learning Rate": 2.450547041676265e-05, "Pretrain/Loss": 2.0115222930908203, "Pretrain/Loss (Raw)": 1.9964346885681152, "Pretrain/Step": 9939, "Pretrain/Step Time": 8.47991618141532} +{"Pretrain/Learning Rate": 2.4501226088541197e-05, "Pretrain/Loss": 2.0112290382385254, "Pretrain/Loss (Raw)": 1.826480507850647, "Pretrain/Step": 9940, "Pretrain/Step Time": 8.481212524697185} +{"Pretrain/Learning Rate": 2.4496981774701535e-05, "Pretrain/Loss": 2.0113120079040527, "Pretrain/Loss (Raw)": 2.139179229736328, "Pretrain/Step": 9941, "Pretrain/Step Time": 8.483221355825663} +{"Pretrain/Learning Rate": 2.4492737475366052e-05, "Pretrain/Loss": 2.0112054347991943, "Pretrain/Loss (Raw)": 2.127764940261841, "Pretrain/Step": 9942, "Pretrain/Step Time": 8.477948766201735} +{"Pretrain/Learning Rate": 2.4488493190657123e-05, "Pretrain/Loss": 2.0104122161865234, "Pretrain/Loss (Raw)": 2.105449676513672, "Pretrain/Step": 9943, "Pretrain/Step Time": 8.481104593724012} +{"Pretrain/Learning Rate": 2.448424892069714e-05, "Pretrain/Loss": 2.010605812072754, "Pretrain/Loss (Raw)": 2.0444998741149902, "Pretrain/Step": 9944, "Pretrain/Step Time": 8.484177470207214} +{"Pretrain/Learning Rate": 2.4480004665608472e-05, "Pretrain/Loss": 2.011533260345459, "Pretrain/Loss (Raw)": 2.1944739818573, "Pretrain/Step": 9945, "Pretrain/Step Time": 8.482341967523098} +{"Pretrain/Learning Rate": 2.44757604255135e-05, "Pretrain/Loss": 2.0128681659698486, "Pretrain/Loss (Raw)": 2.118597984313965, "Pretrain/Step": 9946, "Pretrain/Step Time": 8.489706538617611} +{"Pretrain/Learning Rate": 2.4471516200534608e-05, "Pretrain/Loss": 2.010878086090088, "Pretrain/Loss (Raw)": 1.9214540719985962, "Pretrain/Step": 9947, "Pretrain/Step Time": 8.490248726680875} +{"Pretrain/Learning Rate": 2.446727199079417e-05, "Pretrain/Loss": 2.01108980178833, "Pretrain/Loss (Raw)": 1.9159475564956665, "Pretrain/Step": 9948, "Pretrain/Step Time": 8.486877646297216} +{"Pretrain/Learning Rate": 2.4463027796414587e-05, "Pretrain/Loss": 2.0124406814575195, "Pretrain/Loss (Raw)": 2.105762004852295, "Pretrain/Step": 9949, "Pretrain/Step Time": 8.486940352246165} +{"Pretrain/Learning Rate": 2.4458783617518203e-05, "Pretrain/Loss": 2.015346050262451, "Pretrain/Loss (Raw)": 2.1368627548217773, "Pretrain/Step": 9950, "Pretrain/Step Time": 8.493076290935278} +{"Pretrain/Learning Rate": 2.445453945422742e-05, "Pretrain/Loss": 2.0137486457824707, "Pretrain/Loss (Raw)": 1.8557233810424805, "Pretrain/Step": 9951, "Pretrain/Step Time": 8.485422244295478} +{"Pretrain/Learning Rate": 2.4450295306664597e-05, "Pretrain/Loss": 2.0129644870758057, "Pretrain/Loss (Raw)": 2.0215625762939453, "Pretrain/Step": 9952, "Pretrain/Step Time": 8.483412766829133} +{"Pretrain/Learning Rate": 2.4446051174952127e-05, "Pretrain/Loss": 2.0152504444122314, "Pretrain/Loss (Raw)": 2.1040709018707275, "Pretrain/Step": 9953, "Pretrain/Step Time": 8.479379925876856} +{"Pretrain/Learning Rate": 2.4441807059212376e-05, "Pretrain/Loss": 2.014349937438965, "Pretrain/Loss (Raw)": 2.041013479232788, "Pretrain/Step": 9954, "Pretrain/Step Time": 8.476919433102012} +{"Pretrain/Learning Rate": 2.443756295956773e-05, "Pretrain/Loss": 2.0142338275909424, "Pretrain/Loss (Raw)": 2.2868242263793945, "Pretrain/Step": 9955, "Pretrain/Step Time": 8.483826495707035} +{"Pretrain/Learning Rate": 2.4433318876140558e-05, "Pretrain/Loss": 2.015167236328125, "Pretrain/Loss (Raw)": 2.2027156352996826, "Pretrain/Step": 9956, "Pretrain/Step Time": 8.481393292546272} +{"Pretrain/Learning Rate": 2.442907480905324e-05, "Pretrain/Loss": 2.0116896629333496, "Pretrain/Loss (Raw)": 1.6278619766235352, "Pretrain/Step": 9957, "Pretrain/Step Time": 8.479531090706587} +{"Pretrain/Learning Rate": 2.442483075842814e-05, "Pretrain/Loss": 2.013411283493042, "Pretrain/Loss (Raw)": 1.904412865638733, "Pretrain/Step": 9958, "Pretrain/Step Time": 8.480025054886937} +{"Pretrain/Learning Rate": 2.442058672438764e-05, "Pretrain/Loss": 2.013563632965088, "Pretrain/Loss (Raw)": 1.9846724271774292, "Pretrain/Step": 9959, "Pretrain/Step Time": 8.479457864537835} +{"Pretrain/Learning Rate": 2.441634270705412e-05, "Pretrain/Loss": 2.0113513469696045, "Pretrain/Loss (Raw)": 1.9685815572738647, "Pretrain/Step": 9960, "Pretrain/Step Time": 8.48189420439303} +{"Pretrain/Learning Rate": 2.4412098706549945e-05, "Pretrain/Loss": 2.0113730430603027, "Pretrain/Loss (Raw)": 2.0849194526672363, "Pretrain/Step": 9961, "Pretrain/Step Time": 8.48266488313675} +{"Pretrain/Learning Rate": 2.440785472299749e-05, "Pretrain/Loss": 2.0127980709075928, "Pretrain/Loss (Raw)": 2.0718994140625, "Pretrain/Step": 9962, "Pretrain/Step Time": 8.479928439483047} +{"Pretrain/Learning Rate": 2.440361075651912e-05, "Pretrain/Loss": 2.0109736919403076, "Pretrain/Loss (Raw)": 1.8188620805740356, "Pretrain/Step": 9963, "Pretrain/Step Time": 8.480829959735274} +{"Pretrain/Learning Rate": 2.439936680723722e-05, "Pretrain/Loss": 2.010904312133789, "Pretrain/Loss (Raw)": 2.0942747592926025, "Pretrain/Step": 9964, "Pretrain/Step Time": 8.48100683093071} +{"Pretrain/Learning Rate": 2.439512287527415e-05, "Pretrain/Loss": 2.0098700523376465, "Pretrain/Loss (Raw)": 2.012221336364746, "Pretrain/Step": 9965, "Pretrain/Step Time": 8.482241766527295} +{"Pretrain/Learning Rate": 2.4390878960752294e-05, "Pretrain/Loss": 2.012833833694458, "Pretrain/Loss (Raw)": 2.296595573425293, "Pretrain/Step": 9966, "Pretrain/Step Time": 8.484399799257517} +{"Pretrain/Learning Rate": 2.4386635063794006e-05, "Pretrain/Loss": 2.01073956489563, "Pretrain/Loss (Raw)": 1.9822907447814941, "Pretrain/Step": 9967, "Pretrain/Step Time": 8.483821319416165} +{"Pretrain/Learning Rate": 2.4382391184521663e-05, "Pretrain/Loss": 2.0124008655548096, "Pretrain/Loss (Raw)": 2.139503002166748, "Pretrain/Step": 9968, "Pretrain/Step Time": 8.488988377153873} +{"Pretrain/Learning Rate": 2.4378147323057636e-05, "Pretrain/Loss": 2.0140676498413086, "Pretrain/Loss (Raw)": 2.0539822578430176, "Pretrain/Step": 9969, "Pretrain/Step Time": 8.48455323278904} +{"Pretrain/Learning Rate": 2.4373903479524293e-05, "Pretrain/Loss": 2.0152931213378906, "Pretrain/Loss (Raw)": 2.1001806259155273, "Pretrain/Step": 9970, "Pretrain/Step Time": 8.48997000604868} +{"Pretrain/Learning Rate": 2.4369659654044008e-05, "Pretrain/Loss": 2.017610549926758, "Pretrain/Loss (Raw)": 2.036346912384033, "Pretrain/Step": 9971, "Pretrain/Step Time": 8.492205968126655} +{"Pretrain/Learning Rate": 2.436541584673914e-05, "Pretrain/Loss": 2.023434638977051, "Pretrain/Loss (Raw)": 2.6184158325195312, "Pretrain/Step": 9972, "Pretrain/Step Time": 8.488396372646093} +{"Pretrain/Learning Rate": 2.436117205773205e-05, "Pretrain/Loss": 2.0255467891693115, "Pretrain/Loss (Raw)": 2.1921420097351074, "Pretrain/Step": 9973, "Pretrain/Step Time": 8.488484788686037} +{"Pretrain/Learning Rate": 2.4356928287145118e-05, "Pretrain/Loss": 2.0247631072998047, "Pretrain/Loss (Raw)": 1.961125373840332, "Pretrain/Step": 9974, "Pretrain/Step Time": 8.483164610341191} +{"Pretrain/Learning Rate": 2.4352684535100706e-05, "Pretrain/Loss": 2.024179220199585, "Pretrain/Loss (Raw)": 2.0166964530944824, "Pretrain/Step": 9975, "Pretrain/Step Time": 8.485406253486872} +{"Pretrain/Learning Rate": 2.434844080172118e-05, "Pretrain/Loss": 2.0252838134765625, "Pretrain/Loss (Raw)": 2.0836780071258545, "Pretrain/Step": 9976, "Pretrain/Step Time": 8.48433649353683} +{"Pretrain/Learning Rate": 2.4344197087128907e-05, "Pretrain/Loss": 2.0262584686279297, "Pretrain/Loss (Raw)": 1.9236814975738525, "Pretrain/Step": 9977, "Pretrain/Step Time": 8.487107107415795} +{"Pretrain/Learning Rate": 2.4339953391446247e-05, "Pretrain/Loss": 2.0269711017608643, "Pretrain/Loss (Raw)": 2.0630762577056885, "Pretrain/Step": 9978, "Pretrain/Step Time": 8.484265075996518} +{"Pretrain/Learning Rate": 2.4335709714795562e-05, "Pretrain/Loss": 2.027092933654785, "Pretrain/Loss (Raw)": 1.9422433376312256, "Pretrain/Step": 9979, "Pretrain/Step Time": 8.48284182883799} +{"Pretrain/Learning Rate": 2.433146605729922e-05, "Pretrain/Loss": 2.0286684036254883, "Pretrain/Loss (Raw)": 1.9898720979690552, "Pretrain/Step": 9980, "Pretrain/Step Time": 8.485586985945702} +{"Pretrain/Learning Rate": 2.4327222419079583e-05, "Pretrain/Loss": 2.0284485816955566, "Pretrain/Loss (Raw)": 2.027843475341797, "Pretrain/Step": 9981, "Pretrain/Step Time": 8.48361562564969} +{"Pretrain/Learning Rate": 2.432297880025902e-05, "Pretrain/Loss": 2.0280377864837646, "Pretrain/Loss (Raw)": 1.9488401412963867, "Pretrain/Step": 9982, "Pretrain/Step Time": 8.483252637088299} +{"Pretrain/Learning Rate": 2.431873520095988e-05, "Pretrain/Loss": 2.026942729949951, "Pretrain/Loss (Raw)": 1.7436189651489258, "Pretrain/Step": 9983, "Pretrain/Step Time": 8.487170236185193} +{"Pretrain/Learning Rate": 2.4314491621304526e-05, "Pretrain/Loss": 2.027263641357422, "Pretrain/Loss (Raw)": 2.0211730003356934, "Pretrain/Step": 9984, "Pretrain/Step Time": 8.490990672260523} +{"Pretrain/Learning Rate": 2.431024806141533e-05, "Pretrain/Loss": 2.024144172668457, "Pretrain/Loss (Raw)": 1.8600093126296997, "Pretrain/Step": 9985, "Pretrain/Step Time": 8.484765507280827} +{"Pretrain/Learning Rate": 2.430600452141464e-05, "Pretrain/Loss": 2.0245203971862793, "Pretrain/Loss (Raw)": 2.1175832748413086, "Pretrain/Step": 9986, "Pretrain/Step Time": 8.483659744262695} +{"Pretrain/Learning Rate": 2.4301761001424826e-05, "Pretrain/Loss": 2.022836208343506, "Pretrain/Loss (Raw)": 1.968083143234253, "Pretrain/Step": 9987, "Pretrain/Step Time": 8.484969550743699} +{"Pretrain/Learning Rate": 2.429751750156824e-05, "Pretrain/Loss": 2.0232155323028564, "Pretrain/Loss (Raw)": 1.8510048389434814, "Pretrain/Step": 9988, "Pretrain/Step Time": 8.486021183431149} +{"Pretrain/Learning Rate": 2.429327402196724e-05, "Pretrain/Loss": 2.0212161540985107, "Pretrain/Loss (Raw)": 1.9701220989227295, "Pretrain/Step": 9989, "Pretrain/Step Time": 8.490685822442174} +{"Pretrain/Learning Rate": 2.4289030562744183e-05, "Pretrain/Loss": 2.0227723121643066, "Pretrain/Loss (Raw)": 2.1301872730255127, "Pretrain/Step": 9990, "Pretrain/Step Time": 8.486204851418734} +{"Pretrain/Learning Rate": 2.428478712402143e-05, "Pretrain/Loss": 2.0232653617858887, "Pretrain/Loss (Raw)": 1.9500229358673096, "Pretrain/Step": 9991, "Pretrain/Step Time": 8.4908857177943} +{"Pretrain/Learning Rate": 2.428054370592134e-05, "Pretrain/Loss": 2.024293899536133, "Pretrain/Loss (Raw)": 2.0229387283325195, "Pretrain/Step": 9992, "Pretrain/Step Time": 8.484825367107987} +{"Pretrain/Learning Rate": 2.427630030856626e-05, "Pretrain/Loss": 2.0249741077423096, "Pretrain/Loss (Raw)": 1.9438982009887695, "Pretrain/Step": 9993, "Pretrain/Step Time": 8.490058520808816} +{"Pretrain/Learning Rate": 2.4272056932078552e-05, "Pretrain/Loss": 2.021803855895996, "Pretrain/Loss (Raw)": 1.765082836151123, "Pretrain/Step": 9994, "Pretrain/Step Time": 8.490602374076843} +{"Pretrain/Learning Rate": 2.426781357658057e-05, "Pretrain/Loss": 2.020942211151123, "Pretrain/Loss (Raw)": 2.043281316757202, "Pretrain/Step": 9995, "Pretrain/Step Time": 8.48736771568656} +{"Pretrain/Learning Rate": 2.4263570242194662e-05, "Pretrain/Loss": 2.02067232131958, "Pretrain/Loss (Raw)": 1.9434467554092407, "Pretrain/Step": 9996, "Pretrain/Step Time": 8.494056731462479} +{"Pretrain/Learning Rate": 2.42593269290432e-05, "Pretrain/Loss": 2.0184435844421387, "Pretrain/Loss (Raw)": 1.8774710893630981, "Pretrain/Step": 9997, "Pretrain/Step Time": 8.497185796499252} +{"Pretrain/Learning Rate": 2.4255083637248512e-05, "Pretrain/Loss": 2.0175769329071045, "Pretrain/Loss (Raw)": 1.8890635967254639, "Pretrain/Step": 9998, "Pretrain/Step Time": 8.491919791325927} +{"Pretrain/Learning Rate": 2.4250840366932966e-05, "Pretrain/Loss": 2.015240430831909, "Pretrain/Loss (Raw)": 1.9026920795440674, "Pretrain/Step": 9999, "Pretrain/Step Time": 8.493254993110895} +{"Pretrain/Learning Rate": 2.424659711821891e-05, "Pretrain/Loss": 2.0136170387268066, "Pretrain/Loss (Raw)": 1.9681272506713867, "Pretrain/Step": 10000, "Pretrain/Step Time": 8.489873621612787} +{"Pretrain/Learning Rate": 2.4242353891228692e-05, "Pretrain/Loss": 2.0119504928588867, "Pretrain/Loss (Raw)": 1.9528517723083496, "Pretrain/Step": 10001, "Pretrain/Step Time": 9.556595668196678} +{"Pretrain/Learning Rate": 2.423811068608467e-05, "Pretrain/Loss": 2.013256072998047, "Pretrain/Loss (Raw)": 2.163123369216919, "Pretrain/Step": 10002, "Pretrain/Step Time": 9.55917226523161} +{"Pretrain/Learning Rate": 2.4233867502909192e-05, "Pretrain/Loss": 2.012648582458496, "Pretrain/Loss (Raw)": 2.1002230644226074, "Pretrain/Step": 10003, "Pretrain/Step Time": 9.557130493223667} +{"Pretrain/Learning Rate": 2.4229624341824596e-05, "Pretrain/Loss": 2.01177716255188, "Pretrain/Loss (Raw)": 1.9286078214645386, "Pretrain/Step": 10004, "Pretrain/Step Time": 9.557227795943618} +{"Pretrain/Learning Rate": 2.4225381202953243e-05, "Pretrain/Loss": 2.012590169906616, "Pretrain/Loss (Raw)": 2.147906541824341, "Pretrain/Step": 10005, "Pretrain/Step Time": 9.554949320852757} +{"Pretrain/Learning Rate": 2.4221138086417474e-05, "Pretrain/Loss": 2.014984607696533, "Pretrain/Loss (Raw)": 2.0647575855255127, "Pretrain/Step": 10006, "Pretrain/Step Time": 9.559614770114422} +{"Pretrain/Learning Rate": 2.4216894992339642e-05, "Pretrain/Loss": 2.0159683227539062, "Pretrain/Loss (Raw)": 2.159978151321411, "Pretrain/Step": 10007, "Pretrain/Step Time": 9.547618672251701} +{"Pretrain/Learning Rate": 2.4212651920842096e-05, "Pretrain/Loss": 2.0140700340270996, "Pretrain/Loss (Raw)": 2.071077585220337, "Pretrain/Step": 10008, "Pretrain/Step Time": 9.553708828985691} +{"Pretrain/Learning Rate": 2.420840887204717e-05, "Pretrain/Loss": 2.0176384449005127, "Pretrain/Loss (Raw)": 2.324693202972412, "Pretrain/Step": 10009, "Pretrain/Step Time": 9.549884608015418} +{"Pretrain/Learning Rate": 2.420416584607722e-05, "Pretrain/Loss": 2.016458034515381, "Pretrain/Loss (Raw)": 1.9937620162963867, "Pretrain/Step": 10010, "Pretrain/Step Time": 9.551113288849592} +{"Pretrain/Learning Rate": 2.419992284305458e-05, "Pretrain/Loss": 2.0143206119537354, "Pretrain/Loss (Raw)": 1.9124201536178589, "Pretrain/Step": 10011, "Pretrain/Step Time": 9.555205006152391} +{"Pretrain/Learning Rate": 2.4195679863101605e-05, "Pretrain/Loss": 2.015195369720459, "Pretrain/Loss (Raw)": 2.2198984622955322, "Pretrain/Step": 10012, "Pretrain/Step Time": 9.559378523379564} +{"Pretrain/Learning Rate": 2.4191436906340638e-05, "Pretrain/Loss": 2.0161991119384766, "Pretrain/Loss (Raw)": 2.037771463394165, "Pretrain/Step": 10013, "Pretrain/Step Time": 9.553465120494366} +{"Pretrain/Learning Rate": 2.4187193972894015e-05, "Pretrain/Loss": 2.016122579574585, "Pretrain/Loss (Raw)": 1.979628562927246, "Pretrain/Step": 10014, "Pretrain/Step Time": 9.555832237005234} +{"Pretrain/Learning Rate": 2.418295106288408e-05, "Pretrain/Loss": 2.012960910797119, "Pretrain/Loss (Raw)": 1.4516940116882324, "Pretrain/Step": 10015, "Pretrain/Step Time": 9.548427492380142} +{"Pretrain/Learning Rate": 2.4178708176433173e-05, "Pretrain/Loss": 2.0158157348632812, "Pretrain/Loss (Raw)": 2.3387322425842285, "Pretrain/Step": 10016, "Pretrain/Step Time": 9.550214115530252} +{"Pretrain/Learning Rate": 2.4174465313663637e-05, "Pretrain/Loss": 2.01505708694458, "Pretrain/Loss (Raw)": 1.9179449081420898, "Pretrain/Step": 10017, "Pretrain/Step Time": 9.549016125500202} +{"Pretrain/Learning Rate": 2.417022247469782e-05, "Pretrain/Loss": 2.0153281688690186, "Pretrain/Loss (Raw)": 2.1373848915100098, "Pretrain/Step": 10018, "Pretrain/Step Time": 9.553255001083016} +{"Pretrain/Learning Rate": 2.4165979659658046e-05, "Pretrain/Loss": 2.015385866165161, "Pretrain/Loss (Raw)": 2.019758701324463, "Pretrain/Step": 10019, "Pretrain/Step Time": 9.551909489557147} +{"Pretrain/Learning Rate": 2.4161736868666658e-05, "Pretrain/Loss": 2.015655994415283, "Pretrain/Loss (Raw)": 1.9590688943862915, "Pretrain/Step": 10020, "Pretrain/Step Time": 9.554498778656125} +{"Pretrain/Learning Rate": 2.4157494101846002e-05, "Pretrain/Loss": 2.0115604400634766, "Pretrain/Loss (Raw)": 1.5103758573532104, "Pretrain/Step": 10021, "Pretrain/Step Time": 9.553883641958237} +{"Pretrain/Learning Rate": 2.4153251359318404e-05, "Pretrain/Loss": 2.0128111839294434, "Pretrain/Loss (Raw)": 1.9552741050720215, "Pretrain/Step": 10022, "Pretrain/Step Time": 9.557229617610574} +{"Pretrain/Learning Rate": 2.4149008641206215e-05, "Pretrain/Loss": 2.0110902786254883, "Pretrain/Loss (Raw)": 1.7117912769317627, "Pretrain/Step": 10023, "Pretrain/Step Time": 9.548367081210017} +{"Pretrain/Learning Rate": 2.4144765947631758e-05, "Pretrain/Loss": 2.014000177383423, "Pretrain/Loss (Raw)": 2.0401294231414795, "Pretrain/Step": 10024, "Pretrain/Step Time": 9.55030250735581} +{"Pretrain/Learning Rate": 2.4140523278717367e-05, "Pretrain/Loss": 2.013913631439209, "Pretrain/Loss (Raw)": 2.0146775245666504, "Pretrain/Step": 10025, "Pretrain/Step Time": 9.555603535845876} +{"Pretrain/Learning Rate": 2.4136280634585385e-05, "Pretrain/Loss": 2.0133767127990723, "Pretrain/Loss (Raw)": 2.061641216278076, "Pretrain/Step": 10026, "Pretrain/Step Time": 9.548810789361596} +{"Pretrain/Learning Rate": 2.413203801535814e-05, "Pretrain/Loss": 2.011704921722412, "Pretrain/Loss (Raw)": 2.0306079387664795, "Pretrain/Step": 10027, "Pretrain/Step Time": 9.551867846399546} +{"Pretrain/Learning Rate": 2.4127795421157974e-05, "Pretrain/Loss": 2.011305809020996, "Pretrain/Loss (Raw)": 2.229771375656128, "Pretrain/Step": 10028, "Pretrain/Step Time": 9.554983654990792} +{"Pretrain/Learning Rate": 2.4123552852107206e-05, "Pretrain/Loss": 2.007957935333252, "Pretrain/Loss (Raw)": 1.524060845375061, "Pretrain/Step": 10029, "Pretrain/Step Time": 9.550878830254078} +{"Pretrain/Learning Rate": 2.4119310308328174e-05, "Pretrain/Loss": 2.0077974796295166, "Pretrain/Loss (Raw)": 1.9328975677490234, "Pretrain/Step": 10030, "Pretrain/Step Time": 9.550238562747836} +{"Pretrain/Learning Rate": 2.4115067789943206e-05, "Pretrain/Loss": 2.008150339126587, "Pretrain/Loss (Raw)": 2.0981862545013428, "Pretrain/Step": 10031, "Pretrain/Step Time": 9.549816824495792} +{"Pretrain/Learning Rate": 2.411082529707464e-05, "Pretrain/Loss": 2.010127067565918, "Pretrain/Loss (Raw)": 1.998326063156128, "Pretrain/Step": 10032, "Pretrain/Step Time": 9.553383307531476} +{"Pretrain/Learning Rate": 2.4106582829844807e-05, "Pretrain/Loss": 2.008188247680664, "Pretrain/Loss (Raw)": 1.869670033454895, "Pretrain/Step": 10033, "Pretrain/Step Time": 9.551440604031086} +{"Pretrain/Learning Rate": 2.4102340388376015e-05, "Pretrain/Loss": 2.007239580154419, "Pretrain/Loss (Raw)": 1.9188621044158936, "Pretrain/Step": 10034, "Pretrain/Step Time": 9.551028015092015} +{"Pretrain/Learning Rate": 2.4098097972790615e-05, "Pretrain/Loss": 2.007378101348877, "Pretrain/Loss (Raw)": 1.937737226486206, "Pretrain/Step": 10035, "Pretrain/Step Time": 9.558295089751482} +{"Pretrain/Learning Rate": 2.4093855583210916e-05, "Pretrain/Loss": 2.008979082107544, "Pretrain/Loss (Raw)": 2.1881396770477295, "Pretrain/Step": 10036, "Pretrain/Step Time": 9.549790242686868} +{"Pretrain/Learning Rate": 2.4089613219759252e-05, "Pretrain/Loss": 2.0071725845336914, "Pretrain/Loss (Raw)": 1.978818416595459, "Pretrain/Step": 10037, "Pretrain/Step Time": 9.547701429575682} +{"Pretrain/Learning Rate": 2.408537088255795e-05, "Pretrain/Loss": 2.005493640899658, "Pretrain/Loss (Raw)": 2.1329548358917236, "Pretrain/Step": 10038, "Pretrain/Step Time": 9.547222072258592} +{"Pretrain/Learning Rate": 2.4081128571729335e-05, "Pretrain/Loss": 2.006204843521118, "Pretrain/Loss (Raw)": 1.8714159727096558, "Pretrain/Step": 10039, "Pretrain/Step Time": 9.548524793237448} +{"Pretrain/Learning Rate": 2.407688628739573e-05, "Pretrain/Loss": 2.0049245357513428, "Pretrain/Loss (Raw)": 2.0133726596832275, "Pretrain/Step": 10040, "Pretrain/Step Time": 9.547762313857675} +{"Pretrain/Learning Rate": 2.4072644029679463e-05, "Pretrain/Loss": 2.0031213760375977, "Pretrain/Loss (Raw)": 1.8575434684753418, "Pretrain/Step": 10041, "Pretrain/Step Time": 9.547598639503121} +{"Pretrain/Learning Rate": 2.4068401798702844e-05, "Pretrain/Loss": 2.0045652389526367, "Pretrain/Loss (Raw)": 2.080509901046753, "Pretrain/Step": 10042, "Pretrain/Step Time": 9.546759687364101} +{"Pretrain/Learning Rate": 2.4064159594588205e-05, "Pretrain/Loss": 2.0051679611206055, "Pretrain/Loss (Raw)": 2.0926449298858643, "Pretrain/Step": 10043, "Pretrain/Step Time": 9.54104084894061} +{"Pretrain/Learning Rate": 2.4059917417457863e-05, "Pretrain/Loss": 2.0067808628082275, "Pretrain/Loss (Raw)": 2.012697696685791, "Pretrain/Step": 10044, "Pretrain/Step Time": 9.548489082604647} +{"Pretrain/Learning Rate": 2.4055675267434142e-05, "Pretrain/Loss": 2.0095582008361816, "Pretrain/Loss (Raw)": 2.507913112640381, "Pretrain/Step": 10045, "Pretrain/Step Time": 9.549367787316442} +{"Pretrain/Learning Rate": 2.405143314463936e-05, "Pretrain/Loss": 2.007869005203247, "Pretrain/Loss (Raw)": 1.8422322273254395, "Pretrain/Step": 10046, "Pretrain/Step Time": 9.550196167081594} +{"Pretrain/Learning Rate": 2.4047191049195834e-05, "Pretrain/Loss": 2.0085513591766357, "Pretrain/Loss (Raw)": 2.175208806991577, "Pretrain/Step": 10047, "Pretrain/Step Time": 9.54858423769474} +{"Pretrain/Learning Rate": 2.404294898122588e-05, "Pretrain/Loss": 2.008477210998535, "Pretrain/Loss (Raw)": 1.8723067045211792, "Pretrain/Step": 10048, "Pretrain/Step Time": 9.543249167501926} +{"Pretrain/Learning Rate": 2.4038706940851815e-05, "Pretrain/Loss": 2.0088772773742676, "Pretrain/Loss (Raw)": 1.9065110683441162, "Pretrain/Step": 10049, "Pretrain/Step Time": 9.542232271283865} +{"Pretrain/Learning Rate": 2.4034464928195963e-05, "Pretrain/Loss": 2.0097522735595703, "Pretrain/Loss (Raw)": 1.9938818216323853, "Pretrain/Step": 10050, "Pretrain/Step Time": 9.542138990014791} +{"Pretrain/Learning Rate": 2.4030222943380637e-05, "Pretrain/Loss": 2.0105538368225098, "Pretrain/Loss (Raw)": 2.158430576324463, "Pretrain/Step": 10051, "Pretrain/Step Time": 9.55125449411571} +{"Pretrain/Learning Rate": 2.4025980986528142e-05, "Pretrain/Loss": 2.0097193717956543, "Pretrain/Loss (Raw)": 1.7924370765686035, "Pretrain/Step": 10052, "Pretrain/Step Time": 9.551638707518578} +{"Pretrain/Learning Rate": 2.40217390577608e-05, "Pretrain/Loss": 2.0071675777435303, "Pretrain/Loss (Raw)": 1.9382659196853638, "Pretrain/Step": 10053, "Pretrain/Step Time": 9.555303560569882} +{"Pretrain/Learning Rate": 2.4017497157200923e-05, "Pretrain/Loss": 2.0086398124694824, "Pretrain/Loss (Raw)": 2.1276791095733643, "Pretrain/Step": 10054, "Pretrain/Step Time": 9.550442850217223} +{"Pretrain/Learning Rate": 2.401325528497082e-05, "Pretrain/Loss": 2.0076804161071777, "Pretrain/Loss (Raw)": 1.8481557369232178, "Pretrain/Step": 10055, "Pretrain/Step Time": 9.548046253621578} +{"Pretrain/Learning Rate": 2.4009013441192817e-05, "Pretrain/Loss": 2.007079601287842, "Pretrain/Loss (Raw)": 2.0020947456359863, "Pretrain/Step": 10056, "Pretrain/Step Time": 9.549185069277883} +{"Pretrain/Learning Rate": 2.40047716259892e-05, "Pretrain/Loss": 2.0060131549835205, "Pretrain/Loss (Raw)": 1.5051442384719849, "Pretrain/Step": 10057, "Pretrain/Step Time": 9.549094220623374} +{"Pretrain/Learning Rate": 2.4000529839482297e-05, "Pretrain/Loss": 2.0034542083740234, "Pretrain/Loss (Raw)": 1.9060419797897339, "Pretrain/Step": 10058, "Pretrain/Step Time": 9.547797072678804} +{"Pretrain/Learning Rate": 2.3996288081794407e-05, "Pretrain/Loss": 2.0048766136169434, "Pretrain/Loss (Raw)": 2.1425869464874268, "Pretrain/Step": 10059, "Pretrain/Step Time": 9.544591631740332} +{"Pretrain/Learning Rate": 2.3992046353047845e-05, "Pretrain/Loss": 2.0051701068878174, "Pretrain/Loss (Raw)": 2.089611530303955, "Pretrain/Step": 10060, "Pretrain/Step Time": 9.550246648490429} +{"Pretrain/Learning Rate": 2.3987804653364924e-05, "Pretrain/Loss": 2.0064752101898193, "Pretrain/Loss (Raw)": 1.9833945035934448, "Pretrain/Step": 10061, "Pretrain/Step Time": 9.55231312289834} +{"Pretrain/Learning Rate": 2.3983562982867933e-05, "Pretrain/Loss": 2.003787040710449, "Pretrain/Loss (Raw)": 1.8616501092910767, "Pretrain/Step": 10062, "Pretrain/Step Time": 9.549592459574342} +{"Pretrain/Learning Rate": 2.3979321341679186e-05, "Pretrain/Loss": 2.0036673545837402, "Pretrain/Loss (Raw)": 2.017063856124878, "Pretrain/Step": 10063, "Pretrain/Step Time": 9.549039386212826} +{"Pretrain/Learning Rate": 2.397507972992099e-05, "Pretrain/Loss": 2.002277374267578, "Pretrain/Loss (Raw)": 1.9724681377410889, "Pretrain/Step": 10064, "Pretrain/Step Time": 9.549674417823553} +{"Pretrain/Learning Rate": 2.397083814771565e-05, "Pretrain/Loss": 2.003725051879883, "Pretrain/Loss (Raw)": 2.092144727706909, "Pretrain/Step": 10065, "Pretrain/Step Time": 9.545700456947088} +{"Pretrain/Learning Rate": 2.396659659518547e-05, "Pretrain/Loss": 2.0041003227233887, "Pretrain/Loss (Raw)": 1.7893868684768677, "Pretrain/Step": 10066, "Pretrain/Step Time": 9.541667751967907} +{"Pretrain/Learning Rate": 2.3962355072452745e-05, "Pretrain/Loss": 2.002286672592163, "Pretrain/Loss (Raw)": 1.7642953395843506, "Pretrain/Step": 10067, "Pretrain/Step Time": 9.544384468346834} +{"Pretrain/Learning Rate": 2.3958113579639776e-05, "Pretrain/Loss": 2.002866268157959, "Pretrain/Loss (Raw)": 1.9006699323654175, "Pretrain/Step": 10068, "Pretrain/Step Time": 9.54204106144607} +{"Pretrain/Learning Rate": 2.395387211686887e-05, "Pretrain/Loss": 1.999504566192627, "Pretrain/Loss (Raw)": 1.7088686227798462, "Pretrain/Step": 10069, "Pretrain/Step Time": 9.542421711608768} +{"Pretrain/Learning Rate": 2.3949630684262323e-05, "Pretrain/Loss": 1.9985575675964355, "Pretrain/Loss (Raw)": 2.006544828414917, "Pretrain/Step": 10070, "Pretrain/Step Time": 9.542255561798811} +{"Pretrain/Learning Rate": 2.394538928194244e-05, "Pretrain/Loss": 1.995222806930542, "Pretrain/Loss (Raw)": 1.6786142587661743, "Pretrain/Step": 10071, "Pretrain/Step Time": 9.541419250890613} +{"Pretrain/Learning Rate": 2.3941147910031513e-05, "Pretrain/Loss": 1.993396282196045, "Pretrain/Loss (Raw)": 1.8107008934020996, "Pretrain/Step": 10072, "Pretrain/Step Time": 9.535807786509395} +{"Pretrain/Learning Rate": 2.3936906568651833e-05, "Pretrain/Loss": 1.9925943613052368, "Pretrain/Loss (Raw)": 2.0918328762054443, "Pretrain/Step": 10073, "Pretrain/Step Time": 9.543473925441504} +{"Pretrain/Learning Rate": 2.3932665257925703e-05, "Pretrain/Loss": 1.990485429763794, "Pretrain/Loss (Raw)": 1.848644495010376, "Pretrain/Step": 10074, "Pretrain/Step Time": 9.533883765339851} +{"Pretrain/Learning Rate": 2.3928423977975424e-05, "Pretrain/Loss": 1.9937326908111572, "Pretrain/Loss (Raw)": 2.337109327316284, "Pretrain/Step": 10075, "Pretrain/Step Time": 9.532550966367126} +{"Pretrain/Learning Rate": 2.3924182728923277e-05, "Pretrain/Loss": 1.9909274578094482, "Pretrain/Loss (Raw)": 1.5568698644638062, "Pretrain/Step": 10076, "Pretrain/Step Time": 9.533233232796192} +{"Pretrain/Learning Rate": 2.391994151089157e-05, "Pretrain/Loss": 1.9908645153045654, "Pretrain/Loss (Raw)": 2.0977110862731934, "Pretrain/Step": 10077, "Pretrain/Step Time": 9.536276761442423} +{"Pretrain/Learning Rate": 2.3915700324002586e-05, "Pretrain/Loss": 1.9899827241897583, "Pretrain/Loss (Raw)": 2.023980140686035, "Pretrain/Step": 10078, "Pretrain/Step Time": 9.534431552514434} +{"Pretrain/Learning Rate": 2.391145916837862e-05, "Pretrain/Loss": 1.9918437004089355, "Pretrain/Loss (Raw)": 2.0939412117004395, "Pretrain/Step": 10079, "Pretrain/Step Time": 9.540637778118253} +{"Pretrain/Learning Rate": 2.3907218044141956e-05, "Pretrain/Loss": 1.9907294511795044, "Pretrain/Loss (Raw)": 1.8789451122283936, "Pretrain/Step": 10080, "Pretrain/Step Time": 9.541786445304751} +{"Pretrain/Learning Rate": 2.3902976951414893e-05, "Pretrain/Loss": 1.9901565313339233, "Pretrain/Loss (Raw)": 2.0307304859161377, "Pretrain/Step": 10081, "Pretrain/Step Time": 9.542565675452352} +{"Pretrain/Learning Rate": 2.389873589031972e-05, "Pretrain/Loss": 1.9894986152648926, "Pretrain/Loss (Raw)": 1.956793189048767, "Pretrain/Step": 10082, "Pretrain/Step Time": 9.547456059604883} +{"Pretrain/Learning Rate": 2.3894494860978718e-05, "Pretrain/Loss": 1.987931728363037, "Pretrain/Loss (Raw)": 2.086265802383423, "Pretrain/Step": 10083, "Pretrain/Step Time": 9.542931526899338} +{"Pretrain/Learning Rate": 2.3890253863514174e-05, "Pretrain/Loss": 1.98687744140625, "Pretrain/Loss (Raw)": 2.067765474319458, "Pretrain/Step": 10084, "Pretrain/Step Time": 9.542788468301296} +{"Pretrain/Learning Rate": 2.388601289804838e-05, "Pretrain/Loss": 1.9897887706756592, "Pretrain/Loss (Raw)": 2.000516176223755, "Pretrain/Step": 10085, "Pretrain/Step Time": 9.552675615996122} +{"Pretrain/Learning Rate": 2.3881771964703618e-05, "Pretrain/Loss": 1.9896693229675293, "Pretrain/Loss (Raw)": 1.8891124725341797, "Pretrain/Step": 10086, "Pretrain/Step Time": 9.549822753295302} +{"Pretrain/Learning Rate": 2.3877531063602177e-05, "Pretrain/Loss": 1.988242506980896, "Pretrain/Loss (Raw)": 1.8020505905151367, "Pretrain/Step": 10087, "Pretrain/Step Time": 9.55378570780158} +{"Pretrain/Learning Rate": 2.3873290194866333e-05, "Pretrain/Loss": 1.9877418279647827, "Pretrain/Loss (Raw)": 1.9044911861419678, "Pretrain/Step": 10088, "Pretrain/Step Time": 9.550394121557474} +{"Pretrain/Learning Rate": 2.386904935861837e-05, "Pretrain/Loss": 1.9867740869522095, "Pretrain/Loss (Raw)": 1.9610675573349, "Pretrain/Step": 10089, "Pretrain/Step Time": 9.551835339516401} +{"Pretrain/Learning Rate": 2.3864808554980572e-05, "Pretrain/Loss": 1.9877766370773315, "Pretrain/Loss (Raw)": 2.200212240219116, "Pretrain/Step": 10090, "Pretrain/Step Time": 9.549291895702481} +{"Pretrain/Learning Rate": 2.386056778407522e-05, "Pretrain/Loss": 1.9900870323181152, "Pretrain/Loss (Raw)": 2.1145808696746826, "Pretrain/Step": 10091, "Pretrain/Step Time": 9.552198000252247} +{"Pretrain/Learning Rate": 2.38563270460246e-05, "Pretrain/Loss": 1.989298939704895, "Pretrain/Loss (Raw)": 1.9934141635894775, "Pretrain/Step": 10092, "Pretrain/Step Time": 9.553331991657615} +{"Pretrain/Learning Rate": 2.3852086340950975e-05, "Pretrain/Loss": 1.9876551628112793, "Pretrain/Loss (Raw)": 1.801809549331665, "Pretrain/Step": 10093, "Pretrain/Step Time": 9.553845161572099} +{"Pretrain/Learning Rate": 2.3847845668976632e-05, "Pretrain/Loss": 1.985851764678955, "Pretrain/Loss (Raw)": 2.0657639503479004, "Pretrain/Step": 10094, "Pretrain/Step Time": 9.55915722437203} +{"Pretrain/Learning Rate": 2.3843605030223847e-05, "Pretrain/Loss": 1.9851961135864258, "Pretrain/Loss (Raw)": 1.8983802795410156, "Pretrain/Step": 10095, "Pretrain/Step Time": 9.5584137737751} +{"Pretrain/Learning Rate": 2.3839364424814896e-05, "Pretrain/Loss": 1.985813856124878, "Pretrain/Loss (Raw)": 2.218576192855835, "Pretrain/Step": 10096, "Pretrain/Step Time": 9.551150344312191} +{"Pretrain/Learning Rate": 2.383512385287206e-05, "Pretrain/Loss": 1.984432578086853, "Pretrain/Loss (Raw)": 1.8771673440933228, "Pretrain/Step": 10097, "Pretrain/Step Time": 9.555114485323429} +{"Pretrain/Learning Rate": 2.38308833145176e-05, "Pretrain/Loss": 1.983719825744629, "Pretrain/Loss (Raw)": 2.008931875228882, "Pretrain/Step": 10098, "Pretrain/Step Time": 9.548442581668496} +{"Pretrain/Learning Rate": 2.3826642809873796e-05, "Pretrain/Loss": 1.9822580814361572, "Pretrain/Loss (Raw)": 1.8492686748504639, "Pretrain/Step": 10099, "Pretrain/Step Time": 9.551244746893644} +{"Pretrain/Learning Rate": 2.3822402339062918e-05, "Pretrain/Loss": 1.9772857427597046, "Pretrain/Loss (Raw)": 1.9819403886795044, "Pretrain/Step": 10100, "Pretrain/Step Time": 9.549016613513231} +{"Pretrain/Learning Rate": 2.381816190220724e-05, "Pretrain/Loss": 1.977370023727417, "Pretrain/Loss (Raw)": 2.2029285430908203, "Pretrain/Step": 10101, "Pretrain/Step Time": 9.550052631646395} +{"Pretrain/Learning Rate": 2.3813921499429033e-05, "Pretrain/Loss": 1.9765000343322754, "Pretrain/Loss (Raw)": 1.8497638702392578, "Pretrain/Step": 10102, "Pretrain/Step Time": 9.553909258916974} +{"Pretrain/Learning Rate": 2.3809681130850563e-05, "Pretrain/Loss": 1.976654052734375, "Pretrain/Loss (Raw)": 2.036431074142456, "Pretrain/Step": 10103, "Pretrain/Step Time": 9.554724268615246} +{"Pretrain/Learning Rate": 2.3805440796594094e-05, "Pretrain/Loss": 1.975836992263794, "Pretrain/Loss (Raw)": 1.9790866374969482, "Pretrain/Step": 10104, "Pretrain/Step Time": 9.553745431825519} +{"Pretrain/Learning Rate": 2.3801200496781898e-05, "Pretrain/Loss": 1.9762436151504517, "Pretrain/Loss (Raw)": 1.975728988647461, "Pretrain/Step": 10105, "Pretrain/Step Time": 9.554436014965177} +{"Pretrain/Learning Rate": 2.3796960231536243e-05, "Pretrain/Loss": 1.9759600162506104, "Pretrain/Loss (Raw)": 2.026763677597046, "Pretrain/Step": 10106, "Pretrain/Step Time": 9.555771259590983} +{"Pretrain/Learning Rate": 2.3792720000979395e-05, "Pretrain/Loss": 1.9771981239318848, "Pretrain/Loss (Raw)": 2.1007189750671387, "Pretrain/Step": 10107, "Pretrain/Step Time": 9.555105417966843} +{"Pretrain/Learning Rate": 2.378847980523361e-05, "Pretrain/Loss": 1.9749196767807007, "Pretrain/Loss (Raw)": 1.6982372999191284, "Pretrain/Step": 10108, "Pretrain/Step Time": 9.554371943697333} +{"Pretrain/Learning Rate": 2.3784239644421154e-05, "Pretrain/Loss": 1.9746613502502441, "Pretrain/Loss (Raw)": 1.994777798652649, "Pretrain/Step": 10109, "Pretrain/Step Time": 9.555841030552983} +{"Pretrain/Learning Rate": 2.3779999518664294e-05, "Pretrain/Loss": 1.9761698246002197, "Pretrain/Loss (Raw)": 2.141932964324951, "Pretrain/Step": 10110, "Pretrain/Step Time": 9.556809036061168} +{"Pretrain/Learning Rate": 2.3775759428085286e-05, "Pretrain/Loss": 1.9788613319396973, "Pretrain/Loss (Raw)": 2.0881190299987793, "Pretrain/Step": 10111, "Pretrain/Step Time": 9.553114347159863} +{"Pretrain/Learning Rate": 2.3771519372806393e-05, "Pretrain/Loss": 1.980057716369629, "Pretrain/Loss (Raw)": 2.174309492111206, "Pretrain/Step": 10112, "Pretrain/Step Time": 9.551759833469987} +{"Pretrain/Learning Rate": 2.376727935294988e-05, "Pretrain/Loss": 1.9794316291809082, "Pretrain/Loss (Raw)": 1.7798830270767212, "Pretrain/Step": 10113, "Pretrain/Step Time": 9.55518308840692} +{"Pretrain/Learning Rate": 2.3763039368637988e-05, "Pretrain/Loss": 1.9786992073059082, "Pretrain/Loss (Raw)": 2.023820161819458, "Pretrain/Step": 10114, "Pretrain/Step Time": 9.554510902613401} +{"Pretrain/Learning Rate": 2.3758799419992987e-05, "Pretrain/Loss": 1.9791393280029297, "Pretrain/Loss (Raw)": 2.0244364738464355, "Pretrain/Step": 10115, "Pretrain/Step Time": 9.546613140031695} +{"Pretrain/Learning Rate": 2.3754559507137124e-05, "Pretrain/Loss": 1.979271650314331, "Pretrain/Loss (Raw)": 1.8679441213607788, "Pretrain/Step": 10116, "Pretrain/Step Time": 9.550214728340507} +{"Pretrain/Learning Rate": 2.3750319630192676e-05, "Pretrain/Loss": 1.9807250499725342, "Pretrain/Loss (Raw)": 2.156147003173828, "Pretrain/Step": 10117, "Pretrain/Step Time": 9.548213107511401} +{"Pretrain/Learning Rate": 2.374607978928187e-05, "Pretrain/Loss": 1.9789679050445557, "Pretrain/Loss (Raw)": 1.9052573442459106, "Pretrain/Step": 10118, "Pretrain/Step Time": 9.549550227820873} +{"Pretrain/Learning Rate": 2.3741839984526968e-05, "Pretrain/Loss": 1.9796154499053955, "Pretrain/Loss (Raw)": 2.0329248905181885, "Pretrain/Step": 10119, "Pretrain/Step Time": 9.550087938085198} +{"Pretrain/Learning Rate": 2.373760021605023e-05, "Pretrain/Loss": 1.9797172546386719, "Pretrain/Loss (Raw)": 2.035958766937256, "Pretrain/Step": 10120, "Pretrain/Step Time": 9.551731595769525} +{"Pretrain/Learning Rate": 2.373336048397389e-05, "Pretrain/Loss": 1.9805166721343994, "Pretrain/Loss (Raw)": 2.0462288856506348, "Pretrain/Step": 10121, "Pretrain/Step Time": 9.547820033505559} +{"Pretrain/Learning Rate": 2.3729120788420213e-05, "Pretrain/Loss": 1.9827361106872559, "Pretrain/Loss (Raw)": 2.0491552352905273, "Pretrain/Step": 10122, "Pretrain/Step Time": 9.549772704020143} +{"Pretrain/Learning Rate": 2.3724881129511438e-05, "Pretrain/Loss": 1.9813284873962402, "Pretrain/Loss (Raw)": 1.8631360530853271, "Pretrain/Step": 10123, "Pretrain/Step Time": 9.549398422241211} +{"Pretrain/Learning Rate": 2.3720641507369818e-05, "Pretrain/Loss": 1.9809353351593018, "Pretrain/Loss (Raw)": 1.8931092023849487, "Pretrain/Step": 10124, "Pretrain/Step Time": 9.543369691818953} +{"Pretrain/Learning Rate": 2.3716401922117605e-05, "Pretrain/Loss": 1.9808932542800903, "Pretrain/Loss (Raw)": 1.8720943927764893, "Pretrain/Step": 10125, "Pretrain/Step Time": 9.542011626064777} +{"Pretrain/Learning Rate": 2.3712162373877032e-05, "Pretrain/Loss": 1.9808934926986694, "Pretrain/Loss (Raw)": 1.8890811204910278, "Pretrain/Step": 10126, "Pretrain/Step Time": 9.546183079481125} +{"Pretrain/Learning Rate": 2.370792286277035e-05, "Pretrain/Loss": 1.9820566177368164, "Pretrain/Loss (Raw)": 2.051577091217041, "Pretrain/Step": 10127, "Pretrain/Step Time": 9.54454487375915} +{"Pretrain/Learning Rate": 2.3703683388919797e-05, "Pretrain/Loss": 1.9808335304260254, "Pretrain/Loss (Raw)": 1.8115767240524292, "Pretrain/Step": 10128, "Pretrain/Step Time": 9.543280569836497} +{"Pretrain/Learning Rate": 2.3699443952447624e-05, "Pretrain/Loss": 1.9807145595550537, "Pretrain/Loss (Raw)": 1.9376288652420044, "Pretrain/Step": 10129, "Pretrain/Step Time": 8.475152481347322} +{"Pretrain/Learning Rate": 2.369520455347607e-05, "Pretrain/Loss": 1.9786344766616821, "Pretrain/Loss (Raw)": 1.8968536853790283, "Pretrain/Step": 10130, "Pretrain/Step Time": 8.478264903649688} +{"Pretrain/Learning Rate": 2.369096519212737e-05, "Pretrain/Loss": 1.9838061332702637, "Pretrain/Loss (Raw)": 2.7622151374816895, "Pretrain/Step": 10131, "Pretrain/Step Time": 8.480180198326707} +{"Pretrain/Learning Rate": 2.3686725868523762e-05, "Pretrain/Loss": 1.982323169708252, "Pretrain/Loss (Raw)": 1.7387924194335938, "Pretrain/Step": 10132, "Pretrain/Step Time": 8.476341407746077} +{"Pretrain/Learning Rate": 2.368248658278749e-05, "Pretrain/Loss": 1.9815561771392822, "Pretrain/Loss (Raw)": 2.049727201461792, "Pretrain/Step": 10133, "Pretrain/Step Time": 8.481066824868321} +{"Pretrain/Learning Rate": 2.3678247335040794e-05, "Pretrain/Loss": 1.982132077217102, "Pretrain/Loss (Raw)": 2.138460397720337, "Pretrain/Step": 10134, "Pretrain/Step Time": 8.481198092922568} +{"Pretrain/Learning Rate": 2.3674008125405904e-05, "Pretrain/Loss": 1.980633020401001, "Pretrain/Loss (Raw)": 1.9681000709533691, "Pretrain/Step": 10135, "Pretrain/Step Time": 8.482709171250463} +{"Pretrain/Learning Rate": 2.366976895400505e-05, "Pretrain/Loss": 1.981092929840088, "Pretrain/Loss (Raw)": 2.129944324493408, "Pretrain/Step": 10136, "Pretrain/Step Time": 8.475656669586897} +{"Pretrain/Learning Rate": 2.366552982096047e-05, "Pretrain/Loss": 1.9786738157272339, "Pretrain/Loss (Raw)": 2.01505184173584, "Pretrain/Step": 10137, "Pretrain/Step Time": 8.481114361435175} +{"Pretrain/Learning Rate": 2.3661290726394398e-05, "Pretrain/Loss": 1.9772018194198608, "Pretrain/Loss (Raw)": 1.8053427934646606, "Pretrain/Step": 10138, "Pretrain/Step Time": 8.480913175269961} +{"Pretrain/Learning Rate": 2.3657051670429065e-05, "Pretrain/Loss": 1.9780372381210327, "Pretrain/Loss (Raw)": 2.019355058670044, "Pretrain/Step": 10139, "Pretrain/Step Time": 8.475701732560992} +{"Pretrain/Learning Rate": 2.3652812653186697e-05, "Pretrain/Loss": 1.9769139289855957, "Pretrain/Loss (Raw)": 2.076119899749756, "Pretrain/Step": 10140, "Pretrain/Step Time": 8.476081930100918} +{"Pretrain/Learning Rate": 2.3648573674789538e-05, "Pretrain/Loss": 1.9766366481781006, "Pretrain/Loss (Raw)": 2.0022780895233154, "Pretrain/Step": 10141, "Pretrain/Step Time": 8.4764363206923} +{"Pretrain/Learning Rate": 2.3644334735359794e-05, "Pretrain/Loss": 1.9762499332427979, "Pretrain/Loss (Raw)": 1.9301254749298096, "Pretrain/Step": 10142, "Pretrain/Step Time": 8.476927187293768} +{"Pretrain/Learning Rate": 2.3640095835019703e-05, "Pretrain/Loss": 1.9799137115478516, "Pretrain/Loss (Raw)": 1.9206621646881104, "Pretrain/Step": 10143, "Pretrain/Step Time": 8.477168744429946} +{"Pretrain/Learning Rate": 2.363585697389149e-05, "Pretrain/Loss": 1.9769234657287598, "Pretrain/Loss (Raw)": 1.9559698104858398, "Pretrain/Step": 10144, "Pretrain/Step Time": 8.479499638080597} +{"Pretrain/Learning Rate": 2.3631618152097378e-05, "Pretrain/Loss": 1.9783196449279785, "Pretrain/Loss (Raw)": 2.09665846824646, "Pretrain/Step": 10145, "Pretrain/Step Time": 8.478556223213673} +{"Pretrain/Learning Rate": 2.36273793697596e-05, "Pretrain/Loss": 1.9763492345809937, "Pretrain/Loss (Raw)": 1.885177493095398, "Pretrain/Step": 10146, "Pretrain/Step Time": 8.474293557927012} +{"Pretrain/Learning Rate": 2.3623140627000364e-05, "Pretrain/Loss": 1.9761242866516113, "Pretrain/Loss (Raw)": 1.9909579753875732, "Pretrain/Step": 10147, "Pretrain/Step Time": 8.481464058160782} +{"Pretrain/Learning Rate": 2.36189019239419e-05, "Pretrain/Loss": 1.9776387214660645, "Pretrain/Loss (Raw)": 2.152930498123169, "Pretrain/Step": 10148, "Pretrain/Step Time": 8.477613933384418} +{"Pretrain/Learning Rate": 2.3614663260706422e-05, "Pretrain/Loss": 1.9815716743469238, "Pretrain/Loss (Raw)": 2.013786554336548, "Pretrain/Step": 10149, "Pretrain/Step Time": 8.477750280871987} +{"Pretrain/Learning Rate": 2.3610424637416155e-05, "Pretrain/Loss": 1.9826569557189941, "Pretrain/Loss (Raw)": 2.0941898822784424, "Pretrain/Step": 10150, "Pretrain/Step Time": 8.473113311454654} +{"Pretrain/Learning Rate": 2.3606186054193316e-05, "Pretrain/Loss": 1.983709692955017, "Pretrain/Loss (Raw)": 1.8465415239334106, "Pretrain/Step": 10151, "Pretrain/Step Time": 8.484590712934732} +{"Pretrain/Learning Rate": 2.3601947511160115e-05, "Pretrain/Loss": 1.9831249713897705, "Pretrain/Loss (Raw)": 1.9652901887893677, "Pretrain/Step": 10152, "Pretrain/Step Time": 8.479393059387803} +{"Pretrain/Learning Rate": 2.3597709008438773e-05, "Pretrain/Loss": 1.9828753471374512, "Pretrain/Loss (Raw)": 1.9827289581298828, "Pretrain/Step": 10153, "Pretrain/Step Time": 8.479795327410102} +{"Pretrain/Learning Rate": 2.35934705461515e-05, "Pretrain/Loss": 1.9828859567642212, "Pretrain/Loss (Raw)": 2.062995672225952, "Pretrain/Step": 10154, "Pretrain/Step Time": 8.483809150755405} +{"Pretrain/Learning Rate": 2.358923212442052e-05, "Pretrain/Loss": 1.9827454090118408, "Pretrain/Loss (Raw)": 2.0126140117645264, "Pretrain/Step": 10155, "Pretrain/Step Time": 8.483107740059495} +{"Pretrain/Learning Rate": 2.3584993743368037e-05, "Pretrain/Loss": 1.9812265634536743, "Pretrain/Loss (Raw)": 2.035365343093872, "Pretrain/Step": 10156, "Pretrain/Step Time": 8.479366011917591} +{"Pretrain/Learning Rate": 2.3580755403116258e-05, "Pretrain/Loss": 1.9846303462982178, "Pretrain/Loss (Raw)": 1.9597417116165161, "Pretrain/Step": 10157, "Pretrain/Step Time": 8.479154206812382} +{"Pretrain/Learning Rate": 2.3576517103787394e-05, "Pretrain/Loss": 1.9868555068969727, "Pretrain/Loss (Raw)": 2.2177302837371826, "Pretrain/Step": 10158, "Pretrain/Step Time": 8.475962620228529} +{"Pretrain/Learning Rate": 2.3572278845503657e-05, "Pretrain/Loss": 1.9864047765731812, "Pretrain/Loss (Raw)": 2.0404818058013916, "Pretrain/Step": 10159, "Pretrain/Step Time": 8.482464609667659} +{"Pretrain/Learning Rate": 2.3568040628387253e-05, "Pretrain/Loss": 1.9862077236175537, "Pretrain/Loss (Raw)": 1.9731029272079468, "Pretrain/Step": 10160, "Pretrain/Step Time": 8.480593331158161} +{"Pretrain/Learning Rate": 2.3563802452560395e-05, "Pretrain/Loss": 1.9873263835906982, "Pretrain/Loss (Raw)": 2.0128400325775146, "Pretrain/Step": 10161, "Pretrain/Step Time": 8.481155468150973} +{"Pretrain/Learning Rate": 2.3559564318145276e-05, "Pretrain/Loss": 1.9881049394607544, "Pretrain/Loss (Raw)": 2.0185346603393555, "Pretrain/Step": 10162, "Pretrain/Step Time": 8.482869012281299} +{"Pretrain/Learning Rate": 2.35553262252641e-05, "Pretrain/Loss": 1.9882216453552246, "Pretrain/Loss (Raw)": 1.952681064605713, "Pretrain/Step": 10163, "Pretrain/Step Time": 8.482753993943334} +{"Pretrain/Learning Rate": 2.3551088174039076e-05, "Pretrain/Loss": 1.985629916191101, "Pretrain/Loss (Raw)": 1.8563976287841797, "Pretrain/Step": 10164, "Pretrain/Step Time": 8.480055347084999} +{"Pretrain/Learning Rate": 2.3546850164592403e-05, "Pretrain/Loss": 1.983952522277832, "Pretrain/Loss (Raw)": 1.7641003131866455, "Pretrain/Step": 10165, "Pretrain/Step Time": 8.48461533524096} +{"Pretrain/Learning Rate": 2.3542612197046288e-05, "Pretrain/Loss": 1.9821542501449585, "Pretrain/Loss (Raw)": 1.902784824371338, "Pretrain/Step": 10166, "Pretrain/Step Time": 8.487637061625719} +{"Pretrain/Learning Rate": 2.3538374271522917e-05, "Pretrain/Loss": 1.9833083152770996, "Pretrain/Loss (Raw)": 2.019132375717163, "Pretrain/Step": 10167, "Pretrain/Step Time": 8.486716570332646} +{"Pretrain/Learning Rate": 2.3534136388144497e-05, "Pretrain/Loss": 1.98274827003479, "Pretrain/Loss (Raw)": 1.9416817426681519, "Pretrain/Step": 10168, "Pretrain/Step Time": 8.491584908217192} +{"Pretrain/Learning Rate": 2.3529898547033214e-05, "Pretrain/Loss": 1.9826152324676514, "Pretrain/Loss (Raw)": 1.8405054807662964, "Pretrain/Step": 10169, "Pretrain/Step Time": 8.492391442880034} +{"Pretrain/Learning Rate": 2.3525660748311272e-05, "Pretrain/Loss": 1.9805136919021606, "Pretrain/Loss (Raw)": 1.8115171194076538, "Pretrain/Step": 10170, "Pretrain/Step Time": 8.493251154199243} +{"Pretrain/Learning Rate": 2.3521422992100873e-05, "Pretrain/Loss": 1.9790953397750854, "Pretrain/Loss (Raw)": 1.9111121892929077, "Pretrain/Step": 10171, "Pretrain/Step Time": 8.49484166316688} +{"Pretrain/Learning Rate": 2.351718527852419e-05, "Pretrain/Loss": 1.9778227806091309, "Pretrain/Loss (Raw)": 1.8498094081878662, "Pretrain/Step": 10172, "Pretrain/Step Time": 8.492980575188994} +{"Pretrain/Learning Rate": 2.3512947607703424e-05, "Pretrain/Loss": 1.9763050079345703, "Pretrain/Loss (Raw)": 2.3136351108551025, "Pretrain/Step": 10173, "Pretrain/Step Time": 8.490368191152811} +{"Pretrain/Learning Rate": 2.3508709979760766e-05, "Pretrain/Loss": 1.9760897159576416, "Pretrain/Loss (Raw)": 1.814664602279663, "Pretrain/Step": 10174, "Pretrain/Step Time": 8.491603910923004} +{"Pretrain/Learning Rate": 2.3504472394818406e-05, "Pretrain/Loss": 1.9754242897033691, "Pretrain/Loss (Raw)": 2.0900444984436035, "Pretrain/Step": 10175, "Pretrain/Step Time": 8.49001157656312} +{"Pretrain/Learning Rate": 2.3500234852998528e-05, "Pretrain/Loss": 1.977382779121399, "Pretrain/Loss (Raw)": 2.1229958534240723, "Pretrain/Step": 10176, "Pretrain/Step Time": 8.493151547387242} +{"Pretrain/Learning Rate": 2.3495997354423327e-05, "Pretrain/Loss": 1.9787944555282593, "Pretrain/Loss (Raw)": 2.0872020721435547, "Pretrain/Step": 10177, "Pretrain/Step Time": 8.49254915304482} +{"Pretrain/Learning Rate": 2.3491759899214977e-05, "Pretrain/Loss": 1.9806504249572754, "Pretrain/Loss (Raw)": 2.2314467430114746, "Pretrain/Step": 10178, "Pretrain/Step Time": 8.485479108989239} +{"Pretrain/Learning Rate": 2.3487522487495666e-05, "Pretrain/Loss": 1.9794189929962158, "Pretrain/Loss (Raw)": 2.000819206237793, "Pretrain/Step": 10179, "Pretrain/Step Time": 8.47752384468913} +{"Pretrain/Learning Rate": 2.348328511938758e-05, "Pretrain/Loss": 1.9815599918365479, "Pretrain/Loss (Raw)": 2.066467761993408, "Pretrain/Step": 10180, "Pretrain/Step Time": 8.478610906749964} +{"Pretrain/Learning Rate": 2.34790477950129e-05, "Pretrain/Loss": 1.9809433221817017, "Pretrain/Loss (Raw)": 1.859334945678711, "Pretrain/Step": 10181, "Pretrain/Step Time": 8.478638788685203} +{"Pretrain/Learning Rate": 2.3474810514493807e-05, "Pretrain/Loss": 1.9814786911010742, "Pretrain/Loss (Raw)": 2.1962106227874756, "Pretrain/Step": 10182, "Pretrain/Step Time": 8.475894721224904} +{"Pretrain/Learning Rate": 2.347057327795247e-05, "Pretrain/Loss": 1.983086347579956, "Pretrain/Loss (Raw)": 2.0539190769195557, "Pretrain/Step": 10183, "Pretrain/Step Time": 8.479998962953687} +{"Pretrain/Learning Rate": 2.3466336085511077e-05, "Pretrain/Loss": 1.982583999633789, "Pretrain/Loss (Raw)": 1.9378039836883545, "Pretrain/Step": 10184, "Pretrain/Step Time": 8.47972890548408} +{"Pretrain/Learning Rate": 2.34620989372918e-05, "Pretrain/Loss": 1.9886927604675293, "Pretrain/Loss (Raw)": 2.2870562076568604, "Pretrain/Step": 10185, "Pretrain/Step Time": 8.478706195950508} +{"Pretrain/Learning Rate": 2.345786183341682e-05, "Pretrain/Loss": 1.9886329174041748, "Pretrain/Loss (Raw)": 1.8983904123306274, "Pretrain/Step": 10186, "Pretrain/Step Time": 8.477942299097776} +{"Pretrain/Learning Rate": 2.345362477400831e-05, "Pretrain/Loss": 1.987962007522583, "Pretrain/Loss (Raw)": 2.0567243099212646, "Pretrain/Step": 10187, "Pretrain/Step Time": 8.483640873804688} +{"Pretrain/Learning Rate": 2.344938775918843e-05, "Pretrain/Loss": 1.9876776933670044, "Pretrain/Loss (Raw)": 2.0532121658325195, "Pretrain/Step": 10188, "Pretrain/Step Time": 8.47964407876134} +{"Pretrain/Learning Rate": 2.3445150789079367e-05, "Pretrain/Loss": 1.987676739692688, "Pretrain/Loss (Raw)": 1.9832539558410645, "Pretrain/Step": 10189, "Pretrain/Step Time": 8.479425897821784} +{"Pretrain/Learning Rate": 2.344091386380328e-05, "Pretrain/Loss": 1.988353967666626, "Pretrain/Loss (Raw)": 1.9483397006988525, "Pretrain/Step": 10190, "Pretrain/Step Time": 8.483223550021648} +{"Pretrain/Learning Rate": 2.343667698348235e-05, "Pretrain/Loss": 1.9887727499008179, "Pretrain/Loss (Raw)": 2.0706868171691895, "Pretrain/Step": 10191, "Pretrain/Step Time": 8.482770077884197} +{"Pretrain/Learning Rate": 2.3432440148238737e-05, "Pretrain/Loss": 1.9879932403564453, "Pretrain/Loss (Raw)": 1.8726937770843506, "Pretrain/Step": 10192, "Pretrain/Step Time": 8.487086882814765} +{"Pretrain/Learning Rate": 2.3428203358194603e-05, "Pretrain/Loss": 1.9868448972702026, "Pretrain/Loss (Raw)": 1.9451467990875244, "Pretrain/Step": 10193, "Pretrain/Step Time": 8.485584001988173} +{"Pretrain/Learning Rate": 2.3423966613472115e-05, "Pretrain/Loss": 1.98677396774292, "Pretrain/Loss (Raw)": 1.7803105115890503, "Pretrain/Step": 10194, "Pretrain/Step Time": 8.487478490918875} +{"Pretrain/Learning Rate": 2.3419729914193442e-05, "Pretrain/Loss": 1.9899502992630005, "Pretrain/Loss (Raw)": 2.1708824634552, "Pretrain/Step": 10195, "Pretrain/Step Time": 8.484998039901257} +{"Pretrain/Learning Rate": 2.341549326048074e-05, "Pretrain/Loss": 1.9910495281219482, "Pretrain/Loss (Raw)": 2.0413544178009033, "Pretrain/Step": 10196, "Pretrain/Step Time": 8.490468798205256} +{"Pretrain/Learning Rate": 2.341125665245618e-05, "Pretrain/Loss": 1.9931259155273438, "Pretrain/Loss (Raw)": 1.974638819694519, "Pretrain/Step": 10197, "Pretrain/Step Time": 8.488841313868761} +{"Pretrain/Learning Rate": 2.340702009024191e-05, "Pretrain/Loss": 1.9924535751342773, "Pretrain/Loss (Raw)": 1.9204907417297363, "Pretrain/Step": 10198, "Pretrain/Step Time": 8.49001388810575} +{"Pretrain/Learning Rate": 2.3402783573960092e-05, "Pretrain/Loss": 1.9964491128921509, "Pretrain/Loss (Raw)": 2.190042018890381, "Pretrain/Step": 10199, "Pretrain/Step Time": 8.48960118368268} +{"Pretrain/Learning Rate": 2.339854710373288e-05, "Pretrain/Loss": 1.9980010986328125, "Pretrain/Loss (Raw)": 2.0093722343444824, "Pretrain/Step": 10200, "Pretrain/Step Time": 8.492418520152569} +{"Pretrain/Learning Rate": 2.339431067968245e-05, "Pretrain/Loss": 1.9979909658432007, "Pretrain/Loss (Raw)": 2.0905067920684814, "Pretrain/Step": 10201, "Pretrain/Step Time": 8.489220719784498} +{"Pretrain/Learning Rate": 2.3390074301930925e-05, "Pretrain/Loss": 1.9992742538452148, "Pretrain/Loss (Raw)": 2.0129222869873047, "Pretrain/Step": 10202, "Pretrain/Step Time": 8.491003531962633} +{"Pretrain/Learning Rate": 2.3385837970600475e-05, "Pretrain/Loss": 1.9954544305801392, "Pretrain/Loss (Raw)": 1.8481764793395996, "Pretrain/Step": 10203, "Pretrain/Step Time": 8.492742165923119} +{"Pretrain/Learning Rate": 2.338160168581325e-05, "Pretrain/Loss": 1.9988725185394287, "Pretrain/Loss (Raw)": 1.9943835735321045, "Pretrain/Step": 10204, "Pretrain/Step Time": 8.494029438123107} +{"Pretrain/Learning Rate": 2.3377365447691402e-05, "Pretrain/Loss": 1.9991906881332397, "Pretrain/Loss (Raw)": 2.138411045074463, "Pretrain/Step": 10205, "Pretrain/Step Time": 8.491692846640944} +{"Pretrain/Learning Rate": 2.337312925635707e-05, "Pretrain/Loss": 1.998368263244629, "Pretrain/Loss (Raw)": 1.9187253713607788, "Pretrain/Step": 10206, "Pretrain/Step Time": 8.494338620454073} +{"Pretrain/Learning Rate": 2.3368893111932412e-05, "Pretrain/Loss": 1.9969563484191895, "Pretrain/Loss (Raw)": 1.913216471672058, "Pretrain/Step": 10207, "Pretrain/Step Time": 8.48785231076181} +{"Pretrain/Learning Rate": 2.3364657014539574e-05, "Pretrain/Loss": 1.9978301525115967, "Pretrain/Loss (Raw)": 1.9908074140548706, "Pretrain/Step": 10208, "Pretrain/Step Time": 8.487582040950656} +{"Pretrain/Learning Rate": 2.3360420964300694e-05, "Pretrain/Loss": 1.9982645511627197, "Pretrain/Loss (Raw)": 2.0863168239593506, "Pretrain/Step": 10209, "Pretrain/Step Time": 8.48991334065795} +{"Pretrain/Learning Rate": 2.3356184961337927e-05, "Pretrain/Loss": 1.9997020959854126, "Pretrain/Loss (Raw)": 2.1407978534698486, "Pretrain/Step": 10210, "Pretrain/Step Time": 8.486275317147374} +{"Pretrain/Learning Rate": 2.33519490057734e-05, "Pretrain/Loss": 2.0002896785736084, "Pretrain/Loss (Raw)": 2.161482810974121, "Pretrain/Step": 10211, "Pretrain/Step Time": 8.485356360673904} +{"Pretrain/Learning Rate": 2.334771309772926e-05, "Pretrain/Loss": 2.000525951385498, "Pretrain/Loss (Raw)": 2.098026752471924, "Pretrain/Step": 10212, "Pretrain/Step Time": 8.487193880602717} +{"Pretrain/Learning Rate": 2.3343477237327656e-05, "Pretrain/Loss": 2.0002307891845703, "Pretrain/Loss (Raw)": 1.9627101421356201, "Pretrain/Step": 10213, "Pretrain/Step Time": 8.482217784970999} +{"Pretrain/Learning Rate": 2.3339241424690713e-05, "Pretrain/Loss": 1.997253656387329, "Pretrain/Loss (Raw)": 1.5080560445785522, "Pretrain/Step": 10214, "Pretrain/Step Time": 8.487189676612616} +{"Pretrain/Learning Rate": 2.3335005659940577e-05, "Pretrain/Loss": 1.999523401260376, "Pretrain/Loss (Raw)": 2.092569351196289, "Pretrain/Step": 10215, "Pretrain/Step Time": 8.484872613102198} +{"Pretrain/Learning Rate": 2.3330769943199375e-05, "Pretrain/Loss": 1.9993425607681274, "Pretrain/Loss (Raw)": 1.8813589811325073, "Pretrain/Step": 10216, "Pretrain/Step Time": 8.484020685777068} +{"Pretrain/Learning Rate": 2.3326534274589244e-05, "Pretrain/Loss": 2.0011000633239746, "Pretrain/Loss (Raw)": 2.1859824657440186, "Pretrain/Step": 10217, "Pretrain/Step Time": 8.48757816106081} +{"Pretrain/Learning Rate": 2.332229865423232e-05, "Pretrain/Loss": 2.000514507293701, "Pretrain/Loss (Raw)": 2.1253116130828857, "Pretrain/Step": 10218, "Pretrain/Step Time": 8.48816891014576} +{"Pretrain/Learning Rate": 2.3318063082250733e-05, "Pretrain/Loss": 1.998970866203308, "Pretrain/Loss (Raw)": 1.9169692993164062, "Pretrain/Step": 10219, "Pretrain/Step Time": 8.485481822863221} +{"Pretrain/Learning Rate": 2.3313827558766613e-05, "Pretrain/Loss": 1.9991661310195923, "Pretrain/Loss (Raw)": 2.018406629562378, "Pretrain/Step": 10220, "Pretrain/Step Time": 8.482083033770323} +{"Pretrain/Learning Rate": 2.3309592083902082e-05, "Pretrain/Loss": 2.000032663345337, "Pretrain/Loss (Raw)": 1.9127110242843628, "Pretrain/Step": 10221, "Pretrain/Step Time": 8.479901850223541} +{"Pretrain/Learning Rate": 2.3305356657779273e-05, "Pretrain/Loss": 1.9994230270385742, "Pretrain/Loss (Raw)": 1.9877653121948242, "Pretrain/Step": 10222, "Pretrain/Step Time": 8.474056709557772} +{"Pretrain/Learning Rate": 2.3301121280520307e-05, "Pretrain/Loss": 1.9995341300964355, "Pretrain/Loss (Raw)": 1.9125661849975586, "Pretrain/Step": 10223, "Pretrain/Step Time": 8.477300755679607} +{"Pretrain/Learning Rate": 2.3296885952247317e-05, "Pretrain/Loss": 1.9996768236160278, "Pretrain/Loss (Raw)": 2.2368555068969727, "Pretrain/Step": 10224, "Pretrain/Step Time": 8.479905113577843} +{"Pretrain/Learning Rate": 2.329265067308242e-05, "Pretrain/Loss": 2.0014500617980957, "Pretrain/Loss (Raw)": 2.1041202545166016, "Pretrain/Step": 10225, "Pretrain/Step Time": 8.478615619242191} +{"Pretrain/Learning Rate": 2.3288415443147733e-05, "Pretrain/Loss": 2.00040864944458, "Pretrain/Loss (Raw)": 1.875647783279419, "Pretrain/Step": 10226, "Pretrain/Step Time": 8.482454674318433} +{"Pretrain/Learning Rate": 2.328418026256538e-05, "Pretrain/Loss": 2.0020761489868164, "Pretrain/Loss (Raw)": 2.0627200603485107, "Pretrain/Step": 10227, "Pretrain/Step Time": 8.479193111881614} +{"Pretrain/Learning Rate": 2.327994513145748e-05, "Pretrain/Loss": 2.002164840698242, "Pretrain/Loss (Raw)": 1.993276596069336, "Pretrain/Step": 10228, "Pretrain/Step Time": 8.485425824299455} +{"Pretrain/Learning Rate": 2.327571004994615e-05, "Pretrain/Loss": 1.9993036985397339, "Pretrain/Loss (Raw)": 1.836714744567871, "Pretrain/Step": 10229, "Pretrain/Step Time": 8.484962657094002} +{"Pretrain/Learning Rate": 2.327147501815351e-05, "Pretrain/Loss": 1.9996193647384644, "Pretrain/Loss (Raw)": 1.8901805877685547, "Pretrain/Step": 10230, "Pretrain/Step Time": 8.488731268793344} +{"Pretrain/Learning Rate": 2.3267240036201666e-05, "Pretrain/Loss": 1.9997334480285645, "Pretrain/Loss (Raw)": 2.051013469696045, "Pretrain/Step": 10231, "Pretrain/Step Time": 8.485023237764835} +{"Pretrain/Learning Rate": 2.326300510421273e-05, "Pretrain/Loss": 1.9993895292282104, "Pretrain/Loss (Raw)": 1.9350699186325073, "Pretrain/Step": 10232, "Pretrain/Step Time": 8.489543657749891} +{"Pretrain/Learning Rate": 2.325877022230882e-05, "Pretrain/Loss": 2.001163959503174, "Pretrain/Loss (Raw)": 2.2028348445892334, "Pretrain/Step": 10233, "Pretrain/Step Time": 8.484163630753756} +{"Pretrain/Learning Rate": 2.3254535390612044e-05, "Pretrain/Loss": 2.0025792121887207, "Pretrain/Loss (Raw)": 2.2079381942749023, "Pretrain/Step": 10234, "Pretrain/Step Time": 8.486875170841813} +{"Pretrain/Learning Rate": 2.3250300609244514e-05, "Pretrain/Loss": 2.0005970001220703, "Pretrain/Loss (Raw)": 1.8470042943954468, "Pretrain/Step": 10235, "Pretrain/Step Time": 8.487286917865276} +{"Pretrain/Learning Rate": 2.3246065878328326e-05, "Pretrain/Loss": 2.002145767211914, "Pretrain/Loss (Raw)": 1.8964452743530273, "Pretrain/Step": 10236, "Pretrain/Step Time": 8.485240587964654} +{"Pretrain/Learning Rate": 2.3241831197985593e-05, "Pretrain/Loss": 2.003063678741455, "Pretrain/Loss (Raw)": 2.112318515777588, "Pretrain/Step": 10237, "Pretrain/Step Time": 8.486957663670182} +{"Pretrain/Learning Rate": 2.3237596568338418e-05, "Pretrain/Loss": 2.0006470680236816, "Pretrain/Loss (Raw)": 1.8326010704040527, "Pretrain/Step": 10238, "Pretrain/Step Time": 8.485687833279371} +{"Pretrain/Learning Rate": 2.3233361989508904e-05, "Pretrain/Loss": 2.0000991821289062, "Pretrain/Loss (Raw)": 2.017957925796509, "Pretrain/Step": 10239, "Pretrain/Step Time": 8.487096808850765} +{"Pretrain/Learning Rate": 2.3229127461619148e-05, "Pretrain/Loss": 2.0002119541168213, "Pretrain/Loss (Raw)": 2.188758373260498, "Pretrain/Step": 10240, "Pretrain/Step Time": 8.48651884496212} +{"Pretrain/Learning Rate": 2.3224892984791262e-05, "Pretrain/Loss": 2.0001258850097656, "Pretrain/Loss (Raw)": 1.7688523530960083, "Pretrain/Step": 10241, "Pretrain/Step Time": 8.485181968659163} +{"Pretrain/Learning Rate": 2.322065855914733e-05, "Pretrain/Loss": 2.0005407333374023, "Pretrain/Loss (Raw)": 2.076951742172241, "Pretrain/Step": 10242, "Pretrain/Step Time": 8.484563270583749} +{"Pretrain/Learning Rate": 2.3216424184809456e-05, "Pretrain/Loss": 1.998691439628601, "Pretrain/Loss (Raw)": 1.7877165079116821, "Pretrain/Step": 10243, "Pretrain/Step Time": 8.490598576143384} +{"Pretrain/Learning Rate": 2.3212189861899732e-05, "Pretrain/Loss": 1.999748945236206, "Pretrain/Loss (Raw)": 2.0032906532287598, "Pretrain/Step": 10244, "Pretrain/Step Time": 8.487779201939702} +{"Pretrain/Learning Rate": 2.3207955590540247e-05, "Pretrain/Loss": 1.9987573623657227, "Pretrain/Loss (Raw)": 2.029243230819702, "Pretrain/Step": 10245, "Pretrain/Step Time": 8.484102241694927} +{"Pretrain/Learning Rate": 2.3203721370853112e-05, "Pretrain/Loss": 2.0003395080566406, "Pretrain/Loss (Raw)": 2.107769250869751, "Pretrain/Step": 10246, "Pretrain/Step Time": 8.48727648332715} +{"Pretrain/Learning Rate": 2.3199487202960395e-05, "Pretrain/Loss": 1.999906301498413, "Pretrain/Loss (Raw)": 1.9774905443191528, "Pretrain/Step": 10247, "Pretrain/Step Time": 8.48705673031509} +{"Pretrain/Learning Rate": 2.3195253086984198e-05, "Pretrain/Loss": 1.9976508617401123, "Pretrain/Loss (Raw)": 1.7472399473190308, "Pretrain/Step": 10248, "Pretrain/Step Time": 8.487158689647913} +{"Pretrain/Learning Rate": 2.3191019023046605e-05, "Pretrain/Loss": 1.9953701496124268, "Pretrain/Loss (Raw)": 1.7543044090270996, "Pretrain/Step": 10249, "Pretrain/Step Time": 8.487640151754022} +{"Pretrain/Learning Rate": 2.3186785011269704e-05, "Pretrain/Loss": 1.995566725730896, "Pretrain/Loss (Raw)": 2.074321746826172, "Pretrain/Step": 10250, "Pretrain/Step Time": 8.483511041849852} +{"Pretrain/Learning Rate": 2.3182551051775587e-05, "Pretrain/Loss": 1.9961822032928467, "Pretrain/Loss (Raw)": 1.9419013261795044, "Pretrain/Step": 10251, "Pretrain/Step Time": 8.481124203652143} +{"Pretrain/Learning Rate": 2.3178317144686317e-05, "Pretrain/Loss": 1.998055100440979, "Pretrain/Loss (Raw)": 2.132845878601074, "Pretrain/Step": 10252, "Pretrain/Step Time": 8.481991553679109} +{"Pretrain/Learning Rate": 2.3174083290123993e-05, "Pretrain/Loss": 1.9988795518875122, "Pretrain/Loss (Raw)": 1.9776368141174316, "Pretrain/Step": 10253, "Pretrain/Step Time": 8.483479944989085} +{"Pretrain/Learning Rate": 2.316984948821069e-05, "Pretrain/Loss": 1.9996848106384277, "Pretrain/Loss (Raw)": 1.9921278953552246, "Pretrain/Step": 10254, "Pretrain/Step Time": 8.483822848647833} +{"Pretrain/Learning Rate": 2.3165615739068486e-05, "Pretrain/Loss": 2.0009374618530273, "Pretrain/Loss (Raw)": 2.2119078636169434, "Pretrain/Step": 10255, "Pretrain/Step Time": 8.483818463981152} +{"Pretrain/Learning Rate": 2.3161382042819463e-05, "Pretrain/Loss": 2.0061941146850586, "Pretrain/Loss (Raw)": 2.4844608306884766, "Pretrain/Step": 10256, "Pretrain/Step Time": 8.485661895945668} +{"Pretrain/Learning Rate": 2.315714839958569e-05, "Pretrain/Loss": 2.007359027862549, "Pretrain/Loss (Raw)": 2.0867137908935547, "Pretrain/Step": 10257, "Pretrain/Step Time": 8.486423566937447} +{"Pretrain/Learning Rate": 2.315291480948924e-05, "Pretrain/Loss": 2.008180618286133, "Pretrain/Loss (Raw)": 2.0020322799682617, "Pretrain/Step": 10258, "Pretrain/Step Time": 8.481849025934935} +{"Pretrain/Learning Rate": 2.3148681272652193e-05, "Pretrain/Loss": 2.0015735626220703, "Pretrain/Loss (Raw)": 1.9164997339248657, "Pretrain/Step": 10259, "Pretrain/Step Time": 8.482907986268401} +{"Pretrain/Learning Rate": 2.3144447789196613e-05, "Pretrain/Loss": 2.0029048919677734, "Pretrain/Loss (Raw)": 1.909184217453003, "Pretrain/Step": 10260, "Pretrain/Step Time": 8.485863151028752} +{"Pretrain/Learning Rate": 2.314021435924458e-05, "Pretrain/Loss": 2.002988576889038, "Pretrain/Loss (Raw)": 2.0604662895202637, "Pretrain/Step": 10261, "Pretrain/Step Time": 8.486405411735177} +{"Pretrain/Learning Rate": 2.3135980982918152e-05, "Pretrain/Loss": 2.000836133956909, "Pretrain/Loss (Raw)": 1.862932562828064, "Pretrain/Step": 10262, "Pretrain/Step Time": 8.486553018912673} +{"Pretrain/Learning Rate": 2.3131747660339394e-05, "Pretrain/Loss": 2.0009448528289795, "Pretrain/Loss (Raw)": 1.9820305109024048, "Pretrain/Step": 10263, "Pretrain/Step Time": 8.490890756249428} +{"Pretrain/Learning Rate": 2.312751439163038e-05, "Pretrain/Loss": 2.000377655029297, "Pretrain/Loss (Raw)": 2.0573415756225586, "Pretrain/Step": 10264, "Pretrain/Step Time": 8.493747614324093} +{"Pretrain/Learning Rate": 2.3123281176913166e-05, "Pretrain/Loss": 2.00020432472229, "Pretrain/Loss (Raw)": 1.9928704500198364, "Pretrain/Step": 10265, "Pretrain/Step Time": 8.486602578312159} +{"Pretrain/Learning Rate": 2.3119048016309817e-05, "Pretrain/Loss": 2.0019705295562744, "Pretrain/Loss (Raw)": 2.031416177749634, "Pretrain/Step": 10266, "Pretrain/Step Time": 8.489452736452222} +{"Pretrain/Learning Rate": 2.3114814909942392e-05, "Pretrain/Loss": 1.9991700649261475, "Pretrain/Loss (Raw)": 1.6608946323394775, "Pretrain/Step": 10267, "Pretrain/Step Time": 8.489424172788858} +{"Pretrain/Learning Rate": 2.311058185793295e-05, "Pretrain/Loss": 1.9985449314117432, "Pretrain/Loss (Raw)": 1.9961092472076416, "Pretrain/Step": 10268, "Pretrain/Step Time": 8.491746917366982} +{"Pretrain/Learning Rate": 2.310634886040355e-05, "Pretrain/Loss": 1.9953103065490723, "Pretrain/Loss (Raw)": 1.5882354974746704, "Pretrain/Step": 10269, "Pretrain/Step Time": 8.497337447479367} +{"Pretrain/Learning Rate": 2.310211591747624e-05, "Pretrain/Loss": 1.9944007396697998, "Pretrain/Loss (Raw)": 1.8136940002441406, "Pretrain/Step": 10270, "Pretrain/Step Time": 8.495773162692785} +{"Pretrain/Learning Rate": 2.309788302927309e-05, "Pretrain/Loss": 1.9934334754943848, "Pretrain/Loss (Raw)": 1.7968419790267944, "Pretrain/Step": 10271, "Pretrain/Step Time": 8.494032578542829} +{"Pretrain/Learning Rate": 2.3093650195916138e-05, "Pretrain/Loss": 1.995492696762085, "Pretrain/Loss (Raw)": 2.2195801734924316, "Pretrain/Step": 10272, "Pretrain/Step Time": 8.494492096826434} +{"Pretrain/Learning Rate": 2.308941741752743e-05, "Pretrain/Loss": 1.9959100484848022, "Pretrain/Loss (Raw)": 2.150059938430786, "Pretrain/Step": 10273, "Pretrain/Step Time": 8.49341455847025} +{"Pretrain/Learning Rate": 2.308518469422903e-05, "Pretrain/Loss": 1.9973440170288086, "Pretrain/Loss (Raw)": 2.068729877471924, "Pretrain/Step": 10274, "Pretrain/Step Time": 8.49919693544507} +{"Pretrain/Learning Rate": 2.308095202614298e-05, "Pretrain/Loss": 1.9978258609771729, "Pretrain/Loss (Raw)": 2.0526247024536133, "Pretrain/Step": 10275, "Pretrain/Step Time": 8.488146374002099} +{"Pretrain/Learning Rate": 2.3076719413391327e-05, "Pretrain/Loss": 1.9969254732131958, "Pretrain/Loss (Raw)": 2.0376853942871094, "Pretrain/Step": 10276, "Pretrain/Step Time": 8.489005709066987} +{"Pretrain/Learning Rate": 2.3072486856096117e-05, "Pretrain/Loss": 1.9968780279159546, "Pretrain/Loss (Raw)": 2.007720708847046, "Pretrain/Step": 10277, "Pretrain/Step Time": 8.490857977420092} +{"Pretrain/Learning Rate": 2.3068254354379383e-05, "Pretrain/Loss": 1.9944005012512207, "Pretrain/Loss (Raw)": 1.7770602703094482, "Pretrain/Step": 10278, "Pretrain/Step Time": 8.496235763654113} +{"Pretrain/Learning Rate": 2.3064021908363173e-05, "Pretrain/Loss": 1.9942022562026978, "Pretrain/Loss (Raw)": 1.8211654424667358, "Pretrain/Step": 10279, "Pretrain/Step Time": 8.487447591498494} +{"Pretrain/Learning Rate": 2.3059789518169528e-05, "Pretrain/Loss": 1.9941086769104004, "Pretrain/Loss (Raw)": 1.9533182382583618, "Pretrain/Step": 10280, "Pretrain/Step Time": 8.490108901634812} +{"Pretrain/Learning Rate": 2.3055557183920484e-05, "Pretrain/Loss": 1.99235999584198, "Pretrain/Loss (Raw)": 1.758895754814148, "Pretrain/Step": 10281, "Pretrain/Step Time": 8.485794255509973} +{"Pretrain/Learning Rate": 2.3051324905738083e-05, "Pretrain/Loss": 1.9913976192474365, "Pretrain/Loss (Raw)": 1.9398113489151, "Pretrain/Step": 10282, "Pretrain/Step Time": 8.484331069514155} +{"Pretrain/Learning Rate": 2.3047092683744348e-05, "Pretrain/Loss": 1.9928004741668701, "Pretrain/Loss (Raw)": 2.192186117172241, "Pretrain/Step": 10283, "Pretrain/Step Time": 8.482890244573355} +{"Pretrain/Learning Rate": 2.3042860518061322e-05, "Pretrain/Loss": 1.9930329322814941, "Pretrain/Loss (Raw)": 2.0651133060455322, "Pretrain/Step": 10284, "Pretrain/Step Time": 8.486509380862117} +{"Pretrain/Learning Rate": 2.303862840881103e-05, "Pretrain/Loss": 1.9932441711425781, "Pretrain/Loss (Raw)": 1.9867900609970093, "Pretrain/Step": 10285, "Pretrain/Step Time": 8.490948550403118} +{"Pretrain/Learning Rate": 2.3034396356115517e-05, "Pretrain/Loss": 1.9917851686477661, "Pretrain/Loss (Raw)": 2.030975818634033, "Pretrain/Step": 10286, "Pretrain/Step Time": 8.489982940256596} +{"Pretrain/Learning Rate": 2.303016436009679e-05, "Pretrain/Loss": 1.991941213607788, "Pretrain/Loss (Raw)": 2.060441493988037, "Pretrain/Step": 10287, "Pretrain/Step Time": 8.483374981209636} +{"Pretrain/Learning Rate": 2.3025932420876882e-05, "Pretrain/Loss": 1.9933220148086548, "Pretrain/Loss (Raw)": 2.149855375289917, "Pretrain/Step": 10288, "Pretrain/Step Time": 8.48131357692182} +{"Pretrain/Learning Rate": 2.3021700538577833e-05, "Pretrain/Loss": 1.9938381910324097, "Pretrain/Loss (Raw)": 2.0789144039154053, "Pretrain/Step": 10289, "Pretrain/Step Time": 8.485314343124628} +{"Pretrain/Learning Rate": 2.3017468713321644e-05, "Pretrain/Loss": 1.9925063848495483, "Pretrain/Loss (Raw)": 1.848061203956604, "Pretrain/Step": 10290, "Pretrain/Step Time": 8.488474901765585} +{"Pretrain/Learning Rate": 2.3013236945230345e-05, "Pretrain/Loss": 1.99226713180542, "Pretrain/Loss (Raw)": 1.922068476676941, "Pretrain/Step": 10291, "Pretrain/Step Time": 8.483842991292477} +{"Pretrain/Learning Rate": 2.3009005234425963e-05, "Pretrain/Loss": 1.993170976638794, "Pretrain/Loss (Raw)": 1.9720730781555176, "Pretrain/Step": 10292, "Pretrain/Step Time": 8.486329717561603} +{"Pretrain/Learning Rate": 2.300477358103051e-05, "Pretrain/Loss": 1.9961591958999634, "Pretrain/Loss (Raw)": 2.1466119289398193, "Pretrain/Step": 10293, "Pretrain/Step Time": 8.48441857099533} +{"Pretrain/Learning Rate": 2.3000541985166006e-05, "Pretrain/Loss": 1.9980096817016602, "Pretrain/Loss (Raw)": 2.1396310329437256, "Pretrain/Step": 10294, "Pretrain/Step Time": 8.480984961614013} +{"Pretrain/Learning Rate": 2.299631044695446e-05, "Pretrain/Loss": 1.9976292848587036, "Pretrain/Loss (Raw)": 1.970436930656433, "Pretrain/Step": 10295, "Pretrain/Step Time": 8.482259606942534} +{"Pretrain/Learning Rate": 2.2992078966517894e-05, "Pretrain/Loss": 1.9975347518920898, "Pretrain/Loss (Raw)": 1.92959463596344, "Pretrain/Step": 10296, "Pretrain/Step Time": 8.476495137438178} +{"Pretrain/Learning Rate": 2.2987847543978313e-05, "Pretrain/Loss": 1.9980366230010986, "Pretrain/Loss (Raw)": 1.9047482013702393, "Pretrain/Step": 10297, "Pretrain/Step Time": 8.476179532706738} +{"Pretrain/Learning Rate": 2.2983616179457728e-05, "Pretrain/Loss": 2.0034313201904297, "Pretrain/Loss (Raw)": 2.5020322799682617, "Pretrain/Step": 10298, "Pretrain/Step Time": 8.474146297201514} +{"Pretrain/Learning Rate": 2.297938487307816e-05, "Pretrain/Loss": 2.0031657218933105, "Pretrain/Loss (Raw)": 1.8771320581436157, "Pretrain/Step": 10299, "Pretrain/Step Time": 8.472429042682052} +{"Pretrain/Learning Rate": 2.2975153624961594e-05, "Pretrain/Loss": 2.0087151527404785, "Pretrain/Loss (Raw)": 2.560110569000244, "Pretrain/Step": 10300, "Pretrain/Step Time": 8.472898121923208} +{"Pretrain/Learning Rate": 2.2970922435230046e-05, "Pretrain/Loss": 2.008362054824829, "Pretrain/Loss (Raw)": 2.2684571743011475, "Pretrain/Step": 10301, "Pretrain/Step Time": 8.474154487252235} +{"Pretrain/Learning Rate": 2.296669130400552e-05, "Pretrain/Loss": 2.011152982711792, "Pretrain/Loss (Raw)": 2.171898365020752, "Pretrain/Step": 10302, "Pretrain/Step Time": 8.471995700150728} +{"Pretrain/Learning Rate": 2.2962460231410014e-05, "Pretrain/Loss": 2.0118188858032227, "Pretrain/Loss (Raw)": 2.1752710342407227, "Pretrain/Step": 10303, "Pretrain/Step Time": 8.47103650122881} +{"Pretrain/Learning Rate": 2.2958229217565535e-05, "Pretrain/Loss": 2.009512424468994, "Pretrain/Loss (Raw)": 1.8277429342269897, "Pretrain/Step": 10304, "Pretrain/Step Time": 8.467594189569354} +{"Pretrain/Learning Rate": 2.2953998262594083e-05, "Pretrain/Loss": 2.0100505352020264, "Pretrain/Loss (Raw)": 2.156127691268921, "Pretrain/Step": 10305, "Pretrain/Step Time": 8.470009813085198} +{"Pretrain/Learning Rate": 2.294976736661764e-05, "Pretrain/Loss": 2.01059627532959, "Pretrain/Loss (Raw)": 2.3012940883636475, "Pretrain/Step": 10306, "Pretrain/Step Time": 8.474805815145373} +{"Pretrain/Learning Rate": 2.2945536529758215e-05, "Pretrain/Loss": 2.010303258895874, "Pretrain/Loss (Raw)": 1.9633152484893799, "Pretrain/Step": 10307, "Pretrain/Step Time": 8.475531112402678} +{"Pretrain/Learning Rate": 2.294130575213779e-05, "Pretrain/Loss": 2.00889253616333, "Pretrain/Loss (Raw)": 1.8858639001846313, "Pretrain/Step": 10308, "Pretrain/Step Time": 8.47362756729126} +{"Pretrain/Learning Rate": 2.2937075033878366e-05, "Pretrain/Loss": 2.0094776153564453, "Pretrain/Loss (Raw)": 1.934260368347168, "Pretrain/Step": 10309, "Pretrain/Step Time": 8.471759371459484} +{"Pretrain/Learning Rate": 2.2932844375101933e-05, "Pretrain/Loss": 2.005887031555176, "Pretrain/Loss (Raw)": 1.7366122007369995, "Pretrain/Step": 10310, "Pretrain/Step Time": 8.473725026473403} +{"Pretrain/Learning Rate": 2.2928613775930472e-05, "Pretrain/Loss": 2.00606632232666, "Pretrain/Loss (Raw)": 2.076866865158081, "Pretrain/Step": 10311, "Pretrain/Step Time": 8.473770067095757} +{"Pretrain/Learning Rate": 2.2924383236485968e-05, "Pretrain/Loss": 2.006758213043213, "Pretrain/Loss (Raw)": 2.026364803314209, "Pretrain/Step": 10312, "Pretrain/Step Time": 8.470774095505476} +{"Pretrain/Learning Rate": 2.2920152756890413e-05, "Pretrain/Loss": 2.0047717094421387, "Pretrain/Loss (Raw)": 2.032797336578369, "Pretrain/Step": 10313, "Pretrain/Step Time": 8.469442805275321} +{"Pretrain/Learning Rate": 2.2915922337265787e-05, "Pretrain/Loss": 2.0069355964660645, "Pretrain/Loss (Raw)": 2.1753365993499756, "Pretrain/Step": 10314, "Pretrain/Step Time": 8.473077611997724} +{"Pretrain/Learning Rate": 2.291169197773408e-05, "Pretrain/Loss": 2.006166696548462, "Pretrain/Loss (Raw)": 1.9583271741867065, "Pretrain/Step": 10315, "Pretrain/Step Time": 8.469425169751048} +{"Pretrain/Learning Rate": 2.2907461678417253e-05, "Pretrain/Loss": 2.0060863494873047, "Pretrain/Loss (Raw)": 2.042903423309326, "Pretrain/Step": 10316, "Pretrain/Step Time": 8.467916624620557} +{"Pretrain/Learning Rate": 2.290323143943729e-05, "Pretrain/Loss": 2.006241798400879, "Pretrain/Loss (Raw)": 2.0031626224517822, "Pretrain/Step": 10317, "Pretrain/Step Time": 8.468507073819637} +{"Pretrain/Learning Rate": 2.2899001260916175e-05, "Pretrain/Loss": 2.006366729736328, "Pretrain/Loss (Raw)": 1.9643348455429077, "Pretrain/Step": 10318, "Pretrain/Step Time": 8.464683862403035} +{"Pretrain/Learning Rate": 2.289477114297588e-05, "Pretrain/Loss": 2.006431818008423, "Pretrain/Loss (Raw)": 2.079015016555786, "Pretrain/Step": 10319, "Pretrain/Step Time": 8.4647768586874} +{"Pretrain/Learning Rate": 2.2890541085738375e-05, "Pretrain/Loss": 2.0068821907043457, "Pretrain/Loss (Raw)": 1.930341362953186, "Pretrain/Step": 10320, "Pretrain/Step Time": 8.459292706102133} +{"Pretrain/Learning Rate": 2.288631108932563e-05, "Pretrain/Loss": 2.007479190826416, "Pretrain/Loss (Raw)": 2.021575450897217, "Pretrain/Step": 10321, "Pretrain/Step Time": 8.46421523950994} +{"Pretrain/Learning Rate": 2.2882081153859612e-05, "Pretrain/Loss": 2.0092220306396484, "Pretrain/Loss (Raw)": 2.0033953189849854, "Pretrain/Step": 10322, "Pretrain/Step Time": 8.464679095894098} +{"Pretrain/Learning Rate": 2.287785127946229e-05, "Pretrain/Loss": 2.0078277587890625, "Pretrain/Loss (Raw)": 1.9924123287200928, "Pretrain/Step": 10323, "Pretrain/Step Time": 8.466936754062772} +{"Pretrain/Learning Rate": 2.2873621466255633e-05, "Pretrain/Loss": 2.0075135231018066, "Pretrain/Loss (Raw)": 2.001114845275879, "Pretrain/Step": 10324, "Pretrain/Step Time": 8.463063199073076} +{"Pretrain/Learning Rate": 2.2869391714361604e-05, "Pretrain/Loss": 2.007450819015503, "Pretrain/Loss (Raw)": 1.9666318893432617, "Pretrain/Step": 10325, "Pretrain/Step Time": 8.459758488461375} +{"Pretrain/Learning Rate": 2.286516202390216e-05, "Pretrain/Loss": 2.0082693099975586, "Pretrain/Loss (Raw)": 2.0252296924591064, "Pretrain/Step": 10326, "Pretrain/Step Time": 8.461954295635223} +{"Pretrain/Learning Rate": 2.2860932394999264e-05, "Pretrain/Loss": 2.0064220428466797, "Pretrain/Loss (Raw)": 1.953580379486084, "Pretrain/Step": 10327, "Pretrain/Step Time": 8.461906362324953} +{"Pretrain/Learning Rate": 2.2856702827774874e-05, "Pretrain/Loss": 2.0058774948120117, "Pretrain/Loss (Raw)": 1.939677119255066, "Pretrain/Step": 10328, "Pretrain/Step Time": 8.462161464616656} +{"Pretrain/Learning Rate": 2.285247332235095e-05, "Pretrain/Loss": 2.0035743713378906, "Pretrain/Loss (Raw)": 1.7957096099853516, "Pretrain/Step": 10329, "Pretrain/Step Time": 8.45938959158957} +{"Pretrain/Learning Rate": 2.2848243878849443e-05, "Pretrain/Loss": 2.0018110275268555, "Pretrain/Loss (Raw)": 1.7872428894042969, "Pretrain/Step": 10330, "Pretrain/Step Time": 8.458085656166077} +{"Pretrain/Learning Rate": 2.2844014497392304e-05, "Pretrain/Loss": 2.001870632171631, "Pretrain/Loss (Raw)": 1.85579514503479, "Pretrain/Step": 10331, "Pretrain/Step Time": 8.459576742723584} +{"Pretrain/Learning Rate": 2.2839785178101488e-05, "Pretrain/Loss": 2.000002384185791, "Pretrain/Loss (Raw)": 1.7552587985992432, "Pretrain/Step": 10332, "Pretrain/Step Time": 8.465440114960074} +{"Pretrain/Learning Rate": 2.2835555921098944e-05, "Pretrain/Loss": 2.000575304031372, "Pretrain/Loss (Raw)": 2.211754083633423, "Pretrain/Step": 10333, "Pretrain/Step Time": 8.461688116192818} +{"Pretrain/Learning Rate": 2.2831326726506617e-05, "Pretrain/Loss": 2.0027637481689453, "Pretrain/Loss (Raw)": 2.198814868927002, "Pretrain/Step": 10334, "Pretrain/Step Time": 8.460310524329543} +{"Pretrain/Learning Rate": 2.2827097594446464e-05, "Pretrain/Loss": 2.0041770935058594, "Pretrain/Loss (Raw)": 2.0941460132598877, "Pretrain/Step": 10335, "Pretrain/Step Time": 8.461534148082137} +{"Pretrain/Learning Rate": 2.2822868525040413e-05, "Pretrain/Loss": 2.0036487579345703, "Pretrain/Loss (Raw)": 1.923150897026062, "Pretrain/Step": 10336, "Pretrain/Step Time": 8.460473919287324} +{"Pretrain/Learning Rate": 2.2818639518410414e-05, "Pretrain/Loss": 2.0018014907836914, "Pretrain/Loss (Raw)": 1.849884033203125, "Pretrain/Step": 10337, "Pretrain/Step Time": 8.4584259390831} +{"Pretrain/Learning Rate": 2.2814410574678404e-05, "Pretrain/Loss": 2.0024991035461426, "Pretrain/Loss (Raw)": 2.2300853729248047, "Pretrain/Step": 10338, "Pretrain/Step Time": 8.462515659630299} +{"Pretrain/Learning Rate": 2.281018169396633e-05, "Pretrain/Loss": 2.00114369392395, "Pretrain/Loss (Raw)": 1.9879906177520752, "Pretrain/Step": 10339, "Pretrain/Step Time": 8.464600384235382} +{"Pretrain/Learning Rate": 2.2805952876396117e-05, "Pretrain/Loss": 2.0014114379882812, "Pretrain/Loss (Raw)": 2.132310628890991, "Pretrain/Step": 10340, "Pretrain/Step Time": 8.463899821043015} +{"Pretrain/Learning Rate": 2.2801724122089714e-05, "Pretrain/Loss": 2.0024759769439697, "Pretrain/Loss (Raw)": 2.098970413208008, "Pretrain/Step": 10341, "Pretrain/Step Time": 8.460486808791757} +{"Pretrain/Learning Rate": 2.2797495431169043e-05, "Pretrain/Loss": 2.006514549255371, "Pretrain/Loss (Raw)": 2.0249717235565186, "Pretrain/Step": 10342, "Pretrain/Step Time": 8.45560490526259} +{"Pretrain/Learning Rate": 2.2793266803756033e-05, "Pretrain/Loss": 2.004538059234619, "Pretrain/Loss (Raw)": 1.8395729064941406, "Pretrain/Step": 10343, "Pretrain/Step Time": 8.456776838749647} +{"Pretrain/Learning Rate": 2.2789038239972625e-05, "Pretrain/Loss": 2.00339412689209, "Pretrain/Loss (Raw)": 1.7349413633346558, "Pretrain/Step": 10344, "Pretrain/Step Time": 8.461418436840177} +{"Pretrain/Learning Rate": 2.2784809739940736e-05, "Pretrain/Loss": 2.0028011798858643, "Pretrain/Loss (Raw)": 2.1101062297821045, "Pretrain/Step": 10345, "Pretrain/Step Time": 8.451163141056895} +{"Pretrain/Learning Rate": 2.2780581303782303e-05, "Pretrain/Loss": 2.001110076904297, "Pretrain/Loss (Raw)": 1.9088224172592163, "Pretrain/Step": 10346, "Pretrain/Step Time": 8.451853930950165} +{"Pretrain/Learning Rate": 2.277635293161924e-05, "Pretrain/Loss": 1.9993348121643066, "Pretrain/Loss (Raw)": 1.6897480487823486, "Pretrain/Step": 10347, "Pretrain/Step Time": 8.458722814917564} +{"Pretrain/Learning Rate": 2.277212462357347e-05, "Pretrain/Loss": 2.0001535415649414, "Pretrain/Loss (Raw)": 2.123196601867676, "Pretrain/Step": 10348, "Pretrain/Step Time": 8.45967803709209} +{"Pretrain/Learning Rate": 2.276789637976692e-05, "Pretrain/Loss": 2.0016276836395264, "Pretrain/Loss (Raw)": 2.101428985595703, "Pretrain/Step": 10349, "Pretrain/Step Time": 8.463380742818117} +{"Pretrain/Learning Rate": 2.2763668200321502e-05, "Pretrain/Loss": 2.001919746398926, "Pretrain/Loss (Raw)": 2.0251524448394775, "Pretrain/Step": 10350, "Pretrain/Step Time": 8.468090903013945} +{"Pretrain/Learning Rate": 2.275944008535914e-05, "Pretrain/Loss": 2.003702163696289, "Pretrain/Loss (Raw)": 2.1407008171081543, "Pretrain/Step": 10351, "Pretrain/Step Time": 8.46234418079257} +{"Pretrain/Learning Rate": 2.2755212035001737e-05, "Pretrain/Loss": 2.002262592315674, "Pretrain/Loss (Raw)": 2.0525970458984375, "Pretrain/Step": 10352, "Pretrain/Step Time": 8.46240497380495} +{"Pretrain/Learning Rate": 2.2750984049371215e-05, "Pretrain/Loss": 2.0013513565063477, "Pretrain/Loss (Raw)": 1.9874666929244995, "Pretrain/Step": 10353, "Pretrain/Step Time": 8.4597196765244} +{"Pretrain/Learning Rate": 2.2746756128589485e-05, "Pretrain/Loss": 2.0035743713378906, "Pretrain/Loss (Raw)": 2.1601905822753906, "Pretrain/Step": 10354, "Pretrain/Step Time": 8.458277143537998} +{"Pretrain/Learning Rate": 2.2742528272778447e-05, "Pretrain/Loss": 2.002683639526367, "Pretrain/Loss (Raw)": 1.948716640472412, "Pretrain/Step": 10355, "Pretrain/Step Time": 8.460536159574986} +{"Pretrain/Learning Rate": 2.2738300482060025e-05, "Pretrain/Loss": 2.004321575164795, "Pretrain/Loss (Raw)": 2.202946901321411, "Pretrain/Step": 10356, "Pretrain/Step Time": 8.460629627108574} +{"Pretrain/Learning Rate": 2.2734072756556106e-05, "Pretrain/Loss": 2.006901502609253, "Pretrain/Loss (Raw)": 2.1669347286224365, "Pretrain/Step": 10357, "Pretrain/Step Time": 8.460173282772303} +{"Pretrain/Learning Rate": 2.2729845096388602e-05, "Pretrain/Loss": 2.008631706237793, "Pretrain/Loss (Raw)": 2.1116199493408203, "Pretrain/Step": 10358, "Pretrain/Step Time": 8.45241280645132} +{"Pretrain/Learning Rate": 2.2725617501679415e-05, "Pretrain/Loss": 2.010220527648926, "Pretrain/Loss (Raw)": 2.254426956176758, "Pretrain/Step": 10359, "Pretrain/Step Time": 8.452658217400312} +{"Pretrain/Learning Rate": 2.2721389972550446e-05, "Pretrain/Loss": 2.0119667053222656, "Pretrain/Loss (Raw)": 2.1585443019866943, "Pretrain/Step": 10360, "Pretrain/Step Time": 8.454495193436742} +{"Pretrain/Learning Rate": 2.2717162509123592e-05, "Pretrain/Loss": 2.010315179824829, "Pretrain/Loss (Raw)": 1.9914741516113281, "Pretrain/Step": 10361, "Pretrain/Step Time": 8.453615128993988} +{"Pretrain/Learning Rate": 2.2712935111520747e-05, "Pretrain/Loss": 2.008869171142578, "Pretrain/Loss (Raw)": 2.0228421688079834, "Pretrain/Step": 10362, "Pretrain/Step Time": 8.454046284779906} +{"Pretrain/Learning Rate": 2.27087077798638e-05, "Pretrain/Loss": 2.0107803344726562, "Pretrain/Loss (Raw)": 2.0916390419006348, "Pretrain/Step": 10363, "Pretrain/Step Time": 8.454896122217178} +{"Pretrain/Learning Rate": 2.2704480514274656e-05, "Pretrain/Loss": 2.013848304748535, "Pretrain/Loss (Raw)": 2.2891123294830322, "Pretrain/Step": 10364, "Pretrain/Step Time": 8.456357762217522} +{"Pretrain/Learning Rate": 2.2700253314875196e-05, "Pretrain/Loss": 2.0131325721740723, "Pretrain/Loss (Raw)": 2.020728349685669, "Pretrain/Step": 10365, "Pretrain/Step Time": 8.454925766214728} +{"Pretrain/Learning Rate": 2.2696026181787313e-05, "Pretrain/Loss": 2.013979434967041, "Pretrain/Loss (Raw)": 1.9409863948822021, "Pretrain/Step": 10366, "Pretrain/Step Time": 8.453889396041632} +{"Pretrain/Learning Rate": 2.2691799115132885e-05, "Pretrain/Loss": 2.01275634765625, "Pretrain/Loss (Raw)": 1.8613966703414917, "Pretrain/Step": 10367, "Pretrain/Step Time": 8.453690193593502} +{"Pretrain/Learning Rate": 2.2687572115033806e-05, "Pretrain/Loss": 2.011141777038574, "Pretrain/Loss (Raw)": 1.982112169265747, "Pretrain/Step": 10368, "Pretrain/Step Time": 8.452272614464164} +{"Pretrain/Learning Rate": 2.2683345181611955e-05, "Pretrain/Loss": 2.0137410163879395, "Pretrain/Loss (Raw)": 2.1015615463256836, "Pretrain/Step": 10369, "Pretrain/Step Time": 8.450518809258938} +{"Pretrain/Learning Rate": 2.267911831498922e-05, "Pretrain/Loss": 2.014711618423462, "Pretrain/Loss (Raw)": 2.2011640071868896, "Pretrain/Step": 10370, "Pretrain/Step Time": 8.451187532395124} +{"Pretrain/Learning Rate": 2.2674891515287463e-05, "Pretrain/Loss": 2.0165441036224365, "Pretrain/Loss (Raw)": 2.022289276123047, "Pretrain/Step": 10371, "Pretrain/Step Time": 8.44732515886426} +{"Pretrain/Learning Rate": 2.267066478262857e-05, "Pretrain/Loss": 2.0167019367218018, "Pretrain/Loss (Raw)": 2.023489236831665, "Pretrain/Step": 10372, "Pretrain/Step Time": 8.44861107133329} +{"Pretrain/Learning Rate": 2.2666438117134415e-05, "Pretrain/Loss": 2.0146946907043457, "Pretrain/Loss (Raw)": 1.7723262310028076, "Pretrain/Step": 10373, "Pretrain/Step Time": 8.452312527224422} +{"Pretrain/Learning Rate": 2.266221151892688e-05, "Pretrain/Loss": 2.0126123428344727, "Pretrain/Loss (Raw)": 1.8412339687347412, "Pretrain/Step": 10374, "Pretrain/Step Time": 8.449472684413195} +{"Pretrain/Learning Rate": 2.265798498812782e-05, "Pretrain/Loss": 2.0113210678100586, "Pretrain/Loss (Raw)": 1.8121819496154785, "Pretrain/Step": 10375, "Pretrain/Step Time": 8.444968098774552} +{"Pretrain/Learning Rate": 2.2653758524859112e-05, "Pretrain/Loss": 2.0127692222595215, "Pretrain/Loss (Raw)": 1.9326320886611938, "Pretrain/Step": 10376, "Pretrain/Step Time": 8.44484688155353} +{"Pretrain/Learning Rate": 2.2649532129242623e-05, "Pretrain/Loss": 2.0166711807250977, "Pretrain/Loss (Raw)": 2.253754138946533, "Pretrain/Step": 10377, "Pretrain/Step Time": 8.443760879337788} +{"Pretrain/Learning Rate": 2.2645305801400218e-05, "Pretrain/Loss": 2.013657808303833, "Pretrain/Loss (Raw)": 1.6885981559753418, "Pretrain/Step": 10378, "Pretrain/Step Time": 8.449808355420828} +{"Pretrain/Learning Rate": 2.2641079541453765e-05, "Pretrain/Loss": 2.0136678218841553, "Pretrain/Loss (Raw)": 1.9431835412979126, "Pretrain/Step": 10379, "Pretrain/Step Time": 8.451999925076962} +{"Pretrain/Learning Rate": 2.2636853349525118e-05, "Pretrain/Loss": 2.0129780769348145, "Pretrain/Loss (Raw)": 2.044560432434082, "Pretrain/Step": 10380, "Pretrain/Step Time": 8.452769996598363} +{"Pretrain/Learning Rate": 2.263262722573614e-05, "Pretrain/Loss": 2.0130057334899902, "Pretrain/Loss (Raw)": 1.9811989068984985, "Pretrain/Step": 10381, "Pretrain/Step Time": 8.45132665336132} +{"Pretrain/Learning Rate": 2.2628401170208683e-05, "Pretrain/Loss": 2.011427402496338, "Pretrain/Loss (Raw)": 1.7900766134262085, "Pretrain/Step": 10382, "Pretrain/Step Time": 8.450795805081725} +{"Pretrain/Learning Rate": 2.2624175183064607e-05, "Pretrain/Loss": 2.008953094482422, "Pretrain/Loss (Raw)": 1.8951956033706665, "Pretrain/Step": 10383, "Pretrain/Step Time": 8.449737139046192} +{"Pretrain/Learning Rate": 2.261994926442577e-05, "Pretrain/Loss": 2.0018959045410156, "Pretrain/Loss (Raw)": 1.5811421871185303, "Pretrain/Step": 10384, "Pretrain/Step Time": 8.45440468005836} +{"Pretrain/Learning Rate": 2.2615723414414014e-05, "Pretrain/Loss": 2.001136064529419, "Pretrain/Loss (Raw)": 1.9894506931304932, "Pretrain/Step": 10385, "Pretrain/Step Time": 8.452787896618247} +{"Pretrain/Learning Rate": 2.261149763315119e-05, "Pretrain/Loss": 2.0004501342773438, "Pretrain/Loss (Raw)": 1.9141958951950073, "Pretrain/Step": 10386, "Pretrain/Step Time": 8.453655529767275} +{"Pretrain/Learning Rate": 2.2607271920759153e-05, "Pretrain/Loss": 2.0022473335266113, "Pretrain/Loss (Raw)": 2.146571397781372, "Pretrain/Step": 10387, "Pretrain/Step Time": 8.45309230312705} +{"Pretrain/Learning Rate": 2.260304627735974e-05, "Pretrain/Loss": 2.0018768310546875, "Pretrain/Loss (Raw)": 1.8617442846298218, "Pretrain/Step": 10388, "Pretrain/Step Time": 8.453095311298966} +{"Pretrain/Learning Rate": 2.25988207030748e-05, "Pretrain/Loss": 2.000244379043579, "Pretrain/Loss (Raw)": 1.8515393733978271, "Pretrain/Step": 10389, "Pretrain/Step Time": 8.451267257332802} +{"Pretrain/Learning Rate": 2.259459519802617e-05, "Pretrain/Loss": 2.0020337104797363, "Pretrain/Loss (Raw)": 2.0919458866119385, "Pretrain/Step": 10390, "Pretrain/Step Time": 8.443599000573158} +{"Pretrain/Learning Rate": 2.2590369762335695e-05, "Pretrain/Loss": 2.00254487991333, "Pretrain/Loss (Raw)": 2.047466993331909, "Pretrain/Step": 10391, "Pretrain/Step Time": 8.441820899024606} +{"Pretrain/Learning Rate": 2.2586144396125204e-05, "Pretrain/Loss": 2.0023293495178223, "Pretrain/Loss (Raw)": 2.0297842025756836, "Pretrain/Step": 10392, "Pretrain/Step Time": 8.443915171548724} +{"Pretrain/Learning Rate": 2.2581919099516542e-05, "Pretrain/Loss": 2.0012400150299072, "Pretrain/Loss (Raw)": 1.853410005569458, "Pretrain/Step": 10393, "Pretrain/Step Time": 8.446406777948141} +{"Pretrain/Learning Rate": 2.2577693872631543e-05, "Pretrain/Loss": 2.002328634262085, "Pretrain/Loss (Raw)": 2.170754909515381, "Pretrain/Step": 10394, "Pretrain/Step Time": 8.440489461645484} +{"Pretrain/Learning Rate": 2.2573468715592024e-05, "Pretrain/Loss": 2.004333734512329, "Pretrain/Loss (Raw)": 1.9175550937652588, "Pretrain/Step": 10395, "Pretrain/Step Time": 8.441601226106286} +{"Pretrain/Learning Rate": 2.2569243628519828e-05, "Pretrain/Loss": 2.005875587463379, "Pretrain/Loss (Raw)": 2.1934728622436523, "Pretrain/Step": 10396, "Pretrain/Step Time": 8.440752288326621} +{"Pretrain/Learning Rate": 2.256501861153678e-05, "Pretrain/Loss": 2.008848190307617, "Pretrain/Loss (Raw)": 1.9687291383743286, "Pretrain/Step": 10397, "Pretrain/Step Time": 8.434728484600782} +{"Pretrain/Learning Rate": 2.2560793664764698e-05, "Pretrain/Loss": 2.011849880218506, "Pretrain/Loss (Raw)": 2.1979176998138428, "Pretrain/Step": 10398, "Pretrain/Step Time": 8.437326956540346} +{"Pretrain/Learning Rate": 2.255656878832542e-05, "Pretrain/Loss": 2.013364315032959, "Pretrain/Loss (Raw)": 1.9906704425811768, "Pretrain/Step": 10399, "Pretrain/Step Time": 8.440666848793626} +{"Pretrain/Learning Rate": 2.2552343982340753e-05, "Pretrain/Loss": 2.012014865875244, "Pretrain/Loss (Raw)": 2.0468688011169434, "Pretrain/Step": 10400, "Pretrain/Step Time": 8.444083046168089} +{"Pretrain/Learning Rate": 2.2548119246932524e-05, "Pretrain/Loss": 2.01159930229187, "Pretrain/Loss (Raw)": 2.096855401992798, "Pretrain/Step": 10401, "Pretrain/Step Time": 8.44364975206554} +{"Pretrain/Learning Rate": 2.2543894582222543e-05, "Pretrain/Loss": 2.0098705291748047, "Pretrain/Loss (Raw)": 1.8474153280258179, "Pretrain/Step": 10402, "Pretrain/Step Time": 8.441527035087347} +{"Pretrain/Learning Rate": 2.253966998833263e-05, "Pretrain/Loss": 2.009617805480957, "Pretrain/Loss (Raw)": 2.0203113555908203, "Pretrain/Step": 10403, "Pretrain/Step Time": 8.446724439039826} +{"Pretrain/Learning Rate": 2.253544546538461e-05, "Pretrain/Loss": 2.0114331245422363, "Pretrain/Loss (Raw)": 2.2700393199920654, "Pretrain/Step": 10404, "Pretrain/Step Time": 8.44859397597611} +{"Pretrain/Learning Rate": 2.253122101350027e-05, "Pretrain/Loss": 2.0118021965026855, "Pretrain/Loss (Raw)": 2.0549581050872803, "Pretrain/Step": 10405, "Pretrain/Step Time": 8.444998811930418} +{"Pretrain/Learning Rate": 2.252699663280144e-05, "Pretrain/Loss": 2.014207363128662, "Pretrain/Loss (Raw)": 2.0849196910858154, "Pretrain/Step": 10406, "Pretrain/Step Time": 8.441062537953258} +{"Pretrain/Learning Rate": 2.2522772323409913e-05, "Pretrain/Loss": 2.0128798484802246, "Pretrain/Loss (Raw)": 1.6512715816497803, "Pretrain/Step": 10407, "Pretrain/Step Time": 8.442834762856364} +{"Pretrain/Learning Rate": 2.25185480854475e-05, "Pretrain/Loss": 2.0133957862854004, "Pretrain/Loss (Raw)": 2.019355297088623, "Pretrain/Step": 10408, "Pretrain/Step Time": 8.44366448931396} +{"Pretrain/Learning Rate": 2.2514323919036008e-05, "Pretrain/Loss": 2.015939712524414, "Pretrain/Loss (Raw)": 2.084517240524292, "Pretrain/Step": 10409, "Pretrain/Step Time": 8.446912406012416} +{"Pretrain/Learning Rate": 2.251009982429723e-05, "Pretrain/Loss": 2.016071319580078, "Pretrain/Loss (Raw)": 1.9566471576690674, "Pretrain/Step": 10410, "Pretrain/Step Time": 8.445672824978828} +{"Pretrain/Learning Rate": 2.250587580135297e-05, "Pretrain/Loss": 2.014718532562256, "Pretrain/Loss (Raw)": 2.0190200805664062, "Pretrain/Step": 10411, "Pretrain/Step Time": 8.444627257063985} +{"Pretrain/Learning Rate": 2.2501651850325023e-05, "Pretrain/Loss": 2.0135207176208496, "Pretrain/Loss (Raw)": 1.9117907285690308, "Pretrain/Step": 10412, "Pretrain/Step Time": 8.446971084922552} +{"Pretrain/Learning Rate": 2.2497427971335184e-05, "Pretrain/Loss": 2.013211488723755, "Pretrain/Loss (Raw)": 1.9472121000289917, "Pretrain/Step": 10413, "Pretrain/Step Time": 8.44500757008791} +{"Pretrain/Learning Rate": 2.249320416450524e-05, "Pretrain/Loss": 2.014308214187622, "Pretrain/Loss (Raw)": 2.1713433265686035, "Pretrain/Step": 10414, "Pretrain/Step Time": 8.449248539283872} +{"Pretrain/Learning Rate": 2.2488980429956997e-05, "Pretrain/Loss": 2.014678955078125, "Pretrain/Loss (Raw)": 2.1079154014587402, "Pretrain/Step": 10415, "Pretrain/Step Time": 8.456314966082573} +{"Pretrain/Learning Rate": 2.2484756767812227e-05, "Pretrain/Loss": 2.0132319927215576, "Pretrain/Loss (Raw)": 1.9646397829055786, "Pretrain/Step": 10416, "Pretrain/Step Time": 8.45733430981636} +{"Pretrain/Learning Rate": 2.248053317819272e-05, "Pretrain/Loss": 2.0136587619781494, "Pretrain/Loss (Raw)": 2.133559465408325, "Pretrain/Step": 10417, "Pretrain/Step Time": 8.455848444253206} +{"Pretrain/Learning Rate": 2.2476309661220266e-05, "Pretrain/Loss": 2.01444149017334, "Pretrain/Loss (Raw)": 1.948233962059021, "Pretrain/Step": 10418, "Pretrain/Step Time": 8.448443472385406} +{"Pretrain/Learning Rate": 2.247208621701664e-05, "Pretrain/Loss": 2.013331890106201, "Pretrain/Loss (Raw)": 1.780019760131836, "Pretrain/Step": 10419, "Pretrain/Step Time": 8.452151475474238} +{"Pretrain/Learning Rate": 2.2467862845703636e-05, "Pretrain/Loss": 2.0146093368530273, "Pretrain/Loss (Raw)": 2.1356215476989746, "Pretrain/Step": 10420, "Pretrain/Step Time": 8.450850624591112} +{"Pretrain/Learning Rate": 2.2463639547403014e-05, "Pretrain/Loss": 2.0163064002990723, "Pretrain/Loss (Raw)": 2.3638391494750977, "Pretrain/Step": 10421, "Pretrain/Step Time": 8.451143136247993} +{"Pretrain/Learning Rate": 2.2459416322236555e-05, "Pretrain/Loss": 2.015713691711426, "Pretrain/Loss (Raw)": 2.063735008239746, "Pretrain/Step": 10422, "Pretrain/Step Time": 8.45334998704493} +{"Pretrain/Learning Rate": 2.245519317032604e-05, "Pretrain/Loss": 2.015596389770508, "Pretrain/Loss (Raw)": 1.9554163217544556, "Pretrain/Step": 10423, "Pretrain/Step Time": 8.45323383063078} +{"Pretrain/Learning Rate": 2.2450970091793232e-05, "Pretrain/Loss": 2.0167312622070312, "Pretrain/Loss (Raw)": 2.074864625930786, "Pretrain/Step": 10424, "Pretrain/Step Time": 8.455708274617791} +{"Pretrain/Learning Rate": 2.2446747086759916e-05, "Pretrain/Loss": 2.014616012573242, "Pretrain/Loss (Raw)": 1.634009838104248, "Pretrain/Step": 10425, "Pretrain/Step Time": 8.460895819589496} +{"Pretrain/Learning Rate": 2.2442524155347834e-05, "Pretrain/Loss": 2.010434150695801, "Pretrain/Loss (Raw)": 1.9667621850967407, "Pretrain/Step": 10426, "Pretrain/Step Time": 8.457611506804824} +{"Pretrain/Learning Rate": 2.243830129767877e-05, "Pretrain/Loss": 2.0135581493377686, "Pretrain/Loss (Raw)": 2.2769975662231445, "Pretrain/Step": 10427, "Pretrain/Step Time": 8.464378036558628} +{"Pretrain/Learning Rate": 2.243407851387448e-05, "Pretrain/Loss": 2.0079877376556396, "Pretrain/Loss (Raw)": 1.847089409828186, "Pretrain/Step": 10428, "Pretrain/Step Time": 8.462350143119693} +{"Pretrain/Learning Rate": 2.2429855804056732e-05, "Pretrain/Loss": 2.003718852996826, "Pretrain/Loss (Raw)": 1.7220706939697266, "Pretrain/Step": 10429, "Pretrain/Step Time": 8.466703444719315} +{"Pretrain/Learning Rate": 2.242563316834728e-05, "Pretrain/Loss": 2.00184965133667, "Pretrain/Loss (Raw)": 1.9325929880142212, "Pretrain/Step": 10430, "Pretrain/Step Time": 8.463666398078203} +{"Pretrain/Learning Rate": 2.242141060686788e-05, "Pretrain/Loss": 1.999087929725647, "Pretrain/Loss (Raw)": 1.8217793703079224, "Pretrain/Step": 10431, "Pretrain/Step Time": 8.466243775561452} +{"Pretrain/Learning Rate": 2.2417188119740284e-05, "Pretrain/Loss": 2.0017662048339844, "Pretrain/Loss (Raw)": 2.1705803871154785, "Pretrain/Step": 10432, "Pretrain/Step Time": 8.466635523363948} +{"Pretrain/Learning Rate": 2.2412965707086246e-05, "Pretrain/Loss": 2.0004501342773438, "Pretrain/Loss (Raw)": 1.9876765012741089, "Pretrain/Step": 10433, "Pretrain/Step Time": 8.465748347342014} +{"Pretrain/Learning Rate": 2.2408743369027524e-05, "Pretrain/Loss": 1.9987655878067017, "Pretrain/Loss (Raw)": 2.0856525897979736, "Pretrain/Step": 10434, "Pretrain/Step Time": 8.460788425058126} +{"Pretrain/Learning Rate": 2.2404521105685862e-05, "Pretrain/Loss": 2.001646041870117, "Pretrain/Loss (Raw)": 2.33198881149292, "Pretrain/Step": 10435, "Pretrain/Step Time": 8.460026372224092} +{"Pretrain/Learning Rate": 2.2400298917183e-05, "Pretrain/Loss": 2.002107858657837, "Pretrain/Loss (Raw)": 1.945011019706726, "Pretrain/Step": 10436, "Pretrain/Step Time": 8.457743776962161} +{"Pretrain/Learning Rate": 2.2396076803640684e-05, "Pretrain/Loss": 2.003971576690674, "Pretrain/Loss (Raw)": 2.1728034019470215, "Pretrain/Step": 10437, "Pretrain/Step Time": 8.457936571910977} +{"Pretrain/Learning Rate": 2.239185476518066e-05, "Pretrain/Loss": 2.006793737411499, "Pretrain/Loss (Raw)": 2.097839117050171, "Pretrain/Step": 10438, "Pretrain/Step Time": 8.45977890305221} +{"Pretrain/Learning Rate": 2.238763280192466e-05, "Pretrain/Loss": 2.006666660308838, "Pretrain/Loss (Raw)": 2.0606181621551514, "Pretrain/Step": 10439, "Pretrain/Step Time": 8.457991065457463} +{"Pretrain/Learning Rate": 2.2383410913994436e-05, "Pretrain/Loss": 2.007171392440796, "Pretrain/Loss (Raw)": 2.0909736156463623, "Pretrain/Step": 10440, "Pretrain/Step Time": 8.462191376835108} +{"Pretrain/Learning Rate": 2.2379189101511712e-05, "Pretrain/Loss": 2.00827693939209, "Pretrain/Loss (Raw)": 2.174325704574585, "Pretrain/Step": 10441, "Pretrain/Step Time": 8.463451949879527} +{"Pretrain/Learning Rate": 2.2374967364598222e-05, "Pretrain/Loss": 2.0081634521484375, "Pretrain/Loss (Raw)": 2.1607882976531982, "Pretrain/Step": 10442, "Pretrain/Step Time": 8.461960725486279} +{"Pretrain/Learning Rate": 2.237074570337569e-05, "Pretrain/Loss": 2.008867025375366, "Pretrain/Loss (Raw)": 2.0483851432800293, "Pretrain/Step": 10443, "Pretrain/Step Time": 8.463897431269288} +{"Pretrain/Learning Rate": 2.2366524117965857e-05, "Pretrain/Loss": 2.007978916168213, "Pretrain/Loss (Raw)": 1.929248571395874, "Pretrain/Step": 10444, "Pretrain/Step Time": 8.466017523780465} +{"Pretrain/Learning Rate": 2.2362302608490448e-05, "Pretrain/Loss": 2.007556676864624, "Pretrain/Loss (Raw)": 1.9491103887557983, "Pretrain/Step": 10445, "Pretrain/Step Time": 8.468516629189253} +{"Pretrain/Learning Rate": 2.2358081175071187e-05, "Pretrain/Loss": 2.010986566543579, "Pretrain/Loss (Raw)": 2.4033284187316895, "Pretrain/Step": 10446, "Pretrain/Step Time": 8.467979719862342} +{"Pretrain/Learning Rate": 2.2353859817829783e-05, "Pretrain/Loss": 2.011742353439331, "Pretrain/Loss (Raw)": 2.1757705211639404, "Pretrain/Step": 10447, "Pretrain/Step Time": 8.468528980389237} +{"Pretrain/Learning Rate": 2.2349638536887972e-05, "Pretrain/Loss": 2.0116569995880127, "Pretrain/Loss (Raw)": 1.9194151163101196, "Pretrain/Step": 10448, "Pretrain/Step Time": 8.473028905689716} +{"Pretrain/Learning Rate": 2.234541733236746e-05, "Pretrain/Loss": 2.0124332904815674, "Pretrain/Loss (Raw)": 2.12095046043396, "Pretrain/Step": 10449, "Pretrain/Step Time": 8.469727681949735} +{"Pretrain/Learning Rate": 2.234119620438997e-05, "Pretrain/Loss": 2.0119102001190186, "Pretrain/Loss (Raw)": 1.9364333152770996, "Pretrain/Step": 10450, "Pretrain/Step Time": 8.468159480020404} +{"Pretrain/Learning Rate": 2.233697515307722e-05, "Pretrain/Loss": 2.0126194953918457, "Pretrain/Loss (Raw)": 2.0831775665283203, "Pretrain/Step": 10451, "Pretrain/Step Time": 8.46962852962315} +{"Pretrain/Learning Rate": 2.2332754178550908e-05, "Pretrain/Loss": 2.0142598152160645, "Pretrain/Loss (Raw)": 2.2110955715179443, "Pretrain/Step": 10452, "Pretrain/Step Time": 8.470252726227045} +{"Pretrain/Learning Rate": 2.232853328093275e-05, "Pretrain/Loss": 2.015376329421997, "Pretrain/Loss (Raw)": 2.109546422958374, "Pretrain/Step": 10453, "Pretrain/Step Time": 8.474107900634408} +{"Pretrain/Learning Rate": 2.232431246034446e-05, "Pretrain/Loss": 2.0160226821899414, "Pretrain/Loss (Raw)": 2.107978343963623, "Pretrain/Step": 10454, "Pretrain/Step Time": 8.473469303920865} +{"Pretrain/Learning Rate": 2.2320091716907723e-05, "Pretrain/Loss": 2.016947031021118, "Pretrain/Loss (Raw)": 2.071876287460327, "Pretrain/Step": 10455, "Pretrain/Step Time": 8.473662247881293} +{"Pretrain/Learning Rate": 2.231587105074425e-05, "Pretrain/Loss": 2.0180933475494385, "Pretrain/Loss (Raw)": 2.086435079574585, "Pretrain/Step": 10456, "Pretrain/Step Time": 8.475814258679748} +{"Pretrain/Learning Rate": 2.2311650461975745e-05, "Pretrain/Loss": 2.0195953845977783, "Pretrain/Loss (Raw)": 1.9879539012908936, "Pretrain/Step": 10457, "Pretrain/Step Time": 8.475664233788848} +{"Pretrain/Learning Rate": 2.2307429950723914e-05, "Pretrain/Loss": 2.0206151008605957, "Pretrain/Loss (Raw)": 1.917747139930725, "Pretrain/Step": 10458, "Pretrain/Step Time": 8.476406630128622} +{"Pretrain/Learning Rate": 2.230320951711043e-05, "Pretrain/Loss": 2.0240914821624756, "Pretrain/Loss (Raw)": 2.300783157348633, "Pretrain/Step": 10459, "Pretrain/Step Time": 8.47471166960895} +{"Pretrain/Learning Rate": 2.2298989161257005e-05, "Pretrain/Loss": 2.024535655975342, "Pretrain/Loss (Raw)": 1.8121519088745117, "Pretrain/Step": 10460, "Pretrain/Step Time": 8.476404670625925} +{"Pretrain/Learning Rate": 2.2294768883285318e-05, "Pretrain/Loss": 2.0240466594696045, "Pretrain/Loss (Raw)": 2.149122714996338, "Pretrain/Step": 10461, "Pretrain/Step Time": 8.48095641285181} +{"Pretrain/Learning Rate": 2.2290548683317068e-05, "Pretrain/Loss": 2.0216126441955566, "Pretrain/Loss (Raw)": 1.8872510194778442, "Pretrain/Step": 10462, "Pretrain/Step Time": 8.476349450647831} +{"Pretrain/Learning Rate": 2.2286328561473936e-05, "Pretrain/Loss": 2.020443916320801, "Pretrain/Loss (Raw)": 1.9445563554763794, "Pretrain/Step": 10463, "Pretrain/Step Time": 8.475830517709255} +{"Pretrain/Learning Rate": 2.2282108517877607e-05, "Pretrain/Loss": 2.020461082458496, "Pretrain/Loss (Raw)": 1.9253751039505005, "Pretrain/Step": 10464, "Pretrain/Step Time": 8.481522846966982} +{"Pretrain/Learning Rate": 2.2277888552649763e-05, "Pretrain/Loss": 2.0224831104278564, "Pretrain/Loss (Raw)": 2.108684778213501, "Pretrain/Step": 10465, "Pretrain/Step Time": 8.479121249169111} +{"Pretrain/Learning Rate": 2.2273668665912077e-05, "Pretrain/Loss": 2.0206894874572754, "Pretrain/Loss (Raw)": 2.0004897117614746, "Pretrain/Step": 10466, "Pretrain/Step Time": 8.47512019239366} +{"Pretrain/Learning Rate": 2.226944885778624e-05, "Pretrain/Loss": 2.0201120376586914, "Pretrain/Loss (Raw)": 1.9140846729278564, "Pretrain/Step": 10467, "Pretrain/Step Time": 8.474517622962594} +{"Pretrain/Learning Rate": 2.2265229128393926e-05, "Pretrain/Loss": 2.020596504211426, "Pretrain/Loss (Raw)": 2.194355010986328, "Pretrain/Step": 10468, "Pretrain/Step Time": 8.476276580244303} +{"Pretrain/Learning Rate": 2.2261009477856792e-05, "Pretrain/Loss": 2.019533395767212, "Pretrain/Loss (Raw)": 1.9628689289093018, "Pretrain/Step": 10469, "Pretrain/Step Time": 8.47468381933868} +{"Pretrain/Learning Rate": 2.2256789906296522e-05, "Pretrain/Loss": 2.018838405609131, "Pretrain/Loss (Raw)": 1.935998797416687, "Pretrain/Step": 10470, "Pretrain/Step Time": 8.479639384895563} +{"Pretrain/Learning Rate": 2.2252570413834778e-05, "Pretrain/Loss": 2.017381191253662, "Pretrain/Loss (Raw)": 1.6530261039733887, "Pretrain/Step": 10471, "Pretrain/Step Time": 8.476723147556186} +{"Pretrain/Learning Rate": 2.2248351000593233e-05, "Pretrain/Loss": 2.0204997062683105, "Pretrain/Loss (Raw)": 2.1341757774353027, "Pretrain/Step": 10472, "Pretrain/Step Time": 8.476648516952991} +{"Pretrain/Learning Rate": 2.2244131666693542e-05, "Pretrain/Loss": 2.0199077129364014, "Pretrain/Loss (Raw)": 2.034287929534912, "Pretrain/Step": 10473, "Pretrain/Step Time": 8.480852289125323} +{"Pretrain/Learning Rate": 2.2239912412257383e-05, "Pretrain/Loss": 2.019906520843506, "Pretrain/Loss (Raw)": 1.908698320388794, "Pretrain/Step": 10474, "Pretrain/Step Time": 8.48026262037456} +{"Pretrain/Learning Rate": 2.2235693237406397e-05, "Pretrain/Loss": 2.021167755126953, "Pretrain/Loss (Raw)": 1.8511873483657837, "Pretrain/Step": 10475, "Pretrain/Step Time": 8.476263219490647} +{"Pretrain/Learning Rate": 2.2231474142262247e-05, "Pretrain/Loss": 2.0205976963043213, "Pretrain/Loss (Raw)": 2.050229549407959, "Pretrain/Step": 10476, "Pretrain/Step Time": 8.486334415152669} +{"Pretrain/Learning Rate": 2.2227255126946586e-05, "Pretrain/Loss": 2.019843816757202, "Pretrain/Loss (Raw)": 2.004908323287964, "Pretrain/Step": 10477, "Pretrain/Step Time": 8.486168684437871} +{"Pretrain/Learning Rate": 2.222303619158107e-05, "Pretrain/Loss": 2.0205626487731934, "Pretrain/Loss (Raw)": 2.117185592651367, "Pretrain/Step": 10478, "Pretrain/Step Time": 8.478907292708755} +{"Pretrain/Learning Rate": 2.2218817336287355e-05, "Pretrain/Loss": 2.0174407958984375, "Pretrain/Loss (Raw)": 1.7410717010498047, "Pretrain/Step": 10479, "Pretrain/Step Time": 8.478537369519472} +{"Pretrain/Learning Rate": 2.2214598561187077e-05, "Pretrain/Loss": 2.017571449279785, "Pretrain/Loss (Raw)": 2.069347620010376, "Pretrain/Step": 10480, "Pretrain/Step Time": 8.480402670800686} +{"Pretrain/Learning Rate": 2.2210379866401883e-05, "Pretrain/Loss": 2.018155336380005, "Pretrain/Loss (Raw)": 2.062183380126953, "Pretrain/Step": 10481, "Pretrain/Step Time": 8.485654408112168} +{"Pretrain/Learning Rate": 2.220616125205342e-05, "Pretrain/Loss": 2.0155858993530273, "Pretrain/Loss (Raw)": 1.8313242197036743, "Pretrain/Step": 10482, "Pretrain/Step Time": 8.484324829652905} +{"Pretrain/Learning Rate": 2.2201942718263326e-05, "Pretrain/Loss": 2.0146446228027344, "Pretrain/Loss (Raw)": 1.828208088874817, "Pretrain/Step": 10483, "Pretrain/Step Time": 8.480716535821557} +{"Pretrain/Learning Rate": 2.219772426515325e-05, "Pretrain/Loss": 2.0114312171936035, "Pretrain/Loss (Raw)": 1.7916380167007446, "Pretrain/Step": 10484, "Pretrain/Step Time": 8.476397830992937} +{"Pretrain/Learning Rate": 2.2193505892844813e-05, "Pretrain/Loss": 2.0120182037353516, "Pretrain/Loss (Raw)": 2.2420690059661865, "Pretrain/Step": 10485, "Pretrain/Step Time": 8.475737929344177} +{"Pretrain/Learning Rate": 2.2189287601459653e-05, "Pretrain/Loss": 2.0123047828674316, "Pretrain/Loss (Raw)": 2.148327112197876, "Pretrain/Step": 10486, "Pretrain/Step Time": 8.478004017844796} +{"Pretrain/Learning Rate": 2.2185069391119405e-05, "Pretrain/Loss": 2.0100765228271484, "Pretrain/Loss (Raw)": 1.9692009687423706, "Pretrain/Step": 10487, "Pretrain/Step Time": 8.482865134254098} +{"Pretrain/Learning Rate": 2.2180851261945697e-05, "Pretrain/Loss": 2.009458303451538, "Pretrain/Loss (Raw)": 2.079413652420044, "Pretrain/Step": 10488, "Pretrain/Step Time": 8.475158171728253} +{"Pretrain/Learning Rate": 2.2176633214060165e-05, "Pretrain/Loss": 2.009676456451416, "Pretrain/Loss (Raw)": 2.0193989276885986, "Pretrain/Step": 10489, "Pretrain/Step Time": 8.479208137840033} +{"Pretrain/Learning Rate": 2.217241524758441e-05, "Pretrain/Loss": 2.0101282596588135, "Pretrain/Loss (Raw)": 2.0806641578674316, "Pretrain/Step": 10490, "Pretrain/Step Time": 8.47674679197371} +{"Pretrain/Learning Rate": 2.2168197362640074e-05, "Pretrain/Loss": 2.0097556114196777, "Pretrain/Loss (Raw)": 2.0439507961273193, "Pretrain/Step": 10491, "Pretrain/Step Time": 8.476641401648521} +{"Pretrain/Learning Rate": 2.216397955934877e-05, "Pretrain/Loss": 2.007643938064575, "Pretrain/Loss (Raw)": 2.0188002586364746, "Pretrain/Step": 10492, "Pretrain/Step Time": 8.47964977659285} +{"Pretrain/Learning Rate": 2.2159761837832114e-05, "Pretrain/Loss": 2.006735324859619, "Pretrain/Loss (Raw)": 1.9044383764266968, "Pretrain/Step": 10493, "Pretrain/Step Time": 8.481479993090034} +{"Pretrain/Learning Rate": 2.2155544198211732e-05, "Pretrain/Loss": 2.006680727005005, "Pretrain/Loss (Raw)": 1.933992624282837, "Pretrain/Step": 10494, "Pretrain/Step Time": 8.480422291904688} +{"Pretrain/Learning Rate": 2.215132664060922e-05, "Pretrain/Loss": 2.008047580718994, "Pretrain/Loss (Raw)": 2.0363636016845703, "Pretrain/Step": 10495, "Pretrain/Step Time": 8.480415027588606} +{"Pretrain/Learning Rate": 2.2147109165146195e-05, "Pretrain/Loss": 2.0114481449127197, "Pretrain/Loss (Raw)": 2.417362689971924, "Pretrain/Step": 10496, "Pretrain/Step Time": 8.481334598734975} +{"Pretrain/Learning Rate": 2.214289177194427e-05, "Pretrain/Loss": 2.012068271636963, "Pretrain/Loss (Raw)": 2.180940628051758, "Pretrain/Step": 10497, "Pretrain/Step Time": 8.482202786952257} +{"Pretrain/Learning Rate": 2.2138674461125042e-05, "Pretrain/Loss": 2.011301279067993, "Pretrain/Loss (Raw)": 2.102998971939087, "Pretrain/Step": 10498, "Pretrain/Step Time": 8.481647359207273} +{"Pretrain/Learning Rate": 2.2134457232810125e-05, "Pretrain/Loss": 2.010855197906494, "Pretrain/Loss (Raw)": 1.9651798009872437, "Pretrain/Step": 10499, "Pretrain/Step Time": 8.482712056487799} +{"Pretrain/Learning Rate": 2.213024008712111e-05, "Pretrain/Loss": 2.010108470916748, "Pretrain/Loss (Raw)": 1.9278874397277832, "Pretrain/Step": 10500, "Pretrain/Step Time": 8.481698624789715} +{"Pretrain/Learning Rate": 2.21260230241796e-05, "Pretrain/Loss": 2.0113420486450195, "Pretrain/Loss (Raw)": 1.93022620677948, "Pretrain/Step": 10501, "Pretrain/Step Time": 8.48117177002132} +{"Pretrain/Learning Rate": 2.212180604410719e-05, "Pretrain/Loss": 2.013388156890869, "Pretrain/Loss (Raw)": 2.103158473968506, "Pretrain/Step": 10502, "Pretrain/Step Time": 8.481336629018188} +{"Pretrain/Learning Rate": 2.2117589147025468e-05, "Pretrain/Loss": 2.0164685249328613, "Pretrain/Loss (Raw)": 2.2064507007598877, "Pretrain/Step": 10503, "Pretrain/Step Time": 8.482120452448726} +{"Pretrain/Learning Rate": 2.2113372333056042e-05, "Pretrain/Loss": 2.0180721282958984, "Pretrain/Loss (Raw)": 2.1379151344299316, "Pretrain/Step": 10504, "Pretrain/Step Time": 8.4803107958287} +{"Pretrain/Learning Rate": 2.2109155602320482e-05, "Pretrain/Loss": 2.015542507171631, "Pretrain/Loss (Raw)": 1.9299460649490356, "Pretrain/Step": 10505, "Pretrain/Step Time": 8.47947346419096} +{"Pretrain/Learning Rate": 2.2104938954940384e-05, "Pretrain/Loss": 2.0198731422424316, "Pretrain/Loss (Raw)": 2.2429399490356445, "Pretrain/Step": 10506, "Pretrain/Step Time": 8.47840541601181} +{"Pretrain/Learning Rate": 2.210072239103733e-05, "Pretrain/Loss": 2.021810293197632, "Pretrain/Loss (Raw)": 2.1911404132843018, "Pretrain/Step": 10507, "Pretrain/Step Time": 8.480549024417996} +{"Pretrain/Learning Rate": 2.20965059107329e-05, "Pretrain/Loss": 2.0211713314056396, "Pretrain/Loss (Raw)": 1.9627501964569092, "Pretrain/Step": 10508, "Pretrain/Step Time": 8.480762714520097} +{"Pretrain/Learning Rate": 2.209228951414868e-05, "Pretrain/Loss": 2.020869731903076, "Pretrain/Loss (Raw)": 1.9425818920135498, "Pretrain/Step": 10509, "Pretrain/Step Time": 8.4873279761523} +{"Pretrain/Learning Rate": 2.2088073201406246e-05, "Pretrain/Loss": 2.0230798721313477, "Pretrain/Loss (Raw)": 2.0729990005493164, "Pretrain/Step": 10510, "Pretrain/Step Time": 8.48971812427044} +{"Pretrain/Learning Rate": 2.208385697262716e-05, "Pretrain/Loss": 2.022582530975342, "Pretrain/Loss (Raw)": 1.8315601348876953, "Pretrain/Step": 10511, "Pretrain/Step Time": 8.487748323008418} +{"Pretrain/Learning Rate": 2.2079640827933005e-05, "Pretrain/Loss": 2.0266170501708984, "Pretrain/Loss (Raw)": 2.097536563873291, "Pretrain/Step": 10512, "Pretrain/Step Time": 8.488090613856912} +{"Pretrain/Learning Rate": 2.2075424767445346e-05, "Pretrain/Loss": 2.0264151096343994, "Pretrain/Loss (Raw)": 1.9636309146881104, "Pretrain/Step": 10513, "Pretrain/Step Time": 8.48834639787674} +{"Pretrain/Learning Rate": 2.2071208791285753e-05, "Pretrain/Loss": 2.0270938873291016, "Pretrain/Loss (Raw)": 2.0010595321655273, "Pretrain/Step": 10514, "Pretrain/Step Time": 8.489358028396964} +{"Pretrain/Learning Rate": 2.2066992899575796e-05, "Pretrain/Loss": 2.027836322784424, "Pretrain/Loss (Raw)": 2.241602659225464, "Pretrain/Step": 10515, "Pretrain/Step Time": 8.485821513459086} +{"Pretrain/Learning Rate": 2.2062777092437023e-05, "Pretrain/Loss": 2.029203176498413, "Pretrain/Loss (Raw)": 2.0366904735565186, "Pretrain/Step": 10516, "Pretrain/Step Time": 8.484263233840466} +{"Pretrain/Learning Rate": 2.2058561369991004e-05, "Pretrain/Loss": 2.0289456844329834, "Pretrain/Loss (Raw)": 1.8185780048370361, "Pretrain/Step": 10517, "Pretrain/Step Time": 8.482259128242731} +{"Pretrain/Learning Rate": 2.2054345732359295e-05, "Pretrain/Loss": 2.0306100845336914, "Pretrain/Loss (Raw)": 2.3049957752227783, "Pretrain/Step": 10518, "Pretrain/Step Time": 8.4884572327137} +{"Pretrain/Learning Rate": 2.205013017966345e-05, "Pretrain/Loss": 2.029232978820801, "Pretrain/Loss (Raw)": 1.871191382408142, "Pretrain/Step": 10519, "Pretrain/Step Time": 8.48944167420268} +{"Pretrain/Learning Rate": 2.2045914712025027e-05, "Pretrain/Loss": 2.0295817852020264, "Pretrain/Loss (Raw)": 2.0744261741638184, "Pretrain/Step": 10520, "Pretrain/Step Time": 8.48718255572021} +{"Pretrain/Learning Rate": 2.2041699329565565e-05, "Pretrain/Loss": 2.03004789352417, "Pretrain/Loss (Raw)": 1.913077473640442, "Pretrain/Step": 10521, "Pretrain/Step Time": 8.486491000279784} +{"Pretrain/Learning Rate": 2.203748403240662e-05, "Pretrain/Loss": 2.029621124267578, "Pretrain/Loss (Raw)": 2.1161391735076904, "Pretrain/Step": 10522, "Pretrain/Step Time": 8.490447985008359} +{"Pretrain/Learning Rate": 2.2033268820669728e-05, "Pretrain/Loss": 2.0298125743865967, "Pretrain/Loss (Raw)": 1.9420727491378784, "Pretrain/Step": 10523, "Pretrain/Step Time": 8.4948357809335} +{"Pretrain/Learning Rate": 2.2029053694476442e-05, "Pretrain/Loss": 2.0274391174316406, "Pretrain/Loss (Raw)": 1.8896522521972656, "Pretrain/Step": 10524, "Pretrain/Step Time": 8.49446819536388} +{"Pretrain/Learning Rate": 2.2024838653948304e-05, "Pretrain/Loss": 2.0278987884521484, "Pretrain/Loss (Raw)": 2.027562379837036, "Pretrain/Step": 10525, "Pretrain/Step Time": 8.493762006983161} +{"Pretrain/Learning Rate": 2.202062369920684e-05, "Pretrain/Loss": 2.0266289710998535, "Pretrain/Loss (Raw)": 2.0353939533233643, "Pretrain/Step": 10526, "Pretrain/Step Time": 8.493324667215347} +{"Pretrain/Learning Rate": 2.2016408830373595e-05, "Pretrain/Loss": 2.027585744857788, "Pretrain/Loss (Raw)": 2.113133192062378, "Pretrain/Step": 10527, "Pretrain/Step Time": 8.490900302305818} +{"Pretrain/Learning Rate": 2.2012194047570095e-05, "Pretrain/Loss": 2.0266597270965576, "Pretrain/Loss (Raw)": 1.9283379316329956, "Pretrain/Step": 10528, "Pretrain/Step Time": 8.485856100916862} +{"Pretrain/Learning Rate": 2.2007979350917872e-05, "Pretrain/Loss": 2.0245611667633057, "Pretrain/Loss (Raw)": 1.828243374824524, "Pretrain/Step": 10529, "Pretrain/Step Time": 8.488406075164676} +{"Pretrain/Learning Rate": 2.2003764740538462e-05, "Pretrain/Loss": 2.0268852710723877, "Pretrain/Loss (Raw)": 2.144890308380127, "Pretrain/Step": 10530, "Pretrain/Step Time": 8.48675605840981} +{"Pretrain/Learning Rate": 2.1999550216553377e-05, "Pretrain/Loss": 2.0255959033966064, "Pretrain/Loss (Raw)": 1.855276107788086, "Pretrain/Step": 10531, "Pretrain/Step Time": 8.485376216471195} +{"Pretrain/Learning Rate": 2.199533577908415e-05, "Pretrain/Loss": 2.0235280990600586, "Pretrain/Loss (Raw)": 2.005362033843994, "Pretrain/Step": 10532, "Pretrain/Step Time": 8.481773959472775} +{"Pretrain/Learning Rate": 2.1991121428252293e-05, "Pretrain/Loss": 2.022475004196167, "Pretrain/Loss (Raw)": 1.920164704322815, "Pretrain/Step": 10533, "Pretrain/Step Time": 8.485181599855423} +{"Pretrain/Learning Rate": 2.1986907164179333e-05, "Pretrain/Loss": 2.0224862098693848, "Pretrain/Loss (Raw)": 2.0863468647003174, "Pretrain/Step": 10534, "Pretrain/Step Time": 8.487679505720735} +{"Pretrain/Learning Rate": 2.1982692986986782e-05, "Pretrain/Loss": 2.0257420539855957, "Pretrain/Loss (Raw)": 2.068000555038452, "Pretrain/Step": 10535, "Pretrain/Step Time": 8.484154280275106} +{"Pretrain/Learning Rate": 2.197847889679615e-05, "Pretrain/Loss": 2.026632308959961, "Pretrain/Loss (Raw)": 2.1333260536193848, "Pretrain/Step": 10536, "Pretrain/Step Time": 8.481391403824091} +{"Pretrain/Learning Rate": 2.1974264893728944e-05, "Pretrain/Loss": 2.0247862339019775, "Pretrain/Loss (Raw)": 1.848205327987671, "Pretrain/Step": 10537, "Pretrain/Step Time": 8.482820300385356} +{"Pretrain/Learning Rate": 2.197005097790669e-05, "Pretrain/Loss": 2.026404619216919, "Pretrain/Loss (Raw)": 2.163832426071167, "Pretrain/Step": 10538, "Pretrain/Step Time": 8.482329547405243} +{"Pretrain/Learning Rate": 2.1965837149450873e-05, "Pretrain/Loss": 2.0282156467437744, "Pretrain/Loss (Raw)": 2.2508323192596436, "Pretrain/Step": 10539, "Pretrain/Step Time": 8.484566681087017} +{"Pretrain/Learning Rate": 2.1961623408482997e-05, "Pretrain/Loss": 2.0278007984161377, "Pretrain/Loss (Raw)": 1.8586827516555786, "Pretrain/Step": 10540, "Pretrain/Step Time": 8.47940637357533} +{"Pretrain/Learning Rate": 2.1957409755124572e-05, "Pretrain/Loss": 2.027589797973633, "Pretrain/Loss (Raw)": 1.920188069343567, "Pretrain/Step": 10541, "Pretrain/Step Time": 8.480820572003722} +{"Pretrain/Learning Rate": 2.195319618949709e-05, "Pretrain/Loss": 2.026803970336914, "Pretrain/Loss (Raw)": 2.070767402648926, "Pretrain/Step": 10542, "Pretrain/Step Time": 8.477258848026395} +{"Pretrain/Learning Rate": 2.1948982711722053e-05, "Pretrain/Loss": 2.025692939758301, "Pretrain/Loss (Raw)": 1.9657185077667236, "Pretrain/Step": 10543, "Pretrain/Step Time": 8.480110643431544} +{"Pretrain/Learning Rate": 2.1944769321920945e-05, "Pretrain/Loss": 2.025543212890625, "Pretrain/Loss (Raw)": 1.9454472064971924, "Pretrain/Step": 10544, "Pretrain/Step Time": 8.478439301252365} +{"Pretrain/Learning Rate": 2.194055602021526e-05, "Pretrain/Loss": 2.02270770072937, "Pretrain/Loss (Raw)": 1.7706184387207031, "Pretrain/Step": 10545, "Pretrain/Step Time": 8.477904977276921} +{"Pretrain/Learning Rate": 2.1936342806726485e-05, "Pretrain/Loss": 2.0234062671661377, "Pretrain/Loss (Raw)": 2.0376555919647217, "Pretrain/Step": 10546, "Pretrain/Step Time": 8.48139807023108} +{"Pretrain/Learning Rate": 2.1932129681576105e-05, "Pretrain/Loss": 2.0236337184906006, "Pretrain/Loss (Raw)": 1.809147596359253, "Pretrain/Step": 10547, "Pretrain/Step Time": 8.480373410508037} +{"Pretrain/Learning Rate": 2.1927916644885608e-05, "Pretrain/Loss": 2.021824598312378, "Pretrain/Loss (Raw)": 1.9040300846099854, "Pretrain/Step": 10548, "Pretrain/Step Time": 8.479213697835803} +{"Pretrain/Learning Rate": 2.192370369677646e-05, "Pretrain/Loss": 2.0198974609375, "Pretrain/Loss (Raw)": 2.117184638977051, "Pretrain/Step": 10549, "Pretrain/Step Time": 8.478615082800388} +{"Pretrain/Learning Rate": 2.1919490837370153e-05, "Pretrain/Loss": 2.0177032947540283, "Pretrain/Loss (Raw)": 1.7828946113586426, "Pretrain/Step": 10550, "Pretrain/Step Time": 8.4751618783921} +{"Pretrain/Learning Rate": 2.1915278066788155e-05, "Pretrain/Loss": 2.0170068740844727, "Pretrain/Loss (Raw)": 1.8662415742874146, "Pretrain/Step": 10551, "Pretrain/Step Time": 8.477671632543206} +{"Pretrain/Learning Rate": 2.1911065385151938e-05, "Pretrain/Loss": 2.0174646377563477, "Pretrain/Loss (Raw)": 2.1334831714630127, "Pretrain/Step": 10552, "Pretrain/Step Time": 8.473541650921106} +{"Pretrain/Learning Rate": 2.190685279258298e-05, "Pretrain/Loss": 2.0220913887023926, "Pretrain/Loss (Raw)": 2.2262234687805176, "Pretrain/Step": 10553, "Pretrain/Step Time": 8.47025048546493} +{"Pretrain/Learning Rate": 2.1902640289202732e-05, "Pretrain/Loss": 2.0218698978424072, "Pretrain/Loss (Raw)": 1.938418984413147, "Pretrain/Step": 10554, "Pretrain/Step Time": 8.473127584904432} +{"Pretrain/Learning Rate": 2.189842787513267e-05, "Pretrain/Loss": 2.019422769546509, "Pretrain/Loss (Raw)": 1.9637672901153564, "Pretrain/Step": 10555, "Pretrain/Step Time": 8.467546397820115} +{"Pretrain/Learning Rate": 2.1894215550494257e-05, "Pretrain/Loss": 2.0222861766815186, "Pretrain/Loss (Raw)": 2.2135918140411377, "Pretrain/Step": 10556, "Pretrain/Step Time": 8.466183105483651} +{"Pretrain/Learning Rate": 2.1890003315408947e-05, "Pretrain/Loss": 2.0244672298431396, "Pretrain/Loss (Raw)": 2.0012431144714355, "Pretrain/Step": 10557, "Pretrain/Step Time": 8.463888917118311} +{"Pretrain/Learning Rate": 2.1885791169998203e-05, "Pretrain/Loss": 2.024994373321533, "Pretrain/Loss (Raw)": 2.0000951290130615, "Pretrain/Step": 10558, "Pretrain/Step Time": 8.46757085248828} +{"Pretrain/Learning Rate": 2.188157911438347e-05, "Pretrain/Loss": 2.026569366455078, "Pretrain/Loss (Raw)": 2.02337646484375, "Pretrain/Step": 10559, "Pretrain/Step Time": 8.468857605010271} +{"Pretrain/Learning Rate": 2.1877367148686207e-05, "Pretrain/Loss": 2.025940418243408, "Pretrain/Loss (Raw)": 2.090045928955078, "Pretrain/Step": 10560, "Pretrain/Step Time": 8.472637437283993} +{"Pretrain/Learning Rate": 2.187315527302786e-05, "Pretrain/Loss": 2.023822784423828, "Pretrain/Loss (Raw)": 1.716628074645996, "Pretrain/Step": 10561, "Pretrain/Step Time": 8.474307090044022} +{"Pretrain/Learning Rate": 2.1868943487529875e-05, "Pretrain/Loss": 2.0231595039367676, "Pretrain/Loss (Raw)": 2.0007691383361816, "Pretrain/Step": 10562, "Pretrain/Step Time": 8.475661057978868} +{"Pretrain/Learning Rate": 2.1864731792313703e-05, "Pretrain/Loss": 2.0194835662841797, "Pretrain/Loss (Raw)": 1.8614388704299927, "Pretrain/Step": 10563, "Pretrain/Step Time": 8.475553520023823} +{"Pretrain/Learning Rate": 2.1860520187500775e-05, "Pretrain/Loss": 2.020476818084717, "Pretrain/Loss (Raw)": 2.0721676349639893, "Pretrain/Step": 10564, "Pretrain/Step Time": 8.475686160847545} +{"Pretrain/Learning Rate": 2.1856308673212535e-05, "Pretrain/Loss": 2.0175158977508545, "Pretrain/Loss (Raw)": 1.7937941551208496, "Pretrain/Step": 10565, "Pretrain/Step Time": 8.477746611461043} +{"Pretrain/Learning Rate": 2.1852097249570417e-05, "Pretrain/Loss": 2.0179524421691895, "Pretrain/Loss (Raw)": 2.1537203788757324, "Pretrain/Step": 10566, "Pretrain/Step Time": 8.47465137951076} +{"Pretrain/Learning Rate": 2.1847885916695854e-05, "Pretrain/Loss": 2.0158748626708984, "Pretrain/Loss (Raw)": 1.7947107553482056, "Pretrain/Step": 10567, "Pretrain/Step Time": 8.47559972666204} +{"Pretrain/Learning Rate": 2.1843674674710285e-05, "Pretrain/Loss": 2.0139341354370117, "Pretrain/Loss (Raw)": 1.8425579071044922, "Pretrain/Step": 10568, "Pretrain/Step Time": 8.473623123019934} +{"Pretrain/Learning Rate": 2.183946352373513e-05, "Pretrain/Loss": 2.0144894123077393, "Pretrain/Loss (Raw)": 2.2453784942626953, "Pretrain/Step": 10569, "Pretrain/Step Time": 8.469789035618305} +{"Pretrain/Learning Rate": 2.1835252463891813e-05, "Pretrain/Loss": 2.0142297744750977, "Pretrain/Loss (Raw)": 2.1275525093078613, "Pretrain/Step": 10570, "Pretrain/Step Time": 8.469766417518258} +{"Pretrain/Learning Rate": 2.183104149530176e-05, "Pretrain/Loss": 2.0141892433166504, "Pretrain/Loss (Raw)": 2.043224573135376, "Pretrain/Step": 10571, "Pretrain/Step Time": 8.46867217682302} +{"Pretrain/Learning Rate": 2.182683061808639e-05, "Pretrain/Loss": 2.018367290496826, "Pretrain/Loss (Raw)": 2.4640190601348877, "Pretrain/Step": 10572, "Pretrain/Step Time": 8.471835544332862} +{"Pretrain/Learning Rate": 2.1822619832367126e-05, "Pretrain/Loss": 2.01650333404541, "Pretrain/Loss (Raw)": 1.710511326789856, "Pretrain/Step": 10573, "Pretrain/Step Time": 8.467097949236631} +{"Pretrain/Learning Rate": 2.1818409138265385e-05, "Pretrain/Loss": 2.011495590209961, "Pretrain/Loss (Raw)": 1.7623578310012817, "Pretrain/Step": 10574, "Pretrain/Step Time": 8.471418904140592} +{"Pretrain/Learning Rate": 2.1814198535902563e-05, "Pretrain/Loss": 2.0094099044799805, "Pretrain/Loss (Raw)": 1.9087930917739868, "Pretrain/Step": 10575, "Pretrain/Step Time": 8.46704120375216} +{"Pretrain/Learning Rate": 2.1809988025400085e-05, "Pretrain/Loss": 2.0108678340911865, "Pretrain/Loss (Raw)": 2.106038808822632, "Pretrain/Step": 10576, "Pretrain/Step Time": 8.468538735061884} +{"Pretrain/Learning Rate": 2.180577760687935e-05, "Pretrain/Loss": 2.01035737991333, "Pretrain/Loss (Raw)": 2.0555994510650635, "Pretrain/Step": 10577, "Pretrain/Step Time": 8.467213667929173} +{"Pretrain/Learning Rate": 2.1801567280461768e-05, "Pretrain/Loss": 2.0108680725097656, "Pretrain/Loss (Raw)": 2.001797676086426, "Pretrain/Step": 10578, "Pretrain/Step Time": 8.468200001865625} +{"Pretrain/Learning Rate": 2.1797357046268746e-05, "Pretrain/Loss": 2.0106711387634277, "Pretrain/Loss (Raw)": 2.0579564571380615, "Pretrain/Step": 10579, "Pretrain/Step Time": 8.467237330973148} +{"Pretrain/Learning Rate": 2.1793146904421668e-05, "Pretrain/Loss": 2.009819507598877, "Pretrain/Loss (Raw)": 2.1021029949188232, "Pretrain/Step": 10580, "Pretrain/Step Time": 8.464326702058315} +{"Pretrain/Learning Rate": 2.1788936855041938e-05, "Pretrain/Loss": 2.0095908641815186, "Pretrain/Loss (Raw)": 2.080275297164917, "Pretrain/Step": 10581, "Pretrain/Step Time": 8.465945640578866} +{"Pretrain/Learning Rate": 2.1784726898250952e-05, "Pretrain/Loss": 2.0086240768432617, "Pretrain/Loss (Raw)": 1.984252691268921, "Pretrain/Step": 10582, "Pretrain/Step Time": 8.464726243168116} +{"Pretrain/Learning Rate": 2.1780517034170098e-05, "Pretrain/Loss": 2.00844407081604, "Pretrain/Loss (Raw)": 2.0488290786743164, "Pretrain/Step": 10583, "Pretrain/Step Time": 8.46504970639944} +{"Pretrain/Learning Rate": 2.177630726292077e-05, "Pretrain/Loss": 2.0065701007843018, "Pretrain/Loss (Raw)": 1.8465569019317627, "Pretrain/Step": 10584, "Pretrain/Step Time": 8.462836656719446} +{"Pretrain/Learning Rate": 2.1772097584624345e-05, "Pretrain/Loss": 2.006246566772461, "Pretrain/Loss (Raw)": 1.9465395212173462, "Pretrain/Step": 10585, "Pretrain/Step Time": 8.464412331581116} +{"Pretrain/Learning Rate": 2.176788799940221e-05, "Pretrain/Loss": 2.0054612159729004, "Pretrain/Loss (Raw)": 1.8172158002853394, "Pretrain/Step": 10586, "Pretrain/Step Time": 8.464531663805246} +{"Pretrain/Learning Rate": 2.1763678507375747e-05, "Pretrain/Loss": 2.0017316341400146, "Pretrain/Loss (Raw)": 1.8234115839004517, "Pretrain/Step": 10587, "Pretrain/Step Time": 8.464855823665857} +{"Pretrain/Learning Rate": 2.1759469108666337e-05, "Pretrain/Loss": 2.0036628246307373, "Pretrain/Loss (Raw)": 2.0593624114990234, "Pretrain/Step": 10588, "Pretrain/Step Time": 8.462534511461854} +{"Pretrain/Learning Rate": 2.175525980339535e-05, "Pretrain/Loss": 2.003077745437622, "Pretrain/Loss (Raw)": 2.0741891860961914, "Pretrain/Step": 10589, "Pretrain/Step Time": 8.461689831689} +{"Pretrain/Learning Rate": 2.1751050591684154e-05, "Pretrain/Loss": 2.004030227661133, "Pretrain/Loss (Raw)": 2.0091912746429443, "Pretrain/Step": 10590, "Pretrain/Step Time": 8.464574586600065} +{"Pretrain/Learning Rate": 2.1746841473654128e-05, "Pretrain/Loss": 2.0052037239074707, "Pretrain/Loss (Raw)": 2.094745397567749, "Pretrain/Step": 10591, "Pretrain/Step Time": 8.467357015237212} +{"Pretrain/Learning Rate": 2.174263244942663e-05, "Pretrain/Loss": 2.006645679473877, "Pretrain/Loss (Raw)": 2.1099765300750732, "Pretrain/Step": 10592, "Pretrain/Step Time": 8.460084147751331} +{"Pretrain/Learning Rate": 2.1738423519123032e-05, "Pretrain/Loss": 2.006793260574341, "Pretrain/Loss (Raw)": 2.127556085586548, "Pretrain/Step": 10593, "Pretrain/Step Time": 8.461201023310423} +{"Pretrain/Learning Rate": 2.1734214682864702e-05, "Pretrain/Loss": 2.0065362453460693, "Pretrain/Loss (Raw)": 1.9675968885421753, "Pretrain/Step": 10594, "Pretrain/Step Time": 8.460734048858285} +{"Pretrain/Learning Rate": 2.1730005940772976e-05, "Pretrain/Loss": 2.006791114807129, "Pretrain/Loss (Raw)": 1.9467096328735352, "Pretrain/Step": 10595, "Pretrain/Step Time": 8.464191554114223} +{"Pretrain/Learning Rate": 2.1725797292969228e-05, "Pretrain/Loss": 2.0052590370178223, "Pretrain/Loss (Raw)": 1.9982757568359375, "Pretrain/Step": 10596, "Pretrain/Step Time": 8.464952120557427} +{"Pretrain/Learning Rate": 2.1721588739574806e-05, "Pretrain/Loss": 2.0067834854125977, "Pretrain/Loss (Raw)": 2.157980442047119, "Pretrain/Step": 10597, "Pretrain/Step Time": 8.463806150481105} +{"Pretrain/Learning Rate": 2.171738028071106e-05, "Pretrain/Loss": 2.0048742294311523, "Pretrain/Loss (Raw)": 1.691575288772583, "Pretrain/Step": 10598, "Pretrain/Step Time": 8.466091210022569} +{"Pretrain/Learning Rate": 2.1713171916499347e-05, "Pretrain/Loss": 2.0083706378936768, "Pretrain/Loss (Raw)": 2.1006102561950684, "Pretrain/Step": 10599, "Pretrain/Step Time": 8.467332750558853} +{"Pretrain/Learning Rate": 2.1708963647060998e-05, "Pretrain/Loss": 2.006404399871826, "Pretrain/Loss (Raw)": 1.8825035095214844, "Pretrain/Step": 10600, "Pretrain/Step Time": 8.464871177449822} +{"Pretrain/Learning Rate": 2.1704755472517363e-05, "Pretrain/Loss": 2.0046920776367188, "Pretrain/Loss (Raw)": 1.8150774240493774, "Pretrain/Step": 10601, "Pretrain/Step Time": 8.464847728610039} +{"Pretrain/Learning Rate": 2.170054739298978e-05, "Pretrain/Loss": 2.003371477127075, "Pretrain/Loss (Raw)": 1.7396653890609741, "Pretrain/Step": 10602, "Pretrain/Step Time": 8.46744523011148} +{"Pretrain/Learning Rate": 2.169633940859959e-05, "Pretrain/Loss": 2.0037693977355957, "Pretrain/Loss (Raw)": 1.9021213054656982, "Pretrain/Step": 10603, "Pretrain/Step Time": 8.462334103882313} +{"Pretrain/Learning Rate": 2.169213151946813e-05, "Pretrain/Loss": 2.0001699924468994, "Pretrain/Loss (Raw)": 1.5895310640335083, "Pretrain/Step": 10604, "Pretrain/Step Time": 8.455743653699756} +{"Pretrain/Learning Rate": 2.1687923725716713e-05, "Pretrain/Loss": 1.9995038509368896, "Pretrain/Loss (Raw)": 1.9196066856384277, "Pretrain/Step": 10605, "Pretrain/Step Time": 8.454544307664037} +{"Pretrain/Learning Rate": 2.1683716027466687e-05, "Pretrain/Loss": 1.9968218803405762, "Pretrain/Loss (Raw)": 1.7739109992980957, "Pretrain/Step": 10606, "Pretrain/Step Time": 8.458505567163229} +{"Pretrain/Learning Rate": 2.167950842483937e-05, "Pretrain/Loss": 1.9985322952270508, "Pretrain/Loss (Raw)": 1.9600024223327637, "Pretrain/Step": 10607, "Pretrain/Step Time": 8.462862897664309} +{"Pretrain/Learning Rate": 2.167530091795609e-05, "Pretrain/Loss": 1.997380018234253, "Pretrain/Loss (Raw)": 1.921858549118042, "Pretrain/Step": 10608, "Pretrain/Step Time": 8.459724625572562} +{"Pretrain/Learning Rate": 2.1671093506938157e-05, "Pretrain/Loss": 1.9927940368652344, "Pretrain/Loss (Raw)": 1.475186824798584, "Pretrain/Step": 10609, "Pretrain/Step Time": 8.453771898522973} +{"Pretrain/Learning Rate": 2.1666886191906904e-05, "Pretrain/Loss": 1.9954146146774292, "Pretrain/Loss (Raw)": 2.166743755340576, "Pretrain/Step": 10610, "Pretrain/Step Time": 8.454544227570295} +{"Pretrain/Learning Rate": 2.1662678972983634e-05, "Pretrain/Loss": 1.9970359802246094, "Pretrain/Loss (Raw)": 2.0357542037963867, "Pretrain/Step": 10611, "Pretrain/Step Time": 8.453684195876122} +{"Pretrain/Learning Rate": 2.1658471850289664e-05, "Pretrain/Loss": 1.999025583267212, "Pretrain/Loss (Raw)": 2.046316146850586, "Pretrain/Step": 10612, "Pretrain/Step Time": 8.455244783312082} +{"Pretrain/Learning Rate": 2.16542648239463e-05, "Pretrain/Loss": 1.9966975450515747, "Pretrain/Loss (Raw)": 1.944077491760254, "Pretrain/Step": 10613, "Pretrain/Step Time": 8.455963736400008} +{"Pretrain/Learning Rate": 2.1650057894074854e-05, "Pretrain/Loss": 1.9945697784423828, "Pretrain/Loss (Raw)": 1.8759442567825317, "Pretrain/Step": 10614, "Pretrain/Step Time": 8.45692321844399} +{"Pretrain/Learning Rate": 2.164585106079663e-05, "Pretrain/Loss": 1.9953123331069946, "Pretrain/Loss (Raw)": 2.064274311065674, "Pretrain/Step": 10615, "Pretrain/Step Time": 8.453001696616411} +{"Pretrain/Learning Rate": 2.1641644324232923e-05, "Pretrain/Loss": 1.9948420524597168, "Pretrain/Loss (Raw)": 2.0192067623138428, "Pretrain/Step": 10616, "Pretrain/Step Time": 8.45312986895442} +{"Pretrain/Learning Rate": 2.1637437684505036e-05, "Pretrain/Loss": 1.9941990375518799, "Pretrain/Loss (Raw)": 1.9370917081832886, "Pretrain/Step": 10617, "Pretrain/Step Time": 8.452981462702155} +{"Pretrain/Learning Rate": 2.163323114173426e-05, "Pretrain/Loss": 1.993712067604065, "Pretrain/Loss (Raw)": 2.018331527709961, "Pretrain/Step": 10618, "Pretrain/Step Time": 8.454858748242259} +{"Pretrain/Learning Rate": 2.162902469604189e-05, "Pretrain/Loss": 1.9924957752227783, "Pretrain/Loss (Raw)": 1.8882689476013184, "Pretrain/Step": 10619, "Pretrain/Step Time": 8.454261790961027} +{"Pretrain/Learning Rate": 2.1624818347549222e-05, "Pretrain/Loss": 1.9923564195632935, "Pretrain/Loss (Raw)": 2.0009713172912598, "Pretrain/Step": 10620, "Pretrain/Step Time": 8.448868861421943} +{"Pretrain/Learning Rate": 2.1620612096377534e-05, "Pretrain/Loss": 1.9943242073059082, "Pretrain/Loss (Raw)": 2.1562952995300293, "Pretrain/Step": 10621, "Pretrain/Step Time": 8.449730481952429} +{"Pretrain/Learning Rate": 2.1616405942648123e-05, "Pretrain/Loss": 1.994107961654663, "Pretrain/Loss (Raw)": 1.9063303470611572, "Pretrain/Step": 10622, "Pretrain/Step Time": 8.449091091752052} +{"Pretrain/Learning Rate": 2.161219988648225e-05, "Pretrain/Loss": 1.9936509132385254, "Pretrain/Loss (Raw)": 1.977860689163208, "Pretrain/Step": 10623, "Pretrain/Step Time": 8.45117212086916} +{"Pretrain/Learning Rate": 2.1607993928001207e-05, "Pretrain/Loss": 1.9910666942596436, "Pretrain/Loss (Raw)": 2.0865650177001953, "Pretrain/Step": 10624, "Pretrain/Step Time": 8.453512396663427} +{"Pretrain/Learning Rate": 2.160378806732627e-05, "Pretrain/Loss": 1.9886181354522705, "Pretrain/Loss (Raw)": 1.86753249168396, "Pretrain/Step": 10625, "Pretrain/Step Time": 8.452874129638076} +{"Pretrain/Learning Rate": 2.1599582304578706e-05, "Pretrain/Loss": 1.9875448942184448, "Pretrain/Loss (Raw)": 1.965621829032898, "Pretrain/Step": 10626, "Pretrain/Step Time": 8.45238197594881} +{"Pretrain/Learning Rate": 2.1595376639879796e-05, "Pretrain/Loss": 1.9861446619033813, "Pretrain/Loss (Raw)": 1.785959243774414, "Pretrain/Step": 10627, "Pretrain/Step Time": 8.45166015625} +{"Pretrain/Learning Rate": 2.1591171073350795e-05, "Pretrain/Loss": 1.987044095993042, "Pretrain/Loss (Raw)": 2.043013334274292, "Pretrain/Step": 10628, "Pretrain/Step Time": 8.452434170991182} +{"Pretrain/Learning Rate": 2.158696560511297e-05, "Pretrain/Loss": 1.9881865978240967, "Pretrain/Loss (Raw)": 2.0764687061309814, "Pretrain/Step": 10629, "Pretrain/Step Time": 8.453997975215316} +{"Pretrain/Learning Rate": 2.1582760235287592e-05, "Pretrain/Loss": 1.9868855476379395, "Pretrain/Loss (Raw)": 1.9366282224655151, "Pretrain/Step": 10630, "Pretrain/Step Time": 8.451660944148898} +{"Pretrain/Learning Rate": 2.157855496399591e-05, "Pretrain/Loss": 1.9859215021133423, "Pretrain/Loss (Raw)": 2.083048105239868, "Pretrain/Step": 10631, "Pretrain/Step Time": 8.4514898378402} +{"Pretrain/Learning Rate": 2.1574349791359188e-05, "Pretrain/Loss": 1.984132170677185, "Pretrain/Loss (Raw)": 1.9088739156723022, "Pretrain/Step": 10632, "Pretrain/Step Time": 8.454135868698359} +{"Pretrain/Learning Rate": 2.1570144717498668e-05, "Pretrain/Loss": 1.9866440296173096, "Pretrain/Loss (Raw)": 2.251462936401367, "Pretrain/Step": 10633, "Pretrain/Step Time": 8.455961940810084} +{"Pretrain/Learning Rate": 2.1565939742535614e-05, "Pretrain/Loss": 1.9832603931427002, "Pretrain/Loss (Raw)": 1.8098371028900146, "Pretrain/Step": 10634, "Pretrain/Step Time": 8.452630857005715} +{"Pretrain/Learning Rate": 2.156173486659126e-05, "Pretrain/Loss": 1.9831576347351074, "Pretrain/Loss (Raw)": 2.177994728088379, "Pretrain/Step": 10635, "Pretrain/Step Time": 8.45298432931304} +{"Pretrain/Learning Rate": 2.1557530089786858e-05, "Pretrain/Loss": 1.982297420501709, "Pretrain/Loss (Raw)": 1.8526427745819092, "Pretrain/Step": 10636, "Pretrain/Step Time": 8.45576587319374} +{"Pretrain/Learning Rate": 2.1553325412243652e-05, "Pretrain/Loss": 1.9829509258270264, "Pretrain/Loss (Raw)": 2.0262253284454346, "Pretrain/Step": 10637, "Pretrain/Step Time": 8.447355698794127} +{"Pretrain/Learning Rate": 2.1549120834082882e-05, "Pretrain/Loss": 1.9858717918395996, "Pretrain/Loss (Raw)": 2.446871757507324, "Pretrain/Step": 10638, "Pretrain/Step Time": 8.442686328664422} +{"Pretrain/Learning Rate": 2.1544916355425777e-05, "Pretrain/Loss": 1.9883460998535156, "Pretrain/Loss (Raw)": 2.1482839584350586, "Pretrain/Step": 10639, "Pretrain/Step Time": 8.445034286007285} +{"Pretrain/Learning Rate": 2.1540711976393573e-05, "Pretrain/Loss": 1.986860990524292, "Pretrain/Loss (Raw)": 1.907421350479126, "Pretrain/Step": 10640, "Pretrain/Step Time": 8.443887876346707} +{"Pretrain/Learning Rate": 2.1536507697107494e-05, "Pretrain/Loss": 1.9866410493850708, "Pretrain/Loss (Raw)": 1.9354907274246216, "Pretrain/Step": 10641, "Pretrain/Step Time": 8.443476663902402} +{"Pretrain/Learning Rate": 2.153230351768878e-05, "Pretrain/Loss": 1.9877004623413086, "Pretrain/Loss (Raw)": 2.1366512775421143, "Pretrain/Step": 10642, "Pretrain/Step Time": 8.441871974617243} +{"Pretrain/Learning Rate": 2.1528099438258654e-05, "Pretrain/Loss": 1.9880403280258179, "Pretrain/Loss (Raw)": 2.285121202468872, "Pretrain/Step": 10643, "Pretrain/Step Time": 8.443551655858755} +{"Pretrain/Learning Rate": 2.1523895458938326e-05, "Pretrain/Loss": 1.9846919775009155, "Pretrain/Loss (Raw)": 1.6080925464630127, "Pretrain/Step": 10644, "Pretrain/Step Time": 8.447557868435979} +{"Pretrain/Learning Rate": 2.1519691579849024e-05, "Pretrain/Loss": 1.9878478050231934, "Pretrain/Loss (Raw)": 2.2225282192230225, "Pretrain/Step": 10645, "Pretrain/Step Time": 8.448673306033015} +{"Pretrain/Learning Rate": 2.151548780111196e-05, "Pretrain/Loss": 1.9864983558654785, "Pretrain/Loss (Raw)": 2.1322696208953857, "Pretrain/Step": 10646, "Pretrain/Step Time": 8.446545593440533} +{"Pretrain/Learning Rate": 2.151128412284835e-05, "Pretrain/Loss": 1.9870526790618896, "Pretrain/Loss (Raw)": 1.9421418905258179, "Pretrain/Step": 10647, "Pretrain/Step Time": 8.446684807538986} +{"Pretrain/Learning Rate": 2.150708054517941e-05, "Pretrain/Loss": 1.9875543117523193, "Pretrain/Loss (Raw)": 2.1386401653289795, "Pretrain/Step": 10648, "Pretrain/Step Time": 8.447826268151402} +{"Pretrain/Learning Rate": 2.1502877068226333e-05, "Pretrain/Loss": 1.987492322921753, "Pretrain/Loss (Raw)": 1.9051309823989868, "Pretrain/Step": 10649, "Pretrain/Step Time": 8.44918723590672} +{"Pretrain/Learning Rate": 2.149867369211033e-05, "Pretrain/Loss": 1.9860312938690186, "Pretrain/Loss (Raw)": 1.9291447401046753, "Pretrain/Step": 10650, "Pretrain/Step Time": 8.445467934012413} +{"Pretrain/Learning Rate": 2.1494470416952602e-05, "Pretrain/Loss": 1.985769510269165, "Pretrain/Loss (Raw)": 1.908560037612915, "Pretrain/Step": 10651, "Pretrain/Step Time": 8.442072305828333} +{"Pretrain/Learning Rate": 2.149026724287435e-05, "Pretrain/Loss": 1.9858198165893555, "Pretrain/Loss (Raw)": 1.8960907459259033, "Pretrain/Step": 10652, "Pretrain/Step Time": 8.438705019652843} +{"Pretrain/Learning Rate": 2.1486064169996774e-05, "Pretrain/Loss": 1.9860270023345947, "Pretrain/Loss (Raw)": 2.0540645122528076, "Pretrain/Step": 10653, "Pretrain/Step Time": 8.44023316539824} +{"Pretrain/Learning Rate": 2.1481861198441054e-05, "Pretrain/Loss": 1.9857361316680908, "Pretrain/Loss (Raw)": 1.998184084892273, "Pretrain/Step": 10654, "Pretrain/Step Time": 8.438056536018848} +{"Pretrain/Learning Rate": 2.1477658328328386e-05, "Pretrain/Loss": 1.983959436416626, "Pretrain/Loss (Raw)": 1.8857080936431885, "Pretrain/Step": 10655, "Pretrain/Step Time": 8.437708474695683} +{"Pretrain/Learning Rate": 2.1473455559779955e-05, "Pretrain/Loss": 1.9851704835891724, "Pretrain/Loss (Raw)": 2.083354949951172, "Pretrain/Step": 10656, "Pretrain/Step Time": 8.44078509695828} +{"Pretrain/Learning Rate": 2.146925289291695e-05, "Pretrain/Loss": 1.9860179424285889, "Pretrain/Loss (Raw)": 1.9367038011550903, "Pretrain/Step": 10657, "Pretrain/Step Time": 8.445572812110186} +{"Pretrain/Learning Rate": 2.1465050327860554e-05, "Pretrain/Loss": 1.9863336086273193, "Pretrain/Loss (Raw)": 2.1853177547454834, "Pretrain/Step": 10658, "Pretrain/Step Time": 8.445156190544367} +{"Pretrain/Learning Rate": 2.1460847864731933e-05, "Pretrain/Loss": 1.9850869178771973, "Pretrain/Loss (Raw)": 1.695690393447876, "Pretrain/Step": 10659, "Pretrain/Step Time": 8.444045817479491} +{"Pretrain/Learning Rate": 2.145664550365227e-05, "Pretrain/Loss": 1.9854862689971924, "Pretrain/Loss (Raw)": 2.0564751625061035, "Pretrain/Step": 10660, "Pretrain/Step Time": 8.450657311826944} +{"Pretrain/Learning Rate": 2.1452443244742736e-05, "Pretrain/Loss": 1.9873582124710083, "Pretrain/Loss (Raw)": 2.159776449203491, "Pretrain/Step": 10661, "Pretrain/Step Time": 8.448292898014188} +{"Pretrain/Learning Rate": 2.14482410881245e-05, "Pretrain/Loss": 1.986694097518921, "Pretrain/Loss (Raw)": 2.0013554096221924, "Pretrain/Step": 10662, "Pretrain/Step Time": 8.447722690179944} +{"Pretrain/Learning Rate": 2.144403903391873e-05, "Pretrain/Loss": 1.986223816871643, "Pretrain/Loss (Raw)": 2.00778865814209, "Pretrain/Step": 10663, "Pretrain/Step Time": 8.45252520404756} +{"Pretrain/Learning Rate": 2.143983708224659e-05, "Pretrain/Loss": 1.9847662448883057, "Pretrain/Loss (Raw)": 1.9467693567276, "Pretrain/Step": 10664, "Pretrain/Step Time": 8.45352253317833} +{"Pretrain/Learning Rate": 2.1435635233229232e-05, "Pretrain/Loss": 1.9876474142074585, "Pretrain/Loss (Raw)": 2.2169759273529053, "Pretrain/Step": 10665, "Pretrain/Step Time": 8.451146118342876} +{"Pretrain/Learning Rate": 2.143143348698782e-05, "Pretrain/Loss": 1.9903173446655273, "Pretrain/Loss (Raw)": 2.5055856704711914, "Pretrain/Step": 10666, "Pretrain/Step Time": 8.457181259989738} +{"Pretrain/Learning Rate": 2.142723184364351e-05, "Pretrain/Loss": 1.9883296489715576, "Pretrain/Loss (Raw)": 1.9964163303375244, "Pretrain/Step": 10667, "Pretrain/Step Time": 8.453169276937842} +{"Pretrain/Learning Rate": 2.1423030303317454e-05, "Pretrain/Loss": 1.9896365404129028, "Pretrain/Loss (Raw)": 2.0259556770324707, "Pretrain/Step": 10668, "Pretrain/Step Time": 8.453157015144825} +{"Pretrain/Learning Rate": 2.1418828866130795e-05, "Pretrain/Loss": 1.990053653717041, "Pretrain/Loss (Raw)": 1.97359037399292, "Pretrain/Step": 10669, "Pretrain/Step Time": 8.450406840071082} +{"Pretrain/Learning Rate": 2.141462753220468e-05, "Pretrain/Loss": 1.988424301147461, "Pretrain/Loss (Raw)": 1.8622055053710938, "Pretrain/Step": 10670, "Pretrain/Step Time": 8.45140427723527} +{"Pretrain/Learning Rate": 2.141042630166025e-05, "Pretrain/Loss": 1.9857722520828247, "Pretrain/Loss (Raw)": 1.6262552738189697, "Pretrain/Step": 10671, "Pretrain/Step Time": 8.442360579967499} +{"Pretrain/Learning Rate": 2.1406225174618648e-05, "Pretrain/Loss": 1.9866453409194946, "Pretrain/Loss (Raw)": 2.0572092533111572, "Pretrain/Step": 10672, "Pretrain/Step Time": 8.441871117800474} +{"Pretrain/Learning Rate": 2.140202415120101e-05, "Pretrain/Loss": 1.9872078895568848, "Pretrain/Loss (Raw)": 1.8425877094268799, "Pretrain/Step": 10673, "Pretrain/Step Time": 8.44786006398499} +{"Pretrain/Learning Rate": 2.139782323152848e-05, "Pretrain/Loss": 1.985231637954712, "Pretrain/Loss (Raw)": 1.7847306728363037, "Pretrain/Step": 10674, "Pretrain/Step Time": 8.45089933462441} +{"Pretrain/Learning Rate": 2.1393622415722166e-05, "Pretrain/Loss": 1.9856479167938232, "Pretrain/Loss (Raw)": 1.8624203205108643, "Pretrain/Step": 10675, "Pretrain/Step Time": 8.445071760565042} +{"Pretrain/Learning Rate": 2.138942170390321e-05, "Pretrain/Loss": 1.9888973236083984, "Pretrain/Loss (Raw)": 2.3199594020843506, "Pretrain/Step": 10676, "Pretrain/Step Time": 8.451746294274926} +{"Pretrain/Learning Rate": 2.138522109619273e-05, "Pretrain/Loss": 1.9877581596374512, "Pretrain/Loss (Raw)": 1.9713720083236694, "Pretrain/Step": 10677, "Pretrain/Step Time": 8.449719091877341} +{"Pretrain/Learning Rate": 2.1381020592711856e-05, "Pretrain/Loss": 1.9872550964355469, "Pretrain/Loss (Raw)": 1.7185100317001343, "Pretrain/Step": 10678, "Pretrain/Step Time": 8.45345508493483} +{"Pretrain/Learning Rate": 2.1376820193581706e-05, "Pretrain/Loss": 1.9883211851119995, "Pretrain/Loss (Raw)": 2.0026960372924805, "Pretrain/Step": 10679, "Pretrain/Step Time": 8.450646761804819} +{"Pretrain/Learning Rate": 2.1372619898923386e-05, "Pretrain/Loss": 1.9884542226791382, "Pretrain/Loss (Raw)": 2.1505048274993896, "Pretrain/Step": 10680, "Pretrain/Step Time": 8.450954029336572} +{"Pretrain/Learning Rate": 2.1368419708858013e-05, "Pretrain/Loss": 1.986264944076538, "Pretrain/Loss (Raw)": 1.9459959268569946, "Pretrain/Step": 10681, "Pretrain/Step Time": 8.450122816488147} +{"Pretrain/Learning Rate": 2.1364219623506702e-05, "Pretrain/Loss": 1.9859893321990967, "Pretrain/Loss (Raw)": 1.9031518697738647, "Pretrain/Step": 10682, "Pretrain/Step Time": 8.45230976305902} +{"Pretrain/Learning Rate": 2.136001964299055e-05, "Pretrain/Loss": 1.9864779710769653, "Pretrain/Loss (Raw)": 2.026306390762329, "Pretrain/Step": 10683, "Pretrain/Step Time": 8.451350644230843} +{"Pretrain/Learning Rate": 2.1355819767430673e-05, "Pretrain/Loss": 1.9850126504898071, "Pretrain/Loss (Raw)": 2.0260143280029297, "Pretrain/Step": 10684, "Pretrain/Step Time": 8.452773218974471} +{"Pretrain/Learning Rate": 2.135161999694816e-05, "Pretrain/Loss": 1.9824835062026978, "Pretrain/Loss (Raw)": 1.6775321960449219, "Pretrain/Step": 10685, "Pretrain/Step Time": 8.457475861534476} +{"Pretrain/Learning Rate": 2.134742033166411e-05, "Pretrain/Loss": 1.9780125617980957, "Pretrain/Loss (Raw)": 1.4278146028518677, "Pretrain/Step": 10686, "Pretrain/Step Time": 8.454428393393755} +{"Pretrain/Learning Rate": 2.134322077169962e-05, "Pretrain/Loss": 1.978424072265625, "Pretrain/Loss (Raw)": 2.0760509967803955, "Pretrain/Step": 10687, "Pretrain/Step Time": 8.455678272992373} +{"Pretrain/Learning Rate": 2.1339021317175784e-05, "Pretrain/Loss": 1.9782320261001587, "Pretrain/Loss (Raw)": 2.065458059310913, "Pretrain/Step": 10688, "Pretrain/Step Time": 8.44966202788055} +{"Pretrain/Learning Rate": 2.133482196821369e-05, "Pretrain/Loss": 1.9841382503509521, "Pretrain/Loss (Raw)": 2.4726133346557617, "Pretrain/Step": 10689, "Pretrain/Step Time": 8.453648505732417} +{"Pretrain/Learning Rate": 2.1330622724934414e-05, "Pretrain/Loss": 1.9830679893493652, "Pretrain/Loss (Raw)": 1.8637844324111938, "Pretrain/Step": 10690, "Pretrain/Step Time": 8.45436636544764} +{"Pretrain/Learning Rate": 2.132642358745905e-05, "Pretrain/Loss": 1.9817484617233276, "Pretrain/Loss (Raw)": 1.6925365924835205, "Pretrain/Step": 10691, "Pretrain/Step Time": 8.458129102364182} +{"Pretrain/Learning Rate": 2.1322224555908668e-05, "Pretrain/Loss": 1.9818004369735718, "Pretrain/Loss (Raw)": 2.0788183212280273, "Pretrain/Step": 10692, "Pretrain/Step Time": 8.460700742900372} +{"Pretrain/Learning Rate": 2.131802563040435e-05, "Pretrain/Loss": 1.985987901687622, "Pretrain/Loss (Raw)": 2.3297834396362305, "Pretrain/Step": 10693, "Pretrain/Step Time": 8.457360768690705} +{"Pretrain/Learning Rate": 2.1313826811067173e-05, "Pretrain/Loss": 1.983343482017517, "Pretrain/Loss (Raw)": 1.8152532577514648, "Pretrain/Step": 10694, "Pretrain/Step Time": 8.457917109131813} +{"Pretrain/Learning Rate": 2.1309628098018195e-05, "Pretrain/Loss": 1.9849653244018555, "Pretrain/Loss (Raw)": 2.002293586730957, "Pretrain/Step": 10695, "Pretrain/Step Time": 8.457088496536016} +{"Pretrain/Learning Rate": 2.130542949137849e-05, "Pretrain/Loss": 1.9866375923156738, "Pretrain/Loss (Raw)": 2.0566160678863525, "Pretrain/Step": 10696, "Pretrain/Step Time": 8.453381314873695} +{"Pretrain/Learning Rate": 2.130123099126912e-05, "Pretrain/Loss": 1.9853551387786865, "Pretrain/Loss (Raw)": 2.081214427947998, "Pretrain/Step": 10697, "Pretrain/Step Time": 8.457105446606874} +{"Pretrain/Learning Rate": 2.129703259781115e-05, "Pretrain/Loss": 1.985313057899475, "Pretrain/Loss (Raw)": 2.122174024581909, "Pretrain/Step": 10698, "Pretrain/Step Time": 8.454948564991355} +{"Pretrain/Learning Rate": 2.1292834311125634e-05, "Pretrain/Loss": 1.9845576286315918, "Pretrain/Loss (Raw)": 1.9465303421020508, "Pretrain/Step": 10699, "Pretrain/Step Time": 8.457408457994461} +{"Pretrain/Learning Rate": 2.1288636131333624e-05, "Pretrain/Loss": 1.9813324213027954, "Pretrain/Loss (Raw)": 2.0511841773986816, "Pretrain/Step": 10700, "Pretrain/Step Time": 8.453899934887886} +{"Pretrain/Learning Rate": 2.1284438058556177e-05, "Pretrain/Loss": 1.9833130836486816, "Pretrain/Loss (Raw)": 1.9640543460845947, "Pretrain/Step": 10701, "Pretrain/Step Time": 8.455406121909618} +{"Pretrain/Learning Rate": 2.128024009291434e-05, "Pretrain/Loss": 1.9834227561950684, "Pretrain/Loss (Raw)": 1.7763935327529907, "Pretrain/Step": 10702, "Pretrain/Step Time": 8.45188107341528} +{"Pretrain/Learning Rate": 2.1276042234529155e-05, "Pretrain/Loss": 1.9845149517059326, "Pretrain/Loss (Raw)": 2.0485928058624268, "Pretrain/Step": 10703, "Pretrain/Step Time": 8.453834272921085} +{"Pretrain/Learning Rate": 2.1271844483521676e-05, "Pretrain/Loss": 1.9846216440200806, "Pretrain/Loss (Raw)": 2.119685411453247, "Pretrain/Step": 10704, "Pretrain/Step Time": 8.45189499296248} +{"Pretrain/Learning Rate": 2.1267646840012923e-05, "Pretrain/Loss": 1.9850974082946777, "Pretrain/Loss (Raw)": 2.116511344909668, "Pretrain/Step": 10705, "Pretrain/Step Time": 8.453162532299757} +{"Pretrain/Learning Rate": 2.126344930412395e-05, "Pretrain/Loss": 1.987030029296875, "Pretrain/Loss (Raw)": 2.2491726875305176, "Pretrain/Step": 10706, "Pretrain/Step Time": 8.452423732727766} +{"Pretrain/Learning Rate": 2.1259251875975783e-05, "Pretrain/Loss": 1.9870258569717407, "Pretrain/Loss (Raw)": 2.05741024017334, "Pretrain/Step": 10707, "Pretrain/Step Time": 8.45045823045075} +{"Pretrain/Learning Rate": 2.1255054555689443e-05, "Pretrain/Loss": 1.9871115684509277, "Pretrain/Loss (Raw)": 2.1130776405334473, "Pretrain/Step": 10708, "Pretrain/Step Time": 8.451077349483967} +{"Pretrain/Learning Rate": 2.125085734338597e-05, "Pretrain/Loss": 1.987001657485962, "Pretrain/Loss (Raw)": 2.0662059783935547, "Pretrain/Step": 10709, "Pretrain/Step Time": 8.448425842449069} +{"Pretrain/Learning Rate": 2.1246660239186378e-05, "Pretrain/Loss": 1.9874627590179443, "Pretrain/Loss (Raw)": 2.043274164199829, "Pretrain/Step": 10710, "Pretrain/Step Time": 8.449360648170114} +{"Pretrain/Learning Rate": 2.124246324321169e-05, "Pretrain/Loss": 1.9852294921875, "Pretrain/Loss (Raw)": 1.7629783153533936, "Pretrain/Step": 10711, "Pretrain/Step Time": 8.448995711281896} +{"Pretrain/Learning Rate": 2.1238266355582937e-05, "Pretrain/Loss": 1.9858245849609375, "Pretrain/Loss (Raw)": 1.9227100610733032, "Pretrain/Step": 10712, "Pretrain/Step Time": 8.443058891221881} +{"Pretrain/Learning Rate": 2.1234069576421112e-05, "Pretrain/Loss": 1.985466718673706, "Pretrain/Loss (Raw)": 1.900736927986145, "Pretrain/Step": 10713, "Pretrain/Step Time": 8.445833567529917} +{"Pretrain/Learning Rate": 2.122987290584724e-05, "Pretrain/Loss": 1.9857754707336426, "Pretrain/Loss (Raw)": 1.8567429780960083, "Pretrain/Step": 10714, "Pretrain/Step Time": 8.448525730520487} +{"Pretrain/Learning Rate": 2.122567634398232e-05, "Pretrain/Loss": 1.986800193786621, "Pretrain/Loss (Raw)": 1.9545789957046509, "Pretrain/Step": 10715, "Pretrain/Step Time": 8.447412030771375} +{"Pretrain/Learning Rate": 2.1221479890947366e-05, "Pretrain/Loss": 1.9881012439727783, "Pretrain/Loss (Raw)": 2.225895643234253, "Pretrain/Step": 10716, "Pretrain/Step Time": 8.44523555971682} +{"Pretrain/Learning Rate": 2.1217283546863378e-05, "Pretrain/Loss": 1.9874727725982666, "Pretrain/Loss (Raw)": 1.9937540292739868, "Pretrain/Step": 10717, "Pretrain/Step Time": 8.444998489692807} +{"Pretrain/Learning Rate": 2.1213087311851347e-05, "Pretrain/Loss": 1.9878170490264893, "Pretrain/Loss (Raw)": 2.053248167037964, "Pretrain/Step": 10718, "Pretrain/Step Time": 8.445305064320564} +{"Pretrain/Learning Rate": 2.120889118603228e-05, "Pretrain/Loss": 1.9885921478271484, "Pretrain/Loss (Raw)": 2.1939609050750732, "Pretrain/Step": 10719, "Pretrain/Step Time": 8.44202021881938} +{"Pretrain/Learning Rate": 2.1204695169527156e-05, "Pretrain/Loss": 1.9880002737045288, "Pretrain/Loss (Raw)": 2.034207820892334, "Pretrain/Step": 10720, "Pretrain/Step Time": 8.446688804775476} +{"Pretrain/Learning Rate": 2.1200499262456976e-05, "Pretrain/Loss": 1.988083839416504, "Pretrain/Loss (Raw)": 2.1382522583007812, "Pretrain/Step": 10721, "Pretrain/Step Time": 8.449609853327274} +{"Pretrain/Learning Rate": 2.119630346494272e-05, "Pretrain/Loss": 1.9881956577301025, "Pretrain/Loss (Raw)": 1.9819236993789673, "Pretrain/Step": 10722, "Pretrain/Step Time": 8.450778288766742} +{"Pretrain/Learning Rate": 2.1192107777105372e-05, "Pretrain/Loss": 1.9875863790512085, "Pretrain/Loss (Raw)": 1.868708848953247, "Pretrain/Step": 10723, "Pretrain/Step Time": 8.448051610961556} +{"Pretrain/Learning Rate": 2.1187912199065913e-05, "Pretrain/Loss": 1.9878427982330322, "Pretrain/Loss (Raw)": 2.031107187271118, "Pretrain/Step": 10724, "Pretrain/Step Time": 8.442971853539348} +{"Pretrain/Learning Rate": 2.1183716730945312e-05, "Pretrain/Loss": 1.985844612121582, "Pretrain/Loss (Raw)": 1.9022129774093628, "Pretrain/Step": 10725, "Pretrain/Step Time": 8.443425316363573} +{"Pretrain/Learning Rate": 2.1179521372864554e-05, "Pretrain/Loss": 1.9888331890106201, "Pretrain/Loss (Raw)": 2.0740973949432373, "Pretrain/Step": 10726, "Pretrain/Step Time": 8.443197501823306} +{"Pretrain/Learning Rate": 2.1175326124944612e-05, "Pretrain/Loss": 1.9894119501113892, "Pretrain/Loss (Raw)": 2.174708604812622, "Pretrain/Step": 10727, "Pretrain/Step Time": 8.440049137920141} +{"Pretrain/Learning Rate": 2.1171130987306435e-05, "Pretrain/Loss": 1.9921369552612305, "Pretrain/Loss (Raw)": 2.2313029766082764, "Pretrain/Step": 10728, "Pretrain/Step Time": 8.442408796399832} +{"Pretrain/Learning Rate": 2.1166935960070996e-05, "Pretrain/Loss": 1.9930273294448853, "Pretrain/Loss (Raw)": 1.929025411605835, "Pretrain/Step": 10729, "Pretrain/Step Time": 8.44008838571608} +{"Pretrain/Learning Rate": 2.1162741043359256e-05, "Pretrain/Loss": 1.9940423965454102, "Pretrain/Loss (Raw)": 1.869603157043457, "Pretrain/Step": 10730, "Pretrain/Step Time": 8.435480004176497} +{"Pretrain/Learning Rate": 2.1158546237292177e-05, "Pretrain/Loss": 1.9950213432312012, "Pretrain/Loss (Raw)": 2.027431011199951, "Pretrain/Step": 10731, "Pretrain/Step Time": 8.447756078094244} +{"Pretrain/Learning Rate": 2.1154351541990712e-05, "Pretrain/Loss": 1.998194694519043, "Pretrain/Loss (Raw)": 1.9957354068756104, "Pretrain/Step": 10732, "Pretrain/Step Time": 8.44468766450882} +{"Pretrain/Learning Rate": 2.1150156957575808e-05, "Pretrain/Loss": 1.999788761138916, "Pretrain/Loss (Raw)": 2.1236412525177, "Pretrain/Step": 10733, "Pretrain/Step Time": 8.443399351090193} +{"Pretrain/Learning Rate": 2.1145962484168407e-05, "Pretrain/Loss": 2.0010170936584473, "Pretrain/Loss (Raw)": 1.931142807006836, "Pretrain/Step": 10734, "Pretrain/Step Time": 8.440222702920437} +{"Pretrain/Learning Rate": 2.1141768121889465e-05, "Pretrain/Loss": 2.0012621879577637, "Pretrain/Loss (Raw)": 1.9913772344589233, "Pretrain/Step": 10735, "Pretrain/Step Time": 8.43489488773048} +{"Pretrain/Learning Rate": 2.1137573870859918e-05, "Pretrain/Loss": 2.0013582706451416, "Pretrain/Loss (Raw)": 1.9341423511505127, "Pretrain/Step": 10736, "Pretrain/Step Time": 8.437996434047818} +{"Pretrain/Learning Rate": 2.113337973120071e-05, "Pretrain/Loss": 2.0045652389526367, "Pretrain/Loss (Raw)": 1.8856440782546997, "Pretrain/Step": 10737, "Pretrain/Step Time": 8.440429942682385} +{"Pretrain/Learning Rate": 2.1129185703032772e-05, "Pretrain/Loss": 2.003124713897705, "Pretrain/Loss (Raw)": 1.9824020862579346, "Pretrain/Step": 10738, "Pretrain/Step Time": 8.438837451860309} +{"Pretrain/Learning Rate": 2.1124991786477034e-05, "Pretrain/Loss": 2.0028152465820312, "Pretrain/Loss (Raw)": 1.996111512184143, "Pretrain/Step": 10739, "Pretrain/Step Time": 8.44660641439259} +{"Pretrain/Learning Rate": 2.1120797981654422e-05, "Pretrain/Loss": 2.0028254985809326, "Pretrain/Loss (Raw)": 2.04765248298645, "Pretrain/Step": 10740, "Pretrain/Step Time": 8.446686454117298} +{"Pretrain/Learning Rate": 2.111660428868587e-05, "Pretrain/Loss": 2.0032052993774414, "Pretrain/Loss (Raw)": 1.9926812648773193, "Pretrain/Step": 10741, "Pretrain/Step Time": 8.450400900095701} +{"Pretrain/Learning Rate": 2.111241070769229e-05, "Pretrain/Loss": 2.004549264907837, "Pretrain/Loss (Raw)": 2.0479791164398193, "Pretrain/Step": 10742, "Pretrain/Step Time": 8.447279488667846} +{"Pretrain/Learning Rate": 2.1108217238794616e-05, "Pretrain/Loss": 2.0036911964416504, "Pretrain/Loss (Raw)": 1.9544466733932495, "Pretrain/Step": 10743, "Pretrain/Step Time": 8.450269151479006} +{"Pretrain/Learning Rate": 2.1104023882113748e-05, "Pretrain/Loss": 2.0025875568389893, "Pretrain/Loss (Raw)": 1.8779290914535522, "Pretrain/Step": 10744, "Pretrain/Step Time": 8.44866264052689} +{"Pretrain/Learning Rate": 2.1099830637770604e-05, "Pretrain/Loss": 2.0033059120178223, "Pretrain/Loss (Raw)": 2.029014825820923, "Pretrain/Step": 10745, "Pretrain/Step Time": 8.450625363737345} +{"Pretrain/Learning Rate": 2.1095637505886094e-05, "Pretrain/Loss": 2.0039725303649902, "Pretrain/Loss (Raw)": 2.1036996841430664, "Pretrain/Step": 10746, "Pretrain/Step Time": 8.44965547695756} +{"Pretrain/Learning Rate": 2.1091444486581126e-05, "Pretrain/Loss": 2.004930019378662, "Pretrain/Loss (Raw)": 2.010815143585205, "Pretrain/Step": 10747, "Pretrain/Step Time": 8.45622336678207} +{"Pretrain/Learning Rate": 2.1087251579976608e-05, "Pretrain/Loss": 2.004734516143799, "Pretrain/Loss (Raw)": 1.9759496450424194, "Pretrain/Step": 10748, "Pretrain/Step Time": 8.45516062155366} +{"Pretrain/Learning Rate": 2.1083058786193423e-05, "Pretrain/Loss": 2.003455638885498, "Pretrain/Loss (Raw)": 1.9926025867462158, "Pretrain/Step": 10749, "Pretrain/Step Time": 8.455148635432124} +{"Pretrain/Learning Rate": 2.107886610535248e-05, "Pretrain/Loss": 2.003234624862671, "Pretrain/Loss (Raw)": 1.878024697303772, "Pretrain/Step": 10750, "Pretrain/Step Time": 8.457144737243652} +{"Pretrain/Learning Rate": 2.1074673537574667e-05, "Pretrain/Loss": 2.00068998336792, "Pretrain/Loss (Raw)": 1.6521837711334229, "Pretrain/Step": 10751, "Pretrain/Step Time": 8.454241840168834} +{"Pretrain/Learning Rate": 2.1070481082980873e-05, "Pretrain/Loss": 1.9989302158355713, "Pretrain/Loss (Raw)": 1.8612827062606812, "Pretrain/Step": 10752, "Pretrain/Step Time": 8.450498525053263} +{"Pretrain/Learning Rate": 2.1066288741691995e-05, "Pretrain/Loss": 2.0022549629211426, "Pretrain/Loss (Raw)": 2.2930893898010254, "Pretrain/Step": 10753, "Pretrain/Step Time": 8.45463147200644} +{"Pretrain/Learning Rate": 2.1062096513828904e-05, "Pretrain/Loss": 2.0011110305786133, "Pretrain/Loss (Raw)": 1.8192274570465088, "Pretrain/Step": 10754, "Pretrain/Step Time": 8.455523755401373} +{"Pretrain/Learning Rate": 2.105790439951248e-05, "Pretrain/Loss": 2.0012402534484863, "Pretrain/Loss (Raw)": 1.8024874925613403, "Pretrain/Step": 10755, "Pretrain/Step Time": 8.460728492587805} +{"Pretrain/Learning Rate": 2.1053712398863608e-05, "Pretrain/Loss": 2.000885486602783, "Pretrain/Loss (Raw)": 1.997586727142334, "Pretrain/Step": 10756, "Pretrain/Step Time": 8.459340512752533} +{"Pretrain/Learning Rate": 2.104952051200315e-05, "Pretrain/Loss": 2.0014750957489014, "Pretrain/Loss (Raw)": 2.1519668102264404, "Pretrain/Step": 10757, "Pretrain/Step Time": 8.46054040454328} +{"Pretrain/Learning Rate": 2.1045328739051994e-05, "Pretrain/Loss": 2.002204418182373, "Pretrain/Loss (Raw)": 2.029968500137329, "Pretrain/Step": 10758, "Pretrain/Step Time": 8.464007567614317} +{"Pretrain/Learning Rate": 2.104113708013099e-05, "Pretrain/Loss": 2.0051651000976562, "Pretrain/Loss (Raw)": 2.462021589279175, "Pretrain/Step": 10759, "Pretrain/Step Time": 8.465313974767923} +{"Pretrain/Learning Rate": 2.103694553536101e-05, "Pretrain/Loss": 2.005192756652832, "Pretrain/Loss (Raw)": 1.912427544593811, "Pretrain/Step": 10760, "Pretrain/Step Time": 8.461268642917275} +{"Pretrain/Learning Rate": 2.1032754104862906e-05, "Pretrain/Loss": 2.003502368927002, "Pretrain/Loss (Raw)": 2.0350914001464844, "Pretrain/Step": 10761, "Pretrain/Step Time": 8.459306007251143} +{"Pretrain/Learning Rate": 2.1028562788757545e-05, "Pretrain/Loss": 2.0056371688842773, "Pretrain/Loss (Raw)": 2.083078384399414, "Pretrain/Step": 10762, "Pretrain/Step Time": 8.465093975886703} +{"Pretrain/Learning Rate": 2.1024371587165782e-05, "Pretrain/Loss": 2.0045433044433594, "Pretrain/Loss (Raw)": 2.0379478931427, "Pretrain/Step": 10763, "Pretrain/Step Time": 8.461232656612992} +{"Pretrain/Learning Rate": 2.1020180500208454e-05, "Pretrain/Loss": 2.0061302185058594, "Pretrain/Loss (Raw)": 2.0557990074157715, "Pretrain/Step": 10764, "Pretrain/Step Time": 8.456926198676229} +{"Pretrain/Learning Rate": 2.1015989528006417e-05, "Pretrain/Loss": 2.0063443183898926, "Pretrain/Loss (Raw)": 2.053616523742676, "Pretrain/Step": 10765, "Pretrain/Step Time": 8.46169251948595} +{"Pretrain/Learning Rate": 2.101179867068051e-05, "Pretrain/Loss": 2.0024752616882324, "Pretrain/Loss (Raw)": 1.9516359567642212, "Pretrain/Step": 10766, "Pretrain/Step Time": 8.461832851171494} +{"Pretrain/Learning Rate": 2.100760792835158e-05, "Pretrain/Loss": 2.001070737838745, "Pretrain/Loss (Raw)": 1.9685171842575073, "Pretrain/Step": 10767, "Pretrain/Step Time": 8.460820637643337} +{"Pretrain/Learning Rate": 2.1003417301140466e-05, "Pretrain/Loss": 2.003457546234131, "Pretrain/Loss (Raw)": 2.212916374206543, "Pretrain/Step": 10768, "Pretrain/Step Time": 8.453648466616869} +{"Pretrain/Learning Rate": 2.099922678916799e-05, "Pretrain/Loss": 2.0030829906463623, "Pretrain/Loss (Raw)": 1.8875635862350464, "Pretrain/Step": 10769, "Pretrain/Step Time": 8.455087823793292} +{"Pretrain/Learning Rate": 2.0995036392554993e-05, "Pretrain/Loss": 2.002424955368042, "Pretrain/Loss (Raw)": 2.0524232387542725, "Pretrain/Step": 10770, "Pretrain/Step Time": 8.456810250878334} +{"Pretrain/Learning Rate": 2.0990846111422297e-05, "Pretrain/Loss": 2.0004987716674805, "Pretrain/Loss (Raw)": 2.0385751724243164, "Pretrain/Step": 10771, "Pretrain/Step Time": 8.464460482820868} +{"Pretrain/Learning Rate": 2.0986655945890722e-05, "Pretrain/Loss": 2.0046072006225586, "Pretrain/Loss (Raw)": 2.1339564323425293, "Pretrain/Step": 10772, "Pretrain/Step Time": 8.4593516997993} +{"Pretrain/Learning Rate": 2.09824658960811e-05, "Pretrain/Loss": 2.0022244453430176, "Pretrain/Loss (Raw)": 1.9175481796264648, "Pretrain/Step": 10773, "Pretrain/Step Time": 8.458809977397323} +{"Pretrain/Learning Rate": 2.0978275962114245e-05, "Pretrain/Loss": 2.001739501953125, "Pretrain/Loss (Raw)": 2.0701980590820312, "Pretrain/Step": 10774, "Pretrain/Step Time": 8.461100434884429} +{"Pretrain/Learning Rate": 2.097408614411096e-05, "Pretrain/Loss": 2.004070520401001, "Pretrain/Loss (Raw)": 2.240502119064331, "Pretrain/Step": 10775, "Pretrain/Step Time": 8.45691004768014} +{"Pretrain/Learning Rate": 2.0969896442192066e-05, "Pretrain/Loss": 2.002990245819092, "Pretrain/Loss (Raw)": 2.000340700149536, "Pretrain/Step": 10776, "Pretrain/Step Time": 8.45509916357696} +{"Pretrain/Learning Rate": 2.0965706856478365e-05, "Pretrain/Loss": 2.002307891845703, "Pretrain/Loss (Raw)": 1.8178001642227173, "Pretrain/Step": 10777, "Pretrain/Step Time": 8.452408945187926} +{"Pretrain/Learning Rate": 2.096151738709066e-05, "Pretrain/Loss": 2.003636360168457, "Pretrain/Loss (Raw)": 2.0992000102996826, "Pretrain/Step": 10778, "Pretrain/Step Time": 8.45373178832233} +{"Pretrain/Learning Rate": 2.0957328034149763e-05, "Pretrain/Loss": 2.003781318664551, "Pretrain/Loss (Raw)": 1.9270954132080078, "Pretrain/Step": 10779, "Pretrain/Step Time": 8.451925730332732} +{"Pretrain/Learning Rate": 2.0953138797776462e-05, "Pretrain/Loss": 2.002631187438965, "Pretrain/Loss (Raw)": 1.7488937377929688, "Pretrain/Step": 10780, "Pretrain/Step Time": 8.454168958589435} +{"Pretrain/Learning Rate": 2.0948949678091544e-05, "Pretrain/Loss": 2.0004048347473145, "Pretrain/Loss (Raw)": 1.769087314605713, "Pretrain/Step": 10781, "Pretrain/Step Time": 8.453916504979134} +{"Pretrain/Learning Rate": 2.0944760675215807e-05, "Pretrain/Loss": 2.000209331512451, "Pretrain/Loss (Raw)": 1.9731602668762207, "Pretrain/Step": 10782, "Pretrain/Step Time": 8.456523422151804} +{"Pretrain/Learning Rate": 2.0940571789270038e-05, "Pretrain/Loss": 2.000042200088501, "Pretrain/Loss (Raw)": 1.8643128871917725, "Pretrain/Step": 10783, "Pretrain/Step Time": 8.456862078979611} +{"Pretrain/Learning Rate": 2.0936383020375027e-05, "Pretrain/Loss": 2.000497341156006, "Pretrain/Loss (Raw)": 2.141603946685791, "Pretrain/Step": 10784, "Pretrain/Step Time": 8.453813724219799} +{"Pretrain/Learning Rate": 2.093219436865154e-05, "Pretrain/Loss": 2.001145362854004, "Pretrain/Loss (Raw)": 2.019667387008667, "Pretrain/Step": 10785, "Pretrain/Step Time": 8.446672353893518} +{"Pretrain/Learning Rate": 2.092800583422036e-05, "Pretrain/Loss": 1.9996607303619385, "Pretrain/Loss (Raw)": 1.9952800273895264, "Pretrain/Step": 10786, "Pretrain/Step Time": 8.448906145989895} +{"Pretrain/Learning Rate": 2.0923817417202264e-05, "Pretrain/Loss": 2.0029988288879395, "Pretrain/Loss (Raw)": 2.122957706451416, "Pretrain/Step": 10787, "Pretrain/Step Time": 8.44719280488789} +{"Pretrain/Learning Rate": 2.0919629117718015e-05, "Pretrain/Loss": 2.0042953491210938, "Pretrain/Loss (Raw)": 2.2224364280700684, "Pretrain/Step": 10788, "Pretrain/Step Time": 8.447003748267889} +{"Pretrain/Learning Rate": 2.0915440935888393e-05, "Pretrain/Loss": 2.0020694732666016, "Pretrain/Loss (Raw)": 1.8748728036880493, "Pretrain/Step": 10789, "Pretrain/Step Time": 8.448126427829266} +{"Pretrain/Learning Rate": 2.091125287183415e-05, "Pretrain/Loss": 2.0018210411071777, "Pretrain/Loss (Raw)": 1.969543218612671, "Pretrain/Step": 10790, "Pretrain/Step Time": 8.450579948723316} +{"Pretrain/Learning Rate": 2.0907064925676046e-05, "Pretrain/Loss": 2.0010855197906494, "Pretrain/Loss (Raw)": 1.9136488437652588, "Pretrain/Step": 10791, "Pretrain/Step Time": 8.444546146318316} +{"Pretrain/Learning Rate": 2.090287709753484e-05, "Pretrain/Loss": 2.0011167526245117, "Pretrain/Loss (Raw)": 1.9507629871368408, "Pretrain/Step": 10792, "Pretrain/Step Time": 8.446036396548152} +{"Pretrain/Learning Rate": 2.089868938753128e-05, "Pretrain/Loss": 1.999671459197998, "Pretrain/Loss (Raw)": 2.0319807529449463, "Pretrain/Step": 10793, "Pretrain/Step Time": 8.445431228727102} +{"Pretrain/Learning Rate": 2.089450179578612e-05, "Pretrain/Loss": 1.9960970878601074, "Pretrain/Loss (Raw)": 2.0480668544769287, "Pretrain/Step": 10794, "Pretrain/Step Time": 8.4416395239532} +{"Pretrain/Learning Rate": 2.089031432242011e-05, "Pretrain/Loss": 1.9969290494918823, "Pretrain/Loss (Raw)": 2.1029157638549805, "Pretrain/Step": 10795, "Pretrain/Step Time": 8.444769717752934} +{"Pretrain/Learning Rate": 2.0886126967553993e-05, "Pretrain/Loss": 1.9985461235046387, "Pretrain/Loss (Raw)": 2.2329282760620117, "Pretrain/Step": 10796, "Pretrain/Step Time": 8.442530583590269} +{"Pretrain/Learning Rate": 2.08819397313085e-05, "Pretrain/Loss": 1.9985263347625732, "Pretrain/Loss (Raw)": 1.9710667133331299, "Pretrain/Step": 10797, "Pretrain/Step Time": 8.448222637176514} +{"Pretrain/Learning Rate": 2.0877752613804367e-05, "Pretrain/Loss": 1.9996678829193115, "Pretrain/Loss (Raw)": 2.008319139480591, "Pretrain/Step": 10798, "Pretrain/Step Time": 8.449395298957825} +{"Pretrain/Learning Rate": 2.0873565615162337e-05, "Pretrain/Loss": 2.00535249710083, "Pretrain/Loss (Raw)": 2.35390305519104, "Pretrain/Step": 10799, "Pretrain/Step Time": 8.44793777167797} +{"Pretrain/Learning Rate": 2.0869378735503133e-05, "Pretrain/Loss": 2.0037527084350586, "Pretrain/Loss (Raw)": 1.852419137954712, "Pretrain/Step": 10800, "Pretrain/Step Time": 8.45072877779603} +{"Pretrain/Learning Rate": 2.0865191974947486e-05, "Pretrain/Loss": 2.0062170028686523, "Pretrain/Loss (Raw)": 2.1580185890197754, "Pretrain/Step": 10801, "Pretrain/Step Time": 8.443026283755898} +{"Pretrain/Learning Rate": 2.086100533361611e-05, "Pretrain/Loss": 2.0068397521972656, "Pretrain/Loss (Raw)": 1.8644357919692993, "Pretrain/Step": 10802, "Pretrain/Step Time": 8.443136360496283} +{"Pretrain/Learning Rate": 2.0856818811629724e-05, "Pretrain/Loss": 2.0066757202148438, "Pretrain/Loss (Raw)": 1.8414448499679565, "Pretrain/Step": 10803, "Pretrain/Step Time": 8.450006233528256} +{"Pretrain/Learning Rate": 2.0852632409109048e-05, "Pretrain/Loss": 2.0046420097351074, "Pretrain/Loss (Raw)": 2.0596375465393066, "Pretrain/Step": 10804, "Pretrain/Step Time": 8.445881675928831} +{"Pretrain/Learning Rate": 2.084844612617479e-05, "Pretrain/Loss": 2.004973888397217, "Pretrain/Loss (Raw)": 2.013848066329956, "Pretrain/Step": 10805, "Pretrain/Step Time": 8.445112152025104} +{"Pretrain/Learning Rate": 2.084425996294767e-05, "Pretrain/Loss": 2.0060861110687256, "Pretrain/Loss (Raw)": 1.860865592956543, "Pretrain/Step": 10806, "Pretrain/Step Time": 8.44875474832952} +{"Pretrain/Learning Rate": 2.084007391954838e-05, "Pretrain/Loss": 2.0077149868011475, "Pretrain/Loss (Raw)": 2.211198091506958, "Pretrain/Step": 10807, "Pretrain/Step Time": 8.44489947333932} +{"Pretrain/Learning Rate": 2.0835887996097626e-05, "Pretrain/Loss": 2.005077838897705, "Pretrain/Loss (Raw)": 1.8129416704177856, "Pretrain/Step": 10808, "Pretrain/Step Time": 8.445439334958792} +{"Pretrain/Learning Rate": 2.0831702192716104e-05, "Pretrain/Loss": 2.0046379566192627, "Pretrain/Loss (Raw)": 1.8897061347961426, "Pretrain/Step": 10809, "Pretrain/Step Time": 8.443266211077571} +{"Pretrain/Learning Rate": 2.0827516509524515e-05, "Pretrain/Loss": 2.0042529106140137, "Pretrain/Loss (Raw)": 1.853867769241333, "Pretrain/Step": 10810, "Pretrain/Step Time": 8.447480848059058} +{"Pretrain/Learning Rate": 2.082333094664354e-05, "Pretrain/Loss": 1.999121904373169, "Pretrain/Loss (Raw)": 1.3695313930511475, "Pretrain/Step": 10811, "Pretrain/Step Time": 8.44853619299829} +{"Pretrain/Learning Rate": 2.0819145504193883e-05, "Pretrain/Loss": 2.000380039215088, "Pretrain/Loss (Raw)": 2.1870644092559814, "Pretrain/Step": 10812, "Pretrain/Step Time": 8.445198256522417} +{"Pretrain/Learning Rate": 2.081496018229621e-05, "Pretrain/Loss": 2.003385305404663, "Pretrain/Loss (Raw)": 2.0622050762176514, "Pretrain/Step": 10813, "Pretrain/Step Time": 8.439290022477508} +{"Pretrain/Learning Rate": 2.0810774981071208e-05, "Pretrain/Loss": 2.0087344646453857, "Pretrain/Loss (Raw)": 2.1124961376190186, "Pretrain/Step": 10814, "Pretrain/Step Time": 8.444301139563322} +{"Pretrain/Learning Rate": 2.080658990063956e-05, "Pretrain/Loss": 2.006553888320923, "Pretrain/Loss (Raw)": 1.7969435453414917, "Pretrain/Step": 10815, "Pretrain/Step Time": 8.439486568793654} +{"Pretrain/Learning Rate": 2.0802404941121933e-05, "Pretrain/Loss": 2.004270553588867, "Pretrain/Loss (Raw)": 1.7731776237487793, "Pretrain/Step": 10816, "Pretrain/Step Time": 8.446001715958118} +{"Pretrain/Learning Rate": 2.079822010263901e-05, "Pretrain/Loss": 2.000304698944092, "Pretrain/Loss (Raw)": 1.9650064706802368, "Pretrain/Step": 10817, "Pretrain/Step Time": 8.437325539067388} +{"Pretrain/Learning Rate": 2.079403538531144e-05, "Pretrain/Loss": 2.0018537044525146, "Pretrain/Loss (Raw)": 2.0620479583740234, "Pretrain/Step": 10818, "Pretrain/Step Time": 8.43865124695003} +{"Pretrain/Learning Rate": 2.078985078925989e-05, "Pretrain/Loss": 2.0019619464874268, "Pretrain/Loss (Raw)": 1.706407904624939, "Pretrain/Step": 10819, "Pretrain/Step Time": 8.436636285856366} +{"Pretrain/Learning Rate": 2.0785666314605035e-05, "Pretrain/Loss": 2.001269817352295, "Pretrain/Loss (Raw)": 1.9902063608169556, "Pretrain/Step": 10820, "Pretrain/Step Time": 8.43519781716168} +{"Pretrain/Learning Rate": 2.0781481961467514e-05, "Pretrain/Loss": 1.9966367483139038, "Pretrain/Loss (Raw)": 1.7367581129074097, "Pretrain/Step": 10821, "Pretrain/Step Time": 8.443123003467917} +{"Pretrain/Learning Rate": 2.0777297729967993e-05, "Pretrain/Loss": 1.9983477592468262, "Pretrain/Loss (Raw)": 2.034259557723999, "Pretrain/Step": 10822, "Pretrain/Step Time": 8.442024894058704} +{"Pretrain/Learning Rate": 2.077311362022711e-05, "Pretrain/Loss": 1.9971163272857666, "Pretrain/Loss (Raw)": 1.8446675539016724, "Pretrain/Step": 10823, "Pretrain/Step Time": 8.44253401644528} +{"Pretrain/Learning Rate": 2.0768929632365518e-05, "Pretrain/Loss": 1.9950811862945557, "Pretrain/Loss (Raw)": 1.7961128950119019, "Pretrain/Step": 10824, "Pretrain/Step Time": 8.443317577242851} +{"Pretrain/Learning Rate": 2.0764745766503856e-05, "Pretrain/Loss": 1.993967056274414, "Pretrain/Loss (Raw)": 1.9386240243911743, "Pretrain/Step": 10825, "Pretrain/Step Time": 8.441889682784677} +{"Pretrain/Learning Rate": 2.0760562022762762e-05, "Pretrain/Loss": 1.9948651790618896, "Pretrain/Loss (Raw)": 2.237121343612671, "Pretrain/Step": 10826, "Pretrain/Step Time": 8.444567387923598} +{"Pretrain/Learning Rate": 2.075637840126288e-05, "Pretrain/Loss": 1.995742678642273, "Pretrain/Loss (Raw)": 2.0588533878326416, "Pretrain/Step": 10827, "Pretrain/Step Time": 8.442615440115333} +{"Pretrain/Learning Rate": 2.0752194902124832e-05, "Pretrain/Loss": 1.9956791400909424, "Pretrain/Loss (Raw)": 2.043039321899414, "Pretrain/Step": 10828, "Pretrain/Step Time": 8.439078142866492} +{"Pretrain/Learning Rate": 2.0748011525469247e-05, "Pretrain/Loss": 1.9962310791015625, "Pretrain/Loss (Raw)": 2.03471302986145, "Pretrain/Step": 10829, "Pretrain/Step Time": 8.438168907538056} +{"Pretrain/Learning Rate": 2.0743828271416756e-05, "Pretrain/Loss": 1.9987969398498535, "Pretrain/Loss (Raw)": 2.104837656021118, "Pretrain/Step": 10830, "Pretrain/Step Time": 8.43954680301249} +{"Pretrain/Learning Rate": 2.073964514008797e-05, "Pretrain/Loss": 1.9986175298690796, "Pretrain/Loss (Raw)": 2.025604724884033, "Pretrain/Step": 10831, "Pretrain/Step Time": 8.44655434973538} +{"Pretrain/Learning Rate": 2.0735462131603524e-05, "Pretrain/Loss": 1.9989697933197021, "Pretrain/Loss (Raw)": 2.1647753715515137, "Pretrain/Step": 10832, "Pretrain/Step Time": 8.444422774016857} +{"Pretrain/Learning Rate": 2.073127924608401e-05, "Pretrain/Loss": 1.9961540699005127, "Pretrain/Loss (Raw)": 1.7561079263687134, "Pretrain/Step": 10833, "Pretrain/Step Time": 8.443334633484483} +{"Pretrain/Learning Rate": 2.072709648365006e-05, "Pretrain/Loss": 1.9943222999572754, "Pretrain/Loss (Raw)": 2.0147173404693604, "Pretrain/Step": 10834, "Pretrain/Step Time": 8.4416548255831} +{"Pretrain/Learning Rate": 2.072291384442226e-05, "Pretrain/Loss": 1.9916892051696777, "Pretrain/Loss (Raw)": 1.7203612327575684, "Pretrain/Step": 10835, "Pretrain/Step Time": 8.443742640316486} +{"Pretrain/Learning Rate": 2.071873132852123e-05, "Pretrain/Loss": 1.9906052350997925, "Pretrain/Loss (Raw)": 1.9743309020996094, "Pretrain/Step": 10836, "Pretrain/Step Time": 8.446684690192342} +{"Pretrain/Learning Rate": 2.071454893606757e-05, "Pretrain/Loss": 1.9898303747177124, "Pretrain/Loss (Raw)": 1.9670183658599854, "Pretrain/Step": 10837, "Pretrain/Step Time": 8.449005069211125} +{"Pretrain/Learning Rate": 2.071036666718186e-05, "Pretrain/Loss": 1.9902925491333008, "Pretrain/Loss (Raw)": 2.1024582386016846, "Pretrain/Step": 10838, "Pretrain/Step Time": 8.447364477440715} +{"Pretrain/Learning Rate": 2.0706184521984706e-05, "Pretrain/Loss": 1.991868019104004, "Pretrain/Loss (Raw)": 1.9646083116531372, "Pretrain/Step": 10839, "Pretrain/Step Time": 8.446093427017331} +{"Pretrain/Learning Rate": 2.0702002500596697e-05, "Pretrain/Loss": 1.990978717803955, "Pretrain/Loss (Raw)": 1.808894157409668, "Pretrain/Step": 10840, "Pretrain/Step Time": 8.450804589316249} +{"Pretrain/Learning Rate": 2.069782060313841e-05, "Pretrain/Loss": 1.9938232898712158, "Pretrain/Loss (Raw)": 2.2648403644561768, "Pretrain/Step": 10841, "Pretrain/Step Time": 8.45058529265225} +{"Pretrain/Learning Rate": 2.0693638829730434e-05, "Pretrain/Loss": 1.993943214416504, "Pretrain/Loss (Raw)": 1.8721104860305786, "Pretrain/Step": 10842, "Pretrain/Step Time": 8.446911534294486} +{"Pretrain/Learning Rate": 2.0689457180493358e-05, "Pretrain/Loss": 1.9939334392547607, "Pretrain/Loss (Raw)": 1.953306794166565, "Pretrain/Step": 10843, "Pretrain/Step Time": 8.448561649769545} +{"Pretrain/Learning Rate": 2.0685275655547738e-05, "Pretrain/Loss": 1.9920766353607178, "Pretrain/Loss (Raw)": 1.9882311820983887, "Pretrain/Step": 10844, "Pretrain/Step Time": 8.445823876187205} +{"Pretrain/Learning Rate": 2.068109425501415e-05, "Pretrain/Loss": 1.9910825490951538, "Pretrain/Loss (Raw)": 1.8664878606796265, "Pretrain/Step": 10845, "Pretrain/Step Time": 8.446216564625502} +{"Pretrain/Learning Rate": 2.0676912979013164e-05, "Pretrain/Loss": 1.9916276931762695, "Pretrain/Loss (Raw)": 2.123061180114746, "Pretrain/Step": 10846, "Pretrain/Step Time": 8.448426311835647} +{"Pretrain/Learning Rate": 2.0672731827665347e-05, "Pretrain/Loss": 1.9891515970230103, "Pretrain/Loss (Raw)": 1.8769989013671875, "Pretrain/Step": 10847, "Pretrain/Step Time": 8.449978729709983} +{"Pretrain/Learning Rate": 2.0668550801091263e-05, "Pretrain/Loss": 1.9902153015136719, "Pretrain/Loss (Raw)": 2.1703531742095947, "Pretrain/Step": 10848, "Pretrain/Step Time": 8.449292290955782} +{"Pretrain/Learning Rate": 2.0664369899411456e-05, "Pretrain/Loss": 1.9905074834823608, "Pretrain/Loss (Raw)": 2.175666332244873, "Pretrain/Step": 10849, "Pretrain/Step Time": 8.442544668912888} +{"Pretrain/Learning Rate": 2.0660189122746488e-05, "Pretrain/Loss": 1.9897817373275757, "Pretrain/Loss (Raw)": 1.8890317678451538, "Pretrain/Step": 10850, "Pretrain/Step Time": 8.444252882152796} +{"Pretrain/Learning Rate": 2.0656008471216906e-05, "Pretrain/Loss": 1.9915074110031128, "Pretrain/Loss (Raw)": 2.0895843505859375, "Pretrain/Step": 10851, "Pretrain/Step Time": 8.44361563026905} +{"Pretrain/Learning Rate": 2.065182794494326e-05, "Pretrain/Loss": 1.9924217462539673, "Pretrain/Loss (Raw)": 2.148141860961914, "Pretrain/Step": 10852, "Pretrain/Step Time": 8.444249054417014} +{"Pretrain/Learning Rate": 2.0647647544046088e-05, "Pretrain/Loss": 1.9950313568115234, "Pretrain/Loss (Raw)": 2.23624587059021, "Pretrain/Step": 10853, "Pretrain/Step Time": 8.450068486854434} +{"Pretrain/Learning Rate": 2.064346726864593e-05, "Pretrain/Loss": 1.9932687282562256, "Pretrain/Loss (Raw)": 1.8484950065612793, "Pretrain/Step": 10854, "Pretrain/Step Time": 8.445208799093962} +{"Pretrain/Learning Rate": 2.0639287118863326e-05, "Pretrain/Loss": 1.9916740655899048, "Pretrain/Loss (Raw)": 1.9705705642700195, "Pretrain/Step": 10855, "Pretrain/Step Time": 8.449860455468297} +{"Pretrain/Learning Rate": 2.06351070948188e-05, "Pretrain/Loss": 1.9891352653503418, "Pretrain/Loss (Raw)": 1.9063405990600586, "Pretrain/Step": 10856, "Pretrain/Step Time": 8.447738159447908} +{"Pretrain/Learning Rate": 2.0630927196632888e-05, "Pretrain/Loss": 1.9892536401748657, "Pretrain/Loss (Raw)": 1.9441856145858765, "Pretrain/Step": 10857, "Pretrain/Step Time": 8.44774455577135} +{"Pretrain/Learning Rate": 2.062674742442611e-05, "Pretrain/Loss": 1.9903221130371094, "Pretrain/Loss (Raw)": 2.0063772201538086, "Pretrain/Step": 10858, "Pretrain/Step Time": 8.453399684280157} +{"Pretrain/Learning Rate": 2.0622567778318986e-05, "Pretrain/Loss": 1.9902420043945312, "Pretrain/Loss (Raw)": 2.0171616077423096, "Pretrain/Step": 10859, "Pretrain/Step Time": 8.442349836230278} +{"Pretrain/Learning Rate": 2.0618388258432032e-05, "Pretrain/Loss": 1.992020606994629, "Pretrain/Loss (Raw)": 2.223393678665161, "Pretrain/Step": 10860, "Pretrain/Step Time": 8.443665036931634} +{"Pretrain/Learning Rate": 2.0614208864885764e-05, "Pretrain/Loss": 1.9902082681655884, "Pretrain/Loss (Raw)": 1.8916685581207275, "Pretrain/Step": 10861, "Pretrain/Step Time": 8.44327231682837} +{"Pretrain/Learning Rate": 2.061002959780069e-05, "Pretrain/Loss": 1.9889652729034424, "Pretrain/Loss (Raw)": 1.7720533609390259, "Pretrain/Step": 10862, "Pretrain/Step Time": 8.446907348930836} +{"Pretrain/Learning Rate": 2.0605850457297325e-05, "Pretrain/Loss": 1.987636923789978, "Pretrain/Loss (Raw)": 1.8213303089141846, "Pretrain/Step": 10863, "Pretrain/Step Time": 8.451745746657252} +{"Pretrain/Learning Rate": 2.060167144349616e-05, "Pretrain/Loss": 1.9879181385040283, "Pretrain/Loss (Raw)": 1.9701379537582397, "Pretrain/Step": 10864, "Pretrain/Step Time": 8.451092852279544} +{"Pretrain/Learning Rate": 2.0597492556517697e-05, "Pretrain/Loss": 1.9896619319915771, "Pretrain/Loss (Raw)": 2.1088645458221436, "Pretrain/Step": 10865, "Pretrain/Step Time": 8.452902175486088} +{"Pretrain/Learning Rate": 2.059331379648243e-05, "Pretrain/Loss": 1.9895449876785278, "Pretrain/Loss (Raw)": 1.967417597770691, "Pretrain/Step": 10866, "Pretrain/Step Time": 8.453386532142758} +{"Pretrain/Learning Rate": 2.058913516351086e-05, "Pretrain/Loss": 1.9897258281707764, "Pretrain/Loss (Raw)": 2.01926589012146, "Pretrain/Step": 10867, "Pretrain/Step Time": 8.446898246183991} +{"Pretrain/Learning Rate": 2.058495665772347e-05, "Pretrain/Loss": 1.9908956289291382, "Pretrain/Loss (Raw)": 2.197376012802124, "Pretrain/Step": 10868, "Pretrain/Step Time": 8.447961401194334} +{"Pretrain/Learning Rate": 2.0580778279240733e-05, "Pretrain/Loss": 1.988487720489502, "Pretrain/Loss (Raw)": 1.6844666004180908, "Pretrain/Step": 10869, "Pretrain/Step Time": 8.448360703885555} +{"Pretrain/Learning Rate": 2.0576600028183143e-05, "Pretrain/Loss": 1.9875041246414185, "Pretrain/Loss (Raw)": 1.9220894575119019, "Pretrain/Step": 10870, "Pretrain/Step Time": 8.451018953695893} +{"Pretrain/Learning Rate": 2.057242190467117e-05, "Pretrain/Loss": 1.98797607421875, "Pretrain/Loss (Raw)": 2.014859914779663, "Pretrain/Step": 10871, "Pretrain/Step Time": 8.448997551575303} +{"Pretrain/Learning Rate": 2.0568243908825293e-05, "Pretrain/Loss": 1.9875435829162598, "Pretrain/Loss (Raw)": 1.822575330734253, "Pretrain/Step": 10872, "Pretrain/Step Time": 8.45220904611051} +{"Pretrain/Learning Rate": 2.0564066040765987e-05, "Pretrain/Loss": 1.9889880418777466, "Pretrain/Loss (Raw)": 2.2138965129852295, "Pretrain/Step": 10873, "Pretrain/Step Time": 8.446217950433493} +{"Pretrain/Learning Rate": 2.0559888300613704e-05, "Pretrain/Loss": 1.987678050994873, "Pretrain/Loss (Raw)": 1.9360272884368896, "Pretrain/Step": 10874, "Pretrain/Step Time": 8.444661136716604} +{"Pretrain/Learning Rate": 2.055571068848891e-05, "Pretrain/Loss": 1.9875073432922363, "Pretrain/Loss (Raw)": 1.98896324634552, "Pretrain/Step": 10875, "Pretrain/Step Time": 8.441901583224535} +{"Pretrain/Learning Rate": 2.0551533204512068e-05, "Pretrain/Loss": 1.9874415397644043, "Pretrain/Loss (Raw)": 1.9675157070159912, "Pretrain/Step": 10876, "Pretrain/Step Time": 8.44311628676951} +{"Pretrain/Learning Rate": 2.0547355848803625e-05, "Pretrain/Loss": 1.9878240823745728, "Pretrain/Loss (Raw)": 2.041583299636841, "Pretrain/Step": 10877, "Pretrain/Step Time": 8.44470757059753} +{"Pretrain/Learning Rate": 2.0543178621484038e-05, "Pretrain/Loss": 1.9867115020751953, "Pretrain/Loss (Raw)": 1.7356112003326416, "Pretrain/Step": 10878, "Pretrain/Step Time": 8.442658314481378} +{"Pretrain/Learning Rate": 2.0539001522673752e-05, "Pretrain/Loss": 1.9912132024765015, "Pretrain/Loss (Raw)": 2.228391408920288, "Pretrain/Step": 10879, "Pretrain/Step Time": 8.444623051211238} +{"Pretrain/Learning Rate": 2.0534824552493216e-05, "Pretrain/Loss": 1.992763876914978, "Pretrain/Loss (Raw)": 2.059767723083496, "Pretrain/Step": 10880, "Pretrain/Step Time": 8.444473017007113} +{"Pretrain/Learning Rate": 2.053064771106287e-05, "Pretrain/Loss": 1.9908850193023682, "Pretrain/Loss (Raw)": 2.0526156425476074, "Pretrain/Step": 10881, "Pretrain/Step Time": 8.442548457533121} +{"Pretrain/Learning Rate": 2.052647099850314e-05, "Pretrain/Loss": 1.9924030303955078, "Pretrain/Loss (Raw)": 2.0135061740875244, "Pretrain/Step": 10882, "Pretrain/Step Time": 8.442506270483136} +{"Pretrain/Learning Rate": 2.0522294414934467e-05, "Pretrain/Loss": 1.994704246520996, "Pretrain/Loss (Raw)": 2.0970458984375, "Pretrain/Step": 10883, "Pretrain/Step Time": 8.438006846234202} +{"Pretrain/Learning Rate": 2.0518117960477275e-05, "Pretrain/Loss": 1.9942303895950317, "Pretrain/Loss (Raw)": 1.9369442462921143, "Pretrain/Step": 10884, "Pretrain/Step Time": 8.43879826925695} +{"Pretrain/Learning Rate": 2.0513941635251995e-05, "Pretrain/Loss": 1.992584466934204, "Pretrain/Loss (Raw)": 1.9412885904312134, "Pretrain/Step": 10885, "Pretrain/Step Time": 8.436340592801571} +{"Pretrain/Learning Rate": 2.0509765439379052e-05, "Pretrain/Loss": 1.9940043687820435, "Pretrain/Loss (Raw)": 2.2117035388946533, "Pretrain/Step": 10886, "Pretrain/Step Time": 8.441139483824372} +{"Pretrain/Learning Rate": 2.0505589372978848e-05, "Pretrain/Loss": 1.9912775754928589, "Pretrain/Loss (Raw)": 2.1130077838897705, "Pretrain/Step": 10887, "Pretrain/Step Time": 8.440867071971297} +{"Pretrain/Learning Rate": 2.0501413436171805e-05, "Pretrain/Loss": 1.992281198501587, "Pretrain/Loss (Raw)": 2.040902614593506, "Pretrain/Step": 10888, "Pretrain/Step Time": 8.443073533475399} +{"Pretrain/Learning Rate": 2.0497237629078338e-05, "Pretrain/Loss": 1.9923646450042725, "Pretrain/Loss (Raw)": 2.045755624771118, "Pretrain/Step": 10889, "Pretrain/Step Time": 8.440705170854926} +{"Pretrain/Learning Rate": 2.049306195181885e-05, "Pretrain/Loss": 1.9918015003204346, "Pretrain/Loss (Raw)": 2.0109899044036865, "Pretrain/Step": 10890, "Pretrain/Step Time": 8.436170747503638} +{"Pretrain/Learning Rate": 2.0488886404513745e-05, "Pretrain/Loss": 1.9899518489837646, "Pretrain/Loss (Raw)": 1.8012036085128784, "Pretrain/Step": 10891, "Pretrain/Step Time": 8.440969632938504} +{"Pretrain/Learning Rate": 2.048471098728342e-05, "Pretrain/Loss": 1.9886409044265747, "Pretrain/Loss (Raw)": 1.8880043029785156, "Pretrain/Step": 10892, "Pretrain/Step Time": 8.443361880257726} +{"Pretrain/Learning Rate": 2.0480535700248267e-05, "Pretrain/Loss": 1.9894715547561646, "Pretrain/Loss (Raw)": 2.1599340438842773, "Pretrain/Step": 10893, "Pretrain/Step Time": 8.443096539005637} +{"Pretrain/Learning Rate": 2.0476360543528682e-05, "Pretrain/Loss": 1.989344835281372, "Pretrain/Loss (Raw)": 1.9354029893875122, "Pretrain/Step": 10894, "Pretrain/Step Time": 8.440279262140393} +{"Pretrain/Learning Rate": 2.0472185517245053e-05, "Pretrain/Loss": 1.9895652532577515, "Pretrain/Loss (Raw)": 1.9967412948608398, "Pretrain/Step": 10895, "Pretrain/Step Time": 8.442757410928607} +{"Pretrain/Learning Rate": 2.0468010621517766e-05, "Pretrain/Loss": 1.9860575199127197, "Pretrain/Loss (Raw)": 1.7639378309249878, "Pretrain/Step": 10896, "Pretrain/Step Time": 8.450203960761428} +{"Pretrain/Learning Rate": 2.0463835856467195e-05, "Pretrain/Loss": 1.984995722770691, "Pretrain/Loss (Raw)": 1.7516469955444336, "Pretrain/Step": 10897, "Pretrain/Step Time": 8.449284808710217} +{"Pretrain/Learning Rate": 2.0459661222213717e-05, "Pretrain/Loss": 1.9854544401168823, "Pretrain/Loss (Raw)": 2.1111228466033936, "Pretrain/Step": 10898, "Pretrain/Step Time": 8.444653565064073} +{"Pretrain/Learning Rate": 2.045548671887771e-05, "Pretrain/Loss": 1.9842965602874756, "Pretrain/Loss (Raw)": 1.8903776407241821, "Pretrain/Step": 10899, "Pretrain/Step Time": 8.442557210102677} +{"Pretrain/Learning Rate": 2.0451312346579537e-05, "Pretrain/Loss": 1.9832866191864014, "Pretrain/Loss (Raw)": 2.004687786102295, "Pretrain/Step": 10900, "Pretrain/Step Time": 8.443993166089058} +{"Pretrain/Learning Rate": 2.044713810543957e-05, "Pretrain/Loss": 1.9840155839920044, "Pretrain/Loss (Raw)": 2.0108494758605957, "Pretrain/Step": 10901, "Pretrain/Step Time": 8.444778146222234} +{"Pretrain/Learning Rate": 2.044296399557816e-05, "Pretrain/Loss": 1.9829738140106201, "Pretrain/Loss (Raw)": 1.9368386268615723, "Pretrain/Step": 10902, "Pretrain/Step Time": 8.444614263251424} +{"Pretrain/Learning Rate": 2.0438790017115677e-05, "Pretrain/Loss": 1.9812815189361572, "Pretrain/Loss (Raw)": 2.023902654647827, "Pretrain/Step": 10903, "Pretrain/Step Time": 8.446087408810854} +{"Pretrain/Learning Rate": 2.0434616170172466e-05, "Pretrain/Loss": 1.9806239604949951, "Pretrain/Loss (Raw)": 1.9161888360977173, "Pretrain/Step": 10904, "Pretrain/Step Time": 8.44677259027958} +{"Pretrain/Learning Rate": 2.0430442454868875e-05, "Pretrain/Loss": 1.9815341234207153, "Pretrain/Loss (Raw)": 1.9342904090881348, "Pretrain/Step": 10905, "Pretrain/Step Time": 8.445224415510893} +{"Pretrain/Learning Rate": 2.042626887132526e-05, "Pretrain/Loss": 1.9801385402679443, "Pretrain/Loss (Raw)": 1.9205604791641235, "Pretrain/Step": 10906, "Pretrain/Step Time": 8.448394313454628} +{"Pretrain/Learning Rate": 2.042209541966196e-05, "Pretrain/Loss": 1.9810078144073486, "Pretrain/Loss (Raw)": 2.038356065750122, "Pretrain/Step": 10907, "Pretrain/Step Time": 8.453046947717667} +{"Pretrain/Learning Rate": 2.0417922099999307e-05, "Pretrain/Loss": 1.9847406148910522, "Pretrain/Loss (Raw)": 2.226700782775879, "Pretrain/Step": 10908, "Pretrain/Step Time": 8.450367722660303} +{"Pretrain/Learning Rate": 2.041374891245764e-05, "Pretrain/Loss": 1.984736680984497, "Pretrain/Loss (Raw)": 1.7685778141021729, "Pretrain/Step": 10909, "Pretrain/Step Time": 8.451545370742679} +{"Pretrain/Learning Rate": 2.0409575857157288e-05, "Pretrain/Loss": 1.9854602813720703, "Pretrain/Loss (Raw)": 2.065778970718384, "Pretrain/Step": 10910, "Pretrain/Step Time": 8.450383242219687} +{"Pretrain/Learning Rate": 2.0405402934218582e-05, "Pretrain/Loss": 1.985365867614746, "Pretrain/Loss (Raw)": 1.8522387742996216, "Pretrain/Step": 10911, "Pretrain/Step Time": 8.451763935387135} +{"Pretrain/Learning Rate": 2.0401230143761853e-05, "Pretrain/Loss": 1.9837708473205566, "Pretrain/Loss (Raw)": 1.9374428987503052, "Pretrain/Step": 10912, "Pretrain/Step Time": 8.45217197574675} +{"Pretrain/Learning Rate": 2.0397057485907396e-05, "Pretrain/Loss": 1.9856102466583252, "Pretrain/Loss (Raw)": 2.2551016807556152, "Pretrain/Step": 10913, "Pretrain/Step Time": 8.452236142009497} +{"Pretrain/Learning Rate": 2.039288496077555e-05, "Pretrain/Loss": 1.9855356216430664, "Pretrain/Loss (Raw)": 1.985710859298706, "Pretrain/Step": 10914, "Pretrain/Step Time": 8.448843309655786} +{"Pretrain/Learning Rate": 2.0388712568486616e-05, "Pretrain/Loss": 1.9840991497039795, "Pretrain/Loss (Raw)": 1.93909752368927, "Pretrain/Step": 10915, "Pretrain/Step Time": 8.459410754963756} +{"Pretrain/Learning Rate": 2.03845403091609e-05, "Pretrain/Loss": 1.9827017784118652, "Pretrain/Loss (Raw)": 2.0435791015625, "Pretrain/Step": 10916, "Pretrain/Step Time": 8.454827465116978} +{"Pretrain/Learning Rate": 2.038036818291872e-05, "Pretrain/Loss": 1.9833636283874512, "Pretrain/Loss (Raw)": 1.959610104560852, "Pretrain/Step": 10917, "Pretrain/Step Time": 8.45370352268219} +{"Pretrain/Learning Rate": 2.037619618988036e-05, "Pretrain/Loss": 1.983243465423584, "Pretrain/Loss (Raw)": 1.9541290998458862, "Pretrain/Step": 10918, "Pretrain/Step Time": 8.454040795564651} +{"Pretrain/Learning Rate": 2.0372024330166124e-05, "Pretrain/Loss": 1.980912685394287, "Pretrain/Loss (Raw)": 1.6153225898742676, "Pretrain/Step": 10919, "Pretrain/Step Time": 8.457139793783426} +{"Pretrain/Learning Rate": 2.0367852603896308e-05, "Pretrain/Loss": 1.980010986328125, "Pretrain/Loss (Raw)": 1.835365891456604, "Pretrain/Step": 10920, "Pretrain/Step Time": 8.455718781799078} +{"Pretrain/Learning Rate": 2.036368101119119e-05, "Pretrain/Loss": 1.980727195739746, "Pretrain/Loss (Raw)": 2.123645782470703, "Pretrain/Step": 10921, "Pretrain/Step Time": 8.452645217999816} +{"Pretrain/Learning Rate": 2.035950955217107e-05, "Pretrain/Loss": 1.9793387651443481, "Pretrain/Loss (Raw)": 1.870335578918457, "Pretrain/Step": 10922, "Pretrain/Step Time": 8.4528115298599} +{"Pretrain/Learning Rate": 2.0355338226956216e-05, "Pretrain/Loss": 1.9782869815826416, "Pretrain/Loss (Raw)": 1.96829092502594, "Pretrain/Step": 10923, "Pretrain/Step Time": 8.450816502794623} +{"Pretrain/Learning Rate": 2.0351167035666906e-05, "Pretrain/Loss": 1.974125623703003, "Pretrain/Loss (Raw)": 1.700265884399414, "Pretrain/Step": 10924, "Pretrain/Step Time": 8.455261724069715} +{"Pretrain/Learning Rate": 2.034699597842342e-05, "Pretrain/Loss": 1.9734320640563965, "Pretrain/Loss (Raw)": 1.882295846939087, "Pretrain/Step": 10925, "Pretrain/Step Time": 8.45059566758573} +{"Pretrain/Learning Rate": 2.034282505534603e-05, "Pretrain/Loss": 1.9731131792068481, "Pretrain/Loss (Raw)": 1.9675031900405884, "Pretrain/Step": 10926, "Pretrain/Step Time": 8.451581940054893} +{"Pretrain/Learning Rate": 2.0338654266554997e-05, "Pretrain/Loss": 1.9698494672775269, "Pretrain/Loss (Raw)": 1.9361536502838135, "Pretrain/Step": 10927, "Pretrain/Step Time": 8.454890048131347} +{"Pretrain/Learning Rate": 2.0334483612170576e-05, "Pretrain/Loss": 1.9709386825561523, "Pretrain/Loss (Raw)": 1.9918509721755981, "Pretrain/Step": 10928, "Pretrain/Step Time": 8.454448573291302} +{"Pretrain/Learning Rate": 2.033031309231303e-05, "Pretrain/Loss": 1.971193552017212, "Pretrain/Loss (Raw)": 2.190622568130493, "Pretrain/Step": 10929, "Pretrain/Step Time": 8.456159679219127} +{"Pretrain/Learning Rate": 2.0326142707102616e-05, "Pretrain/Loss": 1.9690897464752197, "Pretrain/Loss (Raw)": 1.595138669013977, "Pretrain/Step": 10930, "Pretrain/Step Time": 8.45181174762547} +{"Pretrain/Learning Rate": 2.032197245665958e-05, "Pretrain/Loss": 1.9700937271118164, "Pretrain/Loss (Raw)": 1.9699616432189941, "Pretrain/Step": 10931, "Pretrain/Step Time": 8.450388694182038} +{"Pretrain/Learning Rate": 2.0317802341104182e-05, "Pretrain/Loss": 1.9703024625778198, "Pretrain/Loss (Raw)": 2.086366891860962, "Pretrain/Step": 10932, "Pretrain/Step Time": 8.454651098698378} +{"Pretrain/Learning Rate": 2.0313632360556642e-05, "Pretrain/Loss": 1.9731426239013672, "Pretrain/Loss (Raw)": 2.377380847930908, "Pretrain/Step": 10933, "Pretrain/Step Time": 8.458459813147783} +{"Pretrain/Learning Rate": 2.030946251513721e-05, "Pretrain/Loss": 1.97065007686615, "Pretrain/Loss (Raw)": 1.5418238639831543, "Pretrain/Step": 10934, "Pretrain/Step Time": 8.453192809596658} +{"Pretrain/Learning Rate": 2.030529280496612e-05, "Pretrain/Loss": 1.968040943145752, "Pretrain/Loss (Raw)": 1.8772292137145996, "Pretrain/Step": 10935, "Pretrain/Step Time": 8.454325368627906} +{"Pretrain/Learning Rate": 2.0301123230163603e-05, "Pretrain/Loss": 1.9695632457733154, "Pretrain/Loss (Raw)": 2.007805347442627, "Pretrain/Step": 10936, "Pretrain/Step Time": 8.454330226406455} +{"Pretrain/Learning Rate": 2.0296953790849893e-05, "Pretrain/Loss": 1.966667652130127, "Pretrain/Loss (Raw)": 1.5190545320510864, "Pretrain/Step": 10937, "Pretrain/Step Time": 8.457414941862226} +{"Pretrain/Learning Rate": 2.0292784487145195e-05, "Pretrain/Loss": 1.9689898490905762, "Pretrain/Loss (Raw)": 2.151103973388672, "Pretrain/Step": 10938, "Pretrain/Step Time": 8.450560374185443} +{"Pretrain/Learning Rate": 2.028861531916974e-05, "Pretrain/Loss": 1.97443425655365, "Pretrain/Loss (Raw)": 2.0664260387420654, "Pretrain/Step": 10939, "Pretrain/Step Time": 8.45137787424028} +{"Pretrain/Learning Rate": 2.028444628704374e-05, "Pretrain/Loss": 1.9738473892211914, "Pretrain/Loss (Raw)": 2.1119580268859863, "Pretrain/Step": 10940, "Pretrain/Step Time": 8.453007562085986} +{"Pretrain/Learning Rate": 2.028027739088741e-05, "Pretrain/Loss": 1.9728143215179443, "Pretrain/Loss (Raw)": 1.929970622062683, "Pretrain/Step": 10941, "Pretrain/Step Time": 8.455605782568455} +{"Pretrain/Learning Rate": 2.027610863082095e-05, "Pretrain/Loss": 1.971233606338501, "Pretrain/Loss (Raw)": 1.910168170928955, "Pretrain/Step": 10942, "Pretrain/Step Time": 8.453056087717414} +{"Pretrain/Learning Rate": 2.0271940006964577e-05, "Pretrain/Loss": 1.9715604782104492, "Pretrain/Loss (Raw)": 1.8387656211853027, "Pretrain/Step": 10943, "Pretrain/Step Time": 8.453761586919427} +{"Pretrain/Learning Rate": 2.0267771519438472e-05, "Pretrain/Loss": 1.9742181301116943, "Pretrain/Loss (Raw)": 2.113365411758423, "Pretrain/Step": 10944, "Pretrain/Step Time": 8.454001169651747} +{"Pretrain/Learning Rate": 2.026360316836284e-05, "Pretrain/Loss": 1.974872350692749, "Pretrain/Loss (Raw)": 2.048741579055786, "Pretrain/Step": 10945, "Pretrain/Step Time": 8.454948529601097} +{"Pretrain/Learning Rate": 2.0259434953857874e-05, "Pretrain/Loss": 1.9746240377426147, "Pretrain/Loss (Raw)": 2.030266046524048, "Pretrain/Step": 10946, "Pretrain/Step Time": 8.452463783323765} +{"Pretrain/Learning Rate": 2.0255266876043757e-05, "Pretrain/Loss": 1.9768905639648438, "Pretrain/Loss (Raw)": 1.9965070486068726, "Pretrain/Step": 10947, "Pretrain/Step Time": 8.454685280099511} +{"Pretrain/Learning Rate": 2.025109893504068e-05, "Pretrain/Loss": 1.9759018421173096, "Pretrain/Loss (Raw)": 1.8636722564697266, "Pretrain/Step": 10948, "Pretrain/Step Time": 8.455537619069219} +{"Pretrain/Learning Rate": 2.0246931130968816e-05, "Pretrain/Loss": 1.9777839183807373, "Pretrain/Loss (Raw)": 1.9776668548583984, "Pretrain/Step": 10949, "Pretrain/Step Time": 8.44928483106196} +{"Pretrain/Learning Rate": 2.024276346394834e-05, "Pretrain/Loss": 1.9769306182861328, "Pretrain/Loss (Raw)": 1.925022840499878, "Pretrain/Step": 10950, "Pretrain/Step Time": 8.451609821990132} +{"Pretrain/Learning Rate": 2.0238595934099423e-05, "Pretrain/Loss": 1.9787472486495972, "Pretrain/Loss (Raw)": 2.0771970748901367, "Pretrain/Step": 10951, "Pretrain/Step Time": 8.44930474087596} +{"Pretrain/Learning Rate": 2.0234428541542238e-05, "Pretrain/Loss": 1.9808930158615112, "Pretrain/Loss (Raw)": 2.0707781314849854, "Pretrain/Step": 10952, "Pretrain/Step Time": 8.451134890317917} +{"Pretrain/Learning Rate": 2.0230261286396952e-05, "Pretrain/Loss": 1.9827324151992798, "Pretrain/Loss (Raw)": 2.1740641593933105, "Pretrain/Step": 10953, "Pretrain/Step Time": 8.452907804399729} +{"Pretrain/Learning Rate": 2.022609416878371e-05, "Pretrain/Loss": 1.979051113128662, "Pretrain/Loss (Raw)": 1.7659262418746948, "Pretrain/Step": 10954, "Pretrain/Step Time": 8.454304484650493} +{"Pretrain/Learning Rate": 2.0221927188822683e-05, "Pretrain/Loss": 1.9806857109069824, "Pretrain/Loss (Raw)": 2.268059492111206, "Pretrain/Step": 10955, "Pretrain/Step Time": 8.453163018450141} +{"Pretrain/Learning Rate": 2.0217760346634016e-05, "Pretrain/Loss": 1.9798450469970703, "Pretrain/Loss (Raw)": 1.9354485273361206, "Pretrain/Step": 10956, "Pretrain/Step Time": 8.455237625166774} +{"Pretrain/Learning Rate": 2.0213593642337854e-05, "Pretrain/Loss": 1.9797475337982178, "Pretrain/Loss (Raw)": 2.0222415924072266, "Pretrain/Step": 10957, "Pretrain/Step Time": 8.458659328520298} +{"Pretrain/Learning Rate": 2.020942707605436e-05, "Pretrain/Loss": 1.978248119354248, "Pretrain/Loss (Raw)": 1.9129068851470947, "Pretrain/Step": 10958, "Pretrain/Step Time": 8.45670548081398} +{"Pretrain/Learning Rate": 2.0205260647903648e-05, "Pretrain/Loss": 1.9776949882507324, "Pretrain/Loss (Raw)": 1.9547920227050781, "Pretrain/Step": 10959, "Pretrain/Step Time": 8.452917993068695} +{"Pretrain/Learning Rate": 2.020109435800587e-05, "Pretrain/Loss": 1.975642204284668, "Pretrain/Loss (Raw)": 1.9020224809646606, "Pretrain/Step": 10960, "Pretrain/Step Time": 8.451568650081754} +{"Pretrain/Learning Rate": 2.0196928206481147e-05, "Pretrain/Loss": 1.9778361320495605, "Pretrain/Loss (Raw)": 2.0369272232055664, "Pretrain/Step": 10961, "Pretrain/Step Time": 8.451914904639125} +{"Pretrain/Learning Rate": 2.0192762193449617e-05, "Pretrain/Loss": 1.9757611751556396, "Pretrain/Loss (Raw)": 1.7491422891616821, "Pretrain/Step": 10962, "Pretrain/Step Time": 8.454048899933696} +{"Pretrain/Learning Rate": 2.0188596319031393e-05, "Pretrain/Loss": 1.9783201217651367, "Pretrain/Loss (Raw)": 2.047893524169922, "Pretrain/Step": 10963, "Pretrain/Step Time": 8.454490220174193} +{"Pretrain/Learning Rate": 2.018443058334661e-05, "Pretrain/Loss": 1.9769083261489868, "Pretrain/Loss (Raw)": 1.793618083000183, "Pretrain/Step": 10964, "Pretrain/Step Time": 8.452773600816727} +{"Pretrain/Learning Rate": 2.0180264986515376e-05, "Pretrain/Loss": 1.9773898124694824, "Pretrain/Loss (Raw)": 2.028641700744629, "Pretrain/Step": 10965, "Pretrain/Step Time": 8.447770645841956} +{"Pretrain/Learning Rate": 2.01760995286578e-05, "Pretrain/Loss": 1.9767134189605713, "Pretrain/Loss (Raw)": 2.015876531600952, "Pretrain/Step": 10966, "Pretrain/Step Time": 8.452642939984798} +{"Pretrain/Learning Rate": 2.0171934209893994e-05, "Pretrain/Loss": 1.9768660068511963, "Pretrain/Loss (Raw)": 1.9841411113739014, "Pretrain/Step": 10967, "Pretrain/Step Time": 8.454752942547202} +{"Pretrain/Learning Rate": 2.0167769030344063e-05, "Pretrain/Loss": 1.9770745038986206, "Pretrain/Loss (Raw)": 1.835588812828064, "Pretrain/Step": 10968, "Pretrain/Step Time": 8.455009585246444} +{"Pretrain/Learning Rate": 2.01636039901281e-05, "Pretrain/Loss": 1.974428653717041, "Pretrain/Loss (Raw)": 1.9261623620986938, "Pretrain/Step": 10969, "Pretrain/Step Time": 8.448333775624633} +{"Pretrain/Learning Rate": 2.0159439089366213e-05, "Pretrain/Loss": 1.97539222240448, "Pretrain/Loss (Raw)": 1.9954564571380615, "Pretrain/Step": 10970, "Pretrain/Step Time": 8.45377621985972} +{"Pretrain/Learning Rate": 2.0155274328178493e-05, "Pretrain/Loss": 1.975917935371399, "Pretrain/Loss (Raw)": 2.0205936431884766, "Pretrain/Step": 10971, "Pretrain/Step Time": 8.44940746948123} +{"Pretrain/Learning Rate": 2.015110970668501e-05, "Pretrain/Loss": 1.9758275747299194, "Pretrain/Loss (Raw)": 1.976672649383545, "Pretrain/Step": 10972, "Pretrain/Step Time": 8.451103264465928} +{"Pretrain/Learning Rate": 2.0146945225005868e-05, "Pretrain/Loss": 1.9765474796295166, "Pretrain/Loss (Raw)": 1.9586435556411743, "Pretrain/Step": 10973, "Pretrain/Step Time": 8.45113867148757} +{"Pretrain/Learning Rate": 2.0142780883261134e-05, "Pretrain/Loss": 1.9731948375701904, "Pretrain/Loss (Raw)": 1.6939111948013306, "Pretrain/Step": 10974, "Pretrain/Step Time": 8.447591682896018} +{"Pretrain/Learning Rate": 2.013861668157089e-05, "Pretrain/Loss": 1.9727689027786255, "Pretrain/Loss (Raw)": 1.8224703073501587, "Pretrain/Step": 10975, "Pretrain/Step Time": 8.450035031884909} +{"Pretrain/Learning Rate": 2.0134452620055213e-05, "Pretrain/Loss": 1.9704214334487915, "Pretrain/Loss (Raw)": 1.8698840141296387, "Pretrain/Step": 10976, "Pretrain/Step Time": 8.446251962333918} +{"Pretrain/Learning Rate": 2.013028869883416e-05, "Pretrain/Loss": 1.9695141315460205, "Pretrain/Loss (Raw)": 2.059535503387451, "Pretrain/Step": 10977, "Pretrain/Step Time": 8.452352922409773} +{"Pretrain/Learning Rate": 2.01261249180278e-05, "Pretrain/Loss": 1.9713718891143799, "Pretrain/Loss (Raw)": 2.1268298625946045, "Pretrain/Step": 10978, "Pretrain/Step Time": 8.45149813592434} +{"Pretrain/Learning Rate": 2.012196127775619e-05, "Pretrain/Loss": 1.9697680473327637, "Pretrain/Loss (Raw)": 1.8842840194702148, "Pretrain/Step": 10979, "Pretrain/Step Time": 8.455206295475364} +{"Pretrain/Learning Rate": 2.011779777813939e-05, "Pretrain/Loss": 1.968942403793335, "Pretrain/Loss (Raw)": 2.042459726333618, "Pretrain/Step": 10980, "Pretrain/Step Time": 8.455031119287014} +{"Pretrain/Learning Rate": 2.0113634419297453e-05, "Pretrain/Loss": 1.9677410125732422, "Pretrain/Loss (Raw)": 2.082468271255493, "Pretrain/Step": 10981, "Pretrain/Step Time": 8.450511997565627} +{"Pretrain/Learning Rate": 2.010947120135042e-05, "Pretrain/Loss": 1.9702813625335693, "Pretrain/Loss (Raw)": 2.173670768737793, "Pretrain/Step": 10982, "Pretrain/Step Time": 8.450772877782583} +{"Pretrain/Learning Rate": 2.0105308124418336e-05, "Pretrain/Loss": 1.9700586795806885, "Pretrain/Loss (Raw)": 1.942054033279419, "Pretrain/Step": 10983, "Pretrain/Step Time": 8.448179760947824} +{"Pretrain/Learning Rate": 2.010114518862124e-05, "Pretrain/Loss": 1.9704889059066772, "Pretrain/Loss (Raw)": 1.9614064693450928, "Pretrain/Step": 10984, "Pretrain/Step Time": 8.452165510505438} +{"Pretrain/Learning Rate": 2.009698239407917e-05, "Pretrain/Loss": 1.9692175388336182, "Pretrain/Loss (Raw)": 1.7814675569534302, "Pretrain/Step": 10985, "Pretrain/Step Time": 8.452109929174185} +{"Pretrain/Learning Rate": 2.009281974091216e-05, "Pretrain/Loss": 1.9683325290679932, "Pretrain/Loss (Raw)": 1.893093466758728, "Pretrain/Step": 10986, "Pretrain/Step Time": 8.450432479381561} +{"Pretrain/Learning Rate": 2.0088657229240233e-05, "Pretrain/Loss": 1.9692436456680298, "Pretrain/Loss (Raw)": 2.1337730884552, "Pretrain/Step": 10987, "Pretrain/Step Time": 8.450914569199085} +{"Pretrain/Learning Rate": 2.008449485918341e-05, "Pretrain/Loss": 1.968793272972107, "Pretrain/Loss (Raw)": 2.1657543182373047, "Pretrain/Step": 10988, "Pretrain/Step Time": 8.44895862415433} +{"Pretrain/Learning Rate": 2.008033263086171e-05, "Pretrain/Loss": 1.9698872566223145, "Pretrain/Loss (Raw)": 2.0316877365112305, "Pretrain/Step": 10989, "Pretrain/Step Time": 8.449924314394593} +{"Pretrain/Learning Rate": 2.007617054439515e-05, "Pretrain/Loss": 1.9725898504257202, "Pretrain/Loss (Raw)": 2.1179957389831543, "Pretrain/Step": 10990, "Pretrain/Step Time": 8.447520921006799} +{"Pretrain/Learning Rate": 2.0072008599903752e-05, "Pretrain/Loss": 1.974716305732727, "Pretrain/Loss (Raw)": 2.093505620956421, "Pretrain/Step": 10991, "Pretrain/Step Time": 8.44953840970993} +{"Pretrain/Learning Rate": 2.0067846797507504e-05, "Pretrain/Loss": 1.9759259223937988, "Pretrain/Loss (Raw)": 2.1249783039093018, "Pretrain/Step": 10992, "Pretrain/Step Time": 8.447965255007148} +{"Pretrain/Learning Rate": 2.0063685137326417e-05, "Pretrain/Loss": 1.974834680557251, "Pretrain/Loss (Raw)": 1.9691933393478394, "Pretrain/Step": 10993, "Pretrain/Step Time": 8.452164713293314} +{"Pretrain/Learning Rate": 2.0059523619480486e-05, "Pretrain/Loss": 1.9751136302947998, "Pretrain/Loss (Raw)": 2.003117561340332, "Pretrain/Step": 10994, "Pretrain/Step Time": 8.450988369062543} +{"Pretrain/Learning Rate": 2.0055362244089712e-05, "Pretrain/Loss": 1.9768812656402588, "Pretrain/Loss (Raw)": 2.2455153465270996, "Pretrain/Step": 10995, "Pretrain/Step Time": 8.452594285830855} +{"Pretrain/Learning Rate": 2.0051201011274088e-05, "Pretrain/Loss": 1.975699543952942, "Pretrain/Loss (Raw)": 2.0461151599884033, "Pretrain/Step": 10996, "Pretrain/Step Time": 8.452559465542436} +{"Pretrain/Learning Rate": 2.0047039921153585e-05, "Pretrain/Loss": 1.9779465198516846, "Pretrain/Loss (Raw)": 1.9720910787582397, "Pretrain/Step": 10997, "Pretrain/Step Time": 8.452986024320126} +{"Pretrain/Learning Rate": 2.0042878973848197e-05, "Pretrain/Loss": 1.9791334867477417, "Pretrain/Loss (Raw)": 2.0740134716033936, "Pretrain/Step": 10998, "Pretrain/Step Time": 8.45171487890184} +{"Pretrain/Learning Rate": 2.00387181694779e-05, "Pretrain/Loss": 1.978529930114746, "Pretrain/Loss (Raw)": 1.9375959634780884, "Pretrain/Step": 10999, "Pretrain/Step Time": 8.451100770384073} +{"Pretrain/Learning Rate": 2.0034557508162667e-05, "Pretrain/Loss": 1.9802056550979614, "Pretrain/Loss (Raw)": 2.0370752811431885, "Pretrain/Step": 11000, "Pretrain/Step Time": 8.450503576546907} +{"Pretrain/Learning Rate": 2.003039699002247e-05, "Pretrain/Loss": 1.9796513319015503, "Pretrain/Loss (Raw)": 2.142944574356079, "Pretrain/Step": 11001, "Pretrain/Step Time": 8.46029957383871} +{"Pretrain/Learning Rate": 2.0026236615177268e-05, "Pretrain/Loss": 1.9804644584655762, "Pretrain/Loss (Raw)": 2.040097951889038, "Pretrain/Step": 11002, "Pretrain/Step Time": 8.462162014096975} +{"Pretrain/Learning Rate": 2.002207638374703e-05, "Pretrain/Loss": 1.9810479879379272, "Pretrain/Loss (Raw)": 2.06365704536438, "Pretrain/Step": 11003, "Pretrain/Step Time": 8.459483128041029} +{"Pretrain/Learning Rate": 2.001791629585171e-05, "Pretrain/Loss": 1.9815256595611572, "Pretrain/Loss (Raw)": 2.028679609298706, "Pretrain/Step": 11004, "Pretrain/Step Time": 8.457446666434407} +{"Pretrain/Learning Rate": 2.0013756351611258e-05, "Pretrain/Loss": 1.9823884963989258, "Pretrain/Loss (Raw)": 2.1520192623138428, "Pretrain/Step": 11005, "Pretrain/Step Time": 8.453858343884349} +{"Pretrain/Learning Rate": 2.0009596551145628e-05, "Pretrain/Loss": 1.984458327293396, "Pretrain/Loss (Raw)": 2.000546932220459, "Pretrain/Step": 11006, "Pretrain/Step Time": 8.455126509070396} +{"Pretrain/Learning Rate": 2.000543689457477e-05, "Pretrain/Loss": 1.9833437204360962, "Pretrain/Loss (Raw)": 2.085709571838379, "Pretrain/Step": 11007, "Pretrain/Step Time": 8.460625691339374} +{"Pretrain/Learning Rate": 2.0001277382018613e-05, "Pretrain/Loss": 1.9822916984558105, "Pretrain/Loss (Raw)": 1.9251171350479126, "Pretrain/Step": 11008, "Pretrain/Step Time": 8.463842574506998} +{"Pretrain/Learning Rate": 1.9997118013597096e-05, "Pretrain/Loss": 1.983246922492981, "Pretrain/Loss (Raw)": 2.174877405166626, "Pretrain/Step": 11009, "Pretrain/Step Time": 8.461964847519994} +{"Pretrain/Learning Rate": 1.9992958789430155e-05, "Pretrain/Loss": 1.9841692447662354, "Pretrain/Loss (Raw)": 2.1315677165985107, "Pretrain/Step": 11010, "Pretrain/Step Time": 8.46023721061647} +{"Pretrain/Learning Rate": 1.998879970963772e-05, "Pretrain/Loss": 1.9824190139770508, "Pretrain/Loss (Raw)": 1.873005986213684, "Pretrain/Step": 11011, "Pretrain/Step Time": 8.459577372297645} +{"Pretrain/Learning Rate": 1.9984640774339717e-05, "Pretrain/Loss": 1.9814372062683105, "Pretrain/Loss (Raw)": 1.8112952709197998, "Pretrain/Step": 11012, "Pretrain/Step Time": 8.463549066334963} +{"Pretrain/Learning Rate": 1.998048198365606e-05, "Pretrain/Loss": 1.982252836227417, "Pretrain/Loss (Raw)": 2.0456793308258057, "Pretrain/Step": 11013, "Pretrain/Step Time": 8.464327471330762} +{"Pretrain/Learning Rate": 1.997632333770666e-05, "Pretrain/Loss": 1.9803316593170166, "Pretrain/Loss (Raw)": 1.9657953977584839, "Pretrain/Step": 11014, "Pretrain/Step Time": 8.45804287493229} +{"Pretrain/Learning Rate": 1.9972164836611437e-05, "Pretrain/Loss": 1.9801782369613647, "Pretrain/Loss (Raw)": 2.093364953994751, "Pretrain/Step": 11015, "Pretrain/Step Time": 8.454505136236548} +{"Pretrain/Learning Rate": 1.9968006480490297e-05, "Pretrain/Loss": 1.9780083894729614, "Pretrain/Loss (Raw)": 1.7631627321243286, "Pretrain/Step": 11016, "Pretrain/Step Time": 8.45807516016066} +{"Pretrain/Learning Rate": 1.9963848269463147e-05, "Pretrain/Loss": 1.9772508144378662, "Pretrain/Loss (Raw)": 1.948775053024292, "Pretrain/Step": 11017, "Pretrain/Step Time": 8.462584527209401} +{"Pretrain/Learning Rate": 1.995969020364988e-05, "Pretrain/Loss": 1.977712631225586, "Pretrain/Loss (Raw)": 2.0701167583465576, "Pretrain/Step": 11018, "Pretrain/Step Time": 8.465144503861666} +{"Pretrain/Learning Rate": 1.995553228317039e-05, "Pretrain/Loss": 1.9794238805770874, "Pretrain/Loss (Raw)": 2.020235776901245, "Pretrain/Step": 11019, "Pretrain/Step Time": 8.463034005835652} +{"Pretrain/Learning Rate": 1.995137450814457e-05, "Pretrain/Loss": 1.9829075336456299, "Pretrain/Loss (Raw)": 2.333919048309326, "Pretrain/Step": 11020, "Pretrain/Step Time": 8.457158599048853} +{"Pretrain/Learning Rate": 1.994721687869231e-05, "Pretrain/Loss": 1.9815926551818848, "Pretrain/Loss (Raw)": 1.9916149377822876, "Pretrain/Step": 11021, "Pretrain/Step Time": 8.455131696537137} +{"Pretrain/Learning Rate": 1.9943059394933493e-05, "Pretrain/Loss": 1.978717565536499, "Pretrain/Loss (Raw)": 1.5673998594284058, "Pretrain/Step": 11022, "Pretrain/Step Time": 8.45697039924562} +{"Pretrain/Learning Rate": 1.993890205698799e-05, "Pretrain/Loss": 1.9797663688659668, "Pretrain/Loss (Raw)": 2.130993127822876, "Pretrain/Step": 11023, "Pretrain/Step Time": 8.45429477095604} +{"Pretrain/Learning Rate": 1.9934744864975674e-05, "Pretrain/Loss": 1.982135534286499, "Pretrain/Loss (Raw)": 2.067194700241089, "Pretrain/Step": 11024, "Pretrain/Step Time": 8.458622792735696} +{"Pretrain/Learning Rate": 1.993058781901642e-05, "Pretrain/Loss": 1.9885972738265991, "Pretrain/Loss (Raw)": 2.578740358352661, "Pretrain/Step": 11025, "Pretrain/Step Time": 8.46221623942256} +{"Pretrain/Learning Rate": 1.9926430919230093e-05, "Pretrain/Loss": 1.9909121990203857, "Pretrain/Loss (Raw)": 2.407454013824463, "Pretrain/Step": 11026, "Pretrain/Step Time": 8.464213892817497} +{"Pretrain/Learning Rate": 1.992227416573656e-05, "Pretrain/Loss": 1.9905979633331299, "Pretrain/Loss (Raw)": 1.8501317501068115, "Pretrain/Step": 11027, "Pretrain/Step Time": 8.459237717092037} +{"Pretrain/Learning Rate": 1.991811755865567e-05, "Pretrain/Loss": 1.9910773038864136, "Pretrain/Loss (Raw)": 2.0660650730133057, "Pretrain/Step": 11028, "Pretrain/Step Time": 8.461871679872274} +{"Pretrain/Learning Rate": 1.9913961098107272e-05, "Pretrain/Loss": 1.9885668754577637, "Pretrain/Loss (Raw)": 1.689502477645874, "Pretrain/Step": 11029, "Pretrain/Step Time": 8.462786855176091} +{"Pretrain/Learning Rate": 1.9909804784211222e-05, "Pretrain/Loss": 1.9888505935668945, "Pretrain/Loss (Raw)": 1.9731513261795044, "Pretrain/Step": 11030, "Pretrain/Step Time": 8.464526614174247} +{"Pretrain/Learning Rate": 1.9905648617087364e-05, "Pretrain/Loss": 1.9880298376083374, "Pretrain/Loss (Raw)": 1.918851613998413, "Pretrain/Step": 11031, "Pretrain/Step Time": 8.466509187594056} +{"Pretrain/Learning Rate": 1.9901492596855543e-05, "Pretrain/Loss": 1.9878700971603394, "Pretrain/Loss (Raw)": 1.8957431316375732, "Pretrain/Step": 11032, "Pretrain/Step Time": 8.466659819707274} +{"Pretrain/Learning Rate": 1.9897336723635583e-05, "Pretrain/Loss": 1.9887720346450806, "Pretrain/Loss (Raw)": 2.0497305393218994, "Pretrain/Step": 11033, "Pretrain/Step Time": 8.466902000829577} +{"Pretrain/Learning Rate": 1.989318099754732e-05, "Pretrain/Loss": 1.9917405843734741, "Pretrain/Loss (Raw)": 2.300550937652588, "Pretrain/Step": 11034, "Pretrain/Step Time": 8.470616463571787} +{"Pretrain/Learning Rate": 1.9889025418710582e-05, "Pretrain/Loss": 1.992329478263855, "Pretrain/Loss (Raw)": 2.113715410232544, "Pretrain/Step": 11035, "Pretrain/Step Time": 8.466490702703595} +{"Pretrain/Learning Rate": 1.9884869987245193e-05, "Pretrain/Loss": 1.9902527332305908, "Pretrain/Loss (Raw)": 1.9609025716781616, "Pretrain/Step": 11036, "Pretrain/Step Time": 8.469840876758099} +{"Pretrain/Learning Rate": 1.988071470327098e-05, "Pretrain/Loss": 1.9883309602737427, "Pretrain/Loss (Raw)": 1.5225682258605957, "Pretrain/Step": 11037, "Pretrain/Step Time": 8.466794671490788} +{"Pretrain/Learning Rate": 1.9876559566907744e-05, "Pretrain/Loss": 1.9881302118301392, "Pretrain/Loss (Raw)": 2.040088653564453, "Pretrain/Step": 11038, "Pretrain/Step Time": 8.464767141267657} +{"Pretrain/Learning Rate": 1.98724045782753e-05, "Pretrain/Loss": 1.9894349575042725, "Pretrain/Loss (Raw)": 2.0192465782165527, "Pretrain/Step": 11039, "Pretrain/Step Time": 8.464309552684426} +{"Pretrain/Learning Rate": 1.9868249737493455e-05, "Pretrain/Loss": 1.9899370670318604, "Pretrain/Loss (Raw)": 2.001718759536743, "Pretrain/Step": 11040, "Pretrain/Step Time": 8.465498907491565} +{"Pretrain/Learning Rate": 1.986409504468201e-05, "Pretrain/Loss": 1.9873955249786377, "Pretrain/Loss (Raw)": 1.9297816753387451, "Pretrain/Step": 11041, "Pretrain/Step Time": 8.467661537230015} +{"Pretrain/Learning Rate": 1.9859940499960776e-05, "Pretrain/Loss": 1.986860990524292, "Pretrain/Loss (Raw)": 1.9173005819320679, "Pretrain/Step": 11042, "Pretrain/Step Time": 8.472438199445605} +{"Pretrain/Learning Rate": 1.9855786103449525e-05, "Pretrain/Loss": 1.9882892370224, "Pretrain/Loss (Raw)": 2.121901750564575, "Pretrain/Step": 11043, "Pretrain/Step Time": 8.46123811043799} +{"Pretrain/Learning Rate": 1.9851631855268055e-05, "Pretrain/Loss": 1.988553524017334, "Pretrain/Loss (Raw)": 2.0774223804473877, "Pretrain/Step": 11044, "Pretrain/Step Time": 8.462225506082177} +{"Pretrain/Learning Rate": 1.9847477755536153e-05, "Pretrain/Loss": 1.9888176918029785, "Pretrain/Loss (Raw)": 1.9934077262878418, "Pretrain/Step": 11045, "Pretrain/Step Time": 8.462978303432465} +{"Pretrain/Learning Rate": 1.9843323804373596e-05, "Pretrain/Loss": 1.987194538116455, "Pretrain/Loss (Raw)": 1.7463597059249878, "Pretrain/Step": 11046, "Pretrain/Step Time": 8.464246936142445} +{"Pretrain/Learning Rate": 1.983917000190016e-05, "Pretrain/Loss": 1.9902186393737793, "Pretrain/Loss (Raw)": 2.0024023056030273, "Pretrain/Step": 11047, "Pretrain/Step Time": 8.463433858007193} +{"Pretrain/Learning Rate": 1.983501634823562e-05, "Pretrain/Loss": 1.9908976554870605, "Pretrain/Loss (Raw)": 1.9223084449768066, "Pretrain/Step": 11048, "Pretrain/Step Time": 8.462629966437817} +{"Pretrain/Learning Rate": 1.983086284349974e-05, "Pretrain/Loss": 1.9914464950561523, "Pretrain/Loss (Raw)": 2.1938884258270264, "Pretrain/Step": 11049, "Pretrain/Step Time": 8.464647818356752} +{"Pretrain/Learning Rate": 1.9826709487812294e-05, "Pretrain/Loss": 1.9936449527740479, "Pretrain/Loss (Raw)": 2.151726245880127, "Pretrain/Step": 11050, "Pretrain/Step Time": 8.46551020257175} +{"Pretrain/Learning Rate": 1.9822556281293027e-05, "Pretrain/Loss": 1.9947842359542847, "Pretrain/Loss (Raw)": 2.1141140460968018, "Pretrain/Step": 11051, "Pretrain/Step Time": 8.466999242082238} +{"Pretrain/Learning Rate": 1.98184032240617e-05, "Pretrain/Loss": 1.9974128007888794, "Pretrain/Loss (Raw)": 2.0367352962493896, "Pretrain/Step": 11052, "Pretrain/Step Time": 8.46241725794971} +{"Pretrain/Learning Rate": 1.981425031623806e-05, "Pretrain/Loss": 1.9990140199661255, "Pretrain/Loss (Raw)": 2.0872466564178467, "Pretrain/Step": 11053, "Pretrain/Step Time": 8.463310906663537} +{"Pretrain/Learning Rate": 1.981009755794186e-05, "Pretrain/Loss": 1.9990487098693848, "Pretrain/Loss (Raw)": 1.9719537496566772, "Pretrain/Step": 11054, "Pretrain/Step Time": 8.461975010111928} +{"Pretrain/Learning Rate": 1.9805944949292843e-05, "Pretrain/Loss": 1.9996275901794434, "Pretrain/Loss (Raw)": 2.010223627090454, "Pretrain/Step": 11055, "Pretrain/Step Time": 8.460560984909534} +{"Pretrain/Learning Rate": 1.9801792490410737e-05, "Pretrain/Loss": 1.9984760284423828, "Pretrain/Loss (Raw)": 1.8444771766662598, "Pretrain/Step": 11056, "Pretrain/Step Time": 8.460077250376344} +{"Pretrain/Learning Rate": 1.9797640181415278e-05, "Pretrain/Loss": 1.9971868991851807, "Pretrain/Loss (Raw)": 2.025601625442505, "Pretrain/Step": 11057, "Pretrain/Step Time": 8.461133323609829} +{"Pretrain/Learning Rate": 1.97934880224262e-05, "Pretrain/Loss": 2.000196933746338, "Pretrain/Loss (Raw)": 1.9804476499557495, "Pretrain/Step": 11058, "Pretrain/Step Time": 8.460805518552661} +{"Pretrain/Learning Rate": 1.978933601356322e-05, "Pretrain/Loss": 2.001782178878784, "Pretrain/Loss (Raw)": 2.172860622406006, "Pretrain/Step": 11059, "Pretrain/Step Time": 8.460745714604855} +{"Pretrain/Learning Rate": 1.9785184154946075e-05, "Pretrain/Loss": 2.000340461730957, "Pretrain/Loss (Raw)": 1.901835560798645, "Pretrain/Step": 11060, "Pretrain/Step Time": 8.45474997907877} +{"Pretrain/Learning Rate": 1.9781032446694456e-05, "Pretrain/Loss": 1.9968714714050293, "Pretrain/Loss (Raw)": 1.9333306550979614, "Pretrain/Step": 11061, "Pretrain/Step Time": 8.457199892029166} +{"Pretrain/Learning Rate": 1.977688088892809e-05, "Pretrain/Loss": 1.9988958835601807, "Pretrain/Loss (Raw)": 1.8009403944015503, "Pretrain/Step": 11062, "Pretrain/Step Time": 8.458274103701115} +{"Pretrain/Learning Rate": 1.9772729481766683e-05, "Pretrain/Loss": 1.999875545501709, "Pretrain/Loss (Raw)": 2.0026278495788574, "Pretrain/Step": 11063, "Pretrain/Step Time": 8.46308564953506} +{"Pretrain/Learning Rate": 1.9768578225329936e-05, "Pretrain/Loss": 1.999788522720337, "Pretrain/Loss (Raw)": 1.9966830015182495, "Pretrain/Step": 11064, "Pretrain/Step Time": 8.462706562131643} +{"Pretrain/Learning Rate": 1.9764427119737554e-05, "Pretrain/Loss": 2.0004758834838867, "Pretrain/Loss (Raw)": 1.6070502996444702, "Pretrain/Step": 11065, "Pretrain/Step Time": 8.463127978146076} +{"Pretrain/Learning Rate": 1.9760276165109214e-05, "Pretrain/Loss": 1.9994924068450928, "Pretrain/Loss (Raw)": 2.0251989364624023, "Pretrain/Step": 11066, "Pretrain/Step Time": 8.464833244681358} +{"Pretrain/Learning Rate": 1.9756125361564623e-05, "Pretrain/Loss": 1.9990828037261963, "Pretrain/Loss (Raw)": 2.0139858722686768, "Pretrain/Step": 11067, "Pretrain/Step Time": 8.462665243074298} +{"Pretrain/Learning Rate": 1.9751974709223457e-05, "Pretrain/Loss": 1.9938287734985352, "Pretrain/Loss (Raw)": 1.439465880393982, "Pretrain/Step": 11068, "Pretrain/Step Time": 8.460453508421779} +{"Pretrain/Learning Rate": 1.9747824208205408e-05, "Pretrain/Loss": 1.9956386089324951, "Pretrain/Loss (Raw)": 2.1616227626800537, "Pretrain/Step": 11069, "Pretrain/Step Time": 8.457404682412744} +{"Pretrain/Learning Rate": 1.9743673858630138e-05, "Pretrain/Loss": 1.9943466186523438, "Pretrain/Loss (Raw)": 1.744783878326416, "Pretrain/Step": 11070, "Pretrain/Step Time": 8.460984012112021} +{"Pretrain/Learning Rate": 1.9739523660617336e-05, "Pretrain/Loss": 1.9929579496383667, "Pretrain/Loss (Raw)": 1.6610099077224731, "Pretrain/Step": 11071, "Pretrain/Step Time": 8.463745409622788} +{"Pretrain/Learning Rate": 1.973537361428665e-05, "Pretrain/Loss": 1.9936413764953613, "Pretrain/Loss (Raw)": 2.200868606567383, "Pretrain/Step": 11072, "Pretrain/Step Time": 8.460411228239536} +{"Pretrain/Learning Rate": 1.973122371975776e-05, "Pretrain/Loss": 1.9924473762512207, "Pretrain/Loss (Raw)": 1.8958892822265625, "Pretrain/Step": 11073, "Pretrain/Step Time": 8.46834653057158} +{"Pretrain/Learning Rate": 1.972707397715032e-05, "Pretrain/Loss": 1.9932395219802856, "Pretrain/Loss (Raw)": 2.1316721439361572, "Pretrain/Step": 11074, "Pretrain/Step Time": 8.469405515119433} +{"Pretrain/Learning Rate": 1.972292438658398e-05, "Pretrain/Loss": 1.9925493001937866, "Pretrain/Loss (Raw)": 1.9081579446792603, "Pretrain/Step": 11075, "Pretrain/Step Time": 8.470600074157119} +{"Pretrain/Learning Rate": 1.9718774948178402e-05, "Pretrain/Loss": 1.9936132431030273, "Pretrain/Loss (Raw)": 1.999861478805542, "Pretrain/Step": 11076, "Pretrain/Step Time": 8.469270957633853} +{"Pretrain/Learning Rate": 1.9714625662053224e-05, "Pretrain/Loss": 1.9935753345489502, "Pretrain/Loss (Raw)": 1.9727959632873535, "Pretrain/Step": 11077, "Pretrain/Step Time": 8.46802813373506} +{"Pretrain/Learning Rate": 1.9710476528328088e-05, "Pretrain/Loss": 1.9937851428985596, "Pretrain/Loss (Raw)": 1.9518800973892212, "Pretrain/Step": 11078, "Pretrain/Step Time": 8.471947405487299} +{"Pretrain/Learning Rate": 1.9706327547122628e-05, "Pretrain/Loss": 1.9929378032684326, "Pretrain/Loss (Raw)": 1.9687473773956299, "Pretrain/Step": 11079, "Pretrain/Step Time": 8.472360806539655} +{"Pretrain/Learning Rate": 1.9702178718556486e-05, "Pretrain/Loss": 1.9922828674316406, "Pretrain/Loss (Raw)": 1.9869349002838135, "Pretrain/Step": 11080, "Pretrain/Step Time": 8.475359478965402} +{"Pretrain/Learning Rate": 1.9698030042749288e-05, "Pretrain/Loss": 1.990041732788086, "Pretrain/Loss (Raw)": 1.8872076272964478, "Pretrain/Step": 11081, "Pretrain/Step Time": 8.479405380785465} +{"Pretrain/Learning Rate": 1.9693881519820653e-05, "Pretrain/Loss": 1.9922196865081787, "Pretrain/Loss (Raw)": 2.044698476791382, "Pretrain/Step": 11082, "Pretrain/Step Time": 8.477423457428813} +{"Pretrain/Learning Rate": 1.96897331498902e-05, "Pretrain/Loss": 1.9893568754196167, "Pretrain/Loss (Raw)": 1.901623249053955, "Pretrain/Step": 11083, "Pretrain/Step Time": 8.478958198800683} +{"Pretrain/Learning Rate": 1.9685584933077552e-05, "Pretrain/Loss": 1.990403413772583, "Pretrain/Loss (Raw)": 2.069417715072632, "Pretrain/Step": 11084, "Pretrain/Step Time": 8.476562391966581} +{"Pretrain/Learning Rate": 1.968143686950232e-05, "Pretrain/Loss": 1.9905568361282349, "Pretrain/Loss (Raw)": 2.0418686866760254, "Pretrain/Step": 11085, "Pretrain/Step Time": 8.473425723612309} +{"Pretrain/Learning Rate": 1.9677288959284104e-05, "Pretrain/Loss": 1.9886398315429688, "Pretrain/Loss (Raw)": 1.6675208806991577, "Pretrain/Step": 11086, "Pretrain/Step Time": 8.472696328535676} +{"Pretrain/Learning Rate": 1.9673141202542507e-05, "Pretrain/Loss": 1.9872428178787231, "Pretrain/Loss (Raw)": 1.7759822607040405, "Pretrain/Step": 11087, "Pretrain/Step Time": 8.473764197900891} +{"Pretrain/Learning Rate": 1.9668993599397127e-05, "Pretrain/Loss": 1.9891254901885986, "Pretrain/Loss (Raw)": 2.1430141925811768, "Pretrain/Step": 11088, "Pretrain/Step Time": 8.477476676926017} +{"Pretrain/Learning Rate": 1.9664846149967557e-05, "Pretrain/Loss": 1.9899091720581055, "Pretrain/Loss (Raw)": 2.137234926223755, "Pretrain/Step": 11089, "Pretrain/Step Time": 8.47935688123107} +{"Pretrain/Learning Rate": 1.966069885437339e-05, "Pretrain/Loss": 1.9901663064956665, "Pretrain/Loss (Raw)": 1.7820395231246948, "Pretrain/Step": 11090, "Pretrain/Step Time": 8.47975143045187} +{"Pretrain/Learning Rate": 1.9656551712734213e-05, "Pretrain/Loss": 1.9888290166854858, "Pretrain/Loss (Raw)": 1.8767317533493042, "Pretrain/Step": 11091, "Pretrain/Step Time": 8.481146492064} +{"Pretrain/Learning Rate": 1.965240472516959e-05, "Pretrain/Loss": 1.9882802963256836, "Pretrain/Loss (Raw)": 1.7233728170394897, "Pretrain/Step": 11092, "Pretrain/Step Time": 8.486300081014633} +{"Pretrain/Learning Rate": 1.9648257891799115e-05, "Pretrain/Loss": 1.9901823997497559, "Pretrain/Loss (Raw)": 2.2721118927001953, "Pretrain/Step": 11093, "Pretrain/Step Time": 8.487652203068137} +{"Pretrain/Learning Rate": 1.964411121274235e-05, "Pretrain/Loss": 1.9896445274353027, "Pretrain/Loss (Raw)": 1.9470324516296387, "Pretrain/Step": 11094, "Pretrain/Step Time": 8.484340865164995} +{"Pretrain/Learning Rate": 1.963996468811886e-05, "Pretrain/Loss": 1.9909671545028687, "Pretrain/Loss (Raw)": 2.15343976020813, "Pretrain/Step": 11095, "Pretrain/Step Time": 8.48516976647079} +{"Pretrain/Learning Rate": 1.9635818318048212e-05, "Pretrain/Loss": 1.993239402770996, "Pretrain/Loss (Raw)": 2.1264309883117676, "Pretrain/Step": 11096, "Pretrain/Step Time": 8.4821731839329} +{"Pretrain/Learning Rate": 1.9631672102649958e-05, "Pretrain/Loss": 1.9951108694076538, "Pretrain/Loss (Raw)": 2.165727138519287, "Pretrain/Step": 11097, "Pretrain/Step Time": 8.485673973336816} +{"Pretrain/Learning Rate": 1.9627526042043655e-05, "Pretrain/Loss": 1.9953997135162354, "Pretrain/Loss (Raw)": 2.0324158668518066, "Pretrain/Step": 11098, "Pretrain/Step Time": 8.485112596303225} +{"Pretrain/Learning Rate": 1.9623380136348853e-05, "Pretrain/Loss": 1.9939048290252686, "Pretrain/Loss (Raw)": 1.8292555809020996, "Pretrain/Step": 11099, "Pretrain/Step Time": 8.485255982726812} +{"Pretrain/Learning Rate": 1.9619234385685092e-05, "Pretrain/Loss": 1.9944956302642822, "Pretrain/Loss (Raw)": 2.052285671234131, "Pretrain/Step": 11100, "Pretrain/Step Time": 8.490004520863295} +{"Pretrain/Learning Rate": 1.9615088790171922e-05, "Pretrain/Loss": 1.995779037475586, "Pretrain/Loss (Raw)": 2.1229310035705566, "Pretrain/Step": 11101, "Pretrain/Step Time": 8.48940945789218} +{"Pretrain/Learning Rate": 1.9610943349928863e-05, "Pretrain/Loss": 1.9991397857666016, "Pretrain/Loss (Raw)": 2.1240792274475098, "Pretrain/Step": 11102, "Pretrain/Step Time": 8.489607110619545} +{"Pretrain/Learning Rate": 1.9606798065075456e-05, "Pretrain/Loss": 2.0004146099090576, "Pretrain/Loss (Raw)": 1.985652208328247, "Pretrain/Step": 11103, "Pretrain/Step Time": 8.486682707443833} +{"Pretrain/Learning Rate": 1.9602652935731222e-05, "Pretrain/Loss": 2.0019466876983643, "Pretrain/Loss (Raw)": 2.065983295440674, "Pretrain/Step": 11104, "Pretrain/Step Time": 8.490266103297472} +{"Pretrain/Learning Rate": 1.9598507962015686e-05, "Pretrain/Loss": 2.0029406547546387, "Pretrain/Loss (Raw)": 2.1867568492889404, "Pretrain/Step": 11105, "Pretrain/Step Time": 8.48834759183228} +{"Pretrain/Learning Rate": 1.9594363144048367e-05, "Pretrain/Loss": 2.000739574432373, "Pretrain/Loss (Raw)": 1.8451052904129028, "Pretrain/Step": 11106, "Pretrain/Step Time": 8.491690799593925} +{"Pretrain/Learning Rate": 1.959021848194878e-05, "Pretrain/Loss": 2.000063896179199, "Pretrain/Loss (Raw)": 1.7978075742721558, "Pretrain/Step": 11107, "Pretrain/Step Time": 8.48578703776002} +{"Pretrain/Learning Rate": 1.9586073975836424e-05, "Pretrain/Loss": 1.9998664855957031, "Pretrain/Loss (Raw)": 2.017183780670166, "Pretrain/Step": 11108, "Pretrain/Step Time": 8.49528394639492} +{"Pretrain/Learning Rate": 1.9581929625830807e-05, "Pretrain/Loss": 1.9991261959075928, "Pretrain/Loss (Raw)": 1.9876976013183594, "Pretrain/Step": 11109, "Pretrain/Step Time": 8.493842925876379} +{"Pretrain/Learning Rate": 1.957778543205143e-05, "Pretrain/Loss": 1.998203158378601, "Pretrain/Loss (Raw)": 2.0555264949798584, "Pretrain/Step": 11110, "Pretrain/Step Time": 8.492288991808891} +{"Pretrain/Learning Rate": 1.9573641394617794e-05, "Pretrain/Loss": 1.9995183944702148, "Pretrain/Loss (Raw)": 2.110407829284668, "Pretrain/Step": 11111, "Pretrain/Step Time": 8.494648080319166} +{"Pretrain/Learning Rate": 1.9569497513649383e-05, "Pretrain/Loss": 1.9988795518875122, "Pretrain/Loss (Raw)": 1.879628300666809, "Pretrain/Step": 11112, "Pretrain/Step Time": 8.489719105884433} +{"Pretrain/Learning Rate": 1.956535378926568e-05, "Pretrain/Loss": 2.000821352005005, "Pretrain/Loss (Raw)": 2.030027389526367, "Pretrain/Step": 11113, "Pretrain/Step Time": 8.489222960546613} +{"Pretrain/Learning Rate": 1.9561210221586166e-05, "Pretrain/Loss": 2.0020179748535156, "Pretrain/Loss (Raw)": 2.0462710857391357, "Pretrain/Step": 11114, "Pretrain/Step Time": 8.489385006949306} +{"Pretrain/Learning Rate": 1.9557066810730325e-05, "Pretrain/Loss": 2.000952959060669, "Pretrain/Loss (Raw)": 1.9974428415298462, "Pretrain/Step": 11115, "Pretrain/Step Time": 8.493036551401019} +{"Pretrain/Learning Rate": 1.955292355681762e-05, "Pretrain/Loss": 2.0006697177886963, "Pretrain/Loss (Raw)": 2.129490613937378, "Pretrain/Step": 11116, "Pretrain/Step Time": 8.491432782262564} +{"Pretrain/Learning Rate": 1.9548780459967534e-05, "Pretrain/Loss": 2.0006918907165527, "Pretrain/Loss (Raw)": 2.034511089324951, "Pretrain/Step": 11117, "Pretrain/Step Time": 8.492586459964514} +{"Pretrain/Learning Rate": 1.9544637520299512e-05, "Pretrain/Loss": 1.997472882270813, "Pretrain/Loss (Raw)": 1.7059800624847412, "Pretrain/Step": 11118, "Pretrain/Step Time": 8.491610554978251} +{"Pretrain/Learning Rate": 1.9540494737933024e-05, "Pretrain/Loss": 1.9959335327148438, "Pretrain/Loss (Raw)": 1.8964709043502808, "Pretrain/Step": 11119, "Pretrain/Step Time": 8.487042794004083} +{"Pretrain/Learning Rate": 1.953635211298752e-05, "Pretrain/Loss": 1.9950013160705566, "Pretrain/Loss (Raw)": 2.005646228790283, "Pretrain/Step": 11120, "Pretrain/Step Time": 8.48650635778904} +{"Pretrain/Learning Rate": 1.953220964558245e-05, "Pretrain/Loss": 1.9941680431365967, "Pretrain/Loss (Raw)": 1.8625576496124268, "Pretrain/Step": 11121, "Pretrain/Step Time": 8.479911921545863} +{"Pretrain/Learning Rate": 1.952806733583727e-05, "Pretrain/Loss": 1.993903398513794, "Pretrain/Loss (Raw)": 1.9692152738571167, "Pretrain/Step": 11122, "Pretrain/Step Time": 8.481426857411861} +{"Pretrain/Learning Rate": 1.9523925183871405e-05, "Pretrain/Loss": 1.9917361736297607, "Pretrain/Loss (Raw)": 1.9681061506271362, "Pretrain/Step": 11123, "Pretrain/Step Time": 8.4883882869035} +{"Pretrain/Learning Rate": 1.9519783189804294e-05, "Pretrain/Loss": 1.9908510446548462, "Pretrain/Loss (Raw)": 1.9328426122665405, "Pretrain/Step": 11124, "Pretrain/Step Time": 8.48993037454784} +{"Pretrain/Learning Rate": 1.9515641353755374e-05, "Pretrain/Loss": 1.9909780025482178, "Pretrain/Loss (Raw)": 1.9883180856704712, "Pretrain/Step": 11125, "Pretrain/Step Time": 8.484635220840573} +{"Pretrain/Learning Rate": 1.9511499675844077e-05, "Pretrain/Loss": 1.990422248840332, "Pretrain/Loss (Raw)": 2.0028774738311768, "Pretrain/Step": 11126, "Pretrain/Step Time": 8.4865662753582} +{"Pretrain/Learning Rate": 1.950735815618981e-05, "Pretrain/Loss": 1.9902690649032593, "Pretrain/Loss (Raw)": 1.9179965257644653, "Pretrain/Step": 11127, "Pretrain/Step Time": 8.483912218362093} +{"Pretrain/Learning Rate": 1.9503216794911995e-05, "Pretrain/Loss": 1.9901771545410156, "Pretrain/Loss (Raw)": 2.0253217220306396, "Pretrain/Step": 11128, "Pretrain/Step Time": 8.48742019943893} +{"Pretrain/Learning Rate": 1.949907559213006e-05, "Pretrain/Loss": 1.9905515909194946, "Pretrain/Loss (Raw)": 2.1908743381500244, "Pretrain/Step": 11129, "Pretrain/Step Time": 8.480275068432093} +{"Pretrain/Learning Rate": 1.9494934547963393e-05, "Pretrain/Loss": 1.990206003189087, "Pretrain/Loss (Raw)": 1.995855689048767, "Pretrain/Step": 11130, "Pretrain/Step Time": 8.480355512350798} +{"Pretrain/Learning Rate": 1.9490793662531408e-05, "Pretrain/Loss": 1.9905807971954346, "Pretrain/Loss (Raw)": 2.111628293991089, "Pretrain/Step": 11131, "Pretrain/Step Time": 8.482358867302537} +{"Pretrain/Learning Rate": 1.9486652935953503e-05, "Pretrain/Loss": 1.9902015924453735, "Pretrain/Loss (Raw)": 1.9801411628723145, "Pretrain/Step": 11132, "Pretrain/Step Time": 8.481881951913238} +{"Pretrain/Learning Rate": 1.9482512368349073e-05, "Pretrain/Loss": 1.988603115081787, "Pretrain/Loss (Raw)": 1.9473986625671387, "Pretrain/Step": 11133, "Pretrain/Step Time": 8.485237710177898} +{"Pretrain/Learning Rate": 1.947837195983752e-05, "Pretrain/Loss": 1.9873311519622803, "Pretrain/Loss (Raw)": 1.8377586603164673, "Pretrain/Step": 11134, "Pretrain/Step Time": 8.481994811445475} +{"Pretrain/Learning Rate": 1.9474231710538208e-05, "Pretrain/Loss": 1.9859895706176758, "Pretrain/Loss (Raw)": 1.913973093032837, "Pretrain/Step": 11135, "Pretrain/Step Time": 8.47614086419344} +{"Pretrain/Learning Rate": 1.9470091620570534e-05, "Pretrain/Loss": 1.9862462282180786, "Pretrain/Loss (Raw)": 1.9579845666885376, "Pretrain/Step": 11136, "Pretrain/Step Time": 8.474879179149866} +{"Pretrain/Learning Rate": 1.946595169005386e-05, "Pretrain/Loss": 1.9852876663208008, "Pretrain/Loss (Raw)": 2.052187204360962, "Pretrain/Step": 11137, "Pretrain/Step Time": 8.477660223841667} +{"Pretrain/Learning Rate": 1.946181191910758e-05, "Pretrain/Loss": 1.9826937913894653, "Pretrain/Loss (Raw)": 1.799531102180481, "Pretrain/Step": 11138, "Pretrain/Step Time": 8.481266871094704} +{"Pretrain/Learning Rate": 1.9457672307851043e-05, "Pretrain/Loss": 1.9832334518432617, "Pretrain/Loss (Raw)": 1.942081093788147, "Pretrain/Step": 11139, "Pretrain/Step Time": 8.48342908732593} +{"Pretrain/Learning Rate": 1.9453532856403626e-05, "Pretrain/Loss": 1.9861857891082764, "Pretrain/Loss (Raw)": 2.1892011165618896, "Pretrain/Step": 11140, "Pretrain/Step Time": 8.482156971469522} +{"Pretrain/Learning Rate": 1.944939356488467e-05, "Pretrain/Loss": 1.98551344871521, "Pretrain/Loss (Raw)": 1.959613561630249, "Pretrain/Step": 11141, "Pretrain/Step Time": 8.47933897189796} +{"Pretrain/Learning Rate": 1.944525443341354e-05, "Pretrain/Loss": 1.9852126836776733, "Pretrain/Loss (Raw)": 1.9273079633712769, "Pretrain/Step": 11142, "Pretrain/Step Time": 8.47818816639483} +{"Pretrain/Learning Rate": 1.9441115462109582e-05, "Pretrain/Loss": 1.983902931213379, "Pretrain/Loss (Raw)": 1.9257198572158813, "Pretrain/Step": 11143, "Pretrain/Step Time": 8.489457298070192} +{"Pretrain/Learning Rate": 1.9436976651092144e-05, "Pretrain/Loss": 1.9845962524414062, "Pretrain/Loss (Raw)": 1.8519072532653809, "Pretrain/Step": 11144, "Pretrain/Step Time": 8.484118243679404} +{"Pretrain/Learning Rate": 1.9432838000480564e-05, "Pretrain/Loss": 1.98582124710083, "Pretrain/Loss (Raw)": 2.1055819988250732, "Pretrain/Step": 11145, "Pretrain/Step Time": 8.483587494120002} +{"Pretrain/Learning Rate": 1.9428699510394173e-05, "Pretrain/Loss": 1.9842407703399658, "Pretrain/Loss (Raw)": 1.8678007125854492, "Pretrain/Step": 11146, "Pretrain/Step Time": 8.481208097189665} +{"Pretrain/Learning Rate": 1.94245611809523e-05, "Pretrain/Loss": 1.985055685043335, "Pretrain/Loss (Raw)": 2.1245336532592773, "Pretrain/Step": 11147, "Pretrain/Step Time": 8.48001323826611} +{"Pretrain/Learning Rate": 1.9420423012274277e-05, "Pretrain/Loss": 1.9813716411590576, "Pretrain/Loss (Raw)": 1.862380862236023, "Pretrain/Step": 11148, "Pretrain/Step Time": 8.487928764894605} +{"Pretrain/Learning Rate": 1.9416285004479423e-05, "Pretrain/Loss": 1.9809808731079102, "Pretrain/Loss (Raw)": 1.9415971040725708, "Pretrain/Step": 11149, "Pretrain/Step Time": 8.485618434846401} +{"Pretrain/Learning Rate": 1.9412147157687064e-05, "Pretrain/Loss": 1.986781358718872, "Pretrain/Loss (Raw)": 2.30985426902771, "Pretrain/Step": 11150, "Pretrain/Step Time": 8.48722136951983} +{"Pretrain/Learning Rate": 1.9408009472016492e-05, "Pretrain/Loss": 1.9845322370529175, "Pretrain/Loss (Raw)": 1.8431065082550049, "Pretrain/Step": 11151, "Pretrain/Step Time": 8.486654497683048} +{"Pretrain/Learning Rate": 1.9403871947587027e-05, "Pretrain/Loss": 1.983568787574768, "Pretrain/Loss (Raw)": 1.9438817501068115, "Pretrain/Step": 11152, "Pretrain/Step Time": 8.48234025388956} +{"Pretrain/Learning Rate": 1.9399734584517972e-05, "Pretrain/Loss": 1.9818333387374878, "Pretrain/Loss (Raw)": 2.3566088676452637, "Pretrain/Step": 11153, "Pretrain/Step Time": 8.479985909536481} +{"Pretrain/Learning Rate": 1.9395597382928616e-05, "Pretrain/Loss": 1.9783155918121338, "Pretrain/Loss (Raw)": 1.9571770429611206, "Pretrain/Step": 11154, "Pretrain/Step Time": 8.480709517374635} +{"Pretrain/Learning Rate": 1.9391460342938266e-05, "Pretrain/Loss": 1.9818346500396729, "Pretrain/Loss (Raw)": 2.3005599975585938, "Pretrain/Step": 11155, "Pretrain/Step Time": 8.48009855300188} +{"Pretrain/Learning Rate": 1.93873234646662e-05, "Pretrain/Loss": 1.9812607765197754, "Pretrain/Loss (Raw)": 1.992600679397583, "Pretrain/Step": 11156, "Pretrain/Step Time": 8.47871177829802} +{"Pretrain/Learning Rate": 1.9383186748231703e-05, "Pretrain/Loss": 1.9836571216583252, "Pretrain/Loss (Raw)": 1.9962496757507324, "Pretrain/Step": 11157, "Pretrain/Step Time": 8.476964998990297} +{"Pretrain/Learning Rate": 1.937905019375406e-05, "Pretrain/Loss": 1.9840314388275146, "Pretrain/Loss (Raw)": 2.021066427230835, "Pretrain/Step": 11158, "Pretrain/Step Time": 8.478984059765935} +{"Pretrain/Learning Rate": 1.937491380135254e-05, "Pretrain/Loss": 1.9851062297821045, "Pretrain/Loss (Raw)": 2.0564303398132324, "Pretrain/Step": 11159, "Pretrain/Step Time": 8.480301178991795} +{"Pretrain/Learning Rate": 1.937077757114642e-05, "Pretrain/Loss": 1.9873816967010498, "Pretrain/Loss (Raw)": 2.186988353729248, "Pretrain/Step": 11160, "Pretrain/Step Time": 8.476588102057576} +{"Pretrain/Learning Rate": 1.9366641503254957e-05, "Pretrain/Loss": 1.9862661361694336, "Pretrain/Loss (Raw)": 1.9069385528564453, "Pretrain/Step": 11161, "Pretrain/Step Time": 8.484357841312885} +{"Pretrain/Learning Rate": 1.9362505597797412e-05, "Pretrain/Loss": 1.98462975025177, "Pretrain/Loss (Raw)": 2.091096878051758, "Pretrain/Step": 11162, "Pretrain/Step Time": 8.47609367966652} +{"Pretrain/Learning Rate": 1.9358369854893046e-05, "Pretrain/Loss": 1.9839963912963867, "Pretrain/Loss (Raw)": 2.032639980316162, "Pretrain/Step": 11163, "Pretrain/Step Time": 8.476833363994956} +{"Pretrain/Learning Rate": 1.9354234274661107e-05, "Pretrain/Loss": 1.984107494354248, "Pretrain/Loss (Raw)": 1.9751255512237549, "Pretrain/Step": 11164, "Pretrain/Step Time": 8.479431817308068} +{"Pretrain/Learning Rate": 1.935009885722085e-05, "Pretrain/Loss": 1.9886176586151123, "Pretrain/Loss (Raw)": 2.0998899936676025, "Pretrain/Step": 11165, "Pretrain/Step Time": 8.48019291460514} +{"Pretrain/Learning Rate": 1.9345963602691504e-05, "Pretrain/Loss": 1.9877252578735352, "Pretrain/Loss (Raw)": 1.9258450269699097, "Pretrain/Step": 11166, "Pretrain/Step Time": 8.480724969878793} +{"Pretrain/Learning Rate": 1.934182851119231e-05, "Pretrain/Loss": 1.9879615306854248, "Pretrain/Loss (Raw)": 2.0494978427886963, "Pretrain/Step": 11167, "Pretrain/Step Time": 8.477949326857924} +{"Pretrain/Learning Rate": 1.93376935828425e-05, "Pretrain/Loss": 1.9884895086288452, "Pretrain/Loss (Raw)": 2.069293737411499, "Pretrain/Step": 11168, "Pretrain/Step Time": 8.47769895195961} +{"Pretrain/Learning Rate": 1.9333558817761307e-05, "Pretrain/Loss": 1.9898560047149658, "Pretrain/Loss (Raw)": 2.1047098636627197, "Pretrain/Step": 11169, "Pretrain/Step Time": 8.476354228332639} +{"Pretrain/Learning Rate": 1.9329424216067958e-05, "Pretrain/Loss": 1.988553524017334, "Pretrain/Loss (Raw)": 1.7505614757537842, "Pretrain/Step": 11170, "Pretrain/Step Time": 8.47389267385006} +{"Pretrain/Learning Rate": 1.9325289777881655e-05, "Pretrain/Loss": 1.988520622253418, "Pretrain/Loss (Raw)": 2.1176865100860596, "Pretrain/Step": 11171, "Pretrain/Step Time": 8.480962384492159} +{"Pretrain/Learning Rate": 1.932115550332162e-05, "Pretrain/Loss": 1.987409234046936, "Pretrain/Loss (Raw)": 1.9351705312728882, "Pretrain/Step": 11172, "Pretrain/Step Time": 8.480931105092168} +{"Pretrain/Learning Rate": 1.9317021392507067e-05, "Pretrain/Loss": 1.9886136054992676, "Pretrain/Loss (Raw)": 2.1475656032562256, "Pretrain/Step": 11173, "Pretrain/Step Time": 8.48197976499796} +{"Pretrain/Learning Rate": 1.9312887445557193e-05, "Pretrain/Loss": 1.988776683807373, "Pretrain/Loss (Raw)": 1.7672337293624878, "Pretrain/Step": 11174, "Pretrain/Step Time": 8.4776067212224} +{"Pretrain/Learning Rate": 1.9308753662591203e-05, "Pretrain/Loss": 1.9888241291046143, "Pretrain/Loss (Raw)": 2.0084757804870605, "Pretrain/Step": 11175, "Pretrain/Step Time": 8.479261927306652} +{"Pretrain/Learning Rate": 1.9304620043728296e-05, "Pretrain/Loss": 1.9888967275619507, "Pretrain/Loss (Raw)": 1.931599736213684, "Pretrain/Step": 11176, "Pretrain/Step Time": 8.477746600285172} +{"Pretrain/Learning Rate": 1.9300486589087645e-05, "Pretrain/Loss": 1.988410472869873, "Pretrain/Loss (Raw)": 2.1316494941711426, "Pretrain/Step": 11177, "Pretrain/Step Time": 8.479348693042994} +{"Pretrain/Learning Rate": 1.9296353298788445e-05, "Pretrain/Loss": 1.9898103475570679, "Pretrain/Loss (Raw)": 2.330909252166748, "Pretrain/Step": 11178, "Pretrain/Step Time": 8.475915130227804} +{"Pretrain/Learning Rate": 1.929222017294988e-05, "Pretrain/Loss": 1.9917596578598022, "Pretrain/Loss (Raw)": 2.3636255264282227, "Pretrain/Step": 11179, "Pretrain/Step Time": 8.474723992869258} +{"Pretrain/Learning Rate": 1.9288087211691118e-05, "Pretrain/Loss": 1.9896975755691528, "Pretrain/Loss (Raw)": 1.7727888822555542, "Pretrain/Step": 11180, "Pretrain/Step Time": 8.478933611884713} +{"Pretrain/Learning Rate": 1.9283954415131343e-05, "Pretrain/Loss": 1.9888343811035156, "Pretrain/Loss (Raw)": 1.9767615795135498, "Pretrain/Step": 11181, "Pretrain/Step Time": 8.480580208823085} +{"Pretrain/Learning Rate": 1.9279821783389713e-05, "Pretrain/Loss": 1.9896832704544067, "Pretrain/Loss (Raw)": 2.0806095600128174, "Pretrain/Step": 11182, "Pretrain/Step Time": 8.479274675250053} +{"Pretrain/Learning Rate": 1.9275689316585383e-05, "Pretrain/Loss": 1.9880616664886475, "Pretrain/Loss (Raw)": 1.8026766777038574, "Pretrain/Step": 11183, "Pretrain/Step Time": 8.479735914617777} +{"Pretrain/Learning Rate": 1.9271557014837516e-05, "Pretrain/Loss": 1.9907195568084717, "Pretrain/Loss (Raw)": 2.1846816539764404, "Pretrain/Step": 11184, "Pretrain/Step Time": 8.479354172945023} +{"Pretrain/Learning Rate": 1.9267424878265268e-05, "Pretrain/Loss": 1.9903104305267334, "Pretrain/Loss (Raw)": 1.9732249975204468, "Pretrain/Step": 11185, "Pretrain/Step Time": 8.478390553966165} +{"Pretrain/Learning Rate": 1.9263292906987783e-05, "Pretrain/Loss": 1.9899685382843018, "Pretrain/Loss (Raw)": 1.9366737604141235, "Pretrain/Step": 11186, "Pretrain/Step Time": 8.478302950039506} +{"Pretrain/Learning Rate": 1.92591611011242e-05, "Pretrain/Loss": 1.989764928817749, "Pretrain/Loss (Raw)": 2.146810531616211, "Pretrain/Step": 11187, "Pretrain/Step Time": 8.478296818211675} +{"Pretrain/Learning Rate": 1.9255029460793662e-05, "Pretrain/Loss": 1.9925868511199951, "Pretrain/Loss (Raw)": 2.26304030418396, "Pretrain/Step": 11188, "Pretrain/Step Time": 8.478429524227977} +{"Pretrain/Learning Rate": 1.9250897986115297e-05, "Pretrain/Loss": 1.9927061796188354, "Pretrain/Loss (Raw)": 1.948606252670288, "Pretrain/Step": 11189, "Pretrain/Step Time": 8.477549558505416} +{"Pretrain/Learning Rate": 1.9246766677208232e-05, "Pretrain/Loss": 1.994638442993164, "Pretrain/Loss (Raw)": 2.048274040222168, "Pretrain/Step": 11190, "Pretrain/Step Time": 8.477647103369236} +{"Pretrain/Learning Rate": 1.9242635534191605e-05, "Pretrain/Loss": 1.9950100183486938, "Pretrain/Loss (Raw)": 2.050182580947876, "Pretrain/Step": 11191, "Pretrain/Step Time": 8.476807445287704} +{"Pretrain/Learning Rate": 1.9238504557184517e-05, "Pretrain/Loss": 1.9947643280029297, "Pretrain/Loss (Raw)": 1.9652472734451294, "Pretrain/Step": 11192, "Pretrain/Step Time": 8.477595446631312} +{"Pretrain/Learning Rate": 1.923437374630609e-05, "Pretrain/Loss": 1.9981658458709717, "Pretrain/Loss (Raw)": 2.0424249172210693, "Pretrain/Step": 11193, "Pretrain/Step Time": 8.474617436528206} +{"Pretrain/Learning Rate": 1.9230243101675428e-05, "Pretrain/Loss": 1.9973053932189941, "Pretrain/Loss (Raw)": 1.9150713682174683, "Pretrain/Step": 11194, "Pretrain/Step Time": 8.47536939010024} +{"Pretrain/Learning Rate": 1.922611262341164e-05, "Pretrain/Loss": 1.998098611831665, "Pretrain/Loss (Raw)": 2.1155240535736084, "Pretrain/Step": 11195, "Pretrain/Step Time": 8.473803360015154} +{"Pretrain/Learning Rate": 1.922198231163383e-05, "Pretrain/Loss": 2.0034377574920654, "Pretrain/Loss (Raw)": 2.1228718757629395, "Pretrain/Step": 11196, "Pretrain/Step Time": 8.4795261900872} +{"Pretrain/Learning Rate": 1.921785216646108e-05, "Pretrain/Loss": 2.001664400100708, "Pretrain/Loss (Raw)": 1.9346221685409546, "Pretrain/Step": 11197, "Pretrain/Step Time": 8.480495523661375} +{"Pretrain/Learning Rate": 1.921372218801249e-05, "Pretrain/Loss": 2.0001935958862305, "Pretrain/Loss (Raw)": 1.5565464496612549, "Pretrain/Step": 11198, "Pretrain/Step Time": 8.474980605766177} +{"Pretrain/Learning Rate": 1.920959237640714e-05, "Pretrain/Loss": 2.001718759536743, "Pretrain/Loss (Raw)": 1.85621976852417, "Pretrain/Step": 11199, "Pretrain/Step Time": 8.477399440482259} +{"Pretrain/Learning Rate": 1.9205462731764113e-05, "Pretrain/Loss": 2.000229835510254, "Pretrain/Loss (Raw)": 2.010291814804077, "Pretrain/Step": 11200, "Pretrain/Step Time": 8.477663541212678} +{"Pretrain/Learning Rate": 1.9201333254202487e-05, "Pretrain/Loss": 1.9993667602539062, "Pretrain/Loss (Raw)": 1.7853825092315674, "Pretrain/Step": 11201, "Pretrain/Step Time": 8.471394035965204} +{"Pretrain/Learning Rate": 1.9197203943841323e-05, "Pretrain/Loss": 1.9987516403198242, "Pretrain/Loss (Raw)": 2.052950620651245, "Pretrain/Step": 11202, "Pretrain/Step Time": 8.469949129968882} +{"Pretrain/Learning Rate": 1.9193074800799693e-05, "Pretrain/Loss": 1.998843789100647, "Pretrain/Loss (Raw)": 1.919962763786316, "Pretrain/Step": 11203, "Pretrain/Step Time": 8.469093168154359} +{"Pretrain/Learning Rate": 1.918894582519666e-05, "Pretrain/Loss": 1.9978086948394775, "Pretrain/Loss (Raw)": 1.8673583269119263, "Pretrain/Step": 11204, "Pretrain/Step Time": 8.468334950506687} +{"Pretrain/Learning Rate": 1.9184817017151275e-05, "Pretrain/Loss": 1.9975793361663818, "Pretrain/Loss (Raw)": 1.9434412717819214, "Pretrain/Step": 11205, "Pretrain/Step Time": 8.475100433453918} +{"Pretrain/Learning Rate": 1.918068837678259e-05, "Pretrain/Loss": 1.9985381364822388, "Pretrain/Loss (Raw)": 2.0746114253997803, "Pretrain/Step": 11206, "Pretrain/Step Time": 8.470094233751297} +{"Pretrain/Learning Rate": 1.9176559904209663e-05, "Pretrain/Loss": 2.000211238861084, "Pretrain/Loss (Raw)": 2.1828877925872803, "Pretrain/Step": 11207, "Pretrain/Step Time": 8.471966689452529} +{"Pretrain/Learning Rate": 1.9172431599551517e-05, "Pretrain/Loss": 1.9991166591644287, "Pretrain/Loss (Raw)": 1.8468608856201172, "Pretrain/Step": 11208, "Pretrain/Step Time": 8.470723785459995} +{"Pretrain/Learning Rate": 1.91683034629272e-05, "Pretrain/Loss": 1.9995384216308594, "Pretrain/Loss (Raw)": 1.9411605596542358, "Pretrain/Step": 11209, "Pretrain/Step Time": 8.467884618788958} +{"Pretrain/Learning Rate": 1.9164175494455737e-05, "Pretrain/Loss": 1.998153567314148, "Pretrain/Loss (Raw)": 1.8674609661102295, "Pretrain/Step": 11210, "Pretrain/Step Time": 8.467539029195905} +{"Pretrain/Learning Rate": 1.9160047694256177e-05, "Pretrain/Loss": 1.9985125064849854, "Pretrain/Loss (Raw)": 1.9475685358047485, "Pretrain/Step": 11211, "Pretrain/Step Time": 8.466654984280467} +{"Pretrain/Learning Rate": 1.915592006244751e-05, "Pretrain/Loss": 1.9984090328216553, "Pretrain/Loss (Raw)": 2.056156635284424, "Pretrain/Step": 11212, "Pretrain/Step Time": 8.466408271342516} +{"Pretrain/Learning Rate": 1.9151792599148772e-05, "Pretrain/Loss": 1.9981666803359985, "Pretrain/Loss (Raw)": 2.0108563899993896, "Pretrain/Step": 11213, "Pretrain/Step Time": 8.467370610684156} +{"Pretrain/Learning Rate": 1.9147665304478973e-05, "Pretrain/Loss": 2.0016307830810547, "Pretrain/Loss (Raw)": 2.1109261512756348, "Pretrain/Step": 11214, "Pretrain/Step Time": 8.467695059254766} +{"Pretrain/Learning Rate": 1.9143538178557115e-05, "Pretrain/Loss": 2.002617835998535, "Pretrain/Loss (Raw)": 1.9023387432098389, "Pretrain/Step": 11215, "Pretrain/Step Time": 8.468130188062787} +{"Pretrain/Learning Rate": 1.9139411221502208e-05, "Pretrain/Loss": 2.001607656478882, "Pretrain/Loss (Raw)": 2.013695478439331, "Pretrain/Step": 11216, "Pretrain/Step Time": 8.465186988934875} +{"Pretrain/Learning Rate": 1.9135284433433243e-05, "Pretrain/Loss": 2.0011208057403564, "Pretrain/Loss (Raw)": 2.0749051570892334, "Pretrain/Step": 11217, "Pretrain/Step Time": 8.463204335421324} +{"Pretrain/Learning Rate": 1.913115781446922e-05, "Pretrain/Loss": 2.004708766937256, "Pretrain/Loss (Raw)": 2.241300582885742, "Pretrain/Step": 11218, "Pretrain/Step Time": 8.46077074110508} +{"Pretrain/Learning Rate": 1.9127031364729124e-05, "Pretrain/Loss": 2.006030559539795, "Pretrain/Loss (Raw)": 2.045933723449707, "Pretrain/Step": 11219, "Pretrain/Step Time": 8.455881187692285} +{"Pretrain/Learning Rate": 1.912290508433194e-05, "Pretrain/Loss": 2.0117812156677246, "Pretrain/Loss (Raw)": 2.459465980529785, "Pretrain/Step": 11220, "Pretrain/Step Time": 8.450482310727239} +{"Pretrain/Learning Rate": 1.911877897339664e-05, "Pretrain/Loss": 2.0093836784362793, "Pretrain/Loss (Raw)": 1.9652113914489746, "Pretrain/Step": 11221, "Pretrain/Step Time": 8.453995183110237} +{"Pretrain/Learning Rate": 1.9114653032042206e-05, "Pretrain/Loss": 2.008972644805908, "Pretrain/Loss (Raw)": 1.8944214582443237, "Pretrain/Step": 11222, "Pretrain/Step Time": 8.455115642398596} +{"Pretrain/Learning Rate": 1.91105272603876e-05, "Pretrain/Loss": 2.007012128829956, "Pretrain/Loss (Raw)": 1.9024890661239624, "Pretrain/Step": 11223, "Pretrain/Step Time": 8.454524144530296} +{"Pretrain/Learning Rate": 1.9106401658551796e-05, "Pretrain/Loss": 2.0085058212280273, "Pretrain/Loss (Raw)": 2.317636251449585, "Pretrain/Step": 11224, "Pretrain/Step Time": 8.45524818263948} +{"Pretrain/Learning Rate": 1.9102276226653737e-05, "Pretrain/Loss": 2.006538152694702, "Pretrain/Loss (Raw)": 1.9138586521148682, "Pretrain/Step": 11225, "Pretrain/Step Time": 8.459582846611738} +{"Pretrain/Learning Rate": 1.909815096481239e-05, "Pretrain/Loss": 2.0068769454956055, "Pretrain/Loss (Raw)": 2.0757646560668945, "Pretrain/Step": 11226, "Pretrain/Step Time": 8.458034692332149} +{"Pretrain/Learning Rate": 1.9094025873146694e-05, "Pretrain/Loss": 2.0079972743988037, "Pretrain/Loss (Raw)": 1.9726793766021729, "Pretrain/Step": 11227, "Pretrain/Step Time": 8.461559779942036} +{"Pretrain/Learning Rate": 1.9089900951775603e-05, "Pretrain/Loss": 2.006833076477051, "Pretrain/Loss (Raw)": 1.90328049659729, "Pretrain/Step": 11228, "Pretrain/Step Time": 8.454226644709706} +{"Pretrain/Learning Rate": 1.9085776200818055e-05, "Pretrain/Loss": 2.0065836906433105, "Pretrain/Loss (Raw)": 2.091012954711914, "Pretrain/Step": 11229, "Pretrain/Step Time": 8.45518341474235} +{"Pretrain/Learning Rate": 1.9081651620392975e-05, "Pretrain/Loss": 2.00620174407959, "Pretrain/Loss (Raw)": 2.0751900672912598, "Pretrain/Step": 11230, "Pretrain/Step Time": 8.452406577765942} +{"Pretrain/Learning Rate": 1.90775272106193e-05, "Pretrain/Loss": 2.004620313644409, "Pretrain/Loss (Raw)": 1.7832142114639282, "Pretrain/Step": 11231, "Pretrain/Step Time": 8.453503580763936} +{"Pretrain/Learning Rate": 1.9073402971615957e-05, "Pretrain/Loss": 2.001586437225342, "Pretrain/Loss (Raw)": 1.6776515245437622, "Pretrain/Step": 11232, "Pretrain/Step Time": 8.450882581993937} +{"Pretrain/Learning Rate": 1.9069278903501853e-05, "Pretrain/Loss": 1.9998729228973389, "Pretrain/Loss (Raw)": 1.9674205780029297, "Pretrain/Step": 11233, "Pretrain/Step Time": 8.45148815959692} +{"Pretrain/Learning Rate": 1.906515500639592e-05, "Pretrain/Loss": 2.001523971557617, "Pretrain/Loss (Raw)": 2.0564472675323486, "Pretrain/Step": 11234, "Pretrain/Step Time": 8.446784736588597} +{"Pretrain/Learning Rate": 1.9061031280417055e-05, "Pretrain/Loss": 2.0015273094177246, "Pretrain/Loss (Raw)": 1.7982151508331299, "Pretrain/Step": 11235, "Pretrain/Step Time": 8.450096651911736} +{"Pretrain/Learning Rate": 1.9056907725684164e-05, "Pretrain/Loss": 2.0014209747314453, "Pretrain/Loss (Raw)": 2.0035781860351562, "Pretrain/Step": 11236, "Pretrain/Step Time": 8.440392322838306} +{"Pretrain/Learning Rate": 1.905278434231615e-05, "Pretrain/Loss": 2.003657102584839, "Pretrain/Loss (Raw)": 2.2739338874816895, "Pretrain/Step": 11237, "Pretrain/Step Time": 8.445879807695746} +{"Pretrain/Learning Rate": 1.9048661130431906e-05, "Pretrain/Loss": 2.0032382011413574, "Pretrain/Loss (Raw)": 2.0019004344940186, "Pretrain/Step": 11238, "Pretrain/Step Time": 8.447169175371528} +{"Pretrain/Learning Rate": 1.9044538090150324e-05, "Pretrain/Loss": 2.002863645553589, "Pretrain/Loss (Raw)": 2.0624594688415527, "Pretrain/Step": 11239, "Pretrain/Step Time": 8.444123152643442} +{"Pretrain/Learning Rate": 1.9040415221590293e-05, "Pretrain/Loss": 2.0043575763702393, "Pretrain/Loss (Raw)": 2.070859670639038, "Pretrain/Step": 11240, "Pretrain/Step Time": 8.448657870292664} +{"Pretrain/Learning Rate": 1.9036292524870682e-05, "Pretrain/Loss": 2.004793882369995, "Pretrain/Loss (Raw)": 2.085886240005493, "Pretrain/Step": 11241, "Pretrain/Step Time": 8.456421671435237} +{"Pretrain/Learning Rate": 1.9032170000110374e-05, "Pretrain/Loss": 2.003481864929199, "Pretrain/Loss (Raw)": 1.878319263458252, "Pretrain/Step": 11242, "Pretrain/Step Time": 8.454379346221685} +{"Pretrain/Learning Rate": 1.902804764742823e-05, "Pretrain/Loss": 2.0049490928649902, "Pretrain/Loss (Raw)": 2.1852574348449707, "Pretrain/Step": 11243, "Pretrain/Step Time": 8.451848646625876} +{"Pretrain/Learning Rate": 1.9023925466943132e-05, "Pretrain/Loss": 2.004887580871582, "Pretrain/Loss (Raw)": 2.121609926223755, "Pretrain/Step": 11244, "Pretrain/Step Time": 8.453487580642104} +{"Pretrain/Learning Rate": 1.901980345877393e-05, "Pretrain/Loss": 2.0045905113220215, "Pretrain/Loss (Raw)": 1.9964793920516968, "Pretrain/Step": 11245, "Pretrain/Step Time": 8.459684768691659} +{"Pretrain/Learning Rate": 1.9015681623039475e-05, "Pretrain/Loss": 2.006944417953491, "Pretrain/Loss (Raw)": 2.0073046684265137, "Pretrain/Step": 11246, "Pretrain/Step Time": 8.460877664387226} +{"Pretrain/Learning Rate": 1.901155995985862e-05, "Pretrain/Loss": 2.0068812370300293, "Pretrain/Loss (Raw)": 1.8883627653121948, "Pretrain/Step": 11247, "Pretrain/Step Time": 8.460735563188791} +{"Pretrain/Learning Rate": 1.9007438469350217e-05, "Pretrain/Loss": 2.00795316696167, "Pretrain/Loss (Raw)": 2.14282488822937, "Pretrain/Step": 11248, "Pretrain/Step Time": 8.459468258544803} +{"Pretrain/Learning Rate": 1.9003317151633095e-05, "Pretrain/Loss": 2.009870767593384, "Pretrain/Loss (Raw)": 2.1080312728881836, "Pretrain/Step": 11249, "Pretrain/Step Time": 8.461932333186269} +{"Pretrain/Learning Rate": 1.8999196006826105e-05, "Pretrain/Loss": 2.010885715484619, "Pretrain/Loss (Raw)": 2.0991201400756836, "Pretrain/Step": 11250, "Pretrain/Step Time": 8.462590647861362} +{"Pretrain/Learning Rate": 1.8995075035048064e-05, "Pretrain/Loss": 2.0124082565307617, "Pretrain/Loss (Raw)": 2.1630125045776367, "Pretrain/Step": 11251, "Pretrain/Step Time": 8.45330629311502} +{"Pretrain/Learning Rate": 1.8990954236417798e-05, "Pretrain/Loss": 2.0143237113952637, "Pretrain/Loss (Raw)": 2.1780200004577637, "Pretrain/Step": 11252, "Pretrain/Step Time": 8.45177530311048} +{"Pretrain/Learning Rate": 1.898683361105413e-05, "Pretrain/Loss": 2.0162405967712402, "Pretrain/Loss (Raw)": 2.2336807250976562, "Pretrain/Step": 11253, "Pretrain/Step Time": 8.454609729349613} +{"Pretrain/Learning Rate": 1.8982713159075877e-05, "Pretrain/Loss": 2.0173749923706055, "Pretrain/Loss (Raw)": 2.148092031478882, "Pretrain/Step": 11254, "Pretrain/Step Time": 8.451331241056323} +{"Pretrain/Learning Rate": 1.8978592880601852e-05, "Pretrain/Loss": 2.016916036605835, "Pretrain/Loss (Raw)": 1.859236717224121, "Pretrain/Step": 11255, "Pretrain/Step Time": 8.45735402032733} +{"Pretrain/Learning Rate": 1.8974472775750855e-05, "Pretrain/Loss": 2.0185155868530273, "Pretrain/Loss (Raw)": 2.2300426959991455, "Pretrain/Step": 11256, "Pretrain/Step Time": 8.454336732625961} +{"Pretrain/Learning Rate": 1.8970352844641688e-05, "Pretrain/Loss": 2.01975154876709, "Pretrain/Loss (Raw)": 2.349100112915039, "Pretrain/Step": 11257, "Pretrain/Step Time": 8.453345270827413} +{"Pretrain/Learning Rate": 1.896623308739314e-05, "Pretrain/Loss": 2.0212349891662598, "Pretrain/Loss (Raw)": 2.1857261657714844, "Pretrain/Step": 11258, "Pretrain/Step Time": 8.454401647672057} +{"Pretrain/Learning Rate": 1.8962113504124013e-05, "Pretrain/Loss": 2.0194485187530518, "Pretrain/Loss (Raw)": 1.8829725980758667, "Pretrain/Step": 11259, "Pretrain/Step Time": 8.452570168301463} +{"Pretrain/Learning Rate": 1.895799409495309e-05, "Pretrain/Loss": 2.019589900970459, "Pretrain/Loss (Raw)": 1.998217225074768, "Pretrain/Step": 11260, "Pretrain/Step Time": 8.453052535653114} +{"Pretrain/Learning Rate": 1.8953874859999142e-05, "Pretrain/Loss": 2.017263650894165, "Pretrain/Loss (Raw)": 1.6496340036392212, "Pretrain/Step": 11261, "Pretrain/Step Time": 8.449574150145054} +{"Pretrain/Learning Rate": 1.894975579938095e-05, "Pretrain/Loss": 2.0178914070129395, "Pretrain/Loss (Raw)": 1.9181467294692993, "Pretrain/Step": 11262, "Pretrain/Step Time": 8.453266179189086} +{"Pretrain/Learning Rate": 1.8945636913217285e-05, "Pretrain/Loss": 2.0174789428710938, "Pretrain/Loss (Raw)": 1.861159086227417, "Pretrain/Step": 11263, "Pretrain/Step Time": 8.45343372784555} +{"Pretrain/Learning Rate": 1.8941518201626914e-05, "Pretrain/Loss": 2.016216278076172, "Pretrain/Loss (Raw)": 1.7963368892669678, "Pretrain/Step": 11264, "Pretrain/Step Time": 8.452150164172053} +{"Pretrain/Learning Rate": 1.8937399664728594e-05, "Pretrain/Loss": 2.0162434577941895, "Pretrain/Loss (Raw)": 2.0557007789611816, "Pretrain/Step": 11265, "Pretrain/Step Time": 8.451510068029165} +{"Pretrain/Learning Rate": 1.8933281302641083e-05, "Pretrain/Loss": 2.017672061920166, "Pretrain/Loss (Raw)": 1.9824055433273315, "Pretrain/Step": 11266, "Pretrain/Step Time": 8.447292156517506} +{"Pretrain/Learning Rate": 1.8929163115483124e-05, "Pretrain/Loss": 2.0185885429382324, "Pretrain/Loss (Raw)": 2.0593912601470947, "Pretrain/Step": 11267, "Pretrain/Step Time": 8.446559365838766} +{"Pretrain/Learning Rate": 1.892504510337347e-05, "Pretrain/Loss": 2.0173444747924805, "Pretrain/Loss (Raw)": 2.0299437046051025, "Pretrain/Step": 11268, "Pretrain/Step Time": 8.443852912634611} +{"Pretrain/Learning Rate": 1.8920927266430853e-05, "Pretrain/Loss": 2.017103433609009, "Pretrain/Loss (Raw)": 1.9287519454956055, "Pretrain/Step": 11269, "Pretrain/Step Time": 8.445867475122213} +{"Pretrain/Learning Rate": 1.8916809604774023e-05, "Pretrain/Loss": 2.0230162143707275, "Pretrain/Loss (Raw)": 2.6841516494750977, "Pretrain/Step": 11270, "Pretrain/Step Time": 8.446291269734502} +{"Pretrain/Learning Rate": 1.8912692118521692e-05, "Pretrain/Loss": 2.0234756469726562, "Pretrain/Loss (Raw)": 1.9845249652862549, "Pretrain/Step": 11271, "Pretrain/Step Time": 8.438877301290631} +{"Pretrain/Learning Rate": 1.890857480779259e-05, "Pretrain/Loss": 2.02339768409729, "Pretrain/Loss (Raw)": 1.8419109582901, "Pretrain/Step": 11272, "Pretrain/Step Time": 8.438781524077058} +{"Pretrain/Learning Rate": 1.8904457672705443e-05, "Pretrain/Loss": 2.024468183517456, "Pretrain/Loss (Raw)": 2.242621421813965, "Pretrain/Step": 11273, "Pretrain/Step Time": 8.439036210998893} +{"Pretrain/Learning Rate": 1.890034071337896e-05, "Pretrain/Loss": 2.0247299671173096, "Pretrain/Loss (Raw)": 1.901313304901123, "Pretrain/Step": 11274, "Pretrain/Step Time": 8.440509278327227} +{"Pretrain/Learning Rate": 1.8896223929931855e-05, "Pretrain/Loss": 2.0253000259399414, "Pretrain/Loss (Raw)": 2.1974895000457764, "Pretrain/Step": 11275, "Pretrain/Step Time": 8.440961996093392} +{"Pretrain/Learning Rate": 1.889210732248283e-05, "Pretrain/Loss": 2.0262644290924072, "Pretrain/Loss (Raw)": 1.9858365058898926, "Pretrain/Step": 11276, "Pretrain/Step Time": 8.439266726374626} +{"Pretrain/Learning Rate": 1.8887990891150586e-05, "Pretrain/Loss": 2.027303695678711, "Pretrain/Loss (Raw)": 2.074622392654419, "Pretrain/Step": 11277, "Pretrain/Step Time": 8.438461793586612} +{"Pretrain/Learning Rate": 1.8883874636053814e-05, "Pretrain/Loss": 2.024892807006836, "Pretrain/Loss (Raw)": 2.001283884048462, "Pretrain/Step": 11278, "Pretrain/Step Time": 8.436639769002795} +{"Pretrain/Learning Rate": 1.8879758557311206e-05, "Pretrain/Loss": 2.025418281555176, "Pretrain/Loss (Raw)": 1.910334587097168, "Pretrain/Step": 11279, "Pretrain/Step Time": 8.438544370234013} +{"Pretrain/Learning Rate": 1.887564265504144e-05, "Pretrain/Loss": 2.0248634815216064, "Pretrain/Loss (Raw)": 1.8728711605072021, "Pretrain/Step": 11280, "Pretrain/Step Time": 8.43799482472241} +{"Pretrain/Learning Rate": 1.8871526929363213e-05, "Pretrain/Loss": 2.020031452178955, "Pretrain/Loss (Raw)": 1.7381188869476318, "Pretrain/Step": 11281, "Pretrain/Step Time": 8.43708703480661} +{"Pretrain/Learning Rate": 1.8867411380395177e-05, "Pretrain/Loss": 2.019918918609619, "Pretrain/Loss (Raw)": 1.9427484273910522, "Pretrain/Step": 11282, "Pretrain/Step Time": 8.434520315378904} +{"Pretrain/Learning Rate": 1.8863296008256012e-05, "Pretrain/Loss": 2.018050193786621, "Pretrain/Loss (Raw)": 2.0614049434661865, "Pretrain/Step": 11283, "Pretrain/Step Time": 8.434787528589368} +{"Pretrain/Learning Rate": 1.885918081306438e-05, "Pretrain/Loss": 2.0183522701263428, "Pretrain/Loss (Raw)": 2.0312302112579346, "Pretrain/Step": 11284, "Pretrain/Step Time": 8.434712912887335} +{"Pretrain/Learning Rate": 1.8855065794938943e-05, "Pretrain/Loss": 2.0180246829986572, "Pretrain/Loss (Raw)": 1.95433509349823, "Pretrain/Step": 11285, "Pretrain/Step Time": 8.437063107267022} +{"Pretrain/Learning Rate": 1.8850950953998354e-05, "Pretrain/Loss": 2.019524335861206, "Pretrain/Loss (Raw)": 2.213029146194458, "Pretrain/Step": 11286, "Pretrain/Step Time": 8.430034222081304} +{"Pretrain/Learning Rate": 1.8846836290361257e-05, "Pretrain/Loss": 2.0183308124542236, "Pretrain/Loss (Raw)": 1.9036390781402588, "Pretrain/Step": 11287, "Pretrain/Step Time": 8.42765973508358} +{"Pretrain/Learning Rate": 1.8842721804146296e-05, "Pretrain/Loss": 2.0175421237945557, "Pretrain/Loss (Raw)": 2.0860517024993896, "Pretrain/Step": 11288, "Pretrain/Step Time": 8.433256758376956} +{"Pretrain/Learning Rate": 1.883860749547211e-05, "Pretrain/Loss": 2.0165998935699463, "Pretrain/Loss (Raw)": 1.7863212823867798, "Pretrain/Step": 11289, "Pretrain/Step Time": 8.425808185711503} +{"Pretrain/Learning Rate": 1.8834493364457333e-05, "Pretrain/Loss": 2.018394947052002, "Pretrain/Loss (Raw)": 2.3208680152893066, "Pretrain/Step": 11290, "Pretrain/Step Time": 8.434655578806996} +{"Pretrain/Learning Rate": 1.8830379411220602e-05, "Pretrain/Loss": 2.018019437789917, "Pretrain/Loss (Raw)": 1.984575629234314, "Pretrain/Step": 11291, "Pretrain/Step Time": 8.434305822476745} +{"Pretrain/Learning Rate": 1.8826265635880526e-05, "Pretrain/Loss": 2.0176942348480225, "Pretrain/Loss (Raw)": 1.9334951639175415, "Pretrain/Step": 11292, "Pretrain/Step Time": 8.428545394912362} +{"Pretrain/Learning Rate": 1.8822152038555723e-05, "Pretrain/Loss": 2.016394853591919, "Pretrain/Loss (Raw)": 1.9335778951644897, "Pretrain/Step": 11293, "Pretrain/Step Time": 8.42769299633801} +{"Pretrain/Learning Rate": 1.8818038619364815e-05, "Pretrain/Loss": 2.016221046447754, "Pretrain/Loss (Raw)": 1.9035851955413818, "Pretrain/Step": 11294, "Pretrain/Step Time": 8.426732659339905} +{"Pretrain/Learning Rate": 1.8813925378426417e-05, "Pretrain/Loss": 2.01591157913208, "Pretrain/Loss (Raw)": 2.0098843574523926, "Pretrain/Step": 11295, "Pretrain/Step Time": 8.42719823308289} +{"Pretrain/Learning Rate": 1.8809812315859108e-05, "Pretrain/Loss": 2.0147860050201416, "Pretrain/Loss (Raw)": 1.9252197742462158, "Pretrain/Step": 11296, "Pretrain/Step Time": 8.428937565535307} +{"Pretrain/Learning Rate": 1.8805699431781495e-05, "Pretrain/Loss": 2.0142815113067627, "Pretrain/Loss (Raw)": 2.040142774581909, "Pretrain/Step": 11297, "Pretrain/Step Time": 8.429963177070022} +{"Pretrain/Learning Rate": 1.880158672631218e-05, "Pretrain/Loss": 2.016620397567749, "Pretrain/Loss (Raw)": 2.0499320030212402, "Pretrain/Step": 11298, "Pretrain/Step Time": 8.428554750978947} +{"Pretrain/Learning Rate": 1.8797474199569737e-05, "Pretrain/Loss": 2.0136795043945312, "Pretrain/Loss (Raw)": 1.7412673234939575, "Pretrain/Step": 11299, "Pretrain/Step Time": 8.427223460748792} +{"Pretrain/Learning Rate": 1.8793361851672752e-05, "Pretrain/Loss": 2.014862298965454, "Pretrain/Loss (Raw)": 2.086549758911133, "Pretrain/Step": 11300, "Pretrain/Step Time": 8.42361286841333} +{"Pretrain/Learning Rate": 1.87892496827398e-05, "Pretrain/Loss": 2.0128841400146484, "Pretrain/Loss (Raw)": 1.8943941593170166, "Pretrain/Step": 11301, "Pretrain/Step Time": 8.428717538714409} +{"Pretrain/Learning Rate": 1.878513769288946e-05, "Pretrain/Loss": 2.0159614086151123, "Pretrain/Loss (Raw)": 2.161118745803833, "Pretrain/Step": 11302, "Pretrain/Step Time": 8.425362272188067} +{"Pretrain/Learning Rate": 1.8781025882240292e-05, "Pretrain/Loss": 2.017514944076538, "Pretrain/Loss (Raw)": 2.207306146621704, "Pretrain/Step": 11303, "Pretrain/Step Time": 8.422146316617727} +{"Pretrain/Learning Rate": 1.8776914250910862e-05, "Pretrain/Loss": 2.0167574882507324, "Pretrain/Loss (Raw)": 1.8346456289291382, "Pretrain/Step": 11304, "Pretrain/Step Time": 8.424591964110732} +{"Pretrain/Learning Rate": 1.877280279901972e-05, "Pretrain/Loss": 2.016561508178711, "Pretrain/Loss (Raw)": 2.1065447330474854, "Pretrain/Step": 11305, "Pretrain/Step Time": 8.42725184559822} +{"Pretrain/Learning Rate": 1.8768691526685416e-05, "Pretrain/Loss": 2.012956142425537, "Pretrain/Loss (Raw)": 1.8694629669189453, "Pretrain/Step": 11306, "Pretrain/Step Time": 8.430235963314772} +{"Pretrain/Learning Rate": 1.87645804340265e-05, "Pretrain/Loss": 2.0086493492126465, "Pretrain/Loss (Raw)": 1.8123406171798706, "Pretrain/Step": 11307, "Pretrain/Step Time": 8.428683428093791} +{"Pretrain/Learning Rate": 1.8760469521161513e-05, "Pretrain/Loss": 2.0101165771484375, "Pretrain/Loss (Raw)": 1.9606008529663086, "Pretrain/Step": 11308, "Pretrain/Step Time": 8.425761574879289} +{"Pretrain/Learning Rate": 1.8756358788208993e-05, "Pretrain/Loss": 2.0111489295959473, "Pretrain/Loss (Raw)": 2.1089181900024414, "Pretrain/Step": 11309, "Pretrain/Step Time": 8.423180064186454} +{"Pretrain/Learning Rate": 1.875224823528746e-05, "Pretrain/Loss": 2.009622573852539, "Pretrain/Loss (Raw)": 1.8852099180221558, "Pretrain/Step": 11310, "Pretrain/Step Time": 8.42336805537343} +{"Pretrain/Learning Rate": 1.8748137862515448e-05, "Pretrain/Loss": 2.010587215423584, "Pretrain/Loss (Raw)": 1.9261552095413208, "Pretrain/Step": 11311, "Pretrain/Step Time": 8.422638427466154} +{"Pretrain/Learning Rate": 1.874402767001147e-05, "Pretrain/Loss": 2.010024070739746, "Pretrain/Loss (Raw)": 2.112577438354492, "Pretrain/Step": 11312, "Pretrain/Step Time": 8.423165852203965} +{"Pretrain/Learning Rate": 1.8739917657894047e-05, "Pretrain/Loss": 2.0101757049560547, "Pretrain/Loss (Raw)": 1.9926631450653076, "Pretrain/Step": 11313, "Pretrain/Step Time": 8.423801014199853} +{"Pretrain/Learning Rate": 1.8735807826281687e-05, "Pretrain/Loss": 2.011044502258301, "Pretrain/Loss (Raw)": 2.0478742122650146, "Pretrain/Step": 11314, "Pretrain/Step Time": 8.424024688079953} +{"Pretrain/Learning Rate": 1.8731698175292893e-05, "Pretrain/Loss": 2.007864236831665, "Pretrain/Loss (Raw)": 1.7397236824035645, "Pretrain/Step": 11315, "Pretrain/Step Time": 8.41987807303667} +{"Pretrain/Learning Rate": 1.8727588705046157e-05, "Pretrain/Loss": 2.007857084274292, "Pretrain/Loss (Raw)": 2.2621281147003174, "Pretrain/Step": 11316, "Pretrain/Step Time": 8.425690369680524} +{"Pretrain/Learning Rate": 1.872347941565998e-05, "Pretrain/Loss": 2.0065460205078125, "Pretrain/Loss (Raw)": 1.7808177471160889, "Pretrain/Step": 11317, "Pretrain/Step Time": 8.425071209669113} +{"Pretrain/Learning Rate": 1.871937030725285e-05, "Pretrain/Loss": 2.005636215209961, "Pretrain/Loss (Raw)": 1.9317846298217773, "Pretrain/Step": 11318, "Pretrain/Step Time": 8.423840841278434} +{"Pretrain/Learning Rate": 1.8715261379943256e-05, "Pretrain/Loss": 2.0064029693603516, "Pretrain/Loss (Raw)": 2.148322105407715, "Pretrain/Step": 11319, "Pretrain/Step Time": 8.423625124618411} +{"Pretrain/Learning Rate": 1.8711152633849666e-05, "Pretrain/Loss": 2.0070295333862305, "Pretrain/Loss (Raw)": 2.0454654693603516, "Pretrain/Step": 11320, "Pretrain/Step Time": 8.422240514308214} +{"Pretrain/Learning Rate": 1.8707044069090552e-05, "Pretrain/Loss": 2.0055460929870605, "Pretrain/Loss (Raw)": 1.852520227432251, "Pretrain/Step": 11321, "Pretrain/Step Time": 8.421646874397993} +{"Pretrain/Learning Rate": 1.870293568578439e-05, "Pretrain/Loss": 2.0072901248931885, "Pretrain/Loss (Raw)": 2.1383235454559326, "Pretrain/Step": 11322, "Pretrain/Step Time": 8.423963157460093} +{"Pretrain/Learning Rate": 1.8698827484049634e-05, "Pretrain/Loss": 2.007255792617798, "Pretrain/Loss (Raw)": 2.111144781112671, "Pretrain/Step": 11323, "Pretrain/Step Time": 8.427266422659159} +{"Pretrain/Learning Rate": 1.8694719464004755e-05, "Pretrain/Loss": 2.0064244270324707, "Pretrain/Loss (Raw)": 2.0164639949798584, "Pretrain/Step": 11324, "Pretrain/Step Time": 8.422798542305827} +{"Pretrain/Learning Rate": 1.869061162576819e-05, "Pretrain/Loss": 2.0058422088623047, "Pretrain/Loss (Raw)": 1.8600820302963257, "Pretrain/Step": 11325, "Pretrain/Step Time": 8.424120580777526} +{"Pretrain/Learning Rate": 1.868650396945839e-05, "Pretrain/Loss": 2.0098729133605957, "Pretrain/Loss (Raw)": 2.072479486465454, "Pretrain/Step": 11326, "Pretrain/Step Time": 8.425128005445004} +{"Pretrain/Learning Rate": 1.8682396495193792e-05, "Pretrain/Loss": 2.0120511054992676, "Pretrain/Loss (Raw)": 2.1350157260894775, "Pretrain/Step": 11327, "Pretrain/Step Time": 8.419008346274495} +{"Pretrain/Learning Rate": 1.8678289203092843e-05, "Pretrain/Loss": 2.0130462646484375, "Pretrain/Loss (Raw)": 2.1376826763153076, "Pretrain/Step": 11328, "Pretrain/Step Time": 8.418238416314125} +{"Pretrain/Learning Rate": 1.8674182093273973e-05, "Pretrain/Loss": 2.01716947555542, "Pretrain/Loss (Raw)": 2.3131606578826904, "Pretrain/Step": 11329, "Pretrain/Step Time": 8.421497808769345} +{"Pretrain/Learning Rate": 1.8670075165855598e-05, "Pretrain/Loss": 2.016061782836914, "Pretrain/Loss (Raw)": 1.911148190498352, "Pretrain/Step": 11330, "Pretrain/Step Time": 8.41981602832675} +{"Pretrain/Learning Rate": 1.8665968420956143e-05, "Pretrain/Loss": 2.0203137397766113, "Pretrain/Loss (Raw)": 2.4642457962036133, "Pretrain/Step": 11331, "Pretrain/Step Time": 8.418623391538858} +{"Pretrain/Learning Rate": 1.8661861858694024e-05, "Pretrain/Loss": 2.0208470821380615, "Pretrain/Loss (Raw)": 1.935611367225647, "Pretrain/Step": 11332, "Pretrain/Step Time": 8.420350087806582} +{"Pretrain/Learning Rate": 1.865775547918765e-05, "Pretrain/Loss": 2.0217418670654297, "Pretrain/Loss (Raw)": 2.0579538345336914, "Pretrain/Step": 11333, "Pretrain/Step Time": 8.41532652080059} +{"Pretrain/Learning Rate": 1.865364928255543e-05, "Pretrain/Loss": 2.0217971801757812, "Pretrain/Loss (Raw)": 2.0816879272460938, "Pretrain/Step": 11334, "Pretrain/Step Time": 8.419744649901986} +{"Pretrain/Learning Rate": 1.8649543268915755e-05, "Pretrain/Loss": 2.021723747253418, "Pretrain/Loss (Raw)": 2.1734814643859863, "Pretrain/Step": 11335, "Pretrain/Step Time": 8.41898855380714} +{"Pretrain/Learning Rate": 1.864543743838702e-05, "Pretrain/Loss": 2.0236010551452637, "Pretrain/Loss (Raw)": 2.087207555770874, "Pretrain/Step": 11336, "Pretrain/Step Time": 8.415890535339713} +{"Pretrain/Learning Rate": 1.864133179108762e-05, "Pretrain/Loss": 2.0244123935699463, "Pretrain/Loss (Raw)": 2.044975996017456, "Pretrain/Step": 11337, "Pretrain/Step Time": 8.419234171509743} +{"Pretrain/Learning Rate": 1.863722632713593e-05, "Pretrain/Loss": 2.0251505374908447, "Pretrain/Loss (Raw)": 1.9619457721710205, "Pretrain/Step": 11338, "Pretrain/Step Time": 8.424313113093376} +{"Pretrain/Learning Rate": 1.863312104665034e-05, "Pretrain/Loss": 2.024869441986084, "Pretrain/Loss (Raw)": 1.9115781784057617, "Pretrain/Step": 11339, "Pretrain/Step Time": 8.42158791795373} +{"Pretrain/Learning Rate": 1.862901594974922e-05, "Pretrain/Loss": 2.0234270095825195, "Pretrain/Loss (Raw)": 1.8715425729751587, "Pretrain/Step": 11340, "Pretrain/Step Time": 8.424389563500881} +{"Pretrain/Learning Rate": 1.8624911036550927e-05, "Pretrain/Loss": 2.022855758666992, "Pretrain/Loss (Raw)": 1.937722086906433, "Pretrain/Step": 11341, "Pretrain/Step Time": 8.42206952162087} +{"Pretrain/Learning Rate": 1.862080630717383e-05, "Pretrain/Loss": 2.0229835510253906, "Pretrain/Loss (Raw)": 2.127264976501465, "Pretrain/Step": 11342, "Pretrain/Step Time": 8.423933118581772} +{"Pretrain/Learning Rate": 1.861670176173629e-05, "Pretrain/Loss": 2.023542881011963, "Pretrain/Loss (Raw)": 1.9739396572113037, "Pretrain/Step": 11343, "Pretrain/Step Time": 8.420220075175166} +{"Pretrain/Learning Rate": 1.861259740035665e-05, "Pretrain/Loss": 2.0234932899475098, "Pretrain/Loss (Raw)": 2.00736141204834, "Pretrain/Step": 11344, "Pretrain/Step Time": 8.419249894097447} +{"Pretrain/Learning Rate": 1.8608493223153267e-05, "Pretrain/Loss": 2.0227673053741455, "Pretrain/Loss (Raw)": 1.9819890260696411, "Pretrain/Step": 11345, "Pretrain/Step Time": 8.427503328770399} +{"Pretrain/Learning Rate": 1.8604389230244474e-05, "Pretrain/Loss": 2.020252227783203, "Pretrain/Loss (Raw)": 1.9193698167800903, "Pretrain/Step": 11346, "Pretrain/Step Time": 8.429789997637272} +{"Pretrain/Learning Rate": 1.8600285421748602e-05, "Pretrain/Loss": 2.0205130577087402, "Pretrain/Loss (Raw)": 2.079310894012451, "Pretrain/Step": 11347, "Pretrain/Step Time": 8.432812867686152} +{"Pretrain/Learning Rate": 1.8596181797783997e-05, "Pretrain/Loss": 2.0176339149475098, "Pretrain/Loss (Raw)": 2.090977191925049, "Pretrain/Step": 11348, "Pretrain/Step Time": 8.435409381985664} +{"Pretrain/Learning Rate": 1.8592078358468972e-05, "Pretrain/Loss": 2.0187952518463135, "Pretrain/Loss (Raw)": 2.1138415336608887, "Pretrain/Step": 11349, "Pretrain/Step Time": 8.433228401467204} +{"Pretrain/Learning Rate": 1.8587975103921853e-05, "Pretrain/Loss": 2.0182533264160156, "Pretrain/Loss (Raw)": 1.8250306844711304, "Pretrain/Step": 11350, "Pretrain/Step Time": 8.43544664233923} +{"Pretrain/Learning Rate": 1.858387203426095e-05, "Pretrain/Loss": 2.0204803943634033, "Pretrain/Loss (Raw)": 2.187567710876465, "Pretrain/Step": 11351, "Pretrain/Step Time": 8.434956485405564} +{"Pretrain/Learning Rate": 1.857976914960457e-05, "Pretrain/Loss": 2.018108367919922, "Pretrain/Loss (Raw)": 2.014031410217285, "Pretrain/Step": 11352, "Pretrain/Step Time": 8.434635523706675} +{"Pretrain/Learning Rate": 1.8575666450071024e-05, "Pretrain/Loss": 2.0185444355010986, "Pretrain/Loss (Raw)": 1.969658374786377, "Pretrain/Step": 11353, "Pretrain/Step Time": 8.430217683315277} +{"Pretrain/Learning Rate": 1.8571563935778607e-05, "Pretrain/Loss": 2.0186870098114014, "Pretrain/Loss (Raw)": 2.094024658203125, "Pretrain/Step": 11354, "Pretrain/Step Time": 8.433066260069609} +{"Pretrain/Learning Rate": 1.8567461606845616e-05, "Pretrain/Loss": 2.018428325653076, "Pretrain/Loss (Raw)": 1.9395464658737183, "Pretrain/Step": 11355, "Pretrain/Step Time": 8.43059608899057} +{"Pretrain/Learning Rate": 1.856335946339033e-05, "Pretrain/Loss": 2.020172119140625, "Pretrain/Loss (Raw)": 2.126509189605713, "Pretrain/Step": 11356, "Pretrain/Step Time": 8.432761199772358} +{"Pretrain/Learning Rate": 1.8559257505531038e-05, "Pretrain/Loss": 2.021541118621826, "Pretrain/Loss (Raw)": 2.266223430633545, "Pretrain/Step": 11357, "Pretrain/Step Time": 8.429855803027749} +{"Pretrain/Learning Rate": 1.8555155733386013e-05, "Pretrain/Loss": 2.022545099258423, "Pretrain/Loss (Raw)": 2.203697681427002, "Pretrain/Step": 11358, "Pretrain/Step Time": 8.431214939802885} +{"Pretrain/Learning Rate": 1.8551054147073533e-05, "Pretrain/Loss": 2.024717330932617, "Pretrain/Loss (Raw)": 2.0612616539001465, "Pretrain/Step": 11359, "Pretrain/Step Time": 8.431322567164898} +{"Pretrain/Learning Rate": 1.8546952746711858e-05, "Pretrain/Loss": 2.026524543762207, "Pretrain/Loss (Raw)": 1.9089733362197876, "Pretrain/Step": 11360, "Pretrain/Step Time": 8.436213141307235} +{"Pretrain/Learning Rate": 1.8542851532419253e-05, "Pretrain/Loss": 2.0277609825134277, "Pretrain/Loss (Raw)": 2.1256895065307617, "Pretrain/Step": 11361, "Pretrain/Step Time": 8.434567846357822} +{"Pretrain/Learning Rate": 1.853875050431397e-05, "Pretrain/Loss": 2.026501178741455, "Pretrain/Loss (Raw)": 1.8951842784881592, "Pretrain/Step": 11362, "Pretrain/Step Time": 8.436065711081028} +{"Pretrain/Learning Rate": 1.8534649662514265e-05, "Pretrain/Loss": 2.0283687114715576, "Pretrain/Loss (Raw)": 2.0372753143310547, "Pretrain/Step": 11363, "Pretrain/Step Time": 8.437682481482625} +{"Pretrain/Learning Rate": 1.8530549007138372e-05, "Pretrain/Loss": 2.0286765098571777, "Pretrain/Loss (Raw)": 2.0429739952087402, "Pretrain/Step": 11364, "Pretrain/Step Time": 8.437942788004875} +{"Pretrain/Learning Rate": 1.8526448538304546e-05, "Pretrain/Loss": 2.0265145301818848, "Pretrain/Loss (Raw)": 1.997195839881897, "Pretrain/Step": 11365, "Pretrain/Step Time": 8.43969527259469} +{"Pretrain/Learning Rate": 1.852234825613101e-05, "Pretrain/Loss": 2.025365114212036, "Pretrain/Loss (Raw)": 1.854779601097107, "Pretrain/Step": 11366, "Pretrain/Step Time": 8.439422564581037} +{"Pretrain/Learning Rate": 1.8518248160735994e-05, "Pretrain/Loss": 2.0228662490844727, "Pretrain/Loss (Raw)": 1.742594838142395, "Pretrain/Step": 11367, "Pretrain/Step Time": 8.444622108712792} +{"Pretrain/Learning Rate": 1.8514148252237722e-05, "Pretrain/Loss": 2.022094249725342, "Pretrain/Loss (Raw)": 1.9720567464828491, "Pretrain/Step": 11368, "Pretrain/Step Time": 8.43952931649983} +{"Pretrain/Learning Rate": 1.8510048530754414e-05, "Pretrain/Loss": 2.0193803310394287, "Pretrain/Loss (Raw)": 1.7384997606277466, "Pretrain/Step": 11369, "Pretrain/Step Time": 8.445316404104233} +{"Pretrain/Learning Rate": 1.8505948996404287e-05, "Pretrain/Loss": 2.0201029777526855, "Pretrain/Loss (Raw)": 1.9708185195922852, "Pretrain/Step": 11370, "Pretrain/Step Time": 8.448435213416815} +{"Pretrain/Learning Rate": 1.8501849649305537e-05, "Pretrain/Loss": 2.0183138847351074, "Pretrain/Loss (Raw)": 1.9562808275222778, "Pretrain/Step": 11371, "Pretrain/Step Time": 8.446752609685063} +{"Pretrain/Learning Rate": 1.849775048957637e-05, "Pretrain/Loss": 2.0168542861938477, "Pretrain/Loss (Raw)": 1.9347765445709229, "Pretrain/Step": 11372, "Pretrain/Step Time": 8.447365881875157} +{"Pretrain/Learning Rate": 1.8493651517334986e-05, "Pretrain/Loss": 2.0174527168273926, "Pretrain/Loss (Raw)": 2.073033332824707, "Pretrain/Step": 11373, "Pretrain/Step Time": 8.437514247372746} +{"Pretrain/Learning Rate": 1.848955273269957e-05, "Pretrain/Loss": 2.0187666416168213, "Pretrain/Loss (Raw)": 2.175509214401245, "Pretrain/Step": 11374, "Pretrain/Step Time": 8.435077168047428} +{"Pretrain/Learning Rate": 1.8485454135788315e-05, "Pretrain/Loss": 2.0210447311401367, "Pretrain/Loss (Raw)": 2.179943561553955, "Pretrain/Step": 11375, "Pretrain/Step Time": 8.436647329479456} +{"Pretrain/Learning Rate": 1.8481355726719404e-05, "Pretrain/Loss": 2.018099784851074, "Pretrain/Loss (Raw)": 1.7658878564834595, "Pretrain/Step": 11376, "Pretrain/Step Time": 8.437965521588922} +{"Pretrain/Learning Rate": 1.8477257505610997e-05, "Pretrain/Loss": 2.0171217918395996, "Pretrain/Loss (Raw)": 1.9828321933746338, "Pretrain/Step": 11377, "Pretrain/Step Time": 8.433937180787325} +{"Pretrain/Learning Rate": 1.8473159472581276e-05, "Pretrain/Loss": 2.015202283859253, "Pretrain/Loss (Raw)": 1.8534348011016846, "Pretrain/Step": 11378, "Pretrain/Step Time": 8.431184938177466} +{"Pretrain/Learning Rate": 1.846906162774841e-05, "Pretrain/Loss": 2.0147900581359863, "Pretrain/Loss (Raw)": 2.1102356910705566, "Pretrain/Step": 11379, "Pretrain/Step Time": 8.438654068857431} +{"Pretrain/Learning Rate": 1.846496397123053e-05, "Pretrain/Loss": 2.012749671936035, "Pretrain/Loss (Raw)": 1.9168885946273804, "Pretrain/Step": 11380, "Pretrain/Step Time": 8.441370444372296} +{"Pretrain/Learning Rate": 1.8460866503145812e-05, "Pretrain/Loss": 2.010800361633301, "Pretrain/Loss (Raw)": 1.9841630458831787, "Pretrain/Step": 11381, "Pretrain/Step Time": 8.442548539489508} +{"Pretrain/Learning Rate": 1.84567692236124e-05, "Pretrain/Loss": 2.0085196495056152, "Pretrain/Loss (Raw)": 1.8561674356460571, "Pretrain/Step": 11382, "Pretrain/Step Time": 8.445555666461587} +{"Pretrain/Learning Rate": 1.8452672132748437e-05, "Pretrain/Loss": 2.0102806091308594, "Pretrain/Loss (Raw)": 2.084623336791992, "Pretrain/Step": 11383, "Pretrain/Step Time": 8.441451346501708} +{"Pretrain/Learning Rate": 1.8448575230672055e-05, "Pretrain/Loss": 2.009457588195801, "Pretrain/Loss (Raw)": 2.1247215270996094, "Pretrain/Step": 11384, "Pretrain/Step Time": 8.437398791313171} +{"Pretrain/Learning Rate": 1.844447851750139e-05, "Pretrain/Loss": 2.0068624019622803, "Pretrain/Loss (Raw)": 2.0168967247009277, "Pretrain/Step": 11385, "Pretrain/Step Time": 8.438510743901134} +{"Pretrain/Learning Rate": 1.844038199335456e-05, "Pretrain/Loss": 2.005976438522339, "Pretrain/Loss (Raw)": 2.072322368621826, "Pretrain/Step": 11386, "Pretrain/Step Time": 8.441547729074955} +{"Pretrain/Learning Rate": 1.8436285658349694e-05, "Pretrain/Loss": 2.0065317153930664, "Pretrain/Loss (Raw)": 1.9540599584579468, "Pretrain/Step": 11387, "Pretrain/Step Time": 8.441927736625075} +{"Pretrain/Learning Rate": 1.8432189512604908e-05, "Pretrain/Loss": 2.006538152694702, "Pretrain/Loss (Raw)": 1.9990298748016357, "Pretrain/Step": 11388, "Pretrain/Step Time": 8.444529999047518} +{"Pretrain/Learning Rate": 1.84280935562383e-05, "Pretrain/Loss": 2.01004958152771, "Pretrain/Loss (Raw)": 2.0990889072418213, "Pretrain/Step": 11389, "Pretrain/Step Time": 8.444625828415155} +{"Pretrain/Learning Rate": 1.8423997789367985e-05, "Pretrain/Loss": 2.009840965270996, "Pretrain/Loss (Raw)": 1.8914363384246826, "Pretrain/Step": 11390, "Pretrain/Step Time": 8.442730769515038} +{"Pretrain/Learning Rate": 1.8419902212112058e-05, "Pretrain/Loss": 2.010209798812866, "Pretrain/Loss (Raw)": 1.9083751440048218, "Pretrain/Step": 11391, "Pretrain/Step Time": 8.442269142717123} +{"Pretrain/Learning Rate": 1.841580682458861e-05, "Pretrain/Loss": 2.0123353004455566, "Pretrain/Loss (Raw)": 2.0684025287628174, "Pretrain/Step": 11392, "Pretrain/Step Time": 8.445132186636329} +{"Pretrain/Learning Rate": 1.841171162691574e-05, "Pretrain/Loss": 2.012345790863037, "Pretrain/Loss (Raw)": 2.0570502281188965, "Pretrain/Step": 11393, "Pretrain/Step Time": 8.440023196861148} +{"Pretrain/Learning Rate": 1.8407616619211513e-05, "Pretrain/Loss": 2.0119106769561768, "Pretrain/Loss (Raw)": 1.9267120361328125, "Pretrain/Step": 11394, "Pretrain/Step Time": 8.44374093785882} +{"Pretrain/Learning Rate": 1.8403521801594012e-05, "Pretrain/Loss": 2.0117902755737305, "Pretrain/Loss (Raw)": 2.0439605712890625, "Pretrain/Step": 11395, "Pretrain/Step Time": 8.44272692874074} +{"Pretrain/Learning Rate": 1.839942717418131e-05, "Pretrain/Loss": 2.012418270111084, "Pretrain/Loss (Raw)": 2.1103498935699463, "Pretrain/Step": 11396, "Pretrain/Step Time": 8.446588210761547} +{"Pretrain/Learning Rate": 1.8395332737091477e-05, "Pretrain/Loss": 2.012125253677368, "Pretrain/Loss (Raw)": 1.8912571668624878, "Pretrain/Step": 11397, "Pretrain/Step Time": 8.446185819804668} +{"Pretrain/Learning Rate": 1.8391238490442568e-05, "Pretrain/Loss": 2.006612539291382, "Pretrain/Loss (Raw)": 1.9785053730010986, "Pretrain/Step": 11398, "Pretrain/Step Time": 8.449208855628967} +{"Pretrain/Learning Rate": 1.8387144434352633e-05, "Pretrain/Loss": 2.008277416229248, "Pretrain/Loss (Raw)": 2.197624444961548, "Pretrain/Step": 11399, "Pretrain/Step Time": 8.451385959982872} +{"Pretrain/Learning Rate": 1.8383050568939732e-05, "Pretrain/Loss": 2.010214328765869, "Pretrain/Loss (Raw)": 2.0898666381835938, "Pretrain/Step": 11400, "Pretrain/Step Time": 8.452758545055985} +{"Pretrain/Learning Rate": 1.8378956894321896e-05, "Pretrain/Loss": 2.0094058513641357, "Pretrain/Loss (Raw)": 2.1391191482543945, "Pretrain/Step": 11401, "Pretrain/Step Time": 8.453576516360044} +{"Pretrain/Learning Rate": 1.8374863410617173e-05, "Pretrain/Loss": 2.0102717876434326, "Pretrain/Loss (Raw)": 2.012166976928711, "Pretrain/Step": 11402, "Pretrain/Step Time": 8.454694090411067} +{"Pretrain/Learning Rate": 1.8370770117943597e-05, "Pretrain/Loss": 2.0108542442321777, "Pretrain/Loss (Raw)": 2.2719979286193848, "Pretrain/Step": 11403, "Pretrain/Step Time": 8.453723583370447} +{"Pretrain/Learning Rate": 1.8366677016419194e-05, "Pretrain/Loss": 2.011913776397705, "Pretrain/Loss (Raw)": 2.121473550796509, "Pretrain/Step": 11404, "Pretrain/Step Time": 8.451139500364661} +{"Pretrain/Learning Rate": 1.8362584106161975e-05, "Pretrain/Loss": 2.0111093521118164, "Pretrain/Loss (Raw)": 1.9716490507125854, "Pretrain/Step": 11405, "Pretrain/Step Time": 8.451588140800595} +{"Pretrain/Learning Rate": 1.8358491387289968e-05, "Pretrain/Loss": 2.0119504928588867, "Pretrain/Loss (Raw)": 2.1089913845062256, "Pretrain/Step": 11406, "Pretrain/Step Time": 8.455544924363494} +{"Pretrain/Learning Rate": 1.835439885992118e-05, "Pretrain/Loss": 2.0117146968841553, "Pretrain/Loss (Raw)": 1.8801201581954956, "Pretrain/Step": 11407, "Pretrain/Step Time": 8.452651020139456} +{"Pretrain/Learning Rate": 1.8350306524173613e-05, "Pretrain/Loss": 2.0149874687194824, "Pretrain/Loss (Raw)": 2.291778802871704, "Pretrain/Step": 11408, "Pretrain/Step Time": 8.448512589558959} +{"Pretrain/Learning Rate": 1.834621438016528e-05, "Pretrain/Loss": 2.016767740249634, "Pretrain/Loss (Raw)": 1.9660043716430664, "Pretrain/Step": 11409, "Pretrain/Step Time": 8.45045917108655} +{"Pretrain/Learning Rate": 1.8342122428014153e-05, "Pretrain/Loss": 2.0165483951568604, "Pretrain/Loss (Raw)": 1.9146755933761597, "Pretrain/Step": 11410, "Pretrain/Step Time": 8.44986355677247} +{"Pretrain/Learning Rate": 1.8338030667838236e-05, "Pretrain/Loss": 2.014828681945801, "Pretrain/Loss (Raw)": 1.8412635326385498, "Pretrain/Step": 11411, "Pretrain/Step Time": 8.448461525142193} +{"Pretrain/Learning Rate": 1.8333939099755508e-05, "Pretrain/Loss": 2.0133795738220215, "Pretrain/Loss (Raw)": 1.845746636390686, "Pretrain/Step": 11412, "Pretrain/Step Time": 8.451664447784424} +{"Pretrain/Learning Rate": 1.8329847723883946e-05, "Pretrain/Loss": 2.013679265975952, "Pretrain/Loss (Raw)": 1.9927185773849487, "Pretrain/Step": 11413, "Pretrain/Step Time": 8.449380200356245} +{"Pretrain/Learning Rate": 1.8325756540341527e-05, "Pretrain/Loss": 2.0131664276123047, "Pretrain/Loss (Raw)": 2.147390127182007, "Pretrain/Step": 11414, "Pretrain/Step Time": 8.453133124858141} +{"Pretrain/Learning Rate": 1.8321665549246208e-05, "Pretrain/Loss": 2.0144386291503906, "Pretrain/Loss (Raw)": 2.066450595855713, "Pretrain/Step": 11415, "Pretrain/Step Time": 8.452422548085451} +{"Pretrain/Learning Rate": 1.831757475071596e-05, "Pretrain/Loss": 2.016873836517334, "Pretrain/Loss (Raw)": 2.397770643234253, "Pretrain/Step": 11416, "Pretrain/Step Time": 8.448896327987313} +{"Pretrain/Learning Rate": 1.831348414486873e-05, "Pretrain/Loss": 2.020106315612793, "Pretrain/Loss (Raw)": 2.2000813484191895, "Pretrain/Step": 11417, "Pretrain/Step Time": 8.45224192366004} +{"Pretrain/Learning Rate": 1.830939373182247e-05, "Pretrain/Loss": 2.0165963172912598, "Pretrain/Loss (Raw)": 1.8716129064559937, "Pretrain/Step": 11418, "Pretrain/Step Time": 8.447300685569644} +{"Pretrain/Learning Rate": 1.8305303511695128e-05, "Pretrain/Loss": 2.0173916816711426, "Pretrain/Loss (Raw)": 2.08634614944458, "Pretrain/Step": 11419, "Pretrain/Step Time": 8.444922752678394} +{"Pretrain/Learning Rate": 1.830121348460464e-05, "Pretrain/Loss": 2.0188746452331543, "Pretrain/Loss (Raw)": 2.1233017444610596, "Pretrain/Step": 11420, "Pretrain/Step Time": 8.450009679421782} +{"Pretrain/Learning Rate": 1.8297123650668936e-05, "Pretrain/Loss": 2.01853346824646, "Pretrain/Loss (Raw)": 1.8899269104003906, "Pretrain/Step": 11421, "Pretrain/Step Time": 8.452436529099941} +{"Pretrain/Learning Rate": 1.8293034010005948e-05, "Pretrain/Loss": 2.0189766883850098, "Pretrain/Loss (Raw)": 1.960338830947876, "Pretrain/Step": 11422, "Pretrain/Step Time": 8.453979447484016} +{"Pretrain/Learning Rate": 1.8288944562733593e-05, "Pretrain/Loss": 2.019340991973877, "Pretrain/Loss (Raw)": 2.056474208831787, "Pretrain/Step": 11423, "Pretrain/Step Time": 8.45775605365634} +{"Pretrain/Learning Rate": 1.8284855308969798e-05, "Pretrain/Loss": 2.0183699131011963, "Pretrain/Loss (Raw)": 1.800942063331604, "Pretrain/Step": 11424, "Pretrain/Step Time": 8.454881466925144} +{"Pretrain/Learning Rate": 1.828076624883246e-05, "Pretrain/Loss": 2.0174479484558105, "Pretrain/Loss (Raw)": 1.9221526384353638, "Pretrain/Step": 11425, "Pretrain/Step Time": 8.453513208776712} +{"Pretrain/Learning Rate": 1.827667738243949e-05, "Pretrain/Loss": 2.0176196098327637, "Pretrain/Loss (Raw)": 2.071876287460327, "Pretrain/Step": 11426, "Pretrain/Step Time": 8.45631905272603} +{"Pretrain/Learning Rate": 1.827258870990879e-05, "Pretrain/Loss": 2.0200209617614746, "Pretrain/Loss (Raw)": 2.0486745834350586, "Pretrain/Step": 11427, "Pretrain/Step Time": 8.45410218462348} +{"Pretrain/Learning Rate": 1.8268500231358254e-05, "Pretrain/Loss": 2.018484592437744, "Pretrain/Loss (Raw)": 1.8898577690124512, "Pretrain/Step": 11428, "Pretrain/Step Time": 8.460200864821672} +{"Pretrain/Learning Rate": 1.826441194690577e-05, "Pretrain/Loss": 2.0195839405059814, "Pretrain/Loss (Raw)": 2.035127878189087, "Pretrain/Step": 11429, "Pretrain/Step Time": 8.457558272406459} +{"Pretrain/Learning Rate": 1.8260323856669216e-05, "Pretrain/Loss": 2.0177035331726074, "Pretrain/Loss (Raw)": 1.9204250574111938, "Pretrain/Step": 11430, "Pretrain/Step Time": 8.458436043933034} +{"Pretrain/Learning Rate": 1.8256235960766472e-05, "Pretrain/Loss": 2.0165815353393555, "Pretrain/Loss (Raw)": 2.063697576522827, "Pretrain/Step": 11431, "Pretrain/Step Time": 8.460823928937316} +{"Pretrain/Learning Rate": 1.825214825931541e-05, "Pretrain/Loss": 2.01668643951416, "Pretrain/Loss (Raw)": 1.8480697870254517, "Pretrain/Step": 11432, "Pretrain/Step Time": 8.46734730899334} +{"Pretrain/Learning Rate": 1.824806075243389e-05, "Pretrain/Loss": 2.016387939453125, "Pretrain/Loss (Raw)": 2.068340301513672, "Pretrain/Step": 11433, "Pretrain/Step Time": 8.464630909264088} +{"Pretrain/Learning Rate": 1.8243973440239794e-05, "Pretrain/Loss": 2.016486644744873, "Pretrain/Loss (Raw)": 1.8820815086364746, "Pretrain/Step": 11434, "Pretrain/Step Time": 8.464291535317898} +{"Pretrain/Learning Rate": 1.8239886322850948e-05, "Pretrain/Loss": 2.016937732696533, "Pretrain/Loss (Raw)": 1.870059847831726, "Pretrain/Step": 11435, "Pretrain/Step Time": 8.464677184820175} +{"Pretrain/Learning Rate": 1.8235799400385217e-05, "Pretrain/Loss": 2.0184683799743652, "Pretrain/Loss (Raw)": 2.156538486480713, "Pretrain/Step": 11436, "Pretrain/Step Time": 8.472198216244578} +{"Pretrain/Learning Rate": 1.8231712672960443e-05, "Pretrain/Loss": 2.0148026943206787, "Pretrain/Loss (Raw)": 1.6397184133529663, "Pretrain/Step": 11437, "Pretrain/Step Time": 8.470743026584387} +{"Pretrain/Learning Rate": 1.8227626140694462e-05, "Pretrain/Loss": 2.014634609222412, "Pretrain/Loss (Raw)": 1.8637140989303589, "Pretrain/Step": 11438, "Pretrain/Step Time": 8.478996912017465} +{"Pretrain/Learning Rate": 1.8223539803705107e-05, "Pretrain/Loss": 2.014883518218994, "Pretrain/Loss (Raw)": 1.957986831665039, "Pretrain/Step": 11439, "Pretrain/Step Time": 8.478598289191723} +{"Pretrain/Learning Rate": 1.8219453662110207e-05, "Pretrain/Loss": 2.013184070587158, "Pretrain/Loss (Raw)": 1.8950687646865845, "Pretrain/Step": 11440, "Pretrain/Step Time": 8.476313119754195} +{"Pretrain/Learning Rate": 1.821536771602758e-05, "Pretrain/Loss": 2.013495683670044, "Pretrain/Loss (Raw)": 2.0325443744659424, "Pretrain/Step": 11441, "Pretrain/Step Time": 8.4759641289711} +{"Pretrain/Learning Rate": 1.8211281965575043e-05, "Pretrain/Loss": 2.012538194656372, "Pretrain/Loss (Raw)": 1.9252989292144775, "Pretrain/Step": 11442, "Pretrain/Step Time": 8.473412871360779} +{"Pretrain/Learning Rate": 1.82071964108704e-05, "Pretrain/Loss": 2.0155975818634033, "Pretrain/Loss (Raw)": 2.131349802017212, "Pretrain/Step": 11443, "Pretrain/Step Time": 8.474472409114242} +{"Pretrain/Learning Rate": 1.8203111052031464e-05, "Pretrain/Loss": 2.01314640045166, "Pretrain/Loss (Raw)": 1.9483624696731567, "Pretrain/Step": 11444, "Pretrain/Step Time": 8.47403222322464} +{"Pretrain/Learning Rate": 1.819902588917603e-05, "Pretrain/Loss": 2.0119686126708984, "Pretrain/Loss (Raw)": 1.630056381225586, "Pretrain/Step": 11445, "Pretrain/Step Time": 8.474525993689895} +{"Pretrain/Learning Rate": 1.819494092242189e-05, "Pretrain/Loss": 2.012413501739502, "Pretrain/Loss (Raw)": 1.9887112379074097, "Pretrain/Step": 11446, "Pretrain/Step Time": 8.47416608966887} +{"Pretrain/Learning Rate": 1.8190856151886826e-05, "Pretrain/Loss": 2.0118465423583984, "Pretrain/Loss (Raw)": 2.0757763385772705, "Pretrain/Step": 11447, "Pretrain/Step Time": 8.470092562958598} +{"Pretrain/Learning Rate": 1.8186771577688627e-05, "Pretrain/Loss": 2.0112266540527344, "Pretrain/Loss (Raw)": 1.9661424160003662, "Pretrain/Step": 11448, "Pretrain/Step Time": 8.469355221837759} +{"Pretrain/Learning Rate": 1.818268719994507e-05, "Pretrain/Loss": 2.0132193565368652, "Pretrain/Loss (Raw)": 2.1075828075408936, "Pretrain/Step": 11449, "Pretrain/Step Time": 8.476337864995003} +{"Pretrain/Learning Rate": 1.8178603018773923e-05, "Pretrain/Loss": 2.012148380279541, "Pretrain/Loss (Raw)": 2.001234769821167, "Pretrain/Step": 11450, "Pretrain/Step Time": 8.477551318705082} +{"Pretrain/Learning Rate": 1.8174519034292944e-05, "Pretrain/Loss": 2.0123119354248047, "Pretrain/Loss (Raw)": 2.1320693492889404, "Pretrain/Step": 11451, "Pretrain/Step Time": 8.476249964907765} +{"Pretrain/Learning Rate": 1.8170435246619898e-05, "Pretrain/Loss": 2.012545347213745, "Pretrain/Loss (Raw)": 2.0463507175445557, "Pretrain/Step": 11452, "Pretrain/Step Time": 8.474862854927778} +{"Pretrain/Learning Rate": 1.8166351655872538e-05, "Pretrain/Loss": 2.0138773918151855, "Pretrain/Loss (Raw)": 2.0305609703063965, "Pretrain/Step": 11453, "Pretrain/Step Time": 8.474969627335668} +{"Pretrain/Learning Rate": 1.816226826216861e-05, "Pretrain/Loss": 2.013953924179077, "Pretrain/Loss (Raw)": 2.082296848297119, "Pretrain/Step": 11454, "Pretrain/Step Time": 8.475988365709782} +{"Pretrain/Learning Rate": 1.815818506562586e-05, "Pretrain/Loss": 2.012559175491333, "Pretrain/Loss (Raw)": 1.9564636945724487, "Pretrain/Step": 11455, "Pretrain/Step Time": 8.478279681876302} +{"Pretrain/Learning Rate": 1.8154102066362018e-05, "Pretrain/Loss": 2.012195110321045, "Pretrain/Loss (Raw)": 2.0911049842834473, "Pretrain/Step": 11456, "Pretrain/Step Time": 8.476474119350314} +{"Pretrain/Learning Rate": 1.8150019264494816e-05, "Pretrain/Loss": 2.007129669189453, "Pretrain/Loss (Raw)": 1.664751648902893, "Pretrain/Step": 11457, "Pretrain/Step Time": 8.474526504054666} +{"Pretrain/Learning Rate": 1.8145936660141975e-05, "Pretrain/Loss": 2.0074775218963623, "Pretrain/Loss (Raw)": 1.9556809663772583, "Pretrain/Step": 11458, "Pretrain/Step Time": 8.476419143378735} +{"Pretrain/Learning Rate": 1.8141854253421227e-05, "Pretrain/Loss": 2.004869222640991, "Pretrain/Loss (Raw)": 2.1303882598876953, "Pretrain/Step": 11459, "Pretrain/Step Time": 8.471658626571298} +{"Pretrain/Learning Rate": 1.8137772044450274e-05, "Pretrain/Loss": 2.0037431716918945, "Pretrain/Loss (Raw)": 1.7914958000183105, "Pretrain/Step": 11460, "Pretrain/Step Time": 8.473941503092647} +{"Pretrain/Learning Rate": 1.8133690033346828e-05, "Pretrain/Loss": 1.9993761777877808, "Pretrain/Loss (Raw)": 1.4989814758300781, "Pretrain/Step": 11461, "Pretrain/Step Time": 8.481961369514465} +{"Pretrain/Learning Rate": 1.8129608220228582e-05, "Pretrain/Loss": 1.9982417821884155, "Pretrain/Loss (Raw)": 1.93648099899292, "Pretrain/Step": 11462, "Pretrain/Step Time": 8.476542180404067} +{"Pretrain/Learning Rate": 1.812552660521326e-05, "Pretrain/Loss": 1.9962711334228516, "Pretrain/Loss (Raw)": 1.9212414026260376, "Pretrain/Step": 11463, "Pretrain/Step Time": 8.47601199708879} +{"Pretrain/Learning Rate": 1.8121445188418514e-05, "Pretrain/Loss": 1.9962034225463867, "Pretrain/Loss (Raw)": 2.0785276889801025, "Pretrain/Step": 11464, "Pretrain/Step Time": 8.478007100522518} +{"Pretrain/Learning Rate": 1.811736396996205e-05, "Pretrain/Loss": 1.996852993965149, "Pretrain/Loss (Raw)": 2.128127336502075, "Pretrain/Step": 11465, "Pretrain/Step Time": 8.475523922592402} +{"Pretrain/Learning Rate": 1.811328294996154e-05, "Pretrain/Loss": 1.9995726346969604, "Pretrain/Loss (Raw)": 2.310051918029785, "Pretrain/Step": 11466, "Pretrain/Step Time": 8.46766097843647} +{"Pretrain/Learning Rate": 1.8109202128534673e-05, "Pretrain/Loss": 2.0011181831359863, "Pretrain/Loss (Raw)": 2.1094138622283936, "Pretrain/Step": 11467, "Pretrain/Step Time": 8.472600057721138} +{"Pretrain/Learning Rate": 1.8105121505799095e-05, "Pretrain/Loss": 2.0015666484832764, "Pretrain/Loss (Raw)": 1.9289515018463135, "Pretrain/Step": 11468, "Pretrain/Step Time": 8.47188551723957} +{"Pretrain/Learning Rate": 1.810104108187248e-05, "Pretrain/Loss": 2.0028066635131836, "Pretrain/Loss (Raw)": 2.096409797668457, "Pretrain/Step": 11469, "Pretrain/Step Time": 8.479247553274035} +{"Pretrain/Learning Rate": 1.809696085687248e-05, "Pretrain/Loss": 2.0019450187683105, "Pretrain/Loss (Raw)": 2.017017126083374, "Pretrain/Step": 11470, "Pretrain/Step Time": 8.479216625913978} +{"Pretrain/Learning Rate": 1.809288083091675e-05, "Pretrain/Loss": 2.003702402114868, "Pretrain/Loss (Raw)": 2.1988556385040283, "Pretrain/Step": 11471, "Pretrain/Step Time": 8.4766054302454} +{"Pretrain/Learning Rate": 1.808880100412293e-05, "Pretrain/Loss": 2.004143238067627, "Pretrain/Loss (Raw)": 2.063793897628784, "Pretrain/Step": 11472, "Pretrain/Step Time": 8.480853233486414} +{"Pretrain/Learning Rate": 1.8084721376608664e-05, "Pretrain/Loss": 2.0045480728149414, "Pretrain/Loss (Raw)": 2.0337963104248047, "Pretrain/Step": 11473, "Pretrain/Step Time": 8.473529243841767} +{"Pretrain/Learning Rate": 1.8080641948491583e-05, "Pretrain/Loss": 2.0058794021606445, "Pretrain/Loss (Raw)": 2.0897743701934814, "Pretrain/Step": 11474, "Pretrain/Step Time": 8.470174480229616} +{"Pretrain/Learning Rate": 1.8076562719889312e-05, "Pretrain/Loss": 2.0052342414855957, "Pretrain/Loss (Raw)": 1.9967602491378784, "Pretrain/Step": 11475, "Pretrain/Step Time": 8.467430468648672} +{"Pretrain/Learning Rate": 1.8072483690919473e-05, "Pretrain/Loss": 2.0051894187927246, "Pretrain/Loss (Raw)": 2.0852293968200684, "Pretrain/Step": 11476, "Pretrain/Step Time": 8.467859715223312} +{"Pretrain/Learning Rate": 1.806840486169968e-05, "Pretrain/Loss": 2.0029821395874023, "Pretrain/Loss (Raw)": 1.8313332796096802, "Pretrain/Step": 11477, "Pretrain/Step Time": 8.467127604410052} +{"Pretrain/Learning Rate": 1.8064326232347555e-05, "Pretrain/Loss": 2.0033342838287354, "Pretrain/Loss (Raw)": 1.8700990676879883, "Pretrain/Step": 11478, "Pretrain/Step Time": 8.465447951108217} +{"Pretrain/Learning Rate": 1.806024780298069e-05, "Pretrain/Loss": 2.0021169185638428, "Pretrain/Loss (Raw)": 2.031733989715576, "Pretrain/Step": 11479, "Pretrain/Step Time": 8.466010183095932} +{"Pretrain/Learning Rate": 1.8056169573716683e-05, "Pretrain/Loss": 2.0030384063720703, "Pretrain/Loss (Raw)": 2.132005214691162, "Pretrain/Step": 11480, "Pretrain/Step Time": 8.465091401711106} +{"Pretrain/Learning Rate": 1.8052091544673134e-05, "Pretrain/Loss": 2.003624439239502, "Pretrain/Loss (Raw)": 2.0446267127990723, "Pretrain/Step": 11481, "Pretrain/Step Time": 8.46991353482008} +{"Pretrain/Learning Rate": 1.8048013715967626e-05, "Pretrain/Loss": 2.000734329223633, "Pretrain/Loss (Raw)": 1.724083423614502, "Pretrain/Step": 11482, "Pretrain/Step Time": 8.464547272771597} +{"Pretrain/Learning Rate": 1.804393608771775e-05, "Pretrain/Loss": 2.0017800331115723, "Pretrain/Loss (Raw)": 2.0734312534332275, "Pretrain/Step": 11483, "Pretrain/Step Time": 8.466276407241821} +{"Pretrain/Learning Rate": 1.8039858660041064e-05, "Pretrain/Loss": 2.0003409385681152, "Pretrain/Loss (Raw)": 1.9422805309295654, "Pretrain/Step": 11484, "Pretrain/Step Time": 8.47270299680531} +{"Pretrain/Learning Rate": 1.8035781433055148e-05, "Pretrain/Loss": 1.9974216222763062, "Pretrain/Loss (Raw)": 1.8925806283950806, "Pretrain/Step": 11485, "Pretrain/Step Time": 8.478503627702594} +{"Pretrain/Learning Rate": 1.8031704406877568e-05, "Pretrain/Loss": 1.9966106414794922, "Pretrain/Loss (Raw)": 2.099879741668701, "Pretrain/Step": 11486, "Pretrain/Step Time": 8.476155322045088} +{"Pretrain/Learning Rate": 1.8027627581625877e-05, "Pretrain/Loss": 1.9966411590576172, "Pretrain/Loss (Raw)": 2.065167188644409, "Pretrain/Step": 11487, "Pretrain/Step Time": 8.477590532973409} +{"Pretrain/Learning Rate": 1.8023550957417635e-05, "Pretrain/Loss": 1.9979726076126099, "Pretrain/Loss (Raw)": 2.079392433166504, "Pretrain/Step": 11488, "Pretrain/Step Time": 8.47233417071402} +{"Pretrain/Learning Rate": 1.8019474534370377e-05, "Pretrain/Loss": 1.9965288639068604, "Pretrain/Loss (Raw)": 1.9408931732177734, "Pretrain/Step": 11489, "Pretrain/Step Time": 8.473120849579573} +{"Pretrain/Learning Rate": 1.801539831260165e-05, "Pretrain/Loss": 1.9981873035430908, "Pretrain/Loss (Raw)": 2.107470989227295, "Pretrain/Step": 11490, "Pretrain/Step Time": 8.475853906944394} +{"Pretrain/Learning Rate": 1.8011322292228988e-05, "Pretrain/Loss": 1.9985452890396118, "Pretrain/Loss (Raw)": 2.0830938816070557, "Pretrain/Step": 11491, "Pretrain/Step Time": 8.47280926629901} +{"Pretrain/Learning Rate": 1.800724647336992e-05, "Pretrain/Loss": 1.9977606534957886, "Pretrain/Loss (Raw)": 1.9425406455993652, "Pretrain/Step": 11492, "Pretrain/Step Time": 8.473513003438711} +{"Pretrain/Learning Rate": 1.8003170856141982e-05, "Pretrain/Loss": 1.9978660345077515, "Pretrain/Loss (Raw)": 2.010698080062866, "Pretrain/Step": 11493, "Pretrain/Step Time": 8.47084229066968} +{"Pretrain/Learning Rate": 1.7999095440662665e-05, "Pretrain/Loss": 1.9975711107254028, "Pretrain/Loss (Raw)": 1.817029356956482, "Pretrain/Step": 11494, "Pretrain/Step Time": 8.47251794487238} +{"Pretrain/Learning Rate": 1.7995020227049503e-05, "Pretrain/Loss": 2.0018153190612793, "Pretrain/Loss (Raw)": 2.28582501411438, "Pretrain/Step": 11495, "Pretrain/Step Time": 8.46750496327877} +{"Pretrain/Learning Rate": 1.7990945215419995e-05, "Pretrain/Loss": 2.0024828910827637, "Pretrain/Loss (Raw)": 2.057528018951416, "Pretrain/Step": 11496, "Pretrain/Step Time": 8.469140715897083} +{"Pretrain/Learning Rate": 1.7986870405891636e-05, "Pretrain/Loss": 2.006392240524292, "Pretrain/Loss (Raw)": 2.2388832569122314, "Pretrain/Step": 11497, "Pretrain/Step Time": 8.458971355110407} +{"Pretrain/Learning Rate": 1.7982795798581934e-05, "Pretrain/Loss": 2.0072569847106934, "Pretrain/Loss (Raw)": 2.0815181732177734, "Pretrain/Step": 11498, "Pretrain/Step Time": 8.457639902830124} +{"Pretrain/Learning Rate": 1.7978721393608362e-05, "Pretrain/Loss": 2.0084593296051025, "Pretrain/Loss (Raw)": 2.1101815700531006, "Pretrain/Step": 11499, "Pretrain/Step Time": 8.455924989655614} +{"Pretrain/Learning Rate": 1.7974647191088408e-05, "Pretrain/Loss": 2.0084285736083984, "Pretrain/Loss (Raw)": 1.9308276176452637, "Pretrain/Step": 11500, "Pretrain/Step Time": 8.457417348399758} +{"Pretrain/Learning Rate": 1.797057319113955e-05, "Pretrain/Loss": 2.0062036514282227, "Pretrain/Loss (Raw)": 1.7882623672485352, "Pretrain/Step": 11501, "Pretrain/Step Time": 8.470482412725687} +{"Pretrain/Learning Rate": 1.796649939387926e-05, "Pretrain/Loss": 2.005276679992676, "Pretrain/Loss (Raw)": 2.0568671226501465, "Pretrain/Step": 11502, "Pretrain/Step Time": 8.470267225056887} +{"Pretrain/Learning Rate": 1.7962425799424997e-05, "Pretrain/Loss": 2.0045766830444336, "Pretrain/Loss (Raw)": 2.090348482131958, "Pretrain/Step": 11503, "Pretrain/Step Time": 8.469981838017702} +{"Pretrain/Learning Rate": 1.7958352407894234e-05, "Pretrain/Loss": 2.007722854614258, "Pretrain/Loss (Raw)": 2.168593406677246, "Pretrain/Step": 11504, "Pretrain/Step Time": 8.472215872257948} +{"Pretrain/Learning Rate": 1.7954279219404414e-05, "Pretrain/Loss": 2.0078957080841064, "Pretrain/Loss (Raw)": 2.00494384765625, "Pretrain/Step": 11505, "Pretrain/Step Time": 8.478193208575249} +{"Pretrain/Learning Rate": 1.795020623407298e-05, "Pretrain/Loss": 2.008915424346924, "Pretrain/Loss (Raw)": 1.9839738607406616, "Pretrain/Step": 11506, "Pretrain/Step Time": 8.482326839119196} +{"Pretrain/Learning Rate": 1.7946133452017382e-05, "Pretrain/Loss": 2.0051565170288086, "Pretrain/Loss (Raw)": 1.6290678977966309, "Pretrain/Step": 11507, "Pretrain/Step Time": 8.476051876321435} +{"Pretrain/Learning Rate": 1.7942060873355048e-05, "Pretrain/Loss": 2.009328842163086, "Pretrain/Loss (Raw)": 2.4509410858154297, "Pretrain/Step": 11508, "Pretrain/Step Time": 8.47686062939465} +{"Pretrain/Learning Rate": 1.793798849820342e-05, "Pretrain/Loss": 2.010288715362549, "Pretrain/Loss (Raw)": 2.1070191860198975, "Pretrain/Step": 11509, "Pretrain/Step Time": 8.476153254508972} +{"Pretrain/Learning Rate": 1.7933916326679918e-05, "Pretrain/Loss": 2.013327121734619, "Pretrain/Loss (Raw)": 2.245121479034424, "Pretrain/Step": 11510, "Pretrain/Step Time": 8.473244924098253} +{"Pretrain/Learning Rate": 1.792984435890195e-05, "Pretrain/Loss": 2.0122756958007812, "Pretrain/Loss (Raw)": 1.9500300884246826, "Pretrain/Step": 11511, "Pretrain/Step Time": 8.480399703606963} +{"Pretrain/Learning Rate": 1.792577259498694e-05, "Pretrain/Loss": 2.011964797973633, "Pretrain/Loss (Raw)": 2.0849127769470215, "Pretrain/Step": 11512, "Pretrain/Step Time": 8.482022944837809} +{"Pretrain/Learning Rate": 1.7921701035052288e-05, "Pretrain/Loss": 2.0132172107696533, "Pretrain/Loss (Raw)": 2.1772050857543945, "Pretrain/Step": 11513, "Pretrain/Step Time": 8.482726857066154} +{"Pretrain/Learning Rate": 1.7917629679215404e-05, "Pretrain/Loss": 2.012929677963257, "Pretrain/Loss (Raw)": 2.035515546798706, "Pretrain/Step": 11514, "Pretrain/Step Time": 8.477240400388837} +{"Pretrain/Learning Rate": 1.7913558527593664e-05, "Pretrain/Loss": 2.0137228965759277, "Pretrain/Loss (Raw)": 2.055605411529541, "Pretrain/Step": 11515, "Pretrain/Step Time": 8.475478174164891} +{"Pretrain/Learning Rate": 1.7909487580304474e-05, "Pretrain/Loss": 2.015068531036377, "Pretrain/Loss (Raw)": 2.171255350112915, "Pretrain/Step": 11516, "Pretrain/Step Time": 8.477235632017255} +{"Pretrain/Learning Rate": 1.7905416837465212e-05, "Pretrain/Loss": 2.015211820602417, "Pretrain/Loss (Raw)": 2.1174356937408447, "Pretrain/Step": 11517, "Pretrain/Step Time": 8.48307984508574} +{"Pretrain/Learning Rate": 1.790134629919325e-05, "Pretrain/Loss": 2.014902114868164, "Pretrain/Loss (Raw)": 1.8518027067184448, "Pretrain/Step": 11518, "Pretrain/Step Time": 8.480464685708284} +{"Pretrain/Learning Rate": 1.789727596560597e-05, "Pretrain/Loss": 2.015092372894287, "Pretrain/Loss (Raw)": 1.9327418804168701, "Pretrain/Step": 11519, "Pretrain/Step Time": 8.481646293774247} +{"Pretrain/Learning Rate": 1.7893205836820725e-05, "Pretrain/Loss": 2.0140185356140137, "Pretrain/Loss (Raw)": 1.9309521913528442, "Pretrain/Step": 11520, "Pretrain/Step Time": 8.481455881148577} +{"Pretrain/Learning Rate": 1.788913591295488e-05, "Pretrain/Loss": 2.012547016143799, "Pretrain/Loss (Raw)": 1.8686963319778442, "Pretrain/Step": 11521, "Pretrain/Step Time": 8.483540935441852} +{"Pretrain/Learning Rate": 1.788506619412579e-05, "Pretrain/Loss": 2.0123109817504883, "Pretrain/Loss (Raw)": 1.8964954614639282, "Pretrain/Step": 11522, "Pretrain/Step Time": 8.483505828306079} +{"Pretrain/Learning Rate": 1.78809966804508e-05, "Pretrain/Loss": 2.0132341384887695, "Pretrain/Loss (Raw)": 2.1621227264404297, "Pretrain/Step": 11523, "Pretrain/Step Time": 8.482954548671842} +{"Pretrain/Learning Rate": 1.7876927372047254e-05, "Pretrain/Loss": 2.0126383304595947, "Pretrain/Loss (Raw)": 2.03405499458313, "Pretrain/Step": 11524, "Pretrain/Step Time": 8.480355255305767} +{"Pretrain/Learning Rate": 1.7872858269032482e-05, "Pretrain/Loss": 2.0174500942230225, "Pretrain/Loss (Raw)": 2.507176160812378, "Pretrain/Step": 11525, "Pretrain/Step Time": 8.48429880850017} +{"Pretrain/Learning Rate": 1.786878937152382e-05, "Pretrain/Loss": 2.018425464630127, "Pretrain/Loss (Raw)": 2.1033754348754883, "Pretrain/Step": 11526, "Pretrain/Step Time": 8.483803246170282} +{"Pretrain/Learning Rate": 1.786472067963859e-05, "Pretrain/Loss": 2.016225814819336, "Pretrain/Loss (Raw)": 1.9160555601119995, "Pretrain/Step": 11527, "Pretrain/Step Time": 8.480622213333845} +{"Pretrain/Learning Rate": 1.7860652193494104e-05, "Pretrain/Loss": 2.018056869506836, "Pretrain/Loss (Raw)": 2.3242359161376953, "Pretrain/Step": 11528, "Pretrain/Step Time": 8.48153473995626} +{"Pretrain/Learning Rate": 1.7856583913207686e-05, "Pretrain/Loss": 2.0143446922302246, "Pretrain/Loss (Raw)": 1.6639741659164429, "Pretrain/Step": 11529, "Pretrain/Step Time": 8.481809651479125} +{"Pretrain/Learning Rate": 1.7852515838896633e-05, "Pretrain/Loss": 2.0163302421569824, "Pretrain/Loss (Raw)": 2.2663261890411377, "Pretrain/Step": 11530, "Pretrain/Step Time": 8.475352928042412} +{"Pretrain/Learning Rate": 1.7848447970678245e-05, "Pretrain/Loss": 2.0151166915893555, "Pretrain/Loss (Raw)": 2.1166396141052246, "Pretrain/Step": 11531, "Pretrain/Step Time": 8.475846050307155} +{"Pretrain/Learning Rate": 1.7844380308669817e-05, "Pretrain/Loss": 2.0155673027038574, "Pretrain/Loss (Raw)": 2.1791462898254395, "Pretrain/Step": 11532, "Pretrain/Step Time": 8.479699697345495} +{"Pretrain/Learning Rate": 1.784031285298864e-05, "Pretrain/Loss": 2.0165884494781494, "Pretrain/Loss (Raw)": 2.102353811264038, "Pretrain/Step": 11533, "Pretrain/Step Time": 8.484824733808637} +{"Pretrain/Learning Rate": 1.7836245603752e-05, "Pretrain/Loss": 2.0156900882720947, "Pretrain/Loss (Raw)": 1.9940173625946045, "Pretrain/Step": 11534, "Pretrain/Step Time": 8.478801907971501} +{"Pretrain/Learning Rate": 1.783217856107716e-05, "Pretrain/Loss": 2.0152316093444824, "Pretrain/Loss (Raw)": 1.821401596069336, "Pretrain/Step": 11535, "Pretrain/Step Time": 8.488110639154911} +{"Pretrain/Learning Rate": 1.7828111725081402e-05, "Pretrain/Loss": 2.0141706466674805, "Pretrain/Loss (Raw)": 2.155984878540039, "Pretrain/Step": 11536, "Pretrain/Step Time": 8.487649723887444} +{"Pretrain/Learning Rate": 1.7824045095881985e-05, "Pretrain/Loss": 2.0144729614257812, "Pretrain/Loss (Raw)": 2.0047199726104736, "Pretrain/Step": 11537, "Pretrain/Step Time": 8.487405268475413} +{"Pretrain/Learning Rate": 1.781997867359617e-05, "Pretrain/Loss": 2.0144262313842773, "Pretrain/Loss (Raw)": 1.9086908102035522, "Pretrain/Step": 11538, "Pretrain/Step Time": 8.486781265586615} +{"Pretrain/Learning Rate": 1.781591245834121e-05, "Pretrain/Loss": 2.016605854034424, "Pretrain/Loss (Raw)": 2.120255708694458, "Pretrain/Step": 11539, "Pretrain/Step Time": 8.489586189389229} +{"Pretrain/Learning Rate": 1.7811846450234353e-05, "Pretrain/Loss": 2.0192878246307373, "Pretrain/Loss (Raw)": 2.189030647277832, "Pretrain/Step": 11540, "Pretrain/Step Time": 8.484105102717876} +{"Pretrain/Learning Rate": 1.780778064939283e-05, "Pretrain/Loss": 2.019538640975952, "Pretrain/Loss (Raw)": 2.024819850921631, "Pretrain/Step": 11541, "Pretrain/Step Time": 8.490089736878872} +{"Pretrain/Learning Rate": 1.7803715055933883e-05, "Pretrain/Loss": 2.019296407699585, "Pretrain/Loss (Raw)": 2.116401433944702, "Pretrain/Step": 11542, "Pretrain/Step Time": 8.488004410639405} +{"Pretrain/Learning Rate": 1.779964966997474e-05, "Pretrain/Loss": 2.017505168914795, "Pretrain/Loss (Raw)": 1.837167739868164, "Pretrain/Step": 11543, "Pretrain/Step Time": 8.486947705969214} +{"Pretrain/Learning Rate": 1.779558449163262e-05, "Pretrain/Loss": 2.0147693157196045, "Pretrain/Loss (Raw)": 2.0475966930389404, "Pretrain/Step": 11544, "Pretrain/Step Time": 8.491616366431117} +{"Pretrain/Learning Rate": 1.7791519521024748e-05, "Pretrain/Loss": 2.0129308700561523, "Pretrain/Loss (Raw)": 1.9647551774978638, "Pretrain/Step": 11545, "Pretrain/Step Time": 8.490761268883944} +{"Pretrain/Learning Rate": 1.7787454758268322e-05, "Pretrain/Loss": 2.013373851776123, "Pretrain/Loss (Raw)": 1.9283148050308228, "Pretrain/Step": 11546, "Pretrain/Step Time": 8.489562110975385} +{"Pretrain/Learning Rate": 1.7783390203480573e-05, "Pretrain/Loss": 2.0114634037017822, "Pretrain/Loss (Raw)": 1.841802954673767, "Pretrain/Step": 11547, "Pretrain/Step Time": 8.492593666538596} +{"Pretrain/Learning Rate": 1.777932585677866e-05, "Pretrain/Loss": 2.0105032920837402, "Pretrain/Loss (Raw)": 2.0003931522369385, "Pretrain/Step": 11548, "Pretrain/Step Time": 8.492645736783743} +{"Pretrain/Learning Rate": 1.77752617182798e-05, "Pretrain/Loss": 2.0111989974975586, "Pretrain/Loss (Raw)": 1.9789572954177856, "Pretrain/Step": 11549, "Pretrain/Step Time": 8.489676542580128} +{"Pretrain/Learning Rate": 1.7771197788101174e-05, "Pretrain/Loss": 2.0063655376434326, "Pretrain/Loss (Raw)": 1.341697096824646, "Pretrain/Step": 11550, "Pretrain/Step Time": 8.493917685002089} +{"Pretrain/Learning Rate": 1.7767134066359964e-05, "Pretrain/Loss": 2.0052239894866943, "Pretrain/Loss (Raw)": 1.9103326797485352, "Pretrain/Step": 11551, "Pretrain/Step Time": 8.494382657110691} +{"Pretrain/Learning Rate": 1.776307055317335e-05, "Pretrain/Loss": 2.008157730102539, "Pretrain/Loss (Raw)": 2.1764872074127197, "Pretrain/Step": 11552, "Pretrain/Step Time": 8.493931204080582} +{"Pretrain/Learning Rate": 1.775900724865849e-05, "Pretrain/Loss": 2.0085370540618896, "Pretrain/Loss (Raw)": 1.970699667930603, "Pretrain/Step": 11553, "Pretrain/Step Time": 8.493289174512029} +{"Pretrain/Learning Rate": 1.775494415293255e-05, "Pretrain/Loss": 2.008572578430176, "Pretrain/Loss (Raw)": 2.0764243602752686, "Pretrain/Step": 11554, "Pretrain/Step Time": 8.494637252762914} +{"Pretrain/Learning Rate": 1.775088126611269e-05, "Pretrain/Loss": 2.0081019401550293, "Pretrain/Loss (Raw)": 1.9884374141693115, "Pretrain/Step": 11555, "Pretrain/Step Time": 8.491347547620535} +{"Pretrain/Learning Rate": 1.7746818588316058e-05, "Pretrain/Loss": 2.0090370178222656, "Pretrain/Loss (Raw)": 2.009521961212158, "Pretrain/Step": 11556, "Pretrain/Step Time": 8.489038787782192} +{"Pretrain/Learning Rate": 1.7742756119659804e-05, "Pretrain/Loss": 2.007918357849121, "Pretrain/Loss (Raw)": 1.891945481300354, "Pretrain/Step": 11557, "Pretrain/Step Time": 8.4857456125319} +{"Pretrain/Learning Rate": 1.7738693860261055e-05, "Pretrain/Loss": 2.008080005645752, "Pretrain/Loss (Raw)": 1.9411214590072632, "Pretrain/Step": 11558, "Pretrain/Step Time": 8.489741710945964} +{"Pretrain/Learning Rate": 1.773463181023695e-05, "Pretrain/Loss": 2.0059571266174316, "Pretrain/Loss (Raw)": 1.7919719219207764, "Pretrain/Step": 11559, "Pretrain/Step Time": 8.489335304126143} +{"Pretrain/Learning Rate": 1.7730569969704614e-05, "Pretrain/Loss": 2.006929397583008, "Pretrain/Loss (Raw)": 1.972538709640503, "Pretrain/Step": 11560, "Pretrain/Step Time": 8.48533578030765} +{"Pretrain/Learning Rate": 1.772650833878117e-05, "Pretrain/Loss": 2.0074620246887207, "Pretrain/Loss (Raw)": 2.136481523513794, "Pretrain/Step": 11561, "Pretrain/Step Time": 8.48105177283287} +{"Pretrain/Learning Rate": 1.7722446917583735e-05, "Pretrain/Loss": 2.008863925933838, "Pretrain/Loss (Raw)": 2.061530590057373, "Pretrain/Step": 11562, "Pretrain/Step Time": 8.482623171061277} +{"Pretrain/Learning Rate": 1.7718385706229405e-05, "Pretrain/Loss": 2.0098652839660645, "Pretrain/Loss (Raw)": 1.998253583908081, "Pretrain/Step": 11563, "Pretrain/Step Time": 8.483922341838479} +{"Pretrain/Learning Rate": 1.7714324704835295e-05, "Pretrain/Loss": 2.0118508338928223, "Pretrain/Loss (Raw)": 2.4106836318969727, "Pretrain/Step": 11564, "Pretrain/Step Time": 8.477474551647902} +{"Pretrain/Learning Rate": 1.7710263913518492e-05, "Pretrain/Loss": 2.014571189880371, "Pretrain/Loss (Raw)": 1.9879077672958374, "Pretrain/Step": 11565, "Pretrain/Step Time": 8.47978688776493} +{"Pretrain/Learning Rate": 1.7706203332396093e-05, "Pretrain/Loss": 2.016622304916382, "Pretrain/Loss (Raw)": 2.126270055770874, "Pretrain/Step": 11566, "Pretrain/Step Time": 8.476432161405683} +{"Pretrain/Learning Rate": 1.7702142961585184e-05, "Pretrain/Loss": 2.0158472061157227, "Pretrain/Loss (Raw)": 1.858789086341858, "Pretrain/Step": 11567, "Pretrain/Step Time": 8.48111112602055} +{"Pretrain/Learning Rate": 1.7698082801202834e-05, "Pretrain/Loss": 2.016709327697754, "Pretrain/Loss (Raw)": 2.005397319793701, "Pretrain/Step": 11568, "Pretrain/Step Time": 8.48166025429964} +{"Pretrain/Learning Rate": 1.7694022851366114e-05, "Pretrain/Loss": 2.011806011199951, "Pretrain/Loss (Raw)": 1.404911994934082, "Pretrain/Step": 11569, "Pretrain/Step Time": 8.48077379912138} +{"Pretrain/Learning Rate": 1.76899631121921e-05, "Pretrain/Loss": 2.011366128921509, "Pretrain/Loss (Raw)": 1.8689942359924316, "Pretrain/Step": 11570, "Pretrain/Step Time": 8.485109543427825} +{"Pretrain/Learning Rate": 1.7685903583797843e-05, "Pretrain/Loss": 2.009964942932129, "Pretrain/Loss (Raw)": 1.952009677886963, "Pretrain/Step": 11571, "Pretrain/Step Time": 8.485983308404684} +{"Pretrain/Learning Rate": 1.76818442663004e-05, "Pretrain/Loss": 2.0103673934936523, "Pretrain/Loss (Raw)": 1.999864101409912, "Pretrain/Step": 11572, "Pretrain/Step Time": 8.481119889765978} +{"Pretrain/Learning Rate": 1.767778515981683e-05, "Pretrain/Loss": 2.0114657878875732, "Pretrain/Loss (Raw)": 1.7706636190414429, "Pretrain/Step": 11573, "Pretrain/Step Time": 8.479070143774152} +{"Pretrain/Learning Rate": 1.767372626446415e-05, "Pretrain/Loss": 2.0111727714538574, "Pretrain/Loss (Raw)": 1.951183557510376, "Pretrain/Step": 11574, "Pretrain/Step Time": 8.480544889345765} +{"Pretrain/Learning Rate": 1.766966758035941e-05, "Pretrain/Loss": 2.011035442352295, "Pretrain/Loss (Raw)": 2.0582215785980225, "Pretrain/Step": 11575, "Pretrain/Step Time": 8.483839793130755} +{"Pretrain/Learning Rate": 1.766560910761964e-05, "Pretrain/Loss": 2.0110411643981934, "Pretrain/Loss (Raw)": 1.9668421745300293, "Pretrain/Step": 11576, "Pretrain/Step Time": 8.485752897337079} +{"Pretrain/Learning Rate": 1.7661550846361864e-05, "Pretrain/Loss": 2.0113673210144043, "Pretrain/Loss (Raw)": 2.1493427753448486, "Pretrain/Step": 11577, "Pretrain/Step Time": 8.481905154883862} +{"Pretrain/Learning Rate": 1.7657492796703096e-05, "Pretrain/Loss": 2.010732412338257, "Pretrain/Loss (Raw)": 1.919979214668274, "Pretrain/Step": 11578, "Pretrain/Step Time": 8.478610161691904} +{"Pretrain/Learning Rate": 1.7653434958760343e-05, "Pretrain/Loss": 2.0087814331054688, "Pretrain/Loss (Raw)": 1.8823338747024536, "Pretrain/Step": 11579, "Pretrain/Step Time": 8.4762719348073} +{"Pretrain/Learning Rate": 1.7649377332650612e-05, "Pretrain/Loss": 2.006908416748047, "Pretrain/Loss (Raw)": 1.8066017627716064, "Pretrain/Step": 11580, "Pretrain/Step Time": 8.48001035116613} +{"Pretrain/Learning Rate": 1.7645319918490907e-05, "Pretrain/Loss": 2.0073561668395996, "Pretrain/Loss (Raw)": 2.0878868103027344, "Pretrain/Step": 11581, "Pretrain/Step Time": 8.478404317051172} +{"Pretrain/Learning Rate": 1.7641262716398216e-05, "Pretrain/Loss": 2.005977153778076, "Pretrain/Loss (Raw)": 1.9057979583740234, "Pretrain/Step": 11582, "Pretrain/Step Time": 8.476051794365048} +{"Pretrain/Learning Rate": 1.7637205726489535e-05, "Pretrain/Loss": 2.006995677947998, "Pretrain/Loss (Raw)": 2.0868473052978516, "Pretrain/Step": 11583, "Pretrain/Step Time": 8.482950342819095} +{"Pretrain/Learning Rate": 1.763314894888183e-05, "Pretrain/Loss": 2.0060713291168213, "Pretrain/Loss (Raw)": 1.9727565050125122, "Pretrain/Step": 11584, "Pretrain/Step Time": 8.484711728990078} +{"Pretrain/Learning Rate": 1.762909238369208e-05, "Pretrain/Loss": 2.008267402648926, "Pretrain/Loss (Raw)": 1.9458550214767456, "Pretrain/Step": 11585, "Pretrain/Step Time": 8.484039213508368} +{"Pretrain/Learning Rate": 1.7625036031037256e-05, "Pretrain/Loss": 2.0087122917175293, "Pretrain/Loss (Raw)": 2.0126097202301025, "Pretrain/Step": 11586, "Pretrain/Step Time": 8.482350559905171} +{"Pretrain/Learning Rate": 1.762097989103432e-05, "Pretrain/Loss": 2.0073742866516113, "Pretrain/Loss (Raw)": 1.9591325521469116, "Pretrain/Step": 11587, "Pretrain/Step Time": 8.488719686865807} +{"Pretrain/Learning Rate": 1.7616923963800227e-05, "Pretrain/Loss": 2.0100903511047363, "Pretrain/Loss (Raw)": 2.1391494274139404, "Pretrain/Step": 11588, "Pretrain/Step Time": 8.485171211883426} +{"Pretrain/Learning Rate": 1.7612868249451926e-05, "Pretrain/Loss": 2.0130534172058105, "Pretrain/Loss (Raw)": 1.878275990486145, "Pretrain/Step": 11589, "Pretrain/Step Time": 8.476013898849487} +{"Pretrain/Learning Rate": 1.7608812748106363e-05, "Pretrain/Loss": 2.012995958328247, "Pretrain/Loss (Raw)": 1.9291175603866577, "Pretrain/Step": 11590, "Pretrain/Step Time": 8.475753901526332} +{"Pretrain/Learning Rate": 1.7604757459880472e-05, "Pretrain/Loss": 2.013606548309326, "Pretrain/Loss (Raw)": 1.9993951320648193, "Pretrain/Step": 11591, "Pretrain/Step Time": 8.475620681419969} +{"Pretrain/Learning Rate": 1.7600702384891186e-05, "Pretrain/Loss": 2.013002395629883, "Pretrain/Loss (Raw)": 2.0011746883392334, "Pretrain/Step": 11592, "Pretrain/Step Time": 8.474992347881198} +{"Pretrain/Learning Rate": 1.7596647523255432e-05, "Pretrain/Loss": 2.0120162963867188, "Pretrain/Loss (Raw)": 2.001929521560669, "Pretrain/Step": 11593, "Pretrain/Step Time": 8.469699503853917} +{"Pretrain/Learning Rate": 1.759259287509013e-05, "Pretrain/Loss": 2.011101245880127, "Pretrain/Loss (Raw)": 2.192918539047241, "Pretrain/Step": 11594, "Pretrain/Step Time": 8.474571695551276} +{"Pretrain/Learning Rate": 1.7588538440512186e-05, "Pretrain/Loss": 2.009967088699341, "Pretrain/Loss (Raw)": 1.9642553329467773, "Pretrain/Step": 11595, "Pretrain/Step Time": 8.47017839178443} +{"Pretrain/Learning Rate": 1.7584484219638513e-05, "Pretrain/Loss": 2.0083789825439453, "Pretrain/Loss (Raw)": 1.7256698608398438, "Pretrain/Step": 11596, "Pretrain/Step Time": 8.469968605786562} +{"Pretrain/Learning Rate": 1.758043021258601e-05, "Pretrain/Loss": 2.0062389373779297, "Pretrain/Loss (Raw)": 1.8224905729293823, "Pretrain/Step": 11597, "Pretrain/Step Time": 8.463745802640915} +{"Pretrain/Learning Rate": 1.7576376419471574e-05, "Pretrain/Loss": 2.007014036178589, "Pretrain/Loss (Raw)": 2.1162197589874268, "Pretrain/Step": 11598, "Pretrain/Step Time": 8.46363795362413} +{"Pretrain/Learning Rate": 1.7572322840412085e-05, "Pretrain/Loss": 2.0053884983062744, "Pretrain/Loss (Raw)": 1.990788221359253, "Pretrain/Step": 11599, "Pretrain/Step Time": 8.467988513410091} +{"Pretrain/Learning Rate": 1.7568269475524433e-05, "Pretrain/Loss": 2.0061988830566406, "Pretrain/Loss (Raw)": 2.1675376892089844, "Pretrain/Step": 11600, "Pretrain/Step Time": 8.467288130894303} +{"Pretrain/Learning Rate": 1.7564216324925495e-05, "Pretrain/Loss": 2.0035974979400635, "Pretrain/Loss (Raw)": 1.7008090019226074, "Pretrain/Step": 11601, "Pretrain/Step Time": 8.470004657283425} +{"Pretrain/Learning Rate": 1.7560163388732134e-05, "Pretrain/Loss": 2.000847101211548, "Pretrain/Loss (Raw)": 1.737716794013977, "Pretrain/Step": 11602, "Pretrain/Step Time": 8.469768349081278} +{"Pretrain/Learning Rate": 1.755611066706122e-05, "Pretrain/Loss": 2.0004045963287354, "Pretrain/Loss (Raw)": 1.9401326179504395, "Pretrain/Step": 11603, "Pretrain/Step Time": 8.469109192490578} +{"Pretrain/Learning Rate": 1.7552058160029605e-05, "Pretrain/Loss": 1.9994410276412964, "Pretrain/Loss (Raw)": 1.961876392364502, "Pretrain/Step": 11604, "Pretrain/Step Time": 8.467827687039971} +{"Pretrain/Learning Rate": 1.754800586775414e-05, "Pretrain/Loss": 2.000042676925659, "Pretrain/Loss (Raw)": 1.9083489179611206, "Pretrain/Step": 11605, "Pretrain/Step Time": 8.470005741342902} +{"Pretrain/Learning Rate": 1.754395379035168e-05, "Pretrain/Loss": 1.99924635887146, "Pretrain/Loss (Raw)": 1.7681753635406494, "Pretrain/Step": 11606, "Pretrain/Step Time": 8.463982271030545} +{"Pretrain/Learning Rate": 1.7539901927939048e-05, "Pretrain/Loss": 1.9998160600662231, "Pretrain/Loss (Raw)": 2.1046407222747803, "Pretrain/Step": 11607, "Pretrain/Step Time": 8.465979428961873} +{"Pretrain/Learning Rate": 1.7535850280633087e-05, "Pretrain/Loss": 1.9998042583465576, "Pretrain/Loss (Raw)": 2.1304922103881836, "Pretrain/Step": 11608, "Pretrain/Step Time": 8.464924681931734} +{"Pretrain/Learning Rate": 1.753179884855063e-05, "Pretrain/Loss": 1.9994726181030273, "Pretrain/Loss (Raw)": 2.0022079944610596, "Pretrain/Step": 11609, "Pretrain/Step Time": 8.459549486637115} +{"Pretrain/Learning Rate": 1.752774763180848e-05, "Pretrain/Loss": 2.001802444458008, "Pretrain/Loss (Raw)": 2.022280216217041, "Pretrain/Step": 11610, "Pretrain/Step Time": 8.466050261631608} +{"Pretrain/Learning Rate": 1.7523696630523457e-05, "Pretrain/Loss": 2.0009899139404297, "Pretrain/Loss (Raw)": 1.9694583415985107, "Pretrain/Step": 11611, "Pretrain/Step Time": 8.463916063308716} +{"Pretrain/Learning Rate": 1.7519645844812373e-05, "Pretrain/Loss": 2.002047300338745, "Pretrain/Loss (Raw)": 2.077596426010132, "Pretrain/Step": 11612, "Pretrain/Step Time": 8.454570475965738} +{"Pretrain/Learning Rate": 1.751559527479203e-05, "Pretrain/Loss": 2.0040712356567383, "Pretrain/Loss (Raw)": 2.151630163192749, "Pretrain/Step": 11613, "Pretrain/Step Time": 8.451805900782347} +{"Pretrain/Learning Rate": 1.7511544920579226e-05, "Pretrain/Loss": 2.0042104721069336, "Pretrain/Loss (Raw)": 2.1176934242248535, "Pretrain/Step": 11614, "Pretrain/Step Time": 8.454685078933835} +{"Pretrain/Learning Rate": 1.750749478229074e-05, "Pretrain/Loss": 2.003757953643799, "Pretrain/Loss (Raw)": 2.0072736740112305, "Pretrain/Step": 11615, "Pretrain/Step Time": 8.454707412049174} +{"Pretrain/Learning Rate": 1.7503444860043356e-05, "Pretrain/Loss": 2.004173755645752, "Pretrain/Loss (Raw)": 2.132615566253662, "Pretrain/Step": 11616, "Pretrain/Step Time": 8.461982183158398} +{"Pretrain/Learning Rate": 1.7499395153953856e-05, "Pretrain/Loss": 2.004941940307617, "Pretrain/Loss (Raw)": 2.039217472076416, "Pretrain/Step": 11617, "Pretrain/Step Time": 8.460175035521388} +{"Pretrain/Learning Rate": 1.7495345664139013e-05, "Pretrain/Loss": 2.0041685104370117, "Pretrain/Loss (Raw)": 2.0084762573242188, "Pretrain/Step": 11618, "Pretrain/Step Time": 8.457140520215034} +{"Pretrain/Learning Rate": 1.7491296390715592e-05, "Pretrain/Loss": 2.005067825317383, "Pretrain/Loss (Raw)": 2.1982004642486572, "Pretrain/Step": 11619, "Pretrain/Step Time": 8.45445167273283} +{"Pretrain/Learning Rate": 1.748724733380034e-05, "Pretrain/Loss": 2.0044522285461426, "Pretrain/Loss (Raw)": 1.8637588024139404, "Pretrain/Step": 11620, "Pretrain/Step Time": 8.454112926498055} +{"Pretrain/Learning Rate": 1.7483198493510015e-05, "Pretrain/Loss": 2.004683017730713, "Pretrain/Loss (Raw)": 2.040224075317383, "Pretrain/Step": 11621, "Pretrain/Step Time": 8.456088181585073} +{"Pretrain/Learning Rate": 1.7479149869961357e-05, "Pretrain/Loss": 2.0076308250427246, "Pretrain/Loss (Raw)": 2.194352626800537, "Pretrain/Step": 11622, "Pretrain/Step Time": 8.456731921061873} +{"Pretrain/Learning Rate": 1.7475101463271122e-05, "Pretrain/Loss": 2.0061862468719482, "Pretrain/Loss (Raw)": 2.1009159088134766, "Pretrain/Step": 11623, "Pretrain/Step Time": 8.45865779556334} +{"Pretrain/Learning Rate": 1.7471053273556027e-05, "Pretrain/Loss": 2.005779266357422, "Pretrain/Loss (Raw)": 2.0054523944854736, "Pretrain/Step": 11624, "Pretrain/Step Time": 8.458995942026377} +{"Pretrain/Learning Rate": 1.7467005300932803e-05, "Pretrain/Loss": 2.0044615268707275, "Pretrain/Loss (Raw)": 2.070202589035034, "Pretrain/Step": 11625, "Pretrain/Step Time": 8.457411734387279} +{"Pretrain/Learning Rate": 1.7462957545518167e-05, "Pretrain/Loss": 2.0008957386016846, "Pretrain/Loss (Raw)": 1.6250889301300049, "Pretrain/Step": 11626, "Pretrain/Step Time": 8.454491972923279} +{"Pretrain/Learning Rate": 1.7458910007428842e-05, "Pretrain/Loss": 2.0008225440979004, "Pretrain/Loss (Raw)": 2.1008105278015137, "Pretrain/Step": 11627, "Pretrain/Step Time": 8.460547940805554} +{"Pretrain/Learning Rate": 1.7454862686781524e-05, "Pretrain/Loss": 2.002194881439209, "Pretrain/Loss (Raw)": 2.1065070629119873, "Pretrain/Step": 11628, "Pretrain/Step Time": 8.458409363403916} +{"Pretrain/Learning Rate": 1.7450815583692935e-05, "Pretrain/Loss": 2.0020766258239746, "Pretrain/Loss (Raw)": 1.773128867149353, "Pretrain/Step": 11629, "Pretrain/Step Time": 8.446713540703058} +{"Pretrain/Learning Rate": 1.7446768698279748e-05, "Pretrain/Loss": 2.00327730178833, "Pretrain/Loss (Raw)": 2.210536241531372, "Pretrain/Step": 11630, "Pretrain/Step Time": 8.448796898126602} +{"Pretrain/Learning Rate": 1.744272203065867e-05, "Pretrain/Loss": 2.0069680213928223, "Pretrain/Loss (Raw)": 2.5627424716949463, "Pretrain/Step": 11631, "Pretrain/Step Time": 8.445475097745657} +{"Pretrain/Learning Rate": 1.743867558094636e-05, "Pretrain/Loss": 2.0054636001586914, "Pretrain/Loss (Raw)": 1.9760514497756958, "Pretrain/Step": 11632, "Pretrain/Step Time": 8.452019656077027} +{"Pretrain/Learning Rate": 1.7434629349259518e-05, "Pretrain/Loss": 2.0050201416015625, "Pretrain/Loss (Raw)": 1.948182463645935, "Pretrain/Step": 11633, "Pretrain/Step Time": 8.448468118906021} +{"Pretrain/Learning Rate": 1.74305833357148e-05, "Pretrain/Loss": 2.0047523975372314, "Pretrain/Loss (Raw)": 1.949695348739624, "Pretrain/Step": 11634, "Pretrain/Step Time": 8.444750482216477} +{"Pretrain/Learning Rate": 1.742653754042888e-05, "Pretrain/Loss": 2.0079023838043213, "Pretrain/Loss (Raw)": 2.0322835445404053, "Pretrain/Step": 11635, "Pretrain/Step Time": 8.44632000848651} +{"Pretrain/Learning Rate": 1.7422491963518406e-05, "Pretrain/Loss": 2.004394054412842, "Pretrain/Loss (Raw)": 2.0018744468688965, "Pretrain/Step": 11636, "Pretrain/Step Time": 8.441241391003132} +{"Pretrain/Learning Rate": 1.741844660510004e-05, "Pretrain/Loss": 2.0046565532684326, "Pretrain/Loss (Raw)": 2.1406033039093018, "Pretrain/Step": 11637, "Pretrain/Step Time": 8.438513867557049} +{"Pretrain/Learning Rate": 1.741440146529042e-05, "Pretrain/Loss": 2.003188133239746, "Pretrain/Loss (Raw)": 2.057173728942871, "Pretrain/Step": 11638, "Pretrain/Step Time": 8.44022086635232} +{"Pretrain/Learning Rate": 1.7410356544206185e-05, "Pretrain/Loss": 2.003037929534912, "Pretrain/Loss (Raw)": 1.9308041334152222, "Pretrain/Step": 11639, "Pretrain/Step Time": 8.437467815354466} +{"Pretrain/Learning Rate": 1.7406311841963966e-05, "Pretrain/Loss": 2.003434181213379, "Pretrain/Loss (Raw)": 2.135631561279297, "Pretrain/Step": 11640, "Pretrain/Step Time": 8.436231235042214} +{"Pretrain/Learning Rate": 1.7402267358680395e-05, "Pretrain/Loss": 2.0053048133850098, "Pretrain/Loss (Raw)": 2.416621446609497, "Pretrain/Step": 11641, "Pretrain/Step Time": 8.443658545613289} +{"Pretrain/Learning Rate": 1.7398223094472094e-05, "Pretrain/Loss": 2.0054335594177246, "Pretrain/Loss (Raw)": 2.0520172119140625, "Pretrain/Step": 11642, "Pretrain/Step Time": 8.442423341795802} +{"Pretrain/Learning Rate": 1.7394179049455665e-05, "Pretrain/Loss": 2.0052928924560547, "Pretrain/Loss (Raw)": 2.0375800132751465, "Pretrain/Step": 11643, "Pretrain/Step Time": 8.442009158432484} +{"Pretrain/Learning Rate": 1.739013522374772e-05, "Pretrain/Loss": 2.0022988319396973, "Pretrain/Loss (Raw)": 1.7880144119262695, "Pretrain/Step": 11644, "Pretrain/Step Time": 8.439886812120676} +{"Pretrain/Learning Rate": 1.738609161746486e-05, "Pretrain/Loss": 2.001882553100586, "Pretrain/Loss (Raw)": 2.064185857772827, "Pretrain/Step": 11645, "Pretrain/Step Time": 8.432821756228805} +{"Pretrain/Learning Rate": 1.7382048230723686e-05, "Pretrain/Loss": 2.001518487930298, "Pretrain/Loss (Raw)": 1.8051869869232178, "Pretrain/Step": 11646, "Pretrain/Step Time": 8.435926496982574} +{"Pretrain/Learning Rate": 1.7378005063640783e-05, "Pretrain/Loss": 2.0013818740844727, "Pretrain/Loss (Raw)": 1.915228009223938, "Pretrain/Step": 11647, "Pretrain/Step Time": 8.437309490516782} +{"Pretrain/Learning Rate": 1.7373962116332727e-05, "Pretrain/Loss": 2.0046164989471436, "Pretrain/Loss (Raw)": 2.3450045585632324, "Pretrain/Step": 11648, "Pretrain/Step Time": 8.437287298962474} +{"Pretrain/Learning Rate": 1.7369919388916096e-05, "Pretrain/Loss": 2.0058212280273438, "Pretrain/Loss (Raw)": 2.0228936672210693, "Pretrain/Step": 11649, "Pretrain/Step Time": 8.4416787866503} +{"Pretrain/Learning Rate": 1.736587688150746e-05, "Pretrain/Loss": 2.0023956298828125, "Pretrain/Loss (Raw)": 1.4580192565917969, "Pretrain/Step": 11650, "Pretrain/Step Time": 8.43898255750537} +{"Pretrain/Learning Rate": 1.736183459422338e-05, "Pretrain/Loss": 2.00199031829834, "Pretrain/Loss (Raw)": 2.1102466583251953, "Pretrain/Step": 11651, "Pretrain/Step Time": 8.435790682211518} +{"Pretrain/Learning Rate": 1.7357792527180428e-05, "Pretrain/Loss": 2.0032567977905273, "Pretrain/Loss (Raw)": 2.1961777210235596, "Pretrain/Step": 11652, "Pretrain/Step Time": 8.435438668355346} +{"Pretrain/Learning Rate": 1.735375068049513e-05, "Pretrain/Loss": 2.0000510215759277, "Pretrain/Loss (Raw)": 2.0968399047851562, "Pretrain/Step": 11653, "Pretrain/Step Time": 8.431191828101873} +{"Pretrain/Learning Rate": 1.734970905428404e-05, "Pretrain/Loss": 1.9994595050811768, "Pretrain/Loss (Raw)": 2.0276496410369873, "Pretrain/Step": 11654, "Pretrain/Step Time": 8.426732789725065} +{"Pretrain/Learning Rate": 1.7345667648663698e-05, "Pretrain/Loss": 2.0013492107391357, "Pretrain/Loss (Raw)": 2.157939910888672, "Pretrain/Step": 11655, "Pretrain/Step Time": 8.42728377878666} +{"Pretrain/Learning Rate": 1.7341626463750635e-05, "Pretrain/Loss": 1.9984869956970215, "Pretrain/Loss (Raw)": 1.9578733444213867, "Pretrain/Step": 11656, "Pretrain/Step Time": 8.431408043950796} +{"Pretrain/Learning Rate": 1.733758549966138e-05, "Pretrain/Loss": 2.0021233558654785, "Pretrain/Loss (Raw)": 2.1294057369232178, "Pretrain/Step": 11657, "Pretrain/Step Time": 8.43016549013555} +{"Pretrain/Learning Rate": 1.7333544756512437e-05, "Pretrain/Loss": 2.0008153915405273, "Pretrain/Loss (Raw)": 2.0989418029785156, "Pretrain/Step": 11658, "Pretrain/Step Time": 8.431248782202601} +{"Pretrain/Learning Rate": 1.732950423442033e-05, "Pretrain/Loss": 2.0014123916625977, "Pretrain/Loss (Raw)": 2.1930348873138428, "Pretrain/Step": 11659, "Pretrain/Step Time": 8.435093397274613} +{"Pretrain/Learning Rate": 1.7325463933501558e-05, "Pretrain/Loss": 1.9994709491729736, "Pretrain/Loss (Raw)": 1.9306561946868896, "Pretrain/Step": 11660, "Pretrain/Step Time": 8.429356375709176} +{"Pretrain/Learning Rate": 1.7321423853872623e-05, "Pretrain/Loss": 1.9986926317214966, "Pretrain/Loss (Raw)": 2.0027167797088623, "Pretrain/Step": 11661, "Pretrain/Step Time": 8.425271719694138} +{"Pretrain/Learning Rate": 1.7317383995650026e-05, "Pretrain/Loss": 1.997625708580017, "Pretrain/Loss (Raw)": 1.857455849647522, "Pretrain/Step": 11662, "Pretrain/Step Time": 8.42834104783833} +{"Pretrain/Learning Rate": 1.7313344358950238e-05, "Pretrain/Loss": 2.000060558319092, "Pretrain/Loss (Raw)": 2.133066415786743, "Pretrain/Step": 11663, "Pretrain/Step Time": 8.422939913347363} +{"Pretrain/Learning Rate": 1.7309304943889747e-05, "Pretrain/Loss": 1.9978837966918945, "Pretrain/Loss (Raw)": 1.8773661851882935, "Pretrain/Step": 11664, "Pretrain/Step Time": 8.42527369223535} +{"Pretrain/Learning Rate": 1.7305265750585025e-05, "Pretrain/Loss": 1.9979805946350098, "Pretrain/Loss (Raw)": 2.0170936584472656, "Pretrain/Step": 11665, "Pretrain/Step Time": 8.427826594561338} +{"Pretrain/Learning Rate": 1.7301226779152548e-05, "Pretrain/Loss": 1.9986207485198975, "Pretrain/Loss (Raw)": 1.9906302690505981, "Pretrain/Step": 11666, "Pretrain/Step Time": 8.43154969625175} +{"Pretrain/Learning Rate": 1.7297188029708767e-05, "Pretrain/Loss": 2.000101089477539, "Pretrain/Loss (Raw)": 2.3097288608551025, "Pretrain/Step": 11667, "Pretrain/Step Time": 8.429732199758291} +{"Pretrain/Learning Rate": 1.7293149502370135e-05, "Pretrain/Loss": 1.9970557689666748, "Pretrain/Loss (Raw)": 1.7992404699325562, "Pretrain/Step": 11668, "Pretrain/Step Time": 8.432843331247568} +{"Pretrain/Learning Rate": 1.7289111197253106e-05, "Pretrain/Loss": 1.997839093208313, "Pretrain/Loss (Raw)": 2.1250815391540527, "Pretrain/Step": 11669, "Pretrain/Step Time": 8.42972002364695} +{"Pretrain/Learning Rate": 1.728507311447412e-05, "Pretrain/Loss": 1.996971845626831, "Pretrain/Loss (Raw)": 2.0054025650024414, "Pretrain/Step": 11670, "Pretrain/Step Time": 8.429082436487079} +{"Pretrain/Learning Rate": 1.728103525414961e-05, "Pretrain/Loss": 1.9980989694595337, "Pretrain/Loss (Raw)": 1.9814280271530151, "Pretrain/Step": 11671, "Pretrain/Step Time": 8.430076876655221} +{"Pretrain/Learning Rate": 1.7276997616396005e-05, "Pretrain/Loss": 1.9988577365875244, "Pretrain/Loss (Raw)": 2.1447246074676514, "Pretrain/Step": 11672, "Pretrain/Step Time": 8.42801583558321} +{"Pretrain/Learning Rate": 1.727296020132974e-05, "Pretrain/Loss": 1.9987362623214722, "Pretrain/Loss (Raw)": 1.9492063522338867, "Pretrain/Step": 11673, "Pretrain/Step Time": 8.433010630309582} +{"Pretrain/Learning Rate": 1.7268923009067213e-05, "Pretrain/Loss": 2.0000481605529785, "Pretrain/Loss (Raw)": 2.0962367057800293, "Pretrain/Step": 11674, "Pretrain/Step Time": 8.43322879076004} +{"Pretrain/Learning Rate": 1.7264886039724842e-05, "Pretrain/Loss": 2.0011706352233887, "Pretrain/Loss (Raw)": 1.9854744672775269, "Pretrain/Step": 11675, "Pretrain/Step Time": 8.430658107623458} +{"Pretrain/Learning Rate": 1.726084929341903e-05, "Pretrain/Loss": 2.001286029815674, "Pretrain/Loss (Raw)": 2.0151968002319336, "Pretrain/Step": 11676, "Pretrain/Step Time": 8.427081594243646} +{"Pretrain/Learning Rate": 1.7256812770266168e-05, "Pretrain/Loss": 2.0023117065429688, "Pretrain/Loss (Raw)": 2.110215425491333, "Pretrain/Step": 11677, "Pretrain/Step Time": 8.42550796829164} +{"Pretrain/Learning Rate": 1.725277647038266e-05, "Pretrain/Loss": 2.0069899559020996, "Pretrain/Loss (Raw)": 1.9405261278152466, "Pretrain/Step": 11678, "Pretrain/Step Time": 8.421574594452977} +{"Pretrain/Learning Rate": 1.7248740393884875e-05, "Pretrain/Loss": 2.007878303527832, "Pretrain/Loss (Raw)": 2.024027109146118, "Pretrain/Step": 11679, "Pretrain/Step Time": 8.419606324285269} +{"Pretrain/Learning Rate": 1.7244704540889194e-05, "Pretrain/Loss": 2.0081658363342285, "Pretrain/Loss (Raw)": 2.213313102722168, "Pretrain/Step": 11680, "Pretrain/Step Time": 8.419127283617854} +{"Pretrain/Learning Rate": 1.7240668911511994e-05, "Pretrain/Loss": 2.0104405879974365, "Pretrain/Loss (Raw)": 2.261843681335449, "Pretrain/Step": 11681, "Pretrain/Step Time": 8.421572532504797} +{"Pretrain/Learning Rate": 1.723663350586964e-05, "Pretrain/Loss": 2.007809638977051, "Pretrain/Loss (Raw)": 1.7396854162216187, "Pretrain/Step": 11682, "Pretrain/Step Time": 8.425419203937054} +{"Pretrain/Learning Rate": 1.723259832407848e-05, "Pretrain/Loss": 2.0062737464904785, "Pretrain/Loss (Raw)": 1.791815161705017, "Pretrain/Step": 11683, "Pretrain/Step Time": 8.428567379713058} +{"Pretrain/Learning Rate": 1.7228563366254873e-05, "Pretrain/Loss": 2.005387306213379, "Pretrain/Loss (Raw)": 1.8960676193237305, "Pretrain/Step": 11684, "Pretrain/Step Time": 8.425483245402575} +{"Pretrain/Learning Rate": 1.7224528632515163e-05, "Pretrain/Loss": 2.0060505867004395, "Pretrain/Loss (Raw)": 1.9768341779708862, "Pretrain/Step": 11685, "Pretrain/Step Time": 8.425449389964342} +{"Pretrain/Learning Rate": 1.7220494122975688e-05, "Pretrain/Loss": 2.0037240982055664, "Pretrain/Loss (Raw)": 1.6433712244033813, "Pretrain/Step": 11686, "Pretrain/Step Time": 8.423894917592406} +{"Pretrain/Learning Rate": 1.721645983775278e-05, "Pretrain/Loss": 2.0041885375976562, "Pretrain/Loss (Raw)": 1.8514080047607422, "Pretrain/Step": 11687, "Pretrain/Step Time": 8.422392085194588} +{"Pretrain/Learning Rate": 1.7212425776962777e-05, "Pretrain/Loss": 2.005449056625366, "Pretrain/Loss (Raw)": 2.133868932723999, "Pretrain/Step": 11688, "Pretrain/Step Time": 8.420401247218251} +{"Pretrain/Learning Rate": 1.7208391940721976e-05, "Pretrain/Loss": 2.004005193710327, "Pretrain/Loss (Raw)": 1.9516675472259521, "Pretrain/Step": 11689, "Pretrain/Step Time": 8.426949927583337} +{"Pretrain/Learning Rate": 1.7204358329146696e-05, "Pretrain/Loss": 2.0026698112487793, "Pretrain/Loss (Raw)": 1.8906030654907227, "Pretrain/Step": 11690, "Pretrain/Step Time": 8.422656385228038} +{"Pretrain/Learning Rate": 1.7200324942353255e-05, "Pretrain/Loss": 2.002601146697998, "Pretrain/Loss (Raw)": 1.98947274684906, "Pretrain/Step": 11691, "Pretrain/Step Time": 8.427405044436455} +{"Pretrain/Learning Rate": 1.7196291780457945e-05, "Pretrain/Loss": 2.000105857849121, "Pretrain/Loss (Raw)": 2.0912647247314453, "Pretrain/Step": 11692, "Pretrain/Step Time": 8.425343373790383} +{"Pretrain/Learning Rate": 1.7192258843577063e-05, "Pretrain/Loss": 1.999152421951294, "Pretrain/Loss (Raw)": 1.8658995628356934, "Pretrain/Step": 11693, "Pretrain/Step Time": 8.42199356853962} +{"Pretrain/Learning Rate": 1.718822613182689e-05, "Pretrain/Loss": 1.9979838132858276, "Pretrain/Loss (Raw)": 1.9766845703125, "Pretrain/Step": 11694, "Pretrain/Step Time": 8.417428057640791} +{"Pretrain/Learning Rate": 1.718419364532371e-05, "Pretrain/Loss": 2.0004260540008545, "Pretrain/Loss (Raw)": 2.171391487121582, "Pretrain/Step": 11695, "Pretrain/Step Time": 8.413806619122624} +{"Pretrain/Learning Rate": 1.7180161384183793e-05, "Pretrain/Loss": 1.9986523389816284, "Pretrain/Loss (Raw)": 1.778337836265564, "Pretrain/Step": 11696, "Pretrain/Step Time": 8.417030315846205} +{"Pretrain/Learning Rate": 1.717612934852341e-05, "Pretrain/Loss": 2.003300666809082, "Pretrain/Loss (Raw)": 1.9998942613601685, "Pretrain/Step": 11697, "Pretrain/Step Time": 8.41759773157537} +{"Pretrain/Learning Rate": 1.717209753845883e-05, "Pretrain/Loss": 2.00518798828125, "Pretrain/Loss (Raw)": 2.1105949878692627, "Pretrain/Step": 11698, "Pretrain/Step Time": 8.424749255180359} +{"Pretrain/Learning Rate": 1.7168065954106294e-05, "Pretrain/Loss": 2.0060014724731445, "Pretrain/Loss (Raw)": 2.0561535358428955, "Pretrain/Step": 11699, "Pretrain/Step Time": 8.423231331631541} +{"Pretrain/Learning Rate": 1.7164034595582055e-05, "Pretrain/Loss": 2.0049831867218018, "Pretrain/Loss (Raw)": 1.8695000410079956, "Pretrain/Step": 11700, "Pretrain/Step Time": 8.42819718271494} +{"Pretrain/Learning Rate": 1.716000346300235e-05, "Pretrain/Loss": 2.0067787170410156, "Pretrain/Loss (Raw)": 2.000507116317749, "Pretrain/Step": 11701, "Pretrain/Step Time": 8.425480864942074} +{"Pretrain/Learning Rate": 1.7155972556483424e-05, "Pretrain/Loss": 2.0083742141723633, "Pretrain/Loss (Raw)": 2.155400514602661, "Pretrain/Step": 11702, "Pretrain/Step Time": 8.42379087768495} +{"Pretrain/Learning Rate": 1.7151941876141502e-05, "Pretrain/Loss": 2.007929801940918, "Pretrain/Loss (Raw)": 2.001328706741333, "Pretrain/Step": 11703, "Pretrain/Step Time": 8.420451700687408} +{"Pretrain/Learning Rate": 1.71479114220928e-05, "Pretrain/Loss": 2.007129192352295, "Pretrain/Loss (Raw)": 1.8643561601638794, "Pretrain/Step": 11704, "Pretrain/Step Time": 8.420380298048258} +{"Pretrain/Learning Rate": 1.714388119445354e-05, "Pretrain/Loss": 2.0067036151885986, "Pretrain/Loss (Raw)": 2.0948657989501953, "Pretrain/Step": 11705, "Pretrain/Step Time": 8.42302686534822} +{"Pretrain/Learning Rate": 1.713985119333992e-05, "Pretrain/Loss": 2.007876396179199, "Pretrain/Loss (Raw)": 2.0701050758361816, "Pretrain/Step": 11706, "Pretrain/Step Time": 8.423054605722427} +{"Pretrain/Learning Rate": 1.7135821418868154e-05, "Pretrain/Loss": 2.0084924697875977, "Pretrain/Loss (Raw)": 1.9612025022506714, "Pretrain/Step": 11707, "Pretrain/Step Time": 8.425825336948037} +{"Pretrain/Learning Rate": 1.7131791871154433e-05, "Pretrain/Loss": 2.0103678703308105, "Pretrain/Loss (Raw)": 2.0466291904449463, "Pretrain/Step": 11708, "Pretrain/Step Time": 8.423747589811683} +{"Pretrain/Learning Rate": 1.7127762550314953e-05, "Pretrain/Loss": 2.0133228302001953, "Pretrain/Loss (Raw)": 2.4661495685577393, "Pretrain/Step": 11709, "Pretrain/Step Time": 8.422015340998769} +{"Pretrain/Learning Rate": 1.712373345646588e-05, "Pretrain/Loss": 2.015299081802368, "Pretrain/Loss (Raw)": 2.1587438583374023, "Pretrain/Step": 11710, "Pretrain/Step Time": 8.424189975485206} +{"Pretrain/Learning Rate": 1.7119704589723405e-05, "Pretrain/Loss": 2.0155839920043945, "Pretrain/Loss (Raw)": 2.123322010040283, "Pretrain/Step": 11711, "Pretrain/Step Time": 8.41445942595601} +{"Pretrain/Learning Rate": 1.7115675950203692e-05, "Pretrain/Loss": 2.016512870788574, "Pretrain/Loss (Raw)": 2.0916335582733154, "Pretrain/Step": 11712, "Pretrain/Step Time": 8.41703737154603} +{"Pretrain/Learning Rate": 1.7111647538022903e-05, "Pretrain/Loss": 2.0155086517333984, "Pretrain/Loss (Raw)": 1.8173447847366333, "Pretrain/Step": 11713, "Pretrain/Step Time": 8.415626108646393} +{"Pretrain/Learning Rate": 1.7107619353297206e-05, "Pretrain/Loss": 2.016568422317505, "Pretrain/Loss (Raw)": 2.148240327835083, "Pretrain/Step": 11714, "Pretrain/Step Time": 8.426680395379663} +{"Pretrain/Learning Rate": 1.7103591396142736e-05, "Pretrain/Loss": 2.0161447525024414, "Pretrain/Loss (Raw)": 1.9049289226531982, "Pretrain/Step": 11715, "Pretrain/Step Time": 8.424042902886868} +{"Pretrain/Learning Rate": 1.7099563666675645e-05, "Pretrain/Loss": 2.0151619911193848, "Pretrain/Loss (Raw)": 2.013305187225342, "Pretrain/Step": 11716, "Pretrain/Step Time": 8.426105106249452} +{"Pretrain/Learning Rate": 1.709553616501206e-05, "Pretrain/Loss": 2.0159902572631836, "Pretrain/Loss (Raw)": 1.9843037128448486, "Pretrain/Step": 11717, "Pretrain/Step Time": 8.42530514858663} +{"Pretrain/Learning Rate": 1.7091508891268117e-05, "Pretrain/Loss": 2.0164971351623535, "Pretrain/Loss (Raw)": 1.9940153360366821, "Pretrain/Step": 11718, "Pretrain/Step Time": 8.426343217492104} +{"Pretrain/Learning Rate": 1.708748184555994e-05, "Pretrain/Loss": 2.015503406524658, "Pretrain/Loss (Raw)": 1.872207760810852, "Pretrain/Step": 11719, "Pretrain/Step Time": 8.427213413640857} +{"Pretrain/Learning Rate": 1.7083455028003648e-05, "Pretrain/Loss": 2.014594316482544, "Pretrain/Loss (Raw)": 1.8847883939743042, "Pretrain/Step": 11720, "Pretrain/Step Time": 8.427841007709503} +{"Pretrain/Learning Rate": 1.7079428438715353e-05, "Pretrain/Loss": 2.0170459747314453, "Pretrain/Loss (Raw)": 2.3157360553741455, "Pretrain/Step": 11721, "Pretrain/Step Time": 8.430326275527477} +{"Pretrain/Learning Rate": 1.7075402077811148e-05, "Pretrain/Loss": 2.015044689178467, "Pretrain/Loss (Raw)": 1.9367843866348267, "Pretrain/Step": 11722, "Pretrain/Step Time": 8.424750795587897} +{"Pretrain/Learning Rate": 1.7071375945407143e-05, "Pretrain/Loss": 2.0156216621398926, "Pretrain/Loss (Raw)": 2.038086414337158, "Pretrain/Step": 11723, "Pretrain/Step Time": 8.427361153066158} +{"Pretrain/Learning Rate": 1.7067350041619416e-05, "Pretrain/Loss": 2.017629623413086, "Pretrain/Loss (Raw)": 1.9827144145965576, "Pretrain/Step": 11724, "Pretrain/Step Time": 8.427973324432969} +{"Pretrain/Learning Rate": 1.7063324366564064e-05, "Pretrain/Loss": 2.0193428993225098, "Pretrain/Loss (Raw)": 2.041762590408325, "Pretrain/Step": 11725, "Pretrain/Step Time": 8.428115522488952} +{"Pretrain/Learning Rate": 1.7059298920357163e-05, "Pretrain/Loss": 2.019176959991455, "Pretrain/Loss (Raw)": 2.0949926376342773, "Pretrain/Step": 11726, "Pretrain/Step Time": 8.42726370319724} +{"Pretrain/Learning Rate": 1.7055273703114777e-05, "Pretrain/Loss": 2.019681930541992, "Pretrain/Loss (Raw)": 2.0554304122924805, "Pretrain/Step": 11727, "Pretrain/Step Time": 8.423139683902264} +{"Pretrain/Learning Rate": 1.705124871495297e-05, "Pretrain/Loss": 2.017673969268799, "Pretrain/Loss (Raw)": 1.9104989767074585, "Pretrain/Step": 11728, "Pretrain/Step Time": 8.425179898738861} +{"Pretrain/Learning Rate": 1.70472239559878e-05, "Pretrain/Loss": 2.0218887329101562, "Pretrain/Loss (Raw)": 2.2403297424316406, "Pretrain/Step": 11729, "Pretrain/Step Time": 8.42333517409861} +{"Pretrain/Learning Rate": 1.7043199426335325e-05, "Pretrain/Loss": 2.024958372116089, "Pretrain/Loss (Raw)": 2.1306073665618896, "Pretrain/Step": 11730, "Pretrain/Step Time": 8.430691661313176} +{"Pretrain/Learning Rate": 1.703917512611159e-05, "Pretrain/Loss": 2.0260262489318848, "Pretrain/Loss (Raw)": 2.0768165588378906, "Pretrain/Step": 11731, "Pretrain/Step Time": 8.434737008064985} +{"Pretrain/Learning Rate": 1.7035151055432623e-05, "Pretrain/Loss": 2.0255494117736816, "Pretrain/Loss (Raw)": 1.9008315801620483, "Pretrain/Step": 11732, "Pretrain/Step Time": 8.43195616826415} +{"Pretrain/Learning Rate": 1.7031127214414462e-05, "Pretrain/Loss": 2.025905132293701, "Pretrain/Loss (Raw)": 1.9538933038711548, "Pretrain/Step": 11733, "Pretrain/Step Time": 8.431105859577656} +{"Pretrain/Learning Rate": 1.7027103603173127e-05, "Pretrain/Loss": 2.026500940322876, "Pretrain/Loss (Raw)": 1.8444480895996094, "Pretrain/Step": 11734, "Pretrain/Step Time": 8.43469519726932} +{"Pretrain/Learning Rate": 1.702308022182464e-05, "Pretrain/Loss": 2.0241730213165283, "Pretrain/Loss (Raw)": 1.8066762685775757, "Pretrain/Step": 11735, "Pretrain/Step Time": 8.435174202546477} +{"Pretrain/Learning Rate": 1.701905707048501e-05, "Pretrain/Loss": 2.02311372756958, "Pretrain/Loss (Raw)": 1.9948810338974, "Pretrain/Step": 11736, "Pretrain/Step Time": 8.434880387037992} +{"Pretrain/Learning Rate": 1.7015034149270253e-05, "Pretrain/Loss": 2.024265766143799, "Pretrain/Loss (Raw)": 2.1496968269348145, "Pretrain/Step": 11737, "Pretrain/Step Time": 8.438561376184225} +{"Pretrain/Learning Rate": 1.7011011458296348e-05, "Pretrain/Loss": 2.0247397422790527, "Pretrain/Loss (Raw)": 2.0829432010650635, "Pretrain/Step": 11738, "Pretrain/Step Time": 8.43267122283578} +{"Pretrain/Learning Rate": 1.7006988997679297e-05, "Pretrain/Loss": 2.0246775150299072, "Pretrain/Loss (Raw)": 1.961473822593689, "Pretrain/Step": 11739, "Pretrain/Step Time": 8.435138121247292} +{"Pretrain/Learning Rate": 1.7002966767535083e-05, "Pretrain/Loss": 2.024611473083496, "Pretrain/Loss (Raw)": 2.069171190261841, "Pretrain/Step": 11740, "Pretrain/Step Time": 8.434642605483532} +{"Pretrain/Learning Rate": 1.6998944767979685e-05, "Pretrain/Loss": 2.02443790435791, "Pretrain/Loss (Raw)": 2.1294121742248535, "Pretrain/Step": 11741, "Pretrain/Step Time": 8.43350613489747} +{"Pretrain/Learning Rate": 1.6994922999129083e-05, "Pretrain/Loss": 2.022756338119507, "Pretrain/Loss (Raw)": 1.9024502038955688, "Pretrain/Step": 11742, "Pretrain/Step Time": 8.439344648271799} +{"Pretrain/Learning Rate": 1.6990901461099223e-05, "Pretrain/Loss": 2.0217549800872803, "Pretrain/Loss (Raw)": 1.879101037979126, "Pretrain/Step": 11743, "Pretrain/Step Time": 8.43745794519782} +{"Pretrain/Learning Rate": 1.6986880154006074e-05, "Pretrain/Loss": 2.0211846828460693, "Pretrain/Loss (Raw)": 2.059587240219116, "Pretrain/Step": 11744, "Pretrain/Step Time": 8.432508986443281} +{"Pretrain/Learning Rate": 1.698285907796559e-05, "Pretrain/Loss": 2.0199294090270996, "Pretrain/Loss (Raw)": 1.8785817623138428, "Pretrain/Step": 11745, "Pretrain/Step Time": 8.43152230978012} +{"Pretrain/Learning Rate": 1.6978838233093707e-05, "Pretrain/Loss": 2.0212085247039795, "Pretrain/Loss (Raw)": 2.172168731689453, "Pretrain/Step": 11746, "Pretrain/Step Time": 8.439377138391137} +{"Pretrain/Learning Rate": 1.6974817619506378e-05, "Pretrain/Loss": 2.0186452865600586, "Pretrain/Loss (Raw)": 1.8701294660568237, "Pretrain/Step": 11747, "Pretrain/Step Time": 8.442090146243572} +{"Pretrain/Learning Rate": 1.6970797237319518e-05, "Pretrain/Loss": 2.0190539360046387, "Pretrain/Loss (Raw)": 1.916038990020752, "Pretrain/Step": 11748, "Pretrain/Step Time": 8.444034026935697} +{"Pretrain/Learning Rate": 1.6966777086649067e-05, "Pretrain/Loss": 2.018510580062866, "Pretrain/Loss (Raw)": 1.9706774950027466, "Pretrain/Step": 11749, "Pretrain/Step Time": 8.443164475262165} +{"Pretrain/Learning Rate": 1.6962757167610926e-05, "Pretrain/Loss": 2.0160107612609863, "Pretrain/Loss (Raw)": 1.8743932247161865, "Pretrain/Step": 11750, "Pretrain/Step Time": 8.439077774062753} +{"Pretrain/Learning Rate": 1.6958737480321022e-05, "Pretrain/Loss": 2.016317844390869, "Pretrain/Loss (Raw)": 2.1402289867401123, "Pretrain/Step": 11751, "Pretrain/Step Time": 8.437260963022709} +{"Pretrain/Learning Rate": 1.695471802489526e-05, "Pretrain/Loss": 2.017009735107422, "Pretrain/Loss (Raw)": 2.0939786434173584, "Pretrain/Step": 11752, "Pretrain/Step Time": 8.43693993985653} +{"Pretrain/Learning Rate": 1.695069880144952e-05, "Pretrain/Loss": 2.0158464908599854, "Pretrain/Loss (Raw)": 1.9213387966156006, "Pretrain/Step": 11753, "Pretrain/Step Time": 8.438214370980859} +{"Pretrain/Learning Rate": 1.6946679810099713e-05, "Pretrain/Loss": 2.0188708305358887, "Pretrain/Loss (Raw)": 2.0121846199035645, "Pretrain/Step": 11754, "Pretrain/Step Time": 8.442119292914867} +{"Pretrain/Learning Rate": 1.694266105096171e-05, "Pretrain/Loss": 2.01853084564209, "Pretrain/Loss (Raw)": 2.0573103427886963, "Pretrain/Step": 11755, "Pretrain/Step Time": 8.436835400760174} +{"Pretrain/Learning Rate": 1.6938642524151403e-05, "Pretrain/Loss": 2.016475200653076, "Pretrain/Loss (Raw)": 1.8433680534362793, "Pretrain/Step": 11756, "Pretrain/Step Time": 8.437924284487963} +{"Pretrain/Learning Rate": 1.6934624229784658e-05, "Pretrain/Loss": 2.019191265106201, "Pretrain/Loss (Raw)": 2.120811939239502, "Pretrain/Step": 11757, "Pretrain/Step Time": 8.437560357153416} +{"Pretrain/Learning Rate": 1.693060616797733e-05, "Pretrain/Loss": 2.0176162719726562, "Pretrain/Loss (Raw)": 2.008925676345825, "Pretrain/Step": 11758, "Pretrain/Step Time": 8.442891320213675} +{"Pretrain/Learning Rate": 1.6926588338845287e-05, "Pretrain/Loss": 2.012420415878296, "Pretrain/Loss (Raw)": 1.8976765871047974, "Pretrain/Step": 11759, "Pretrain/Step Time": 8.445375483483076} +{"Pretrain/Learning Rate": 1.692257074250438e-05, "Pretrain/Loss": 2.013756275177002, "Pretrain/Loss (Raw)": 2.14704966545105, "Pretrain/Step": 11760, "Pretrain/Step Time": 8.436749340966344} +{"Pretrain/Learning Rate": 1.6918553379070445e-05, "Pretrain/Loss": 2.012737512588501, "Pretrain/Loss (Raw)": 1.8177820444107056, "Pretrain/Step": 11761, "Pretrain/Step Time": 8.43681052327156} +{"Pretrain/Learning Rate": 1.6914536248659336e-05, "Pretrain/Loss": 2.0135412216186523, "Pretrain/Loss (Raw)": 2.0525403022766113, "Pretrain/Step": 11762, "Pretrain/Step Time": 8.442416280508041} +{"Pretrain/Learning Rate": 1.691051935138687e-05, "Pretrain/Loss": 2.014702081680298, "Pretrain/Loss (Raw)": 2.1808788776397705, "Pretrain/Step": 11763, "Pretrain/Step Time": 8.441568380221725} +{"Pretrain/Learning Rate": 1.6906502687368873e-05, "Pretrain/Loss": 2.0146372318267822, "Pretrain/Loss (Raw)": 1.993582010269165, "Pretrain/Step": 11764, "Pretrain/Step Time": 8.438925873488188} +{"Pretrain/Learning Rate": 1.6902486256721166e-05, "Pretrain/Loss": 2.013831615447998, "Pretrain/Loss (Raw)": 2.0374679565429688, "Pretrain/Step": 11765, "Pretrain/Step Time": 8.443891920149326} +{"Pretrain/Learning Rate": 1.689847005955956e-05, "Pretrain/Loss": 2.0144450664520264, "Pretrain/Loss (Raw)": 2.135719060897827, "Pretrain/Step": 11766, "Pretrain/Step Time": 8.44033551029861} +{"Pretrain/Learning Rate": 1.6894454095999865e-05, "Pretrain/Loss": 2.0149431228637695, "Pretrain/Loss (Raw)": 1.9945204257965088, "Pretrain/Step": 11767, "Pretrain/Step Time": 8.43551285378635} +{"Pretrain/Learning Rate": 1.6890438366157866e-05, "Pretrain/Loss": 2.0157718658447266, "Pretrain/Loss (Raw)": 2.241750717163086, "Pretrain/Step": 11768, "Pretrain/Step Time": 8.440890369936824} +{"Pretrain/Learning Rate": 1.688642287014936e-05, "Pretrain/Loss": 2.01308012008667, "Pretrain/Loss (Raw)": 2.0720531940460205, "Pretrain/Step": 11769, "Pretrain/Step Time": 8.432462206110358} +{"Pretrain/Learning Rate": 1.688240760809013e-05, "Pretrain/Loss": 2.0142550468444824, "Pretrain/Loss (Raw)": 2.202406644821167, "Pretrain/Step": 11770, "Pretrain/Step Time": 8.436086116358638} +{"Pretrain/Learning Rate": 1.6878392580095954e-05, "Pretrain/Loss": 2.012321949005127, "Pretrain/Loss (Raw)": 1.790158987045288, "Pretrain/Step": 11771, "Pretrain/Step Time": 8.436162682250142} +{"Pretrain/Learning Rate": 1.6874377786282602e-05, "Pretrain/Loss": 2.0131702423095703, "Pretrain/Loss (Raw)": 1.8965849876403809, "Pretrain/Step": 11772, "Pretrain/Step Time": 8.439430978149176} +{"Pretrain/Learning Rate": 1.6870363226765844e-05, "Pretrain/Loss": 2.0137104988098145, "Pretrain/Loss (Raw)": 2.1333463191986084, "Pretrain/Step": 11773, "Pretrain/Step Time": 8.44101887382567} +{"Pretrain/Learning Rate": 1.686634890166143e-05, "Pretrain/Loss": 2.0150399208068848, "Pretrain/Loss (Raw)": 1.9753682613372803, "Pretrain/Step": 11774, "Pretrain/Step Time": 8.441475806757808} +{"Pretrain/Learning Rate": 1.6862334811085105e-05, "Pretrain/Loss": 2.016667604446411, "Pretrain/Loss (Raw)": 2.12355899810791, "Pretrain/Step": 11775, "Pretrain/Step Time": 8.440898582339287} +{"Pretrain/Learning Rate": 1.6858320955152623e-05, "Pretrain/Loss": 2.016737937927246, "Pretrain/Loss (Raw)": 2.354032278060913, "Pretrain/Step": 11776, "Pretrain/Step Time": 8.438302431255579} +{"Pretrain/Learning Rate": 1.685430733397972e-05, "Pretrain/Loss": 2.0168325901031494, "Pretrain/Loss (Raw)": 2.034977912902832, "Pretrain/Step": 11777, "Pretrain/Step Time": 8.437491606920958} +{"Pretrain/Learning Rate": 1.6850293947682123e-05, "Pretrain/Loss": 2.020685911178589, "Pretrain/Loss (Raw)": 1.951248288154602, "Pretrain/Step": 11778, "Pretrain/Step Time": 8.437207913026214} +{"Pretrain/Learning Rate": 1.6846280796375553e-05, "Pretrain/Loss": 2.0205698013305664, "Pretrain/Loss (Raw)": 2.0954058170318604, "Pretrain/Step": 11779, "Pretrain/Step Time": 8.443117113783956} +{"Pretrain/Learning Rate": 1.6842267880175723e-05, "Pretrain/Loss": 2.019524335861206, "Pretrain/Loss (Raw)": 2.062349319458008, "Pretrain/Step": 11780, "Pretrain/Step Time": 8.442941904067993} +{"Pretrain/Learning Rate": 1.683825519919835e-05, "Pretrain/Loss": 2.0181188583374023, "Pretrain/Loss (Raw)": 1.9169155359268188, "Pretrain/Step": 11781, "Pretrain/Step Time": 8.440658874809742} +{"Pretrain/Learning Rate": 1.683424275355914e-05, "Pretrain/Loss": 2.018441677093506, "Pretrain/Loss (Raw)": 2.0689823627471924, "Pretrain/Step": 11782, "Pretrain/Step Time": 8.44791784696281} +{"Pretrain/Learning Rate": 1.6830230543373783e-05, "Pretrain/Loss": 2.0176806449890137, "Pretrain/Loss (Raw)": 2.0605132579803467, "Pretrain/Step": 11783, "Pretrain/Step Time": 8.446734678000212} +{"Pretrain/Learning Rate": 1.6826218568757963e-05, "Pretrain/Loss": 2.017430067062378, "Pretrain/Loss (Raw)": 1.9258267879486084, "Pretrain/Step": 11784, "Pretrain/Step Time": 8.441331325098872} +{"Pretrain/Learning Rate": 1.682220682982737e-05, "Pretrain/Loss": 2.016575813293457, "Pretrain/Loss (Raw)": 2.020036458969116, "Pretrain/Step": 11785, "Pretrain/Step Time": 8.439395323395729} +{"Pretrain/Learning Rate": 1.681819532669768e-05, "Pretrain/Loss": 2.0147833824157715, "Pretrain/Loss (Raw)": 1.8695212602615356, "Pretrain/Step": 11786, "Pretrain/Step Time": 8.443290146067739} +{"Pretrain/Learning Rate": 1.6814184059484558e-05, "Pretrain/Loss": 2.0122382640838623, "Pretrain/Loss (Raw)": 1.8672593832015991, "Pretrain/Step": 11787, "Pretrain/Step Time": 8.440680276602507} +{"Pretrain/Learning Rate": 1.6810173028303674e-05, "Pretrain/Loss": 2.012303590774536, "Pretrain/Loss (Raw)": 1.9390246868133545, "Pretrain/Step": 11788, "Pretrain/Step Time": 8.443161249160767} +{"Pretrain/Learning Rate": 1.6806162233270673e-05, "Pretrain/Loss": 2.0110785961151123, "Pretrain/Loss (Raw)": 1.8458918333053589, "Pretrain/Step": 11789, "Pretrain/Step Time": 8.44220926426351} +{"Pretrain/Learning Rate": 1.680215167450121e-05, "Pretrain/Loss": 2.01358699798584, "Pretrain/Loss (Raw)": 2.178555965423584, "Pretrain/Step": 11790, "Pretrain/Step Time": 8.442782314494252} +{"Pretrain/Learning Rate": 1.679814135211092e-05, "Pretrain/Loss": 2.011807680130005, "Pretrain/Loss (Raw)": 1.9053003787994385, "Pretrain/Step": 11791, "Pretrain/Step Time": 8.444942232221365} +{"Pretrain/Learning Rate": 1.679413126621544e-05, "Pretrain/Loss": 2.0122971534729004, "Pretrain/Loss (Raw)": 1.9400349855422974, "Pretrain/Step": 11792, "Pretrain/Step Time": 8.443816164508462} +{"Pretrain/Learning Rate": 1.679012141693041e-05, "Pretrain/Loss": 2.0123302936553955, "Pretrain/Loss (Raw)": 2.021320343017578, "Pretrain/Step": 11793, "Pretrain/Step Time": 8.438596967607737} +{"Pretrain/Learning Rate": 1.6786111804371433e-05, "Pretrain/Loss": 2.012392282485962, "Pretrain/Loss (Raw)": 1.9985672235488892, "Pretrain/Step": 11794, "Pretrain/Step Time": 8.43872876279056} +{"Pretrain/Learning Rate": 1.6782102428654134e-05, "Pretrain/Loss": 2.0089235305786133, "Pretrain/Loss (Raw)": 1.8657512664794922, "Pretrain/Step": 11795, "Pretrain/Step Time": 8.442789603024721} +{"Pretrain/Learning Rate": 1.677809328989412e-05, "Pretrain/Loss": 2.009838581085205, "Pretrain/Loss (Raw)": 1.9163291454315186, "Pretrain/Step": 11796, "Pretrain/Step Time": 8.438895361497998} +{"Pretrain/Learning Rate": 1.6774084388206986e-05, "Pretrain/Loss": 2.0094375610351562, "Pretrain/Loss (Raw)": 2.073755979537964, "Pretrain/Step": 11797, "Pretrain/Step Time": 8.44065934792161} +{"Pretrain/Learning Rate": 1.677007572370834e-05, "Pretrain/Loss": 2.0090298652648926, "Pretrain/Loss (Raw)": 1.953229546546936, "Pretrain/Step": 11798, "Pretrain/Step Time": 8.442729393020272} +{"Pretrain/Learning Rate": 1.6766067296513755e-05, "Pretrain/Loss": 2.0085370540618896, "Pretrain/Loss (Raw)": 1.9183448553085327, "Pretrain/Step": 11799, "Pretrain/Step Time": 8.441697901114821} +{"Pretrain/Learning Rate": 1.6762059106738814e-05, "Pretrain/Loss": 2.00818133354187, "Pretrain/Loss (Raw)": 2.0991971492767334, "Pretrain/Step": 11800, "Pretrain/Step Time": 8.43944251537323} +{"Pretrain/Learning Rate": 1.6758051154499088e-05, "Pretrain/Loss": 2.0089073181152344, "Pretrain/Loss (Raw)": 2.042147159576416, "Pretrain/Step": 11801, "Pretrain/Step Time": 8.438011707738042} +{"Pretrain/Learning Rate": 1.6754043439910143e-05, "Pretrain/Loss": 2.007502317428589, "Pretrain/Loss (Raw)": 1.9163752794265747, "Pretrain/Step": 11802, "Pretrain/Step Time": 8.43752027861774} +{"Pretrain/Learning Rate": 1.675003596308755e-05, "Pretrain/Loss": 2.0096023082733154, "Pretrain/Loss (Raw)": 2.2542920112609863, "Pretrain/Step": 11803, "Pretrain/Step Time": 8.440930180251598} +{"Pretrain/Learning Rate": 1.674602872414685e-05, "Pretrain/Loss": 2.009399890899658, "Pretrain/Loss (Raw)": 1.9892929792404175, "Pretrain/Step": 11804, "Pretrain/Step Time": 8.440519215539098} +{"Pretrain/Learning Rate": 1.6742021723203592e-05, "Pretrain/Loss": 2.009852886199951, "Pretrain/Loss (Raw)": 2.1681571006774902, "Pretrain/Step": 11805, "Pretrain/Step Time": 8.44347558170557} +{"Pretrain/Learning Rate": 1.673801496037332e-05, "Pretrain/Loss": 2.0137171745300293, "Pretrain/Loss (Raw)": 2.43517804145813, "Pretrain/Step": 11806, "Pretrain/Step Time": 8.438756711781025} +{"Pretrain/Learning Rate": 1.673400843577156e-05, "Pretrain/Loss": 2.014887809753418, "Pretrain/Loss (Raw)": 2.173861026763916, "Pretrain/Step": 11807, "Pretrain/Step Time": 8.441624896600842} +{"Pretrain/Learning Rate": 1.673000214951384e-05, "Pretrain/Loss": 2.0130715370178223, "Pretrain/Loss (Raw)": 1.9808229207992554, "Pretrain/Step": 11808, "Pretrain/Step Time": 8.443236246705055} +{"Pretrain/Learning Rate": 1.6725996101715678e-05, "Pretrain/Loss": 2.010700225830078, "Pretrain/Loss (Raw)": 1.9583477973937988, "Pretrain/Step": 11809, "Pretrain/Step Time": 8.440866600722075} +{"Pretrain/Learning Rate": 1.6721990292492585e-05, "Pretrain/Loss": 2.013887882232666, "Pretrain/Loss (Raw)": 2.147683620452881, "Pretrain/Step": 11810, "Pretrain/Step Time": 8.43650784343481} +{"Pretrain/Learning Rate": 1.671798472196007e-05, "Pretrain/Loss": 2.014803409576416, "Pretrain/Loss (Raw)": 1.909006118774414, "Pretrain/Step": 11811, "Pretrain/Step Time": 8.440604323521256} +{"Pretrain/Learning Rate": 1.6713979390233624e-05, "Pretrain/Loss": 2.016028881072998, "Pretrain/Loss (Raw)": 2.0529019832611084, "Pretrain/Step": 11812, "Pretrain/Step Time": 8.43916480988264} +{"Pretrain/Learning Rate": 1.6709974297428738e-05, "Pretrain/Loss": 2.0142619609832764, "Pretrain/Loss (Raw)": 1.7506911754608154, "Pretrain/Step": 11813, "Pretrain/Step Time": 8.43986720778048} +{"Pretrain/Learning Rate": 1.67059694436609e-05, "Pretrain/Loss": 2.017390012741089, "Pretrain/Loss (Raw)": 2.043774127960205, "Pretrain/Step": 11814, "Pretrain/Step Time": 8.442329926416278} +{"Pretrain/Learning Rate": 1.670196482904559e-05, "Pretrain/Loss": 2.0174121856689453, "Pretrain/Loss (Raw)": 1.8542213439941406, "Pretrain/Step": 11815, "Pretrain/Step Time": 8.440864372998476} +{"Pretrain/Learning Rate": 1.669796045369828e-05, "Pretrain/Loss": 2.01540470123291, "Pretrain/Loss (Raw)": 1.8769387006759644, "Pretrain/Step": 11816, "Pretrain/Step Time": 8.440309120342135} +{"Pretrain/Learning Rate": 1.6693956317734414e-05, "Pretrain/Loss": 2.017019748687744, "Pretrain/Loss (Raw)": 2.158400058746338, "Pretrain/Step": 11817, "Pretrain/Step Time": 8.436576856300235} +{"Pretrain/Learning Rate": 1.668995242126947e-05, "Pretrain/Loss": 2.0185792446136475, "Pretrain/Loss (Raw)": 2.090195894241333, "Pretrain/Step": 11818, "Pretrain/Step Time": 8.4396289922297} +{"Pretrain/Learning Rate": 1.6685948764418887e-05, "Pretrain/Loss": 2.018899917602539, "Pretrain/Loss (Raw)": 2.0305259227752686, "Pretrain/Step": 11819, "Pretrain/Step Time": 8.436908388510346} +{"Pretrain/Learning Rate": 1.668194534729811e-05, "Pretrain/Loss": 2.0170583724975586, "Pretrain/Loss (Raw)": 1.8555611371994019, "Pretrain/Step": 11820, "Pretrain/Step Time": 8.439551193267107} +{"Pretrain/Learning Rate": 1.6677942170022582e-05, "Pretrain/Loss": 2.018357753753662, "Pretrain/Loss (Raw)": 2.032215118408203, "Pretrain/Step": 11821, "Pretrain/Step Time": 8.440876301378012} +{"Pretrain/Learning Rate": 1.667393923270772e-05, "Pretrain/Loss": 2.0192599296569824, "Pretrain/Loss (Raw)": 2.0921671390533447, "Pretrain/Step": 11822, "Pretrain/Step Time": 8.442536262795329} +{"Pretrain/Learning Rate": 1.666993653546895e-05, "Pretrain/Loss": 2.0173208713531494, "Pretrain/Loss (Raw)": 1.9231760501861572, "Pretrain/Step": 11823, "Pretrain/Step Time": 8.442496104165912} +{"Pretrain/Learning Rate": 1.6665934078421687e-05, "Pretrain/Loss": 2.0190839767456055, "Pretrain/Loss (Raw)": 2.0040299892425537, "Pretrain/Step": 11824, "Pretrain/Step Time": 8.44122746028006} +{"Pretrain/Learning Rate": 1.666193186168134e-05, "Pretrain/Loss": 2.0206384658813477, "Pretrain/Loss (Raw)": 2.1988699436187744, "Pretrain/Step": 11825, "Pretrain/Step Time": 8.44382943958044} +{"Pretrain/Learning Rate": 1.6657929885363317e-05, "Pretrain/Loss": 2.0193207263946533, "Pretrain/Loss (Raw)": 1.941901445388794, "Pretrain/Step": 11826, "Pretrain/Step Time": 8.433745309710503} +{"Pretrain/Learning Rate": 1.6653928149582996e-05, "Pretrain/Loss": 2.020035982131958, "Pretrain/Loss (Raw)": 2.1477200984954834, "Pretrain/Step": 11827, "Pretrain/Step Time": 8.434496162459254} +{"Pretrain/Learning Rate": 1.664992665445577e-05, "Pretrain/Loss": 2.0223469734191895, "Pretrain/Loss (Raw)": 2.165295124053955, "Pretrain/Step": 11828, "Pretrain/Step Time": 8.432440368458629} +{"Pretrain/Learning Rate": 1.664592540009703e-05, "Pretrain/Loss": 2.023297071456909, "Pretrain/Loss (Raw)": 2.1221377849578857, "Pretrain/Step": 11829, "Pretrain/Step Time": 8.43303532525897} +{"Pretrain/Learning Rate": 1.664192438662214e-05, "Pretrain/Loss": 2.0216219425201416, "Pretrain/Loss (Raw)": 1.9409770965576172, "Pretrain/Step": 11830, "Pretrain/Step Time": 8.43314565345645} +{"Pretrain/Learning Rate": 1.663792361414647e-05, "Pretrain/Loss": 2.0200095176696777, "Pretrain/Loss (Raw)": 1.7949402332305908, "Pretrain/Step": 11831, "Pretrain/Step Time": 8.433978766202927} +{"Pretrain/Learning Rate": 1.663392308278538e-05, "Pretrain/Loss": 2.0193910598754883, "Pretrain/Loss (Raw)": 1.7851890325546265, "Pretrain/Step": 11832, "Pretrain/Step Time": 8.434934532269835} +{"Pretrain/Learning Rate": 1.6629922792654213e-05, "Pretrain/Loss": 2.019899368286133, "Pretrain/Loss (Raw)": 2.159946918487549, "Pretrain/Step": 11833, "Pretrain/Step Time": 8.428553380072117} +{"Pretrain/Learning Rate": 1.6625922743868325e-05, "Pretrain/Loss": 2.020099401473999, "Pretrain/Loss (Raw)": 2.095689535140991, "Pretrain/Step": 11834, "Pretrain/Step Time": 8.429264785721898} +{"Pretrain/Learning Rate": 1.662192293654305e-05, "Pretrain/Loss": 2.01741361618042, "Pretrain/Loss (Raw)": 1.6174147129058838, "Pretrain/Step": 11835, "Pretrain/Step Time": 8.428780354559422} +{"Pretrain/Learning Rate": 1.661792337079372e-05, "Pretrain/Loss": 2.017904281616211, "Pretrain/Loss (Raw)": 2.109447717666626, "Pretrain/Step": 11836, "Pretrain/Step Time": 8.430593373253942} +{"Pretrain/Learning Rate": 1.661392404673567e-05, "Pretrain/Loss": 2.013674259185791, "Pretrain/Loss (Raw)": 1.9246957302093506, "Pretrain/Step": 11837, "Pretrain/Step Time": 8.433415990322828} +{"Pretrain/Learning Rate": 1.66099249644842e-05, "Pretrain/Loss": 2.013543128967285, "Pretrain/Loss (Raw)": 2.141957998275757, "Pretrain/Step": 11838, "Pretrain/Step Time": 8.431089555844665} +{"Pretrain/Learning Rate": 1.660592612415463e-05, "Pretrain/Loss": 2.0134124755859375, "Pretrain/Loss (Raw)": 2.1065919399261475, "Pretrain/Step": 11839, "Pretrain/Step Time": 8.4372294023633} +{"Pretrain/Learning Rate": 1.660192752586226e-05, "Pretrain/Loss": 2.0125651359558105, "Pretrain/Loss (Raw)": 1.9832013845443726, "Pretrain/Step": 11840, "Pretrain/Step Time": 8.434325646609068} +{"Pretrain/Learning Rate": 1.6597929169722392e-05, "Pretrain/Loss": 2.0147316455841064, "Pretrain/Loss (Raw)": 2.0946407318115234, "Pretrain/Step": 11841, "Pretrain/Step Time": 8.43286107480526} +{"Pretrain/Learning Rate": 1.659393105585032e-05, "Pretrain/Loss": 2.0133814811706543, "Pretrain/Loss (Raw)": 1.9754217863082886, "Pretrain/Step": 11842, "Pretrain/Step Time": 8.43067136220634} +{"Pretrain/Learning Rate": 1.658993318436131e-05, "Pretrain/Loss": 2.013472557067871, "Pretrain/Loss (Raw)": 1.9166009426116943, "Pretrain/Step": 11843, "Pretrain/Step Time": 8.428677076473832} +{"Pretrain/Learning Rate": 1.6585935555370656e-05, "Pretrain/Loss": 2.011760950088501, "Pretrain/Loss (Raw)": 1.7942204475402832, "Pretrain/Step": 11844, "Pretrain/Step Time": 8.427855491638184} +{"Pretrain/Learning Rate": 1.6581938168993612e-05, "Pretrain/Loss": 2.0116586685180664, "Pretrain/Loss (Raw)": 1.9712148904800415, "Pretrain/Step": 11845, "Pretrain/Step Time": 8.432922905310988} +{"Pretrain/Learning Rate": 1.657794102534545e-05, "Pretrain/Loss": 2.012831687927246, "Pretrain/Loss (Raw)": 2.1441433429718018, "Pretrain/Step": 11846, "Pretrain/Step Time": 8.433963894844055} +{"Pretrain/Learning Rate": 1.6573944124541424e-05, "Pretrain/Loss": 2.0126349925994873, "Pretrain/Loss (Raw)": 1.8470224142074585, "Pretrain/Step": 11847, "Pretrain/Step Time": 8.432629128918052} +{"Pretrain/Learning Rate": 1.6569947466696774e-05, "Pretrain/Loss": 2.0159826278686523, "Pretrain/Loss (Raw)": 2.313281774520874, "Pretrain/Step": 11848, "Pretrain/Step Time": 8.431427737697959} +{"Pretrain/Learning Rate": 1.6565951051926748e-05, "Pretrain/Loss": 2.0132007598876953, "Pretrain/Loss (Raw)": 1.9596621990203857, "Pretrain/Step": 11849, "Pretrain/Step Time": 8.43014406785369} +{"Pretrain/Learning Rate": 1.6561954880346576e-05, "Pretrain/Loss": 2.0144760608673096, "Pretrain/Loss (Raw)": 2.100031614303589, "Pretrain/Step": 11850, "Pretrain/Step Time": 8.430763844400644} +{"Pretrain/Learning Rate": 1.655795895207149e-05, "Pretrain/Loss": 2.0149450302124023, "Pretrain/Loss (Raw)": 2.0980913639068604, "Pretrain/Step": 11851, "Pretrain/Step Time": 8.433623533695936} +{"Pretrain/Learning Rate": 1.6553963267216706e-05, "Pretrain/Loss": 2.0143229961395264, "Pretrain/Loss (Raw)": 1.9031403064727783, "Pretrain/Step": 11852, "Pretrain/Step Time": 8.432282596826553} +{"Pretrain/Learning Rate": 1.6549967825897438e-05, "Pretrain/Loss": 2.013296127319336, "Pretrain/Loss (Raw)": 1.9102907180786133, "Pretrain/Step": 11853, "Pretrain/Step Time": 8.438242154195905} +{"Pretrain/Learning Rate": 1.6545972628228884e-05, "Pretrain/Loss": 2.012653350830078, "Pretrain/Loss (Raw)": 2.012730121612549, "Pretrain/Step": 11854, "Pretrain/Step Time": 8.435807198286057} +{"Pretrain/Learning Rate": 1.6541977674326252e-05, "Pretrain/Loss": 2.0144097805023193, "Pretrain/Loss (Raw)": 2.2802340984344482, "Pretrain/Step": 11855, "Pretrain/Step Time": 8.439442006871104} +{"Pretrain/Learning Rate": 1.6537982964304734e-05, "Pretrain/Loss": 2.014749050140381, "Pretrain/Loss (Raw)": 1.9539204835891724, "Pretrain/Step": 11856, "Pretrain/Step Time": 8.43502190336585} +{"Pretrain/Learning Rate": 1.6533988498279517e-05, "Pretrain/Loss": 2.01289701461792, "Pretrain/Loss (Raw)": 2.0032906532287598, "Pretrain/Step": 11857, "Pretrain/Step Time": 8.430333904922009} +{"Pretrain/Learning Rate": 1.652999427636577e-05, "Pretrain/Loss": 2.01153302192688, "Pretrain/Loss (Raw)": 1.9560192823410034, "Pretrain/Step": 11858, "Pretrain/Step Time": 8.42835957184434} +{"Pretrain/Learning Rate": 1.652600029867866e-05, "Pretrain/Loss": 2.0101609230041504, "Pretrain/Loss (Raw)": 1.9011682271957397, "Pretrain/Step": 11859, "Pretrain/Step Time": 8.42635983042419} +{"Pretrain/Learning Rate": 1.6522006565333365e-05, "Pretrain/Loss": 2.0124900341033936, "Pretrain/Loss (Raw)": 2.1989872455596924, "Pretrain/Step": 11860, "Pretrain/Step Time": 8.429026635363698} +{"Pretrain/Learning Rate": 1.651801307644503e-05, "Pretrain/Loss": 2.0124974250793457, "Pretrain/Loss (Raw)": 1.9548053741455078, "Pretrain/Step": 11861, "Pretrain/Step Time": 8.433522114530206} +{"Pretrain/Learning Rate": 1.6514019832128813e-05, "Pretrain/Loss": 2.0114245414733887, "Pretrain/Loss (Raw)": 1.7071553468704224, "Pretrain/Step": 11862, "Pretrain/Step Time": 8.434379594400525} +{"Pretrain/Learning Rate": 1.6510026832499848e-05, "Pretrain/Loss": 2.011716842651367, "Pretrain/Loss (Raw)": 1.8440532684326172, "Pretrain/Step": 11863, "Pretrain/Step Time": 8.432314733043313} +{"Pretrain/Learning Rate": 1.6506034077673278e-05, "Pretrain/Loss": 2.014044761657715, "Pretrain/Loss (Raw)": 2.2928671836853027, "Pretrain/Step": 11864, "Pretrain/Step Time": 8.43321026302874} +{"Pretrain/Learning Rate": 1.650204156776422e-05, "Pretrain/Loss": 2.0125904083251953, "Pretrain/Loss (Raw)": 1.963548183441162, "Pretrain/Step": 11865, "Pretrain/Step Time": 8.427246510982513} +{"Pretrain/Learning Rate": 1.649804930288781e-05, "Pretrain/Loss": 2.0098137855529785, "Pretrain/Loss (Raw)": 1.7275172472000122, "Pretrain/Step": 11866, "Pretrain/Step Time": 8.426651906222105} +{"Pretrain/Learning Rate": 1.6494057283159154e-05, "Pretrain/Loss": 2.0106072425842285, "Pretrain/Loss (Raw)": 2.063037395477295, "Pretrain/Step": 11867, "Pretrain/Step Time": 8.424733750522137} +{"Pretrain/Learning Rate": 1.649006550869336e-05, "Pretrain/Loss": 2.0103907585144043, "Pretrain/Loss (Raw)": 2.0414679050445557, "Pretrain/Step": 11868, "Pretrain/Step Time": 8.427285877987742} +{"Pretrain/Learning Rate": 1.6486073979605524e-05, "Pretrain/Loss": 2.0085201263427734, "Pretrain/Loss (Raw)": 1.889995813369751, "Pretrain/Step": 11869, "Pretrain/Step Time": 8.431751076132059} +{"Pretrain/Learning Rate": 1.6482082696010744e-05, "Pretrain/Loss": 2.0089831352233887, "Pretrain/Loss (Raw)": 1.9617011547088623, "Pretrain/Step": 11870, "Pretrain/Step Time": 8.423114670440555} +{"Pretrain/Learning Rate": 1.6478091658024107e-05, "Pretrain/Loss": 2.0092334747314453, "Pretrain/Loss (Raw)": 1.911144733428955, "Pretrain/Step": 11871, "Pretrain/Step Time": 8.426388658583164} +{"Pretrain/Learning Rate": 1.6474100865760685e-05, "Pretrain/Loss": 2.0085721015930176, "Pretrain/Loss (Raw)": 1.9749027490615845, "Pretrain/Step": 11872, "Pretrain/Step Time": 8.424607323482633} +{"Pretrain/Learning Rate": 1.6470110319335562e-05, "Pretrain/Loss": 2.0099406242370605, "Pretrain/Loss (Raw)": 2.05377459526062, "Pretrain/Step": 11873, "Pretrain/Step Time": 8.424328178167343} +{"Pretrain/Learning Rate": 1.646612001886379e-05, "Pretrain/Loss": 2.006450653076172, "Pretrain/Loss (Raw)": 1.7254647016525269, "Pretrain/Step": 11874, "Pretrain/Step Time": 8.417164821177721} +{"Pretrain/Learning Rate": 1.6462129964460434e-05, "Pretrain/Loss": 2.007941246032715, "Pretrain/Loss (Raw)": 2.060934543609619, "Pretrain/Step": 11875, "Pretrain/Step Time": 8.418135797604918} +{"Pretrain/Learning Rate": 1.6458140156240537e-05, "Pretrain/Loss": 2.006845235824585, "Pretrain/Loss (Raw)": 1.7757408618927002, "Pretrain/Step": 11876, "Pretrain/Step Time": 8.419881224632263} +{"Pretrain/Learning Rate": 1.6454150594319145e-05, "Pretrain/Loss": 2.0056872367858887, "Pretrain/Loss (Raw)": 1.8224217891693115, "Pretrain/Step": 11877, "Pretrain/Step Time": 8.424145940691233} +{"Pretrain/Learning Rate": 1.6450161278811307e-05, "Pretrain/Loss": 2.0078444480895996, "Pretrain/Loss (Raw)": 2.1505308151245117, "Pretrain/Step": 11878, "Pretrain/Step Time": 8.425605919212103} +{"Pretrain/Learning Rate": 1.6446172209832035e-05, "Pretrain/Loss": 2.007702350616455, "Pretrain/Loss (Raw)": 2.122051239013672, "Pretrain/Step": 11879, "Pretrain/Step Time": 8.429260769858956} +{"Pretrain/Learning Rate": 1.6442183387496357e-05, "Pretrain/Loss": 2.00628924369812, "Pretrain/Loss (Raw)": 1.9130868911743164, "Pretrain/Step": 11880, "Pretrain/Step Time": 8.425209868699312} +{"Pretrain/Learning Rate": 1.6438194811919286e-05, "Pretrain/Loss": 2.0066676139831543, "Pretrain/Loss (Raw)": 1.9697591066360474, "Pretrain/Step": 11881, "Pretrain/Step Time": 8.424592360854149} +{"Pretrain/Learning Rate": 1.6434206483215833e-05, "Pretrain/Loss": 2.007479190826416, "Pretrain/Loss (Raw)": 2.1160786151885986, "Pretrain/Step": 11882, "Pretrain/Step Time": 8.421429360285401} +{"Pretrain/Learning Rate": 1.6430218401501006e-05, "Pretrain/Loss": 2.0074462890625, "Pretrain/Loss (Raw)": 2.0531179904937744, "Pretrain/Step": 11883, "Pretrain/Step Time": 8.427283763885498} +{"Pretrain/Learning Rate": 1.6426230566889784e-05, "Pretrain/Loss": 2.0085878372192383, "Pretrain/Loss (Raw)": 1.9894541501998901, "Pretrain/Step": 11884, "Pretrain/Step Time": 8.428543420508504} +{"Pretrain/Learning Rate": 1.6422242979497162e-05, "Pretrain/Loss": 2.006375551223755, "Pretrain/Loss (Raw)": 1.8376697301864624, "Pretrain/Step": 11885, "Pretrain/Step Time": 8.431424230337143} +{"Pretrain/Learning Rate": 1.6418255639438113e-05, "Pretrain/Loss": 2.0070996284484863, "Pretrain/Loss (Raw)": 2.1015806198120117, "Pretrain/Step": 11886, "Pretrain/Step Time": 8.428357122465968} +{"Pretrain/Learning Rate": 1.641426854682761e-05, "Pretrain/Loss": 2.0076820850372314, "Pretrain/Loss (Raw)": 1.9722474813461304, "Pretrain/Step": 11887, "Pretrain/Step Time": 8.43073507770896} +{"Pretrain/Learning Rate": 1.6410281701780626e-05, "Pretrain/Loss": 2.007871150970459, "Pretrain/Loss (Raw)": 2.171231269836426, "Pretrain/Step": 11888, "Pretrain/Step Time": 8.430392449721694} +{"Pretrain/Learning Rate": 1.640629510441211e-05, "Pretrain/Loss": 2.0128424167633057, "Pretrain/Loss (Raw)": 2.454131841659546, "Pretrain/Step": 11889, "Pretrain/Step Time": 8.427611455321312} +{"Pretrain/Learning Rate": 1.6402308754837022e-05, "Pretrain/Loss": 2.0105466842651367, "Pretrain/Loss (Raw)": 1.7586805820465088, "Pretrain/Step": 11890, "Pretrain/Step Time": 8.425441034138203} +{"Pretrain/Learning Rate": 1.6398322653170296e-05, "Pretrain/Loss": 2.007058620452881, "Pretrain/Loss (Raw)": 1.734401822090149, "Pretrain/Step": 11891, "Pretrain/Step Time": 8.425672683864832} +{"Pretrain/Learning Rate": 1.6394336799526872e-05, "Pretrain/Loss": 2.0072951316833496, "Pretrain/Loss (Raw)": 2.0238609313964844, "Pretrain/Step": 11892, "Pretrain/Step Time": 8.429442927241325} +{"Pretrain/Learning Rate": 1.639035119402168e-05, "Pretrain/Loss": 2.0066239833831787, "Pretrain/Loss (Raw)": 1.951555848121643, "Pretrain/Step": 11893, "Pretrain/Step Time": 8.428881712257862} +{"Pretrain/Learning Rate": 1.638636583676964e-05, "Pretrain/Loss": 2.0052218437194824, "Pretrain/Loss (Raw)": 1.956275463104248, "Pretrain/Step": 11894, "Pretrain/Step Time": 8.430145842954516} +{"Pretrain/Learning Rate": 1.6382380727885677e-05, "Pretrain/Loss": 2.0063538551330566, "Pretrain/Loss (Raw)": 2.1394035816192627, "Pretrain/Step": 11895, "Pretrain/Step Time": 8.435352949425578} +{"Pretrain/Learning Rate": 1.637839586748468e-05, "Pretrain/Loss": 2.00453519821167, "Pretrain/Loss (Raw)": 2.0089304447174072, "Pretrain/Step": 11896, "Pretrain/Step Time": 8.435552403330803} +{"Pretrain/Learning Rate": 1.6374411255681568e-05, "Pretrain/Loss": 2.0029916763305664, "Pretrain/Loss (Raw)": 1.874518632888794, "Pretrain/Step": 11897, "Pretrain/Step Time": 8.433925142511725} +{"Pretrain/Learning Rate": 1.6370426892591224e-05, "Pretrain/Loss": 2.0017709732055664, "Pretrain/Loss (Raw)": 2.0461342334747314, "Pretrain/Step": 11898, "Pretrain/Step Time": 8.430890740826726} +{"Pretrain/Learning Rate": 1.6366442778328537e-05, "Pretrain/Loss": 2.004581928253174, "Pretrain/Loss (Raw)": 2.149970769882202, "Pretrain/Step": 11899, "Pretrain/Step Time": 8.432164715602994} +{"Pretrain/Learning Rate": 1.6362458913008387e-05, "Pretrain/Loss": 2.0032567977905273, "Pretrain/Loss (Raw)": 1.7269611358642578, "Pretrain/Step": 11900, "Pretrain/Step Time": 8.42850518040359} +{"Pretrain/Learning Rate": 1.6358475296745644e-05, "Pretrain/Loss": 2.0024073123931885, "Pretrain/Loss (Raw)": 2.0246224403381348, "Pretrain/Step": 11901, "Pretrain/Step Time": 8.427738070487976} +{"Pretrain/Learning Rate": 1.6354491929655176e-05, "Pretrain/Loss": 2.0027449131011963, "Pretrain/Loss (Raw)": 2.0185699462890625, "Pretrain/Step": 11902, "Pretrain/Step Time": 8.426242807880044} +{"Pretrain/Learning Rate": 1.6350508811851838e-05, "Pretrain/Loss": 2.00142765045166, "Pretrain/Loss (Raw)": 1.954984426498413, "Pretrain/Step": 11903, "Pretrain/Step Time": 8.427596844732761} +{"Pretrain/Learning Rate": 1.634652594345048e-05, "Pretrain/Loss": 1.9992396831512451, "Pretrain/Loss (Raw)": 2.0739524364471436, "Pretrain/Step": 11904, "Pretrain/Step Time": 8.4280273206532} +{"Pretrain/Learning Rate": 1.634254332456594e-05, "Pretrain/Loss": 1.9982335567474365, "Pretrain/Loss (Raw)": 1.9061836004257202, "Pretrain/Step": 11905, "Pretrain/Step Time": 8.423826906830072} +{"Pretrain/Learning Rate": 1.6338560955313076e-05, "Pretrain/Loss": 1.9994463920593262, "Pretrain/Loss (Raw)": 2.106503963470459, "Pretrain/Step": 11906, "Pretrain/Step Time": 8.423789558932185} +{"Pretrain/Learning Rate": 1.633457883580669e-05, "Pretrain/Loss": 1.9985742568969727, "Pretrain/Loss (Raw)": 1.9837549924850464, "Pretrain/Step": 11907, "Pretrain/Step Time": 8.422131888568401} +{"Pretrain/Learning Rate": 1.6330596966161614e-05, "Pretrain/Loss": 1.9988653659820557, "Pretrain/Loss (Raw)": 2.099618434906006, "Pretrain/Step": 11908, "Pretrain/Step Time": 8.418647438287735} +{"Pretrain/Learning Rate": 1.6326615346492662e-05, "Pretrain/Loss": 2.000063896179199, "Pretrain/Loss (Raw)": 2.0703136920928955, "Pretrain/Step": 11909, "Pretrain/Step Time": 8.42535650730133} +{"Pretrain/Learning Rate": 1.6322633976914644e-05, "Pretrain/Loss": 1.998288869857788, "Pretrain/Loss (Raw)": 1.8418124914169312, "Pretrain/Step": 11910, "Pretrain/Step Time": 8.422302857041359} +{"Pretrain/Learning Rate": 1.6318652857542365e-05, "Pretrain/Loss": 1.9988096952438354, "Pretrain/Loss (Raw)": 2.1271698474884033, "Pretrain/Step": 11911, "Pretrain/Step Time": 8.424131704494357} +{"Pretrain/Learning Rate": 1.6314671988490603e-05, "Pretrain/Loss": 1.999773383140564, "Pretrain/Loss (Raw)": 2.0491600036621094, "Pretrain/Step": 11912, "Pretrain/Step Time": 8.423698630183935} +{"Pretrain/Learning Rate": 1.6310691369874153e-05, "Pretrain/Loss": 1.9980868101119995, "Pretrain/Loss (Raw)": 1.8041727542877197, "Pretrain/Step": 11913, "Pretrain/Step Time": 8.423932235687971} +{"Pretrain/Learning Rate": 1.6306711001807793e-05, "Pretrain/Loss": 1.9993468523025513, "Pretrain/Loss (Raw)": 2.030799627304077, "Pretrain/Step": 11914, "Pretrain/Step Time": 8.42537321522832} +{"Pretrain/Learning Rate": 1.6302730884406288e-05, "Pretrain/Loss": 1.9999784231185913, "Pretrain/Loss (Raw)": 1.948091983795166, "Pretrain/Step": 11915, "Pretrain/Step Time": 8.424035901203752} +{"Pretrain/Learning Rate": 1.6298751017784415e-05, "Pretrain/Loss": 2.0017740726470947, "Pretrain/Loss (Raw)": 2.1688554286956787, "Pretrain/Step": 11916, "Pretrain/Step Time": 8.423207562416792} +{"Pretrain/Learning Rate": 1.629477140205692e-05, "Pretrain/Loss": 2.002870559692383, "Pretrain/Loss (Raw)": 1.9862580299377441, "Pretrain/Step": 11917, "Pretrain/Step Time": 8.423630835488439} +{"Pretrain/Learning Rate": 1.6290792037338552e-05, "Pretrain/Loss": 2.000452995300293, "Pretrain/Loss (Raw)": 1.8691128492355347, "Pretrain/Step": 11918, "Pretrain/Step Time": 8.423775600269437} +{"Pretrain/Learning Rate": 1.6286812923744053e-05, "Pretrain/Loss": 2.0014538764953613, "Pretrain/Loss (Raw)": 2.033400535583496, "Pretrain/Step": 11919, "Pretrain/Step Time": 8.420776022598147} +{"Pretrain/Learning Rate": 1.628283406138817e-05, "Pretrain/Loss": 2.002406120300293, "Pretrain/Loss (Raw)": 2.0619404315948486, "Pretrain/Step": 11920, "Pretrain/Step Time": 8.42079327814281} +{"Pretrain/Learning Rate": 1.627885545038562e-05, "Pretrain/Loss": 2.002486228942871, "Pretrain/Loss (Raw)": 2.0315778255462646, "Pretrain/Step": 11921, "Pretrain/Step Time": 8.422170482575893} +{"Pretrain/Learning Rate": 1.627487709085112e-05, "Pretrain/Loss": 2.0023326873779297, "Pretrain/Loss (Raw)": 1.9789072275161743, "Pretrain/Step": 11922, "Pretrain/Step Time": 8.422509090974927} +{"Pretrain/Learning Rate": 1.6270898982899392e-05, "Pretrain/Loss": 2.002284049987793, "Pretrain/Loss (Raw)": 1.8594917058944702, "Pretrain/Step": 11923, "Pretrain/Step Time": 8.417334597557783} +{"Pretrain/Learning Rate": 1.6266921126645133e-05, "Pretrain/Loss": 2.0025689601898193, "Pretrain/Loss (Raw)": 1.9528199434280396, "Pretrain/Step": 11924, "Pretrain/Step Time": 8.422220442444086} +{"Pretrain/Learning Rate": 1.626294352220305e-05, "Pretrain/Loss": 2.000059127807617, "Pretrain/Loss (Raw)": 1.7524996995925903, "Pretrain/Step": 11925, "Pretrain/Step Time": 8.420628560706973} +{"Pretrain/Learning Rate": 1.6258966169687833e-05, "Pretrain/Loss": 2.0015029907226562, "Pretrain/Loss (Raw)": 2.1380443572998047, "Pretrain/Step": 11926, "Pretrain/Step Time": 8.420391105115414} +{"Pretrain/Learning Rate": 1.625498906921416e-05, "Pretrain/Loss": 2.003539562225342, "Pretrain/Loss (Raw)": 2.1790289878845215, "Pretrain/Step": 11927, "Pretrain/Step Time": 8.4207384865731} +{"Pretrain/Learning Rate": 1.6251012220896716e-05, "Pretrain/Loss": 2.0024378299713135, "Pretrain/Loss (Raw)": 1.9581737518310547, "Pretrain/Step": 11928, "Pretrain/Step Time": 8.423501811921597} +{"Pretrain/Learning Rate": 1.624703562485017e-05, "Pretrain/Loss": 2.0020642280578613, "Pretrain/Loss (Raw)": 1.9943304061889648, "Pretrain/Step": 11929, "Pretrain/Step Time": 8.418754482641816} +{"Pretrain/Learning Rate": 1.6243059281189173e-05, "Pretrain/Loss": 2.003084897994995, "Pretrain/Loss (Raw)": 2.0470168590545654, "Pretrain/Step": 11930, "Pretrain/Step Time": 8.419436611235142} +{"Pretrain/Learning Rate": 1.6239083190028398e-05, "Pretrain/Loss": 2.001516580581665, "Pretrain/Loss (Raw)": 2.0535364151000977, "Pretrain/Step": 11931, "Pretrain/Step Time": 8.416837129741907} +{"Pretrain/Learning Rate": 1.623510735148248e-05, "Pretrain/Loss": 2.001796007156372, "Pretrain/Loss (Raw)": 2.0250632762908936, "Pretrain/Step": 11932, "Pretrain/Step Time": 8.414173113182187} +{"Pretrain/Learning Rate": 1.6231131765666057e-05, "Pretrain/Loss": 1.9955990314483643, "Pretrain/Loss (Raw)": 1.3749626874923706, "Pretrain/Step": 11933, "Pretrain/Step Time": 8.416690429672599} +{"Pretrain/Learning Rate": 1.6227156432693773e-05, "Pretrain/Loss": 1.9897018671035767, "Pretrain/Loss (Raw)": 1.6803280115127563, "Pretrain/Step": 11934, "Pretrain/Step Time": 8.419611914083362} +{"Pretrain/Learning Rate": 1.6223181352680245e-05, "Pretrain/Loss": 1.9877989292144775, "Pretrain/Loss (Raw)": 1.9302793741226196, "Pretrain/Step": 11935, "Pretrain/Step Time": 8.414798786863685} +{"Pretrain/Learning Rate": 1.6219206525740105e-05, "Pretrain/Loss": 1.9897711277008057, "Pretrain/Loss (Raw)": 2.2332820892333984, "Pretrain/Step": 11936, "Pretrain/Step Time": 8.41258592903614} +{"Pretrain/Learning Rate": 1.6215231951987948e-05, "Pretrain/Loss": 1.9902188777923584, "Pretrain/Loss (Raw)": 2.0156564712524414, "Pretrain/Step": 11937, "Pretrain/Step Time": 8.419260188937187} +{"Pretrain/Learning Rate": 1.621125763153838e-05, "Pretrain/Loss": 1.9898536205291748, "Pretrain/Loss (Raw)": 2.1009132862091064, "Pretrain/Step": 11938, "Pretrain/Step Time": 8.417609840631485} +{"Pretrain/Learning Rate": 1.620728356450601e-05, "Pretrain/Loss": 1.9908549785614014, "Pretrain/Loss (Raw)": 2.0371782779693604, "Pretrain/Step": 11939, "Pretrain/Step Time": 8.414695724844933} +{"Pretrain/Learning Rate": 1.6203309751005414e-05, "Pretrain/Loss": 1.990466833114624, "Pretrain/Loss (Raw)": 2.0032272338867188, "Pretrain/Step": 11940, "Pretrain/Step Time": 8.41635524481535} +{"Pretrain/Learning Rate": 1.6199336191151183e-05, "Pretrain/Loss": 1.9932682514190674, "Pretrain/Loss (Raw)": 2.1092681884765625, "Pretrain/Step": 11941, "Pretrain/Step Time": 8.419733429327607} +{"Pretrain/Learning Rate": 1.619536288505789e-05, "Pretrain/Loss": 1.9901416301727295, "Pretrain/Loss (Raw)": 1.6435750722885132, "Pretrain/Step": 11942, "Pretrain/Step Time": 8.42013137973845} +{"Pretrain/Learning Rate": 1.6191389832840103e-05, "Pretrain/Loss": 1.9906996488571167, "Pretrain/Loss (Raw)": 1.9256486892700195, "Pretrain/Step": 11943, "Pretrain/Step Time": 8.422282725572586} +{"Pretrain/Learning Rate": 1.6187417034612375e-05, "Pretrain/Loss": 1.9927618503570557, "Pretrain/Loss (Raw)": 2.1408910751342773, "Pretrain/Step": 11944, "Pretrain/Step Time": 8.419267948716879} +{"Pretrain/Learning Rate": 1.618344449048927e-05, "Pretrain/Loss": 1.9923579692840576, "Pretrain/Loss (Raw)": 2.1067116260528564, "Pretrain/Step": 11945, "Pretrain/Step Time": 8.421311363577843} +{"Pretrain/Learning Rate": 1.6179472200585323e-05, "Pretrain/Loss": 1.9900968074798584, "Pretrain/Loss (Raw)": 1.8007690906524658, "Pretrain/Step": 11946, "Pretrain/Step Time": 8.419268809258938} +{"Pretrain/Learning Rate": 1.6175500165015084e-05, "Pretrain/Loss": 1.988645315170288, "Pretrain/Loss (Raw)": 1.8447321653366089, "Pretrain/Step": 11947, "Pretrain/Step Time": 8.418238807469606} +{"Pretrain/Learning Rate": 1.617152838389307e-05, "Pretrain/Loss": 1.9902443885803223, "Pretrain/Loss (Raw)": 2.060232162475586, "Pretrain/Step": 11948, "Pretrain/Step Time": 8.41853447444737} +{"Pretrain/Learning Rate": 1.6167556857333814e-05, "Pretrain/Loss": 1.9894587993621826, "Pretrain/Loss (Raw)": 1.9316686391830444, "Pretrain/Step": 11949, "Pretrain/Step Time": 8.419419856742024} +{"Pretrain/Learning Rate": 1.6163585585451827e-05, "Pretrain/Loss": 1.986814260482788, "Pretrain/Loss (Raw)": 1.7536660432815552, "Pretrain/Step": 11950, "Pretrain/Step Time": 8.420648511499166} +{"Pretrain/Learning Rate": 1.615961456836162e-05, "Pretrain/Loss": 1.9871926307678223, "Pretrain/Loss (Raw)": 1.9716200828552246, "Pretrain/Step": 11951, "Pretrain/Step Time": 8.418576506897807} +{"Pretrain/Learning Rate": 1.6155643806177705e-05, "Pretrain/Loss": 1.9879963397979736, "Pretrain/Loss (Raw)": 2.1068971157073975, "Pretrain/Step": 11952, "Pretrain/Step Time": 8.414407340809703} +{"Pretrain/Learning Rate": 1.6151673299014556e-05, "Pretrain/Loss": 1.987518548965454, "Pretrain/Loss (Raw)": 2.137700080871582, "Pretrain/Step": 11953, "Pretrain/Step Time": 8.41381256468594} +{"Pretrain/Learning Rate": 1.614770304698667e-05, "Pretrain/Loss": 1.9875013828277588, "Pretrain/Loss (Raw)": 1.939715027809143, "Pretrain/Step": 11954, "Pretrain/Step Time": 8.417195919901133} +{"Pretrain/Learning Rate": 1.6143733050208525e-05, "Pretrain/Loss": 1.987741470336914, "Pretrain/Loss (Raw)": 2.1784720420837402, "Pretrain/Step": 11955, "Pretrain/Step Time": 8.41883241198957} +{"Pretrain/Learning Rate": 1.61397633087946e-05, "Pretrain/Loss": 1.986872911453247, "Pretrain/Loss (Raw)": 2.0540871620178223, "Pretrain/Step": 11956, "Pretrain/Step Time": 8.419585533440113} +{"Pretrain/Learning Rate": 1.6135793822859355e-05, "Pretrain/Loss": 1.9846923351287842, "Pretrain/Loss (Raw)": 1.843025803565979, "Pretrain/Step": 11957, "Pretrain/Step Time": 8.421896826475859} +{"Pretrain/Learning Rate": 1.6131824592517242e-05, "Pretrain/Loss": 1.9846398830413818, "Pretrain/Loss (Raw)": 1.9342784881591797, "Pretrain/Step": 11958, "Pretrain/Step Time": 8.427337927743793} +{"Pretrain/Learning Rate": 1.6127855617882714e-05, "Pretrain/Loss": 1.986611247062683, "Pretrain/Loss (Raw)": 2.047279119491577, "Pretrain/Step": 11959, "Pretrain/Step Time": 8.428892705589533} +{"Pretrain/Learning Rate": 1.6123886899070218e-05, "Pretrain/Loss": 1.9889668226242065, "Pretrain/Loss (Raw)": 2.086690664291382, "Pretrain/Step": 11960, "Pretrain/Step Time": 8.428496517241001} +{"Pretrain/Learning Rate": 1.6119918436194182e-05, "Pretrain/Loss": 1.9859716892242432, "Pretrain/Loss (Raw)": 1.776584267616272, "Pretrain/Step": 11961, "Pretrain/Step Time": 8.428946187719703} +{"Pretrain/Learning Rate": 1.6115950229369044e-05, "Pretrain/Loss": 1.9854360818862915, "Pretrain/Loss (Raw)": 2.0271167755126953, "Pretrain/Step": 11962, "Pretrain/Step Time": 8.428134797140956} +{"Pretrain/Learning Rate": 1.6111982278709213e-05, "Pretrain/Loss": 1.9891085624694824, "Pretrain/Loss (Raw)": 2.0875022411346436, "Pretrain/Step": 11963, "Pretrain/Step Time": 8.430130038410425} +{"Pretrain/Learning Rate": 1.610801458432911e-05, "Pretrain/Loss": 1.9858978986740112, "Pretrain/Loss (Raw)": 1.698472499847412, "Pretrain/Step": 11964, "Pretrain/Step Time": 8.429282383993268} +{"Pretrain/Learning Rate": 1.6104047146343138e-05, "Pretrain/Loss": 1.9860477447509766, "Pretrain/Loss (Raw)": 1.9438822269439697, "Pretrain/Step": 11965, "Pretrain/Step Time": 8.43136290833354} +{"Pretrain/Learning Rate": 1.6100079964865694e-05, "Pretrain/Loss": 1.9860823154449463, "Pretrain/Loss (Raw)": 2.146393060684204, "Pretrain/Step": 11966, "Pretrain/Step Time": 8.432377194985747} +{"Pretrain/Learning Rate": 1.609611304001118e-05, "Pretrain/Loss": 1.9861056804656982, "Pretrain/Loss (Raw)": 2.1095731258392334, "Pretrain/Step": 11967, "Pretrain/Step Time": 8.429819347336888} +{"Pretrain/Learning Rate": 1.6092146371893956e-05, "Pretrain/Loss": 1.983589768409729, "Pretrain/Loss (Raw)": 1.6611578464508057, "Pretrain/Step": 11968, "Pretrain/Step Time": 8.429592682048678} +{"Pretrain/Learning Rate": 1.608817996062842e-05, "Pretrain/Loss": 1.9833073616027832, "Pretrain/Loss (Raw)": 2.058504104614258, "Pretrain/Step": 11969, "Pretrain/Step Time": 8.431821629405022} +{"Pretrain/Learning Rate": 1.6084213806328928e-05, "Pretrain/Loss": 1.9833879470825195, "Pretrain/Loss (Raw)": 1.9857282638549805, "Pretrain/Step": 11970, "Pretrain/Step Time": 8.427321562543511} +{"Pretrain/Learning Rate": 1.6080247909109848e-05, "Pretrain/Loss": 1.9820274114608765, "Pretrain/Loss (Raw)": 1.7424657344818115, "Pretrain/Step": 11971, "Pretrain/Step Time": 8.427947638556361} +{"Pretrain/Learning Rate": 1.607628226908553e-05, "Pretrain/Loss": 1.9833862781524658, "Pretrain/Loss (Raw)": 1.9681395292282104, "Pretrain/Step": 11972, "Pretrain/Step Time": 8.427787909284234} +{"Pretrain/Learning Rate": 1.607231688637032e-05, "Pretrain/Loss": 1.9817872047424316, "Pretrain/Loss (Raw)": 1.766525149345398, "Pretrain/Step": 11973, "Pretrain/Step Time": 8.425702877342701} +{"Pretrain/Learning Rate": 1.606835176107856e-05, "Pretrain/Loss": 1.9821792840957642, "Pretrain/Loss (Raw)": 2.1943423748016357, "Pretrain/Step": 11974, "Pretrain/Step Time": 8.425294626504183} +{"Pretrain/Learning Rate": 1.6064386893324585e-05, "Pretrain/Loss": 1.984688639640808, "Pretrain/Loss (Raw)": 2.1682209968566895, "Pretrain/Step": 11975, "Pretrain/Step Time": 8.428197452798486} +{"Pretrain/Learning Rate": 1.6060422283222708e-05, "Pretrain/Loss": 1.9825177192687988, "Pretrain/Loss (Raw)": 2.0353922843933105, "Pretrain/Step": 11976, "Pretrain/Step Time": 8.428802322596312} +{"Pretrain/Learning Rate": 1.6056457930887254e-05, "Pretrain/Loss": 1.983034610748291, "Pretrain/Loss (Raw)": 2.025836229324341, "Pretrain/Step": 11977, "Pretrain/Step Time": 8.432053307071328} +{"Pretrain/Learning Rate": 1.6052493836432533e-05, "Pretrain/Loss": 1.9837114810943604, "Pretrain/Loss (Raw)": 2.1866774559020996, "Pretrain/Step": 11978, "Pretrain/Step Time": 8.430411256849766} +{"Pretrain/Learning Rate": 1.6048529999972843e-05, "Pretrain/Loss": 1.9840997457504272, "Pretrain/Loss (Raw)": 2.1477839946746826, "Pretrain/Step": 11979, "Pretrain/Step Time": 8.429730746895075} +{"Pretrain/Learning Rate": 1.6044566421622487e-05, "Pretrain/Loss": 1.9848004579544067, "Pretrain/Loss (Raw)": 1.992822289466858, "Pretrain/Step": 11980, "Pretrain/Step Time": 8.433516206219792} +{"Pretrain/Learning Rate": 1.6040603101495738e-05, "Pretrain/Loss": 1.9843926429748535, "Pretrain/Loss (Raw)": 1.8580936193466187, "Pretrain/Step": 11981, "Pretrain/Step Time": 8.432010667398572} +{"Pretrain/Learning Rate": 1.6036640039706883e-05, "Pretrain/Loss": 1.982546329498291, "Pretrain/Loss (Raw)": 1.7764114141464233, "Pretrain/Step": 11982, "Pretrain/Step Time": 8.433272330090404} +{"Pretrain/Learning Rate": 1.6032677236370192e-05, "Pretrain/Loss": 1.9810187816619873, "Pretrain/Loss (Raw)": 2.0847010612487793, "Pretrain/Step": 11983, "Pretrain/Step Time": 8.432476872578263} +{"Pretrain/Learning Rate": 1.6028714691599934e-05, "Pretrain/Loss": 1.9808199405670166, "Pretrain/Loss (Raw)": 1.9284614324569702, "Pretrain/Step": 11984, "Pretrain/Step Time": 8.435055719688535} +{"Pretrain/Learning Rate": 1.6024752405510367e-05, "Pretrain/Loss": 1.9820787906646729, "Pretrain/Loss (Raw)": 2.164421796798706, "Pretrain/Step": 11985, "Pretrain/Step Time": 8.438705429434776} +{"Pretrain/Learning Rate": 1.6020790378215732e-05, "Pretrain/Loss": 1.9821465015411377, "Pretrain/Loss (Raw)": 1.9646990299224854, "Pretrain/Step": 11986, "Pretrain/Step Time": 8.432889696210623} +{"Pretrain/Learning Rate": 1.6016828609830277e-05, "Pretrain/Loss": 1.9849369525909424, "Pretrain/Loss (Raw)": 2.25834321975708, "Pretrain/Step": 11987, "Pretrain/Step Time": 8.436283830553293} +{"Pretrain/Learning Rate": 1.6012867100468238e-05, "Pretrain/Loss": 1.9818183183670044, "Pretrain/Loss (Raw)": 1.7997982501983643, "Pretrain/Step": 11988, "Pretrain/Step Time": 8.437268825247884} +{"Pretrain/Learning Rate": 1.6008905850243838e-05, "Pretrain/Loss": 1.981788158416748, "Pretrain/Loss (Raw)": 1.9509541988372803, "Pretrain/Step": 11989, "Pretrain/Step Time": 8.437991853803396} +{"Pretrain/Learning Rate": 1.6004944859271303e-05, "Pretrain/Loss": 1.9829890727996826, "Pretrain/Loss (Raw)": 1.8608767986297607, "Pretrain/Step": 11990, "Pretrain/Step Time": 8.435752920806408} +{"Pretrain/Learning Rate": 1.600098412766484e-05, "Pretrain/Loss": 1.983328104019165, "Pretrain/Loss (Raw)": 1.887444019317627, "Pretrain/Step": 11991, "Pretrain/Step Time": 8.437433123588562} +{"Pretrain/Learning Rate": 1.5997023655538658e-05, "Pretrain/Loss": 1.978867769241333, "Pretrain/Loss (Raw)": 1.721940517425537, "Pretrain/Step": 11992, "Pretrain/Step Time": 8.439444379881024} +{"Pretrain/Learning Rate": 1.599306344300695e-05, "Pretrain/Loss": 1.9793275594711304, "Pretrain/Loss (Raw)": 2.022402286529541, "Pretrain/Step": 11993, "Pretrain/Step Time": 8.440527573227882} +{"Pretrain/Learning Rate": 1.5989103490183903e-05, "Pretrain/Loss": 1.981478214263916, "Pretrain/Loss (Raw)": 2.0028185844421387, "Pretrain/Step": 11994, "Pretrain/Step Time": 8.442541241645813} +{"Pretrain/Learning Rate": 1.5985143797183715e-05, "Pretrain/Loss": 1.9810535907745361, "Pretrain/Loss (Raw)": 2.0086669921875, "Pretrain/Step": 11995, "Pretrain/Step Time": 8.440690398216248} +{"Pretrain/Learning Rate": 1.598118436412055e-05, "Pretrain/Loss": 1.9809744358062744, "Pretrain/Loss (Raw)": 2.0313377380371094, "Pretrain/Step": 11996, "Pretrain/Step Time": 8.443112837150693} +{"Pretrain/Learning Rate": 1.5977225191108568e-05, "Pretrain/Loss": 1.9822092056274414, "Pretrain/Loss (Raw)": 2.048048496246338, "Pretrain/Step": 11997, "Pretrain/Step Time": 8.44065690971911} +{"Pretrain/Learning Rate": 1.597326627826194e-05, "Pretrain/Loss": 1.9819682836532593, "Pretrain/Loss (Raw)": 1.930859088897705, "Pretrain/Step": 11998, "Pretrain/Step Time": 8.44595380872488} +{"Pretrain/Learning Rate": 1.5969307625694814e-05, "Pretrain/Loss": 1.9833040237426758, "Pretrain/Loss (Raw)": 2.082111120223999, "Pretrain/Step": 11999, "Pretrain/Step Time": 8.440845273435116} +{"Pretrain/Learning Rate": 1.5965349233521344e-05, "Pretrain/Loss": 1.9837979078292847, "Pretrain/Loss (Raw)": 2.0381264686584473, "Pretrain/Step": 12000, "Pretrain/Step Time": 8.44279895350337} +{"Pretrain/Learning Rate": 1.5961391101855656e-05, "Pretrain/Loss": 1.9840251207351685, "Pretrain/Loss (Raw)": 2.0828516483306885, "Pretrain/Step": 12001, "Pretrain/Step Time": 8.444017890840769} +{"Pretrain/Learning Rate": 1.595743323081188e-05, "Pretrain/Loss": 1.985095500946045, "Pretrain/Loss (Raw)": 1.862480640411377, "Pretrain/Step": 12002, "Pretrain/Step Time": 8.444297052919865} +{"Pretrain/Learning Rate": 1.5953475620504144e-05, "Pretrain/Loss": 1.9856904745101929, "Pretrain/Loss (Raw)": 2.1370890140533447, "Pretrain/Step": 12003, "Pretrain/Step Time": 8.443223159760237} +{"Pretrain/Learning Rate": 1.5949518271046558e-05, "Pretrain/Loss": 1.9875984191894531, "Pretrain/Loss (Raw)": 2.0199646949768066, "Pretrain/Step": 12004, "Pretrain/Step Time": 8.440368175506592} +{"Pretrain/Learning Rate": 1.5945561182553237e-05, "Pretrain/Loss": 1.990177869796753, "Pretrain/Loss (Raw)": 2.1525938510894775, "Pretrain/Step": 12005, "Pretrain/Step Time": 8.437271855771542} +{"Pretrain/Learning Rate": 1.594160435513828e-05, "Pretrain/Loss": 1.9897668361663818, "Pretrain/Loss (Raw)": 2.097913980484009, "Pretrain/Step": 12006, "Pretrain/Step Time": 8.440310049802065} +{"Pretrain/Learning Rate": 1.5937647788915767e-05, "Pretrain/Loss": 1.9893403053283691, "Pretrain/Loss (Raw)": 2.0674471855163574, "Pretrain/Step": 12007, "Pretrain/Step Time": 8.43907910771668} +{"Pretrain/Learning Rate": 1.5933691483999798e-05, "Pretrain/Loss": 1.9891502857208252, "Pretrain/Loss (Raw)": 1.8887794017791748, "Pretrain/Step": 12008, "Pretrain/Step Time": 8.444303702563047} +{"Pretrain/Learning Rate": 1.592973544050444e-05, "Pretrain/Loss": 1.9914377927780151, "Pretrain/Loss (Raw)": 2.262547492980957, "Pretrain/Step": 12009, "Pretrain/Step Time": 8.443795865401626} +{"Pretrain/Learning Rate": 1.5925779658543764e-05, "Pretrain/Loss": 1.9905390739440918, "Pretrain/Loss (Raw)": 2.001044273376465, "Pretrain/Step": 12010, "Pretrain/Step Time": 8.443427566438913} +{"Pretrain/Learning Rate": 1.5921824138231843e-05, "Pretrain/Loss": 1.9913679361343384, "Pretrain/Loss (Raw)": 2.159207344055176, "Pretrain/Step": 12011, "Pretrain/Step Time": 8.44098242558539} +{"Pretrain/Learning Rate": 1.5917868879682718e-05, "Pretrain/Loss": 1.992222547531128, "Pretrain/Loss (Raw)": 2.0988502502441406, "Pretrain/Step": 12012, "Pretrain/Step Time": 8.439611351117492} +{"Pretrain/Learning Rate": 1.591391388301044e-05, "Pretrain/Loss": 1.993029236793518, "Pretrain/Loss (Raw)": 1.9409290552139282, "Pretrain/Step": 12013, "Pretrain/Step Time": 8.437788866460323} +{"Pretrain/Learning Rate": 1.5909959148329052e-05, "Pretrain/Loss": 1.9929931163787842, "Pretrain/Loss (Raw)": 2.0969653129577637, "Pretrain/Step": 12014, "Pretrain/Step Time": 8.44502106308937} +{"Pretrain/Learning Rate": 1.5906004675752583e-05, "Pretrain/Loss": 1.993788242340088, "Pretrain/Loss (Raw)": 2.0740017890930176, "Pretrain/Step": 12015, "Pretrain/Step Time": 8.440382555127144} +{"Pretrain/Learning Rate": 1.5902050465395065e-05, "Pretrain/Loss": 1.9931514263153076, "Pretrain/Loss (Raw)": 2.0897464752197266, "Pretrain/Step": 12016, "Pretrain/Step Time": 8.44267632625997} +{"Pretrain/Learning Rate": 1.5898096517370498e-05, "Pretrain/Loss": 1.9885963201522827, "Pretrain/Loss (Raw)": 1.8710625171661377, "Pretrain/Step": 12017, "Pretrain/Step Time": 8.444214655086398} +{"Pretrain/Learning Rate": 1.5894142831792906e-05, "Pretrain/Loss": 1.9899802207946777, "Pretrain/Loss (Raw)": 1.9358221292495728, "Pretrain/Step": 12018, "Pretrain/Step Time": 8.441849110648036} +{"Pretrain/Learning Rate": 1.5890189408776283e-05, "Pretrain/Loss": 1.9906022548675537, "Pretrain/Loss (Raw)": 1.814008116722107, "Pretrain/Step": 12019, "Pretrain/Step Time": 8.442167732864618} +{"Pretrain/Learning Rate": 1.588623624843463e-05, "Pretrain/Loss": 1.990206241607666, "Pretrain/Loss (Raw)": 1.973177433013916, "Pretrain/Step": 12020, "Pretrain/Step Time": 8.442229960113764} +{"Pretrain/Learning Rate": 1.5882283350881934e-05, "Pretrain/Loss": 1.9900822639465332, "Pretrain/Loss (Raw)": 1.9356956481933594, "Pretrain/Step": 12021, "Pretrain/Step Time": 8.437876770272851} +{"Pretrain/Learning Rate": 1.5878330716232163e-05, "Pretrain/Loss": 1.9907395839691162, "Pretrain/Loss (Raw)": 2.0404129028320312, "Pretrain/Step": 12022, "Pretrain/Step Time": 8.43960571102798} +{"Pretrain/Learning Rate": 1.5874378344599296e-05, "Pretrain/Loss": 1.9899487495422363, "Pretrain/Loss (Raw)": 2.03816294670105, "Pretrain/Step": 12023, "Pretrain/Step Time": 8.441914789378643} +{"Pretrain/Learning Rate": 1.58704262360973e-05, "Pretrain/Loss": 1.9899829626083374, "Pretrain/Loss (Raw)": 2.0133235454559326, "Pretrain/Step": 12024, "Pretrain/Step Time": 8.440627880394459} +{"Pretrain/Learning Rate": 1.5866474390840125e-05, "Pretrain/Loss": 1.9916467666625977, "Pretrain/Loss (Raw)": 2.0874850749969482, "Pretrain/Step": 12025, "Pretrain/Step Time": 8.442263355478644} +{"Pretrain/Learning Rate": 1.5862522808941726e-05, "Pretrain/Loss": 1.9917033910751343, "Pretrain/Loss (Raw)": 2.0533804893493652, "Pretrain/Step": 12026, "Pretrain/Step Time": 8.441149884834886} +{"Pretrain/Learning Rate": 1.5858571490516036e-05, "Pretrain/Loss": 1.990511417388916, "Pretrain/Loss (Raw)": 1.9973804950714111, "Pretrain/Step": 12027, "Pretrain/Step Time": 8.441582404077053} +{"Pretrain/Learning Rate": 1.5854620435676994e-05, "Pretrain/Loss": 1.9933949708938599, "Pretrain/Loss (Raw)": 2.096069574356079, "Pretrain/Step": 12028, "Pretrain/Step Time": 8.443453727290034} +{"Pretrain/Learning Rate": 1.5850669644538522e-05, "Pretrain/Loss": 1.99277663230896, "Pretrain/Loss (Raw)": 1.9454792737960815, "Pretrain/Step": 12029, "Pretrain/Step Time": 8.445034610107541} +{"Pretrain/Learning Rate": 1.584671911721454e-05, "Pretrain/Loss": 1.9944603443145752, "Pretrain/Loss (Raw)": 2.234092950820923, "Pretrain/Step": 12030, "Pretrain/Step Time": 8.44891950674355} +{"Pretrain/Learning Rate": 1.584276885381897e-05, "Pretrain/Loss": 1.994323968887329, "Pretrain/Loss (Raw)": 1.937516212463379, "Pretrain/Step": 12031, "Pretrain/Step Time": 8.448370158672333} +{"Pretrain/Learning Rate": 1.58388188544657e-05, "Pretrain/Loss": 1.991999626159668, "Pretrain/Loss (Raw)": 1.7764538526535034, "Pretrain/Step": 12032, "Pretrain/Step Time": 8.44980463013053} +{"Pretrain/Learning Rate": 1.5834869119268624e-05, "Pretrain/Loss": 1.9917346239089966, "Pretrain/Loss (Raw)": 1.8722518682479858, "Pretrain/Step": 12033, "Pretrain/Step Time": 8.450482986867428} +{"Pretrain/Learning Rate": 1.583091964834164e-05, "Pretrain/Loss": 1.9905097484588623, "Pretrain/Loss (Raw)": 1.9497100114822388, "Pretrain/Step": 12034, "Pretrain/Step Time": 8.448582749813795} +{"Pretrain/Learning Rate": 1.5826970441798623e-05, "Pretrain/Loss": 1.9918431043624878, "Pretrain/Loss (Raw)": 2.154421329498291, "Pretrain/Step": 12035, "Pretrain/Step Time": 8.448869599029422} +{"Pretrain/Learning Rate": 1.5823021499753455e-05, "Pretrain/Loss": 1.9905835390090942, "Pretrain/Loss (Raw)": 1.938398838043213, "Pretrain/Step": 12036, "Pretrain/Step Time": 8.454992989078164} +{"Pretrain/Learning Rate": 1.581907282231998e-05, "Pretrain/Loss": 1.9885121583938599, "Pretrain/Loss (Raw)": 1.8051804304122925, "Pretrain/Step": 12037, "Pretrain/Step Time": 8.45660818554461} +{"Pretrain/Learning Rate": 1.5815124409612075e-05, "Pretrain/Loss": 1.9887816905975342, "Pretrain/Loss (Raw)": 1.8763017654418945, "Pretrain/Step": 12038, "Pretrain/Step Time": 8.457264704629779} +{"Pretrain/Learning Rate": 1.5811176261743582e-05, "Pretrain/Loss": 1.9886715412139893, "Pretrain/Loss (Raw)": 2.113077163696289, "Pretrain/Step": 12039, "Pretrain/Step Time": 8.457727378234267} +{"Pretrain/Learning Rate": 1.5807228378828343e-05, "Pretrain/Loss": 1.9876350164413452, "Pretrain/Loss (Raw)": 1.9164913892745972, "Pretrain/Step": 12040, "Pretrain/Step Time": 8.457281706854701} +{"Pretrain/Learning Rate": 1.5803280760980187e-05, "Pretrain/Loss": 1.9885177612304688, "Pretrain/Loss (Raw)": 1.9171664714813232, "Pretrain/Step": 12041, "Pretrain/Step Time": 8.460282122716308} +{"Pretrain/Learning Rate": 1.579933340831296e-05, "Pretrain/Loss": 1.9877054691314697, "Pretrain/Loss (Raw)": 1.926828384399414, "Pretrain/Step": 12042, "Pretrain/Step Time": 8.455550717189908} +{"Pretrain/Learning Rate": 1.579538632094046e-05, "Pretrain/Loss": 1.9862685203552246, "Pretrain/Loss (Raw)": 1.7641578912734985, "Pretrain/Step": 12043, "Pretrain/Step Time": 8.458160109817982} +{"Pretrain/Learning Rate": 1.5791439498976507e-05, "Pretrain/Loss": 1.98395836353302, "Pretrain/Loss (Raw)": 1.873162865638733, "Pretrain/Step": 12044, "Pretrain/Step Time": 8.456656021997333} +{"Pretrain/Learning Rate": 1.5787492942534908e-05, "Pretrain/Loss": 1.9853334426879883, "Pretrain/Loss (Raw)": 2.1622564792633057, "Pretrain/Step": 12045, "Pretrain/Step Time": 8.458742586895823} +{"Pretrain/Learning Rate": 1.578354665172945e-05, "Pretrain/Loss": 1.9877265691757202, "Pretrain/Loss (Raw)": 2.175438642501831, "Pretrain/Step": 12046, "Pretrain/Step Time": 8.459622830152512} +{"Pretrain/Learning Rate": 1.5779600626673935e-05, "Pretrain/Loss": 1.9876034259796143, "Pretrain/Loss (Raw)": 2.017646074295044, "Pretrain/Step": 12047, "Pretrain/Step Time": 8.458344539627433} +{"Pretrain/Learning Rate": 1.577565486748213e-05, "Pretrain/Loss": 1.9879322052001953, "Pretrain/Loss (Raw)": 2.104027509689331, "Pretrain/Step": 12048, "Pretrain/Step Time": 8.456596460193396} +{"Pretrain/Learning Rate": 1.5771709374267814e-05, "Pretrain/Loss": 1.9863580465316772, "Pretrain/Loss (Raw)": 1.8300760984420776, "Pretrain/Step": 12049, "Pretrain/Step Time": 8.453265590593219} +{"Pretrain/Learning Rate": 1.5767764147144754e-05, "Pretrain/Loss": 1.9907913208007812, "Pretrain/Loss (Raw)": 2.5463712215423584, "Pretrain/Step": 12050, "Pretrain/Step Time": 8.451955942437053} +{"Pretrain/Learning Rate": 1.5763819186226704e-05, "Pretrain/Loss": 1.9905624389648438, "Pretrain/Loss (Raw)": 1.8301897048950195, "Pretrain/Step": 12051, "Pretrain/Step Time": 8.456014389172196} +{"Pretrain/Learning Rate": 1.575987449162743e-05, "Pretrain/Loss": 1.9924532175064087, "Pretrain/Loss (Raw)": 2.1948347091674805, "Pretrain/Step": 12052, "Pretrain/Step Time": 8.45402142778039} +{"Pretrain/Learning Rate": 1.575593006346065e-05, "Pretrain/Loss": 1.9942059516906738, "Pretrain/Loss (Raw)": 1.9768623113632202, "Pretrain/Step": 12053, "Pretrain/Step Time": 8.453886041417718} +{"Pretrain/Learning Rate": 1.5751985901840116e-05, "Pretrain/Loss": 1.9945766925811768, "Pretrain/Loss (Raw)": 2.185490369796753, "Pretrain/Step": 12054, "Pretrain/Step Time": 8.455962926149368} +{"Pretrain/Learning Rate": 1.5748042006879545e-05, "Pretrain/Loss": 1.9935954809188843, "Pretrain/Loss (Raw)": 2.0534181594848633, "Pretrain/Step": 12055, "Pretrain/Step Time": 8.457640124484897} +{"Pretrain/Learning Rate": 1.5744098378692657e-05, "Pretrain/Loss": 1.9933632612228394, "Pretrain/Loss (Raw)": 1.9284747838974, "Pretrain/Step": 12056, "Pretrain/Step Time": 8.456712942570448} +{"Pretrain/Learning Rate": 1.5740155017393167e-05, "Pretrain/Loss": 1.9920297861099243, "Pretrain/Loss (Raw)": 1.8236346244812012, "Pretrain/Step": 12057, "Pretrain/Step Time": 8.460648529231548} +{"Pretrain/Learning Rate": 1.5736211923094778e-05, "Pretrain/Loss": 1.9933574199676514, "Pretrain/Loss (Raw)": 2.2169601917266846, "Pretrain/Step": 12058, "Pretrain/Step Time": 8.45847175270319} +{"Pretrain/Learning Rate": 1.5732269095911198e-05, "Pretrain/Loss": 1.9916713237762451, "Pretrain/Loss (Raw)": 1.8377082347869873, "Pretrain/Step": 12059, "Pretrain/Step Time": 8.458231057971716} +{"Pretrain/Learning Rate": 1.5728326535956097e-05, "Pretrain/Loss": 1.993417501449585, "Pretrain/Loss (Raw)": 2.248575448989868, "Pretrain/Step": 12060, "Pretrain/Step Time": 8.46245482377708} +{"Pretrain/Learning Rate": 1.5724384243343165e-05, "Pretrain/Loss": 1.999000072479248, "Pretrain/Loss (Raw)": 2.089543104171753, "Pretrain/Step": 12061, "Pretrain/Step Time": 8.460104461759329} +{"Pretrain/Learning Rate": 1.5720442218186073e-05, "Pretrain/Loss": 2.0015363693237305, "Pretrain/Loss (Raw)": 2.0049707889556885, "Pretrain/Step": 12062, "Pretrain/Step Time": 8.46398051455617} +{"Pretrain/Learning Rate": 1.571650046059849e-05, "Pretrain/Loss": 2.000760078430176, "Pretrain/Loss (Raw)": 1.8309112787246704, "Pretrain/Step": 12063, "Pretrain/Step Time": 8.467321753501892} +{"Pretrain/Learning Rate": 1.5712558970694077e-05, "Pretrain/Loss": 1.997930884361267, "Pretrain/Loss (Raw)": 1.8711464405059814, "Pretrain/Step": 12064, "Pretrain/Step Time": 8.467131836339831} +{"Pretrain/Learning Rate": 1.5708617748586472e-05, "Pretrain/Loss": 1.9968513250350952, "Pretrain/Loss (Raw)": 1.8774700164794922, "Pretrain/Step": 12065, "Pretrain/Step Time": 8.460459230467677} +{"Pretrain/Learning Rate": 1.5704676794389328e-05, "Pretrain/Loss": 1.9966715574264526, "Pretrain/Loss (Raw)": 2.077908754348755, "Pretrain/Step": 12066, "Pretrain/Step Time": 8.460786949843168} +{"Pretrain/Learning Rate": 1.570073610821627e-05, "Pretrain/Loss": 1.9965343475341797, "Pretrain/Loss (Raw)": 2.0196096897125244, "Pretrain/Step": 12067, "Pretrain/Step Time": 8.461309904232621} +{"Pretrain/Learning Rate": 1.5696795690180936e-05, "Pretrain/Loss": 1.9980638027191162, "Pretrain/Loss (Raw)": 2.1989872455596924, "Pretrain/Step": 12068, "Pretrain/Step Time": 8.464041650295258} +{"Pretrain/Learning Rate": 1.5692855540396938e-05, "Pretrain/Loss": 1.9988629817962646, "Pretrain/Loss (Raw)": 2.2115697860717773, "Pretrain/Step": 12069, "Pretrain/Step Time": 8.462716814130545} +{"Pretrain/Learning Rate": 1.5688915658977893e-05, "Pretrain/Loss": 2.0001025199890137, "Pretrain/Loss (Raw)": 1.8022323846817017, "Pretrain/Step": 12070, "Pretrain/Step Time": 8.457834174856544} +{"Pretrain/Learning Rate": 1.5684976046037397e-05, "Pretrain/Loss": 2.0008602142333984, "Pretrain/Loss (Raw)": 2.0226101875305176, "Pretrain/Step": 12071, "Pretrain/Step Time": 8.456082921475172} +{"Pretrain/Learning Rate": 1.568103670168905e-05, "Pretrain/Loss": 1.9990650415420532, "Pretrain/Loss (Raw)": 1.9111407995224, "Pretrain/Step": 12072, "Pretrain/Step Time": 8.465395210310817} +{"Pretrain/Learning Rate": 1.5677097626046444e-05, "Pretrain/Loss": 1.9951565265655518, "Pretrain/Loss (Raw)": 1.6064178943634033, "Pretrain/Step": 12073, "Pretrain/Step Time": 8.464066276326776} +{"Pretrain/Learning Rate": 1.567315881922315e-05, "Pretrain/Loss": 1.9964735507965088, "Pretrain/Loss (Raw)": 1.9693437814712524, "Pretrain/Step": 12074, "Pretrain/Step Time": 8.464702462777495} +{"Pretrain/Learning Rate": 1.566922028133275e-05, "Pretrain/Loss": 1.9967550039291382, "Pretrain/Loss (Raw)": 1.8807601928710938, "Pretrain/Step": 12075, "Pretrain/Step Time": 8.464949170127511} +{"Pretrain/Learning Rate": 1.5665282012488808e-05, "Pretrain/Loss": 1.9954519271850586, "Pretrain/Loss (Raw)": 1.8934203386306763, "Pretrain/Step": 12076, "Pretrain/Step Time": 8.463329378515482} +{"Pretrain/Learning Rate": 1.5661344012804874e-05, "Pretrain/Loss": 1.9971470832824707, "Pretrain/Loss (Raw)": 2.148660898208618, "Pretrain/Step": 12077, "Pretrain/Step Time": 8.466543655842543} +{"Pretrain/Learning Rate": 1.5657406282394503e-05, "Pretrain/Loss": 1.9982891082763672, "Pretrain/Loss (Raw)": 1.8998342752456665, "Pretrain/Step": 12078, "Pretrain/Step Time": 8.462267640978098} +{"Pretrain/Learning Rate": 1.5653468821371238e-05, "Pretrain/Loss": 1.9955997467041016, "Pretrain/Loss (Raw)": 1.6273977756500244, "Pretrain/Step": 12079, "Pretrain/Step Time": 8.469653151929379} +{"Pretrain/Learning Rate": 1.5649531629848612e-05, "Pretrain/Loss": 1.9936251640319824, "Pretrain/Loss (Raw)": 1.8541460037231445, "Pretrain/Step": 12080, "Pretrain/Step Time": 8.473850464448333} +{"Pretrain/Learning Rate": 1.5645594707940147e-05, "Pretrain/Loss": 1.9924871921539307, "Pretrain/Loss (Raw)": 1.9920562505722046, "Pretrain/Step": 12081, "Pretrain/Step Time": 8.469573086127639} +{"Pretrain/Learning Rate": 1.564165805575936e-05, "Pretrain/Loss": 1.992645025253296, "Pretrain/Loss (Raw)": 1.9598987102508545, "Pretrain/Step": 12082, "Pretrain/Step Time": 8.469787692651153} +{"Pretrain/Learning Rate": 1.5637721673419774e-05, "Pretrain/Loss": 1.9911963939666748, "Pretrain/Loss (Raw)": 1.9930444955825806, "Pretrain/Step": 12083, "Pretrain/Step Time": 8.471067177131772} +{"Pretrain/Learning Rate": 1.5633785561034876e-05, "Pretrain/Loss": 1.9927940368652344, "Pretrain/Loss (Raw)": 2.258592367172241, "Pretrain/Step": 12084, "Pretrain/Step Time": 8.467016339302063} +{"Pretrain/Learning Rate": 1.5629849718718177e-05, "Pretrain/Loss": 1.9944392442703247, "Pretrain/Loss (Raw)": 2.053610324859619, "Pretrain/Step": 12085, "Pretrain/Step Time": 8.467939032241702} +{"Pretrain/Learning Rate": 1.5625914146583152e-05, "Pretrain/Loss": 1.9959566593170166, "Pretrain/Loss (Raw)": 2.12850284576416, "Pretrain/Step": 12086, "Pretrain/Step Time": 8.466488255187869} +{"Pretrain/Learning Rate": 1.5621978844743282e-05, "Pretrain/Loss": 1.9944086074829102, "Pretrain/Loss (Raw)": 1.8491264581680298, "Pretrain/Step": 12087, "Pretrain/Step Time": 8.463390581309795} +{"Pretrain/Learning Rate": 1.561804381331204e-05, "Pretrain/Loss": 1.993096113204956, "Pretrain/Loss (Raw)": 1.918704628944397, "Pretrain/Step": 12088, "Pretrain/Step Time": 8.465337105095387} +{"Pretrain/Learning Rate": 1.561410905240289e-05, "Pretrain/Loss": 1.994492530822754, "Pretrain/Loss (Raw)": 1.955327033996582, "Pretrain/Step": 12089, "Pretrain/Step Time": 8.466485425829887} +{"Pretrain/Learning Rate": 1.56101745621293e-05, "Pretrain/Loss": 1.9947459697723389, "Pretrain/Loss (Raw)": 2.0595362186431885, "Pretrain/Step": 12090, "Pretrain/Step Time": 8.469129908829927} +{"Pretrain/Learning Rate": 1.5606240342604697e-05, "Pretrain/Loss": 1.9948333501815796, "Pretrain/Loss (Raw)": 2.0987014770507812, "Pretrain/Step": 12091, "Pretrain/Step Time": 8.467817725613713} +{"Pretrain/Learning Rate": 1.5602306393942533e-05, "Pretrain/Loss": 1.9981131553649902, "Pretrain/Loss (Raw)": 2.118279457092285, "Pretrain/Step": 12092, "Pretrain/Step Time": 8.46545092947781} +{"Pretrain/Learning Rate": 1.5598372716256237e-05, "Pretrain/Loss": 1.9969488382339478, "Pretrain/Loss (Raw)": 1.7948520183563232, "Pretrain/Step": 12093, "Pretrain/Step Time": 8.468718318268657} +{"Pretrain/Learning Rate": 1.559443930965924e-05, "Pretrain/Loss": 1.9960730075836182, "Pretrain/Loss (Raw)": 2.0342912673950195, "Pretrain/Step": 12094, "Pretrain/Step Time": 8.468958307057619} +{"Pretrain/Learning Rate": 1.5590506174264956e-05, "Pretrain/Loss": 1.994541883468628, "Pretrain/Loss (Raw)": 1.9135879278182983, "Pretrain/Step": 12095, "Pretrain/Step Time": 8.473207775503397} +{"Pretrain/Learning Rate": 1.5586573310186793e-05, "Pretrain/Loss": 1.9997010231018066, "Pretrain/Loss (Raw)": 2.3215229511260986, "Pretrain/Step": 12096, "Pretrain/Step Time": 8.473056403920054} +{"Pretrain/Learning Rate": 1.558264071753815e-05, "Pretrain/Loss": 2.00058650970459, "Pretrain/Loss (Raw)": 2.171841859817505, "Pretrain/Step": 12097, "Pretrain/Step Time": 8.473290763795376} +{"Pretrain/Learning Rate": 1.5578708396432425e-05, "Pretrain/Loss": 2.0006093978881836, "Pretrain/Loss (Raw)": 1.9886834621429443, "Pretrain/Step": 12098, "Pretrain/Step Time": 8.472511280328035} +{"Pretrain/Learning Rate": 1.5574776346982994e-05, "Pretrain/Loss": 2.0041332244873047, "Pretrain/Loss (Raw)": 2.1935057640075684, "Pretrain/Step": 12099, "Pretrain/Step Time": 8.471934359520674} +{"Pretrain/Learning Rate": 1.5570844569303255e-05, "Pretrain/Loss": 2.005018472671509, "Pretrain/Loss (Raw)": 2.0814414024353027, "Pretrain/Step": 12100, "Pretrain/Step Time": 8.47118136100471} +{"Pretrain/Learning Rate": 1.556691306350656e-05, "Pretrain/Loss": 2.006441593170166, "Pretrain/Loss (Raw)": 1.9487096071243286, "Pretrain/Step": 12101, "Pretrain/Step Time": 8.466906288638711} +{"Pretrain/Learning Rate": 1.5562981829706273e-05, "Pretrain/Loss": 2.0044941902160645, "Pretrain/Loss (Raw)": 1.9450533390045166, "Pretrain/Step": 12102, "Pretrain/Step Time": 8.466275304555893} +{"Pretrain/Learning Rate": 1.5559050868015757e-05, "Pretrain/Loss": 2.0012011528015137, "Pretrain/Loss (Raw)": 1.7467248439788818, "Pretrain/Step": 12103, "Pretrain/Step Time": 8.4692991245538} +{"Pretrain/Learning Rate": 1.5555120178548356e-05, "Pretrain/Loss": 2.001659631729126, "Pretrain/Loss (Raw)": 2.0940589904785156, "Pretrain/Step": 12104, "Pretrain/Step Time": 8.468649007380009} +{"Pretrain/Learning Rate": 1.55511897614174e-05, "Pretrain/Loss": 2.0028088092803955, "Pretrain/Loss (Raw)": 2.1729416847229004, "Pretrain/Step": 12105, "Pretrain/Step Time": 8.46294210664928} +{"Pretrain/Learning Rate": 1.5547259616736233e-05, "Pretrain/Loss": 1.9982261657714844, "Pretrain/Loss (Raw)": 1.6000863313674927, "Pretrain/Step": 12106, "Pretrain/Step Time": 8.469172950834036} +{"Pretrain/Learning Rate": 1.5543329744618167e-05, "Pretrain/Loss": 1.9983423948287964, "Pretrain/Loss (Raw)": 2.1626758575439453, "Pretrain/Step": 12107, "Pretrain/Step Time": 8.467923855409026} +{"Pretrain/Learning Rate": 1.5539400145176523e-05, "Pretrain/Loss": 1.9986884593963623, "Pretrain/Loss (Raw)": 2.037128448486328, "Pretrain/Step": 12108, "Pretrain/Step Time": 8.464997032657266} +{"Pretrain/Learning Rate": 1.5535470818524602e-05, "Pretrain/Loss": 1.9995646476745605, "Pretrain/Loss (Raw)": 1.970229983329773, "Pretrain/Step": 12109, "Pretrain/Step Time": 8.459257742390037} +{"Pretrain/Learning Rate": 1.553154176477571e-05, "Pretrain/Loss": 2.0046961307525635, "Pretrain/Loss (Raw)": 2.4332528114318848, "Pretrain/Step": 12110, "Pretrain/Step Time": 8.458541713654995} +{"Pretrain/Learning Rate": 1.5527612984043145e-05, "Pretrain/Loss": 2.0037384033203125, "Pretrain/Loss (Raw)": 1.962092399597168, "Pretrain/Step": 12111, "Pretrain/Step Time": 8.460792053490877} +{"Pretrain/Learning Rate": 1.5523684476440174e-05, "Pretrain/Loss": 2.0034589767456055, "Pretrain/Loss (Raw)": 1.892706036567688, "Pretrain/Step": 12112, "Pretrain/Step Time": 8.462306225672364} +{"Pretrain/Learning Rate": 1.551975624208008e-05, "Pretrain/Loss": 2.001584529876709, "Pretrain/Loss (Raw)": 1.924500584602356, "Pretrain/Step": 12113, "Pretrain/Step Time": 8.460995178669691} +{"Pretrain/Learning Rate": 1.5515828281076135e-05, "Pretrain/Loss": 2.001063823699951, "Pretrain/Loss (Raw)": 1.8980330228805542, "Pretrain/Step": 12114, "Pretrain/Step Time": 8.463618785142899} +{"Pretrain/Learning Rate": 1.551190059354159e-05, "Pretrain/Loss": 1.9988359212875366, "Pretrain/Loss (Raw)": 1.9731900691986084, "Pretrain/Step": 12115, "Pretrain/Step Time": 8.45850982144475} +{"Pretrain/Learning Rate": 1.5507973179589712e-05, "Pretrain/Loss": 2.0010855197906494, "Pretrain/Loss (Raw)": 2.087747573852539, "Pretrain/Step": 12116, "Pretrain/Step Time": 8.456386923789978} +{"Pretrain/Learning Rate": 1.5504046039333732e-05, "Pretrain/Loss": 2.00226092338562, "Pretrain/Loss (Raw)": 2.101391077041626, "Pretrain/Step": 12117, "Pretrain/Step Time": 8.449524546042085} +{"Pretrain/Learning Rate": 1.5500119172886885e-05, "Pretrain/Loss": 2.0020930767059326, "Pretrain/Loss (Raw)": 1.8393902778625488, "Pretrain/Step": 12118, "Pretrain/Step Time": 8.451223196461797} +{"Pretrain/Learning Rate": 1.5496192580362405e-05, "Pretrain/Loss": 2.001269578933716, "Pretrain/Loss (Raw)": 1.7820415496826172, "Pretrain/Step": 12119, "Pretrain/Step Time": 8.45424504764378} +{"Pretrain/Learning Rate": 1.5492266261873518e-05, "Pretrain/Loss": 2.002730131149292, "Pretrain/Loss (Raw)": 1.908902883529663, "Pretrain/Step": 12120, "Pretrain/Step Time": 8.45423368550837} +{"Pretrain/Learning Rate": 1.548834021753343e-05, "Pretrain/Loss": 2.0016250610351562, "Pretrain/Loss (Raw)": 1.880960464477539, "Pretrain/Step": 12121, "Pretrain/Step Time": 8.456666143611073} +{"Pretrain/Learning Rate": 1.5484414447455348e-05, "Pretrain/Loss": 2.0003139972686768, "Pretrain/Loss (Raw)": 1.834981083869934, "Pretrain/Step": 12122, "Pretrain/Step Time": 8.454948192462325} +{"Pretrain/Learning Rate": 1.5480488951752463e-05, "Pretrain/Loss": 1.9987776279449463, "Pretrain/Loss (Raw)": 1.8120144605636597, "Pretrain/Step": 12123, "Pretrain/Step Time": 8.460032381117344} +{"Pretrain/Learning Rate": 1.5476563730537967e-05, "Pretrain/Loss": 1.9969854354858398, "Pretrain/Loss (Raw)": 1.8019264936447144, "Pretrain/Step": 12124, "Pretrain/Step Time": 8.458229660987854} +{"Pretrain/Learning Rate": 1.5472638783925048e-05, "Pretrain/Loss": 1.9989758729934692, "Pretrain/Loss (Raw)": 2.302837371826172, "Pretrain/Step": 12125, "Pretrain/Step Time": 8.455126162618399} +{"Pretrain/Learning Rate": 1.546871411202687e-05, "Pretrain/Loss": 1.9973859786987305, "Pretrain/Loss (Raw)": 1.7273503541946411, "Pretrain/Step": 12126, "Pretrain/Step Time": 8.452506098896265} +{"Pretrain/Learning Rate": 1.5464789714956602e-05, "Pretrain/Loss": 1.9955792427062988, "Pretrain/Loss (Raw)": 1.8508474826812744, "Pretrain/Step": 12127, "Pretrain/Step Time": 8.455351507291198} +{"Pretrain/Learning Rate": 1.54608655928274e-05, "Pretrain/Loss": 1.9966639280319214, "Pretrain/Loss (Raw)": 2.1769745349884033, "Pretrain/Step": 12128, "Pretrain/Step Time": 8.45495474152267} +{"Pretrain/Learning Rate": 1.545694174575241e-05, "Pretrain/Loss": 1.9972349405288696, "Pretrain/Loss (Raw)": 2.1559391021728516, "Pretrain/Step": 12129, "Pretrain/Step Time": 8.45434762723744} +{"Pretrain/Learning Rate": 1.5453018173844786e-05, "Pretrain/Loss": 1.997145414352417, "Pretrain/Loss (Raw)": 1.85100519657135, "Pretrain/Step": 12130, "Pretrain/Step Time": 8.450789323076606} +{"Pretrain/Learning Rate": 1.5449094877217652e-05, "Pretrain/Loss": 1.9970461130142212, "Pretrain/Loss (Raw)": 2.1243982315063477, "Pretrain/Step": 12131, "Pretrain/Step Time": 8.457617200911045} +{"Pretrain/Learning Rate": 1.544517185598413e-05, "Pretrain/Loss": 1.995934009552002, "Pretrain/Loss (Raw)": 1.877616286277771, "Pretrain/Step": 12132, "Pretrain/Step Time": 8.457110073417425} +{"Pretrain/Learning Rate": 1.544124911025734e-05, "Pretrain/Loss": 1.9949347972869873, "Pretrain/Loss (Raw)": 2.024688720703125, "Pretrain/Step": 12133, "Pretrain/Step Time": 8.459125138819218} +{"Pretrain/Learning Rate": 1.5437326640150395e-05, "Pretrain/Loss": 1.9920828342437744, "Pretrain/Loss (Raw)": 1.7328598499298096, "Pretrain/Step": 12134, "Pretrain/Step Time": 8.455024741590023} +{"Pretrain/Learning Rate": 1.54334044457764e-05, "Pretrain/Loss": 1.991138219833374, "Pretrain/Loss (Raw)": 1.9465386867523193, "Pretrain/Step": 12135, "Pretrain/Step Time": 8.456659629940987} +{"Pretrain/Learning Rate": 1.5429482527248444e-05, "Pretrain/Loss": 1.9922468662261963, "Pretrain/Loss (Raw)": 2.0306966304779053, "Pretrain/Step": 12136, "Pretrain/Step Time": 8.454543562605977} +{"Pretrain/Learning Rate": 1.542556088467961e-05, "Pretrain/Loss": 1.9892525672912598, "Pretrain/Loss (Raw)": 1.8792691230773926, "Pretrain/Step": 12137, "Pretrain/Step Time": 8.45677848905325} +{"Pretrain/Learning Rate": 1.5421639518182975e-05, "Pretrain/Loss": 1.98482346534729, "Pretrain/Loss (Raw)": 1.434108018875122, "Pretrain/Step": 12138, "Pretrain/Step Time": 8.457995314151049} +{"Pretrain/Learning Rate": 1.5417718427871618e-05, "Pretrain/Loss": 1.9839119911193848, "Pretrain/Loss (Raw)": 2.042567253112793, "Pretrain/Step": 12139, "Pretrain/Step Time": 8.456639368087053} +{"Pretrain/Learning Rate": 1.541379761385859e-05, "Pretrain/Loss": 1.9827502965927124, "Pretrain/Loss (Raw)": 1.9501336812973022, "Pretrain/Step": 12140, "Pretrain/Step Time": 8.456473244354129} +{"Pretrain/Learning Rate": 1.540987707625695e-05, "Pretrain/Loss": 1.981753945350647, "Pretrain/Loss (Raw)": 1.8133960962295532, "Pretrain/Step": 12141, "Pretrain/Step Time": 8.4547304417938} +{"Pretrain/Learning Rate": 1.5405956815179746e-05, "Pretrain/Loss": 1.980506181716919, "Pretrain/Loss (Raw)": 1.9372533559799194, "Pretrain/Step": 12142, "Pretrain/Step Time": 8.446627356112003} +{"Pretrain/Learning Rate": 1.5402036830740012e-05, "Pretrain/Loss": 1.9811747074127197, "Pretrain/Loss (Raw)": 2.1595752239227295, "Pretrain/Step": 12143, "Pretrain/Step Time": 8.451225150376558} +{"Pretrain/Learning Rate": 1.5398117123050788e-05, "Pretrain/Loss": 1.9806814193725586, "Pretrain/Loss (Raw)": 2.0266122817993164, "Pretrain/Step": 12144, "Pretrain/Step Time": 8.449907375499606} +{"Pretrain/Learning Rate": 1.5394197692225077e-05, "Pretrain/Loss": 1.9806444644927979, "Pretrain/Loss (Raw)": 1.866324782371521, "Pretrain/Step": 12145, "Pretrain/Step Time": 8.448335567489266} +{"Pretrain/Learning Rate": 1.5390278538375907e-05, "Pretrain/Loss": 1.9809588193893433, "Pretrain/Loss (Raw)": 1.9760648012161255, "Pretrain/Step": 12146, "Pretrain/Step Time": 8.449014350771904} +{"Pretrain/Learning Rate": 1.538635966161628e-05, "Pretrain/Loss": 1.9817296266555786, "Pretrain/Loss (Raw)": 1.9126604795455933, "Pretrain/Step": 12147, "Pretrain/Step Time": 8.447278957813978} +{"Pretrain/Learning Rate": 1.5382441062059193e-05, "Pretrain/Loss": 1.9801671504974365, "Pretrain/Loss (Raw)": 1.7731809616088867, "Pretrain/Step": 12148, "Pretrain/Step Time": 8.45073065534234} +{"Pretrain/Learning Rate": 1.5378522739817647e-05, "Pretrain/Loss": 1.9779398441314697, "Pretrain/Loss (Raw)": 1.6505974531173706, "Pretrain/Step": 12149, "Pretrain/Step Time": 8.451143145561218} +{"Pretrain/Learning Rate": 1.537460469500461e-05, "Pretrain/Loss": 1.977629542350769, "Pretrain/Loss (Raw)": 2.0007073879241943, "Pretrain/Step": 12150, "Pretrain/Step Time": 8.45146126486361} +{"Pretrain/Learning Rate": 1.537068692773306e-05, "Pretrain/Loss": 1.981184959411621, "Pretrain/Loss (Raw)": 2.4932475090026855, "Pretrain/Step": 12151, "Pretrain/Step Time": 8.445683110505342} +{"Pretrain/Learning Rate": 1.5366769438115962e-05, "Pretrain/Loss": 1.9809244871139526, "Pretrain/Loss (Raw)": 1.9799869060516357, "Pretrain/Step": 12152, "Pretrain/Step Time": 8.446566948667169} +{"Pretrain/Learning Rate": 1.5362852226266282e-05, "Pretrain/Loss": 1.9815011024475098, "Pretrain/Loss (Raw)": 2.1612863540649414, "Pretrain/Step": 12153, "Pretrain/Step Time": 8.444761838763952} +{"Pretrain/Learning Rate": 1.5358935292296967e-05, "Pretrain/Loss": 1.9816813468933105, "Pretrain/Loss (Raw)": 2.0764646530151367, "Pretrain/Step": 12154, "Pretrain/Step Time": 8.44654305651784} +{"Pretrain/Learning Rate": 1.535501863632095e-05, "Pretrain/Loss": 1.9810144901275635, "Pretrain/Loss (Raw)": 1.9120275974273682, "Pretrain/Step": 12155, "Pretrain/Step Time": 8.446214204654098} +{"Pretrain/Learning Rate": 1.535110225845117e-05, "Pretrain/Loss": 1.9807701110839844, "Pretrain/Loss (Raw)": 2.06478214263916, "Pretrain/Step": 12156, "Pretrain/Step Time": 8.446706073358655} +{"Pretrain/Learning Rate": 1.5347186158800554e-05, "Pretrain/Loss": 1.980150580406189, "Pretrain/Loss (Raw)": 1.8661811351776123, "Pretrain/Step": 12157, "Pretrain/Step Time": 8.445218527689576} +{"Pretrain/Learning Rate": 1.5343270337482023e-05, "Pretrain/Loss": 1.9785182476043701, "Pretrain/Loss (Raw)": 2.025151491165161, "Pretrain/Step": 12158, "Pretrain/Step Time": 8.445925360545516} +{"Pretrain/Learning Rate": 1.533935479460849e-05, "Pretrain/Loss": 1.9796202182769775, "Pretrain/Loss (Raw)": 2.078568935394287, "Pretrain/Step": 12159, "Pretrain/Step Time": 8.442621948197484} +{"Pretrain/Learning Rate": 1.5335439530292843e-05, "Pretrain/Loss": 1.9818185567855835, "Pretrain/Loss (Raw)": 2.057844400405884, "Pretrain/Step": 12160, "Pretrain/Step Time": 8.443227564916015} +{"Pretrain/Learning Rate": 1.5331524544647985e-05, "Pretrain/Loss": 1.9824931621551514, "Pretrain/Loss (Raw)": 1.9585868120193481, "Pretrain/Step": 12161, "Pretrain/Step Time": 8.441241743043065} +{"Pretrain/Learning Rate": 1.5327609837786803e-05, "Pretrain/Loss": 1.984336256980896, "Pretrain/Loss (Raw)": 2.185633897781372, "Pretrain/Step": 12162, "Pretrain/Step Time": 8.446131370961666} +{"Pretrain/Learning Rate": 1.532369540982217e-05, "Pretrain/Loss": 1.9808531999588013, "Pretrain/Loss (Raw)": 1.7086001634597778, "Pretrain/Step": 12163, "Pretrain/Step Time": 8.446572542190552} +{"Pretrain/Learning Rate": 1.5319781260866967e-05, "Pretrain/Loss": 1.9815244674682617, "Pretrain/Loss (Raw)": 2.024317979812622, "Pretrain/Step": 12164, "Pretrain/Step Time": 8.44465614296496} +{"Pretrain/Learning Rate": 1.5315867391034037e-05, "Pretrain/Loss": 1.9839614629745483, "Pretrain/Loss (Raw)": 2.117121934890747, "Pretrain/Step": 12165, "Pretrain/Step Time": 8.44235324114561} +{"Pretrain/Learning Rate": 1.531195380043625e-05, "Pretrain/Loss": 1.9851901531219482, "Pretrain/Loss (Raw)": 2.0335693359375, "Pretrain/Step": 12166, "Pretrain/Step Time": 8.43928649649024} +{"Pretrain/Learning Rate": 1.5308040489186443e-05, "Pretrain/Loss": 1.984591007232666, "Pretrain/Loss (Raw)": 2.0363826751708984, "Pretrain/Step": 12167, "Pretrain/Step Time": 8.439271442592144} +{"Pretrain/Learning Rate": 1.5304127457397455e-05, "Pretrain/Loss": 1.9844920635223389, "Pretrain/Loss (Raw)": 1.9038227796554565, "Pretrain/Step": 12168, "Pretrain/Step Time": 8.438624884933233} +{"Pretrain/Learning Rate": 1.5300214705182113e-05, "Pretrain/Loss": 1.984438180923462, "Pretrain/Loss (Raw)": 1.9102628231048584, "Pretrain/Step": 12169, "Pretrain/Step Time": 8.43527447246015} +{"Pretrain/Learning Rate": 1.5296302232653252e-05, "Pretrain/Loss": 1.9868414402008057, "Pretrain/Loss (Raw)": 2.2344443798065186, "Pretrain/Step": 12170, "Pretrain/Step Time": 8.442918768152595} +{"Pretrain/Learning Rate": 1.529239003992367e-05, "Pretrain/Loss": 1.9895446300506592, "Pretrain/Loss (Raw)": 2.110172748565674, "Pretrain/Step": 12171, "Pretrain/Step Time": 8.4391301702708} +{"Pretrain/Learning Rate": 1.528847812710618e-05, "Pretrain/Loss": 1.9889326095581055, "Pretrain/Loss (Raw)": 1.7948379516601562, "Pretrain/Step": 12172, "Pretrain/Step Time": 8.441149139776826} +{"Pretrain/Learning Rate": 1.5284566494313574e-05, "Pretrain/Loss": 1.9862897396087646, "Pretrain/Loss (Raw)": 1.823960542678833, "Pretrain/Step": 12173, "Pretrain/Step Time": 8.438402423635125} +{"Pretrain/Learning Rate": 1.5280655141658645e-05, "Pretrain/Loss": 1.9860141277313232, "Pretrain/Loss (Raw)": 2.140167236328125, "Pretrain/Step": 12174, "Pretrain/Step Time": 8.439237838611007} +{"Pretrain/Learning Rate": 1.527674406925418e-05, "Pretrain/Loss": 1.986443042755127, "Pretrain/Loss (Raw)": 2.07255220413208, "Pretrain/Step": 12175, "Pretrain/Step Time": 8.445547968149185} +{"Pretrain/Learning Rate": 1.5272833277212936e-05, "Pretrain/Loss": 1.9859435558319092, "Pretrain/Loss (Raw)": 2.0400800704956055, "Pretrain/Step": 12176, "Pretrain/Step Time": 8.444615840911865} +{"Pretrain/Learning Rate": 1.5268922765647693e-05, "Pretrain/Loss": 1.9862754344940186, "Pretrain/Loss (Raw)": 1.872541904449463, "Pretrain/Step": 12177, "Pretrain/Step Time": 8.448526049032807} +{"Pretrain/Learning Rate": 1.5265012534671198e-05, "Pretrain/Loss": 1.9830780029296875, "Pretrain/Loss (Raw)": 2.137108087539673, "Pretrain/Step": 12178, "Pretrain/Step Time": 8.444980731233954} +{"Pretrain/Learning Rate": 1.5261102584396203e-05, "Pretrain/Loss": 1.9838510751724243, "Pretrain/Loss (Raw)": 1.9291622638702393, "Pretrain/Step": 12179, "Pretrain/Step Time": 8.44333298318088} +{"Pretrain/Learning Rate": 1.5257192914935455e-05, "Pretrain/Loss": 1.9820687770843506, "Pretrain/Loss (Raw)": 1.9666895866394043, "Pretrain/Step": 12180, "Pretrain/Step Time": 8.442006142809987} +{"Pretrain/Learning Rate": 1.525328352640168e-05, "Pretrain/Loss": 1.9823226928710938, "Pretrain/Loss (Raw)": 2.009373426437378, "Pretrain/Step": 12181, "Pretrain/Step Time": 8.444057211279869} +{"Pretrain/Learning Rate": 1.5249374418907597e-05, "Pretrain/Loss": 1.9821054935455322, "Pretrain/Loss (Raw)": 2.1576807498931885, "Pretrain/Step": 12182, "Pretrain/Step Time": 8.439687952399254} +{"Pretrain/Learning Rate": 1.5245465592565933e-05, "Pretrain/Loss": 1.9815584421157837, "Pretrain/Loss (Raw)": 1.9834011793136597, "Pretrain/Step": 12183, "Pretrain/Step Time": 8.436100097373128} +{"Pretrain/Learning Rate": 1.5241557047489394e-05, "Pretrain/Loss": 1.9815435409545898, "Pretrain/Loss (Raw)": 1.9265583753585815, "Pretrain/Step": 12184, "Pretrain/Step Time": 8.443589076399803} +{"Pretrain/Learning Rate": 1.5237648783790682e-05, "Pretrain/Loss": 1.9838407039642334, "Pretrain/Loss (Raw)": 2.117669105529785, "Pretrain/Step": 12185, "Pretrain/Step Time": 8.438517659902573} +{"Pretrain/Learning Rate": 1.5233740801582478e-05, "Pretrain/Loss": 1.979832649230957, "Pretrain/Loss (Raw)": 1.7039353847503662, "Pretrain/Step": 12186, "Pretrain/Step Time": 8.443635823205113} +{"Pretrain/Learning Rate": 1.5229833100977476e-05, "Pretrain/Loss": 1.9816794395446777, "Pretrain/Loss (Raw)": 2.0741004943847656, "Pretrain/Step": 12187, "Pretrain/Step Time": 8.442569609731436} +{"Pretrain/Learning Rate": 1.5225925682088346e-05, "Pretrain/Loss": 1.9808156490325928, "Pretrain/Loss (Raw)": 2.1379997730255127, "Pretrain/Step": 12188, "Pretrain/Step Time": 8.440679581835866} +{"Pretrain/Learning Rate": 1.5222018545027761e-05, "Pretrain/Loss": 1.9815616607666016, "Pretrain/Loss (Raw)": 2.1850218772888184, "Pretrain/Step": 12189, "Pretrain/Step Time": 8.438625279814005} +{"Pretrain/Learning Rate": 1.5218111689908382e-05, "Pretrain/Loss": 1.9799602031707764, "Pretrain/Loss (Raw)": 1.8000062704086304, "Pretrain/Step": 12190, "Pretrain/Step Time": 8.436516553163528} +{"Pretrain/Learning Rate": 1.521420511684285e-05, "Pretrain/Loss": 1.9796314239501953, "Pretrain/Loss (Raw)": 1.7888180017471313, "Pretrain/Step": 12191, "Pretrain/Step Time": 8.43507468700409} +{"Pretrain/Learning Rate": 1.521029882594382e-05, "Pretrain/Loss": 1.9817469120025635, "Pretrain/Loss (Raw)": 2.1419360637664795, "Pretrain/Step": 12192, "Pretrain/Step Time": 8.440367287024856} +{"Pretrain/Learning Rate": 1.5206392817323918e-05, "Pretrain/Loss": 1.983328938484192, "Pretrain/Loss (Raw)": 2.0799505710601807, "Pretrain/Step": 12193, "Pretrain/Step Time": 8.44113645516336} +{"Pretrain/Learning Rate": 1.5202487091095776e-05, "Pretrain/Loss": 1.9840130805969238, "Pretrain/Loss (Raw)": 2.1655020713806152, "Pretrain/Step": 12194, "Pretrain/Step Time": 8.438136786222458} +{"Pretrain/Learning Rate": 1.5198581647372018e-05, "Pretrain/Loss": 1.9842981100082397, "Pretrain/Loss (Raw)": 2.0560789108276367, "Pretrain/Step": 12195, "Pretrain/Step Time": 8.43679234571755} +{"Pretrain/Learning Rate": 1.5194676486265242e-05, "Pretrain/Loss": 1.9822157621383667, "Pretrain/Loss (Raw)": 1.9324456453323364, "Pretrain/Step": 12196, "Pretrain/Step Time": 8.438445838168263} +{"Pretrain/Learning Rate": 1.5190771607888061e-05, "Pretrain/Loss": 1.9816845655441284, "Pretrain/Loss (Raw)": 2.1435773372650146, "Pretrain/Step": 12197, "Pretrain/Step Time": 8.43309567682445} +{"Pretrain/Learning Rate": 1.5186867012353062e-05, "Pretrain/Loss": 1.9841630458831787, "Pretrain/Loss (Raw)": 2.1194674968719482, "Pretrain/Step": 12198, "Pretrain/Step Time": 8.442861750721931} +{"Pretrain/Learning Rate": 1.5182962699772835e-05, "Pretrain/Loss": 1.9846371412277222, "Pretrain/Loss (Raw)": 2.083317279815674, "Pretrain/Step": 12199, "Pretrain/Step Time": 8.44381270930171} +{"Pretrain/Learning Rate": 1.5179058670259963e-05, "Pretrain/Loss": 1.9840425252914429, "Pretrain/Loss (Raw)": 1.8350105285644531, "Pretrain/Step": 12200, "Pretrain/Step Time": 8.441361043602228} +{"Pretrain/Learning Rate": 1.5175154923927007e-05, "Pretrain/Loss": 1.9870294332504272, "Pretrain/Loss (Raw)": 1.9887418746948242, "Pretrain/Step": 12201, "Pretrain/Step Time": 8.44132374227047} +{"Pretrain/Learning Rate": 1.5171251460886531e-05, "Pretrain/Loss": 1.9872620105743408, "Pretrain/Loss (Raw)": 1.9991108179092407, "Pretrain/Step": 12202, "Pretrain/Step Time": 8.442999217659235} +{"Pretrain/Learning Rate": 1.5167348281251092e-05, "Pretrain/Loss": 1.988721489906311, "Pretrain/Loss (Raw)": 2.0675854682922363, "Pretrain/Step": 12203, "Pretrain/Step Time": 8.44330508634448} +{"Pretrain/Learning Rate": 1.5163445385133234e-05, "Pretrain/Loss": 1.988639235496521, "Pretrain/Loss (Raw)": 1.8828884363174438, "Pretrain/Step": 12204, "Pretrain/Step Time": 8.444235181435943} +{"Pretrain/Learning Rate": 1.5159542772645492e-05, "Pretrain/Loss": 1.9878621101379395, "Pretrain/Loss (Raw)": 2.0491952896118164, "Pretrain/Step": 12205, "Pretrain/Step Time": 8.438023831695318} +{"Pretrain/Learning Rate": 1.5155640443900403e-05, "Pretrain/Loss": 1.9880363941192627, "Pretrain/Loss (Raw)": 1.9221376180648804, "Pretrain/Step": 12206, "Pretrain/Step Time": 8.444287575781345} +{"Pretrain/Learning Rate": 1.5151738399010479e-05, "Pretrain/Loss": 1.9904403686523438, "Pretrain/Loss (Raw)": 1.9351199865341187, "Pretrain/Step": 12207, "Pretrain/Step Time": 8.436238840222359} +{"Pretrain/Learning Rate": 1.5147836638088233e-05, "Pretrain/Loss": 1.9946017265319824, "Pretrain/Loss (Raw)": 2.3867974281311035, "Pretrain/Step": 12208, "Pretrain/Step Time": 8.438997711986303} +{"Pretrain/Learning Rate": 1.5143935161246176e-05, "Pretrain/Loss": 1.9935486316680908, "Pretrain/Loss (Raw)": 1.8572403192520142, "Pretrain/Step": 12209, "Pretrain/Step Time": 8.440800866112113} +{"Pretrain/Learning Rate": 1.5140033968596794e-05, "Pretrain/Loss": 1.9929534196853638, "Pretrain/Loss (Raw)": 1.883719801902771, "Pretrain/Step": 12210, "Pretrain/Step Time": 8.43874841183424} +{"Pretrain/Learning Rate": 1.5136133060252594e-05, "Pretrain/Loss": 1.9936237335205078, "Pretrain/Loss (Raw)": 2.0788345336914062, "Pretrain/Step": 12211, "Pretrain/Step Time": 8.43718390353024} +{"Pretrain/Learning Rate": 1.5132232436326032e-05, "Pretrain/Loss": 1.9922163486480713, "Pretrain/Loss (Raw)": 2.0784711837768555, "Pretrain/Step": 12212, "Pretrain/Step Time": 8.43944076448679} +{"Pretrain/Learning Rate": 1.5128332096929595e-05, "Pretrain/Loss": 1.9915741682052612, "Pretrain/Loss (Raw)": 1.971397042274475, "Pretrain/Step": 12213, "Pretrain/Step Time": 8.435089303180575} +{"Pretrain/Learning Rate": 1.5124432042175744e-05, "Pretrain/Loss": 1.99056077003479, "Pretrain/Loss (Raw)": 1.9987974166870117, "Pretrain/Step": 12214, "Pretrain/Step Time": 8.430713741108775} +{"Pretrain/Learning Rate": 1.5120532272176929e-05, "Pretrain/Loss": 1.9918169975280762, "Pretrain/Loss (Raw)": 2.0099313259124756, "Pretrain/Step": 12215, "Pretrain/Step Time": 8.43886061757803} +{"Pretrain/Learning Rate": 1.5116632787045613e-05, "Pretrain/Loss": 1.9918614625930786, "Pretrain/Loss (Raw)": 1.9243699312210083, "Pretrain/Step": 12216, "Pretrain/Step Time": 8.442401234060526} +{"Pretrain/Learning Rate": 1.5112733586894212e-05, "Pretrain/Loss": 1.9962934255599976, "Pretrain/Loss (Raw)": 2.5226192474365234, "Pretrain/Step": 12217, "Pretrain/Step Time": 8.440600702539086} +{"Pretrain/Learning Rate": 1.510883467183517e-05, "Pretrain/Loss": 1.996263027191162, "Pretrain/Loss (Raw)": 2.0556511878967285, "Pretrain/Step": 12218, "Pretrain/Step Time": 8.436372762545943} +{"Pretrain/Learning Rate": 1.510493604198091e-05, "Pretrain/Loss": 1.996608018875122, "Pretrain/Loss (Raw)": 2.142859697341919, "Pretrain/Step": 12219, "Pretrain/Step Time": 8.440361801534891} +{"Pretrain/Learning Rate": 1.5101037697443852e-05, "Pretrain/Loss": 1.9963321685791016, "Pretrain/Loss (Raw)": 2.0829923152923584, "Pretrain/Step": 12220, "Pretrain/Step Time": 8.440969295799732} +{"Pretrain/Learning Rate": 1.5097139638336382e-05, "Pretrain/Loss": 1.997161865234375, "Pretrain/Loss (Raw)": 1.9010276794433594, "Pretrain/Step": 12221, "Pretrain/Step Time": 8.433210803195834} +{"Pretrain/Learning Rate": 1.509324186477091e-05, "Pretrain/Loss": 1.997009038925171, "Pretrain/Loss (Raw)": 2.0147342681884766, "Pretrain/Step": 12222, "Pretrain/Step Time": 8.434794632717967} +{"Pretrain/Learning Rate": 1.5089344376859832e-05, "Pretrain/Loss": 1.9982205629348755, "Pretrain/Loss (Raw)": 2.068668842315674, "Pretrain/Step": 12223, "Pretrain/Step Time": 8.42637911811471} +{"Pretrain/Learning Rate": 1.5085447174715514e-05, "Pretrain/Loss": 1.9948927164077759, "Pretrain/Loss (Raw)": 1.8955562114715576, "Pretrain/Step": 12224, "Pretrain/Step Time": 8.431974733248353} +{"Pretrain/Learning Rate": 1.5081550258450338e-05, "Pretrain/Loss": 1.9934918880462646, "Pretrain/Loss (Raw)": 1.992530107498169, "Pretrain/Step": 12225, "Pretrain/Step Time": 8.431019764393568} +{"Pretrain/Learning Rate": 1.5077653628176672e-05, "Pretrain/Loss": 1.9952032566070557, "Pretrain/Loss (Raw)": 2.207737922668457, "Pretrain/Step": 12226, "Pretrain/Step Time": 8.430372579023242} +{"Pretrain/Learning Rate": 1.5073757284006868e-05, "Pretrain/Loss": 1.9927480220794678, "Pretrain/Loss (Raw)": 1.8792331218719482, "Pretrain/Step": 12227, "Pretrain/Step Time": 8.431427426636219} +{"Pretrain/Learning Rate": 1.5069861226053278e-05, "Pretrain/Loss": 1.9926426410675049, "Pretrain/Loss (Raw)": 2.0679776668548584, "Pretrain/Step": 12228, "Pretrain/Step Time": 8.433616809546947} +{"Pretrain/Learning Rate": 1.5065965454428233e-05, "Pretrain/Loss": 1.9917024374008179, "Pretrain/Loss (Raw)": 1.8283458948135376, "Pretrain/Step": 12229, "Pretrain/Step Time": 8.43723295815289} +{"Pretrain/Learning Rate": 1.5062069969244075e-05, "Pretrain/Loss": 1.9911363124847412, "Pretrain/Loss (Raw)": 1.872602939605713, "Pretrain/Step": 12230, "Pretrain/Step Time": 8.437517773360014} +{"Pretrain/Learning Rate": 1.5058174770613121e-05, "Pretrain/Loss": 1.9901427030563354, "Pretrain/Loss (Raw)": 1.619539499282837, "Pretrain/Step": 12231, "Pretrain/Step Time": 8.4328353703022} +{"Pretrain/Learning Rate": 1.505427985864769e-05, "Pretrain/Loss": 1.9887014627456665, "Pretrain/Loss (Raw)": 1.9095765352249146, "Pretrain/Step": 12232, "Pretrain/Step Time": 8.438918869942427} +{"Pretrain/Learning Rate": 1.505038523346009e-05, "Pretrain/Loss": 1.9853686094284058, "Pretrain/Loss (Raw)": 1.746330976486206, "Pretrain/Step": 12233, "Pretrain/Step Time": 8.44257671199739} +{"Pretrain/Learning Rate": 1.5046490895162618e-05, "Pretrain/Loss": 1.9876055717468262, "Pretrain/Loss (Raw)": 1.8864195346832275, "Pretrain/Step": 12234, "Pretrain/Step Time": 8.439344741404057} +{"Pretrain/Learning Rate": 1.5042596843867563e-05, "Pretrain/Loss": 1.985321044921875, "Pretrain/Loss (Raw)": 1.87026047706604, "Pretrain/Step": 12235, "Pretrain/Step Time": 8.438563702628016} +{"Pretrain/Learning Rate": 1.5038703079687205e-05, "Pretrain/Loss": 1.983472466468811, "Pretrain/Loss (Raw)": 1.8005162477493286, "Pretrain/Step": 12236, "Pretrain/Step Time": 8.43894568644464} +{"Pretrain/Learning Rate": 1.5034809602733824e-05, "Pretrain/Loss": 1.986078143119812, "Pretrain/Loss (Raw)": 2.3037424087524414, "Pretrain/Step": 12237, "Pretrain/Step Time": 8.443172520026565} +{"Pretrain/Learning Rate": 1.5030916413119684e-05, "Pretrain/Loss": 1.9828249216079712, "Pretrain/Loss (Raw)": 2.0168397426605225, "Pretrain/Step": 12238, "Pretrain/Step Time": 8.444075766950846} +{"Pretrain/Learning Rate": 1.5027023510957045e-05, "Pretrain/Loss": 1.9811482429504395, "Pretrain/Loss (Raw)": 1.7474921941757202, "Pretrain/Step": 12239, "Pretrain/Step Time": 8.44264523871243} +{"Pretrain/Learning Rate": 1.5023130896358145e-05, "Pretrain/Loss": 1.9829868078231812, "Pretrain/Loss (Raw)": 2.128023386001587, "Pretrain/Step": 12240, "Pretrain/Step Time": 8.438576562330127} +{"Pretrain/Learning Rate": 1.5019238569435235e-05, "Pretrain/Loss": 1.9836173057556152, "Pretrain/Loss (Raw)": 2.0052082538604736, "Pretrain/Step": 12241, "Pretrain/Step Time": 8.440288744866848} +{"Pretrain/Learning Rate": 1.5015346530300544e-05, "Pretrain/Loss": 1.981550931930542, "Pretrain/Loss (Raw)": 1.6335346698760986, "Pretrain/Step": 12242, "Pretrain/Step Time": 8.439551720395684} +{"Pretrain/Learning Rate": 1.50114547790663e-05, "Pretrain/Loss": 1.9814817905426025, "Pretrain/Loss (Raw)": 1.9643381834030151, "Pretrain/Step": 12243, "Pretrain/Step Time": 8.440966730937362} +{"Pretrain/Learning Rate": 1.5007563315844719e-05, "Pretrain/Loss": 1.9792767763137817, "Pretrain/Loss (Raw)": 1.8055185079574585, "Pretrain/Step": 12244, "Pretrain/Step Time": 8.441124299541116} +{"Pretrain/Learning Rate": 1.5003672140748e-05, "Pretrain/Loss": 1.9800500869750977, "Pretrain/Loss (Raw)": 2.2003657817840576, "Pretrain/Step": 12245, "Pretrain/Step Time": 8.441278476268053} +{"Pretrain/Learning Rate": 1.499978125388835e-05, "Pretrain/Loss": 1.9800370931625366, "Pretrain/Loss (Raw)": 1.83773934841156, "Pretrain/Step": 12246, "Pretrain/Step Time": 8.442544041201472} +{"Pretrain/Learning Rate": 1.4995890655377956e-05, "Pretrain/Loss": 1.9818193912506104, "Pretrain/Loss (Raw)": 2.0101749897003174, "Pretrain/Step": 12247, "Pretrain/Step Time": 8.439440505579114} +{"Pretrain/Learning Rate": 1.4992000345329002e-05, "Pretrain/Loss": 1.9817934036254883, "Pretrain/Loss (Raw)": 1.905577540397644, "Pretrain/Step": 12248, "Pretrain/Step Time": 8.442194623872638} +{"Pretrain/Learning Rate": 1.4988110323853671e-05, "Pretrain/Loss": 1.9838199615478516, "Pretrain/Loss (Raw)": 2.1403470039367676, "Pretrain/Step": 12249, "Pretrain/Step Time": 8.44082847982645} +{"Pretrain/Learning Rate": 1.4984220591064113e-05, "Pretrain/Loss": 1.9830410480499268, "Pretrain/Loss (Raw)": 1.7352977991104126, "Pretrain/Step": 12250, "Pretrain/Step Time": 8.444108977913857} +{"Pretrain/Learning Rate": 1.4980331147072493e-05, "Pretrain/Loss": 1.98574697971344, "Pretrain/Loss (Raw)": 2.1583588123321533, "Pretrain/Step": 12251, "Pretrain/Step Time": 8.440586319193244} +{"Pretrain/Learning Rate": 1.4976441991990964e-05, "Pretrain/Loss": 1.9877527952194214, "Pretrain/Loss (Raw)": 2.05867862701416, "Pretrain/Step": 12252, "Pretrain/Step Time": 8.438917690888047} +{"Pretrain/Learning Rate": 1.497255312593166e-05, "Pretrain/Loss": 1.987154245376587, "Pretrain/Loss (Raw)": 2.22621488571167, "Pretrain/Step": 12253, "Pretrain/Step Time": 8.445600889623165} +{"Pretrain/Learning Rate": 1.4968664549006728e-05, "Pretrain/Loss": 1.9895715713500977, "Pretrain/Loss (Raw)": 2.0367698669433594, "Pretrain/Step": 12254, "Pretrain/Step Time": 8.447716508060694} +{"Pretrain/Learning Rate": 1.4964776261328272e-05, "Pretrain/Loss": 1.9894258975982666, "Pretrain/Loss (Raw)": 1.8322023153305054, "Pretrain/Step": 12255, "Pretrain/Step Time": 8.445551432669163} +{"Pretrain/Learning Rate": 1.4960888263008421e-05, "Pretrain/Loss": 1.988903284072876, "Pretrain/Loss (Raw)": 2.1100683212280273, "Pretrain/Step": 12256, "Pretrain/Step Time": 8.445039708167315} +{"Pretrain/Learning Rate": 1.4957000554159279e-05, "Pretrain/Loss": 1.9842920303344727, "Pretrain/Loss (Raw)": 1.56569504737854, "Pretrain/Step": 12257, "Pretrain/Step Time": 8.445602545514703} +{"Pretrain/Learning Rate": 1.4953113134892946e-05, "Pretrain/Loss": 1.985661506652832, "Pretrain/Loss (Raw)": 2.0263280868530273, "Pretrain/Step": 12258, "Pretrain/Step Time": 8.446872025728226} +{"Pretrain/Learning Rate": 1.4949226005321517e-05, "Pretrain/Loss": 1.9855425357818604, "Pretrain/Loss (Raw)": 2.109135150909424, "Pretrain/Step": 12259, "Pretrain/Step Time": 8.43887952156365} +{"Pretrain/Learning Rate": 1.4945339165557068e-05, "Pretrain/Loss": 1.9888389110565186, "Pretrain/Loss (Raw)": 2.299581289291382, "Pretrain/Step": 12260, "Pretrain/Step Time": 8.4419995713979} +{"Pretrain/Learning Rate": 1.4941452615711676e-05, "Pretrain/Loss": 1.9885317087173462, "Pretrain/Loss (Raw)": 1.985358715057373, "Pretrain/Step": 12261, "Pretrain/Step Time": 8.43156835064292} +{"Pretrain/Learning Rate": 1.4937566355897406e-05, "Pretrain/Loss": 1.990966558456421, "Pretrain/Loss (Raw)": 2.0445189476013184, "Pretrain/Step": 12262, "Pretrain/Step Time": 8.435755053535104} +{"Pretrain/Learning Rate": 1.4933680386226317e-05, "Pretrain/Loss": 1.991852045059204, "Pretrain/Loss (Raw)": 2.059889554977417, "Pretrain/Step": 12263, "Pretrain/Step Time": 8.432120613753796} +{"Pretrain/Learning Rate": 1.4929794706810462e-05, "Pretrain/Loss": 1.9928593635559082, "Pretrain/Loss (Raw)": 2.159632444381714, "Pretrain/Step": 12264, "Pretrain/Step Time": 8.435856632888317} +{"Pretrain/Learning Rate": 1.4925909317761871e-05, "Pretrain/Loss": 1.9939531087875366, "Pretrain/Loss (Raw)": 2.019254446029663, "Pretrain/Step": 12265, "Pretrain/Step Time": 8.434645688161254} +{"Pretrain/Learning Rate": 1.4922024219192587e-05, "Pretrain/Loss": 1.9986385107040405, "Pretrain/Loss (Raw)": 2.0338568687438965, "Pretrain/Step": 12266, "Pretrain/Step Time": 8.434918278828263} +{"Pretrain/Learning Rate": 1.491813941121463e-05, "Pretrain/Loss": 1.9966645240783691, "Pretrain/Loss (Raw)": 1.7898756265640259, "Pretrain/Step": 12267, "Pretrain/Step Time": 8.437842041254044} +{"Pretrain/Learning Rate": 1.4914254893940014e-05, "Pretrain/Loss": 1.9948463439941406, "Pretrain/Loss (Raw)": 1.7174222469329834, "Pretrain/Step": 12268, "Pretrain/Step Time": 8.4365742392838} +{"Pretrain/Learning Rate": 1.491037066748075e-05, "Pretrain/Loss": 1.9956765174865723, "Pretrain/Loss (Raw)": 1.919645071029663, "Pretrain/Step": 12269, "Pretrain/Step Time": 8.439061269164085} +{"Pretrain/Learning Rate": 1.4906486731948838e-05, "Pretrain/Loss": 1.9933136701583862, "Pretrain/Loss (Raw)": 1.6348127126693726, "Pretrain/Step": 12270, "Pretrain/Step Time": 8.437849009409547} +{"Pretrain/Learning Rate": 1.490260308745626e-05, "Pretrain/Loss": 1.9906178712844849, "Pretrain/Loss (Raw)": 1.8145180940628052, "Pretrain/Step": 12271, "Pretrain/Step Time": 8.433857111260295} +{"Pretrain/Learning Rate": 1.4898719734115004e-05, "Pretrain/Loss": 1.9910873174667358, "Pretrain/Loss (Raw)": 2.086700916290283, "Pretrain/Step": 12272, "Pretrain/Step Time": 8.435632752254605} +{"Pretrain/Learning Rate": 1.4894836672037043e-05, "Pretrain/Loss": 1.9924468994140625, "Pretrain/Loss (Raw)": 2.0403504371643066, "Pretrain/Step": 12273, "Pretrain/Step Time": 8.435180973261595} +{"Pretrain/Learning Rate": 1.4890953901334347e-05, "Pretrain/Loss": 1.994576096534729, "Pretrain/Loss (Raw)": 2.248608112335205, "Pretrain/Step": 12274, "Pretrain/Step Time": 8.434538954868913} +{"Pretrain/Learning Rate": 1.488707142211887e-05, "Pretrain/Loss": 1.9942054748535156, "Pretrain/Loss (Raw)": 1.8652098178863525, "Pretrain/Step": 12275, "Pretrain/Step Time": 8.437405664473772} +{"Pretrain/Learning Rate": 1.4883189234502557e-05, "Pretrain/Loss": 1.9955575466156006, "Pretrain/Loss (Raw)": 1.9462581872940063, "Pretrain/Step": 12276, "Pretrain/Step Time": 8.432784451171756} +{"Pretrain/Learning Rate": 1.4879307338597347e-05, "Pretrain/Loss": 1.9954075813293457, "Pretrain/Loss (Raw)": 1.631389856338501, "Pretrain/Step": 12277, "Pretrain/Step Time": 8.437852857634425} +{"Pretrain/Learning Rate": 1.4875425734515181e-05, "Pretrain/Loss": 1.9945553541183472, "Pretrain/Loss (Raw)": 1.8916172981262207, "Pretrain/Step": 12278, "Pretrain/Step Time": 8.435473894700408} +{"Pretrain/Learning Rate": 1.4871544422367972e-05, "Pretrain/Loss": 1.990952491760254, "Pretrain/Loss (Raw)": 2.0320992469787598, "Pretrain/Step": 12279, "Pretrain/Step Time": 8.440695544704795} +{"Pretrain/Learning Rate": 1.4867663402267645e-05, "Pretrain/Loss": 1.9907985925674438, "Pretrain/Loss (Raw)": 1.9602857828140259, "Pretrain/Step": 12280, "Pretrain/Step Time": 8.435294447466731} +{"Pretrain/Learning Rate": 1.4863782674326096e-05, "Pretrain/Loss": 1.9882802963256836, "Pretrain/Loss (Raw)": 1.838930606842041, "Pretrain/Step": 12281, "Pretrain/Step Time": 8.444567162543535} +{"Pretrain/Learning Rate": 1.4859902238655226e-05, "Pretrain/Loss": 1.9895493984222412, "Pretrain/Loss (Raw)": 2.2389156818389893, "Pretrain/Step": 12282, "Pretrain/Step Time": 8.444124368950725} +{"Pretrain/Learning Rate": 1.4856022095366931e-05, "Pretrain/Loss": 1.9897876977920532, "Pretrain/Loss (Raw)": 1.9425278902053833, "Pretrain/Step": 12283, "Pretrain/Step Time": 8.443961517885327} +{"Pretrain/Learning Rate": 1.4852142244573086e-05, "Pretrain/Loss": 1.9895143508911133, "Pretrain/Loss (Raw)": 2.029796600341797, "Pretrain/Step": 12284, "Pretrain/Step Time": 8.44841823913157} +{"Pretrain/Learning Rate": 1.4848262686385572e-05, "Pretrain/Loss": 1.989671230316162, "Pretrain/Loss (Raw)": 1.8862580060958862, "Pretrain/Step": 12285, "Pretrain/Step Time": 8.448168663308024} +{"Pretrain/Learning Rate": 1.4844383420916238e-05, "Pretrain/Loss": 1.990993618965149, "Pretrain/Loss (Raw)": 2.1944098472595215, "Pretrain/Step": 12286, "Pretrain/Step Time": 8.442137368023396} +{"Pretrain/Learning Rate": 1.4840504448276953e-05, "Pretrain/Loss": 1.9900305271148682, "Pretrain/Loss (Raw)": 1.9553163051605225, "Pretrain/Step": 12287, "Pretrain/Step Time": 8.443428257480264} +{"Pretrain/Learning Rate": 1.483662576857956e-05, "Pretrain/Loss": 1.98799467086792, "Pretrain/Loss (Raw)": 1.7972477674484253, "Pretrain/Step": 12288, "Pretrain/Step Time": 8.44027521647513} +{"Pretrain/Learning Rate": 1.4832747381935897e-05, "Pretrain/Loss": 1.9907433986663818, "Pretrain/Loss (Raw)": 2.3104124069213867, "Pretrain/Step": 12289, "Pretrain/Step Time": 8.444543857127428} +{"Pretrain/Learning Rate": 1.4828869288457797e-05, "Pretrain/Loss": 1.9868426322937012, "Pretrain/Loss (Raw)": 1.686352014541626, "Pretrain/Step": 12290, "Pretrain/Step Time": 8.442148450762033} +{"Pretrain/Learning Rate": 1.482499148825708e-05, "Pretrain/Loss": 1.98921799659729, "Pretrain/Loss (Raw)": 2.0126607418060303, "Pretrain/Step": 12291, "Pretrain/Step Time": 8.440465241670609} +{"Pretrain/Learning Rate": 1.4821113981445561e-05, "Pretrain/Loss": 1.989728569984436, "Pretrain/Loss (Raw)": 2.089647054672241, "Pretrain/Step": 12292, "Pretrain/Step Time": 8.439607946202159} +{"Pretrain/Learning Rate": 1.4817236768135045e-05, "Pretrain/Loss": 1.9893391132354736, "Pretrain/Loss (Raw)": 2.0672690868377686, "Pretrain/Step": 12293, "Pretrain/Step Time": 8.43626113049686} +{"Pretrain/Learning Rate": 1.4813359848437325e-05, "Pretrain/Loss": 1.9876108169555664, "Pretrain/Loss (Raw)": 1.8123456239700317, "Pretrain/Step": 12294, "Pretrain/Step Time": 8.435660662129521} +{"Pretrain/Learning Rate": 1.4809483222464201e-05, "Pretrain/Loss": 1.986753225326538, "Pretrain/Loss (Raw)": 1.9266197681427002, "Pretrain/Step": 12295, "Pretrain/Step Time": 8.438427910208702} +{"Pretrain/Learning Rate": 1.480560689032744e-05, "Pretrain/Loss": 1.9876006841659546, "Pretrain/Loss (Raw)": 2.01229190826416, "Pretrain/Step": 12296, "Pretrain/Step Time": 8.440405016764998} +{"Pretrain/Learning Rate": 1.4801730852138814e-05, "Pretrain/Loss": 1.9905123710632324, "Pretrain/Loss (Raw)": 2.2829623222351074, "Pretrain/Step": 12297, "Pretrain/Step Time": 8.442152380943298} +{"Pretrain/Learning Rate": 1.4797855108010092e-05, "Pretrain/Loss": 1.9888970851898193, "Pretrain/Loss (Raw)": 2.027676820755005, "Pretrain/Step": 12298, "Pretrain/Step Time": 8.433634893968701} +{"Pretrain/Learning Rate": 1.4793979658053026e-05, "Pretrain/Loss": 1.9878631830215454, "Pretrain/Loss (Raw)": 1.977851390838623, "Pretrain/Step": 12299, "Pretrain/Step Time": 8.43556509166956} +{"Pretrain/Learning Rate": 1.4790104502379365e-05, "Pretrain/Loss": 1.9904890060424805, "Pretrain/Loss (Raw)": 2.1309406757354736, "Pretrain/Step": 12300, "Pretrain/Step Time": 8.443914635106921} +{"Pretrain/Learning Rate": 1.478622964110084e-05, "Pretrain/Loss": 1.9912184476852417, "Pretrain/Loss (Raw)": 1.9173219203948975, "Pretrain/Step": 12301, "Pretrain/Step Time": 8.444808211177588} +{"Pretrain/Learning Rate": 1.4782355074329182e-05, "Pretrain/Loss": 1.9924288988113403, "Pretrain/Loss (Raw)": 2.2950971126556396, "Pretrain/Step": 12302, "Pretrain/Step Time": 8.44211982935667} +{"Pretrain/Learning Rate": 1.4778480802176115e-05, "Pretrain/Loss": 1.992348313331604, "Pretrain/Loss (Raw)": 2.0622618198394775, "Pretrain/Step": 12303, "Pretrain/Step Time": 8.435071965679526} +{"Pretrain/Learning Rate": 1.4774606824753357e-05, "Pretrain/Loss": 1.990901231765747, "Pretrain/Loss (Raw)": 1.8548321723937988, "Pretrain/Step": 12304, "Pretrain/Step Time": 8.435576874762774} +{"Pretrain/Learning Rate": 1.477073314217259e-05, "Pretrain/Loss": 1.9925928115844727, "Pretrain/Loss (Raw)": 2.0890679359436035, "Pretrain/Step": 12305, "Pretrain/Step Time": 8.434881515800953} +{"Pretrain/Learning Rate": 1.4766859754545525e-05, "Pretrain/Loss": 1.9903315305709839, "Pretrain/Loss (Raw)": 1.8476665019989014, "Pretrain/Step": 12306, "Pretrain/Step Time": 8.43639980070293} +{"Pretrain/Learning Rate": 1.4762986661983844e-05, "Pretrain/Loss": 1.9924083948135376, "Pretrain/Loss (Raw)": 2.1950175762176514, "Pretrain/Step": 12307, "Pretrain/Step Time": 8.437873467803001} +{"Pretrain/Learning Rate": 1.4759113864599231e-05, "Pretrain/Loss": 1.9925973415374756, "Pretrain/Loss (Raw)": 1.9908543825149536, "Pretrain/Step": 12308, "Pretrain/Step Time": 8.437557194381952} +{"Pretrain/Learning Rate": 1.4755241362503345e-05, "Pretrain/Loss": 1.9909937381744385, "Pretrain/Loss (Raw)": 1.8041185140609741, "Pretrain/Step": 12309, "Pretrain/Step Time": 8.432833082973957} +{"Pretrain/Learning Rate": 1.4751369155807854e-05, "Pretrain/Loss": 1.9898827075958252, "Pretrain/Loss (Raw)": 2.015454053878784, "Pretrain/Step": 12310, "Pretrain/Step Time": 8.43700797483325} +{"Pretrain/Learning Rate": 1.4747497244624403e-05, "Pretrain/Loss": 1.9907852411270142, "Pretrain/Loss (Raw)": 2.098951578140259, "Pretrain/Step": 12311, "Pretrain/Step Time": 8.440785428509116} +{"Pretrain/Learning Rate": 1.4743625629064647e-05, "Pretrain/Loss": 1.9912734031677246, "Pretrain/Loss (Raw)": 1.9890109300613403, "Pretrain/Step": 12312, "Pretrain/Step Time": 8.435386028140783} +{"Pretrain/Learning Rate": 1.473975430924022e-05, "Pretrain/Loss": 1.9916497468948364, "Pretrain/Loss (Raw)": 2.1658520698547363, "Pretrain/Step": 12313, "Pretrain/Step Time": 8.43329225666821} +{"Pretrain/Learning Rate": 1.4735883285262739e-05, "Pretrain/Loss": 1.9924461841583252, "Pretrain/Loss (Raw)": 1.8058749437332153, "Pretrain/Step": 12314, "Pretrain/Step Time": 8.432214848697186} +{"Pretrain/Learning Rate": 1.4732012557243826e-05, "Pretrain/Loss": 1.9923264980316162, "Pretrain/Loss (Raw)": 2.058786153793335, "Pretrain/Step": 12315, "Pretrain/Step Time": 8.437086423859} +{"Pretrain/Learning Rate": 1.4728142125295094e-05, "Pretrain/Loss": 1.9925751686096191, "Pretrain/Loss (Raw)": 2.169828414916992, "Pretrain/Step": 12316, "Pretrain/Step Time": 8.43588613346219} +{"Pretrain/Learning Rate": 1.4724271989528143e-05, "Pretrain/Loss": 1.991308331489563, "Pretrain/Loss (Raw)": 2.0228781700134277, "Pretrain/Step": 12317, "Pretrain/Step Time": 8.44217157177627} +{"Pretrain/Learning Rate": 1.472040215005457e-05, "Pretrain/Loss": 1.9931058883666992, "Pretrain/Loss (Raw)": 2.0300748348236084, "Pretrain/Step": 12318, "Pretrain/Step Time": 8.444014167413116} +{"Pretrain/Learning Rate": 1.471653260698595e-05, "Pretrain/Loss": 1.9932833909988403, "Pretrain/Loss (Raw)": 1.8115439414978027, "Pretrain/Step": 12319, "Pretrain/Step Time": 8.444101398810744} +{"Pretrain/Learning Rate": 1.4712663360433862e-05, "Pretrain/Loss": 1.9916553497314453, "Pretrain/Loss (Raw)": 1.9335405826568604, "Pretrain/Step": 12320, "Pretrain/Step Time": 8.438538456335664} +{"Pretrain/Learning Rate": 1.4708794410509874e-05, "Pretrain/Loss": 1.9905556440353394, "Pretrain/Loss (Raw)": 1.9392019510269165, "Pretrain/Step": 12321, "Pretrain/Step Time": 8.440680855885148} +{"Pretrain/Learning Rate": 1.4704925757325543e-05, "Pretrain/Loss": 1.9898748397827148, "Pretrain/Loss (Raw)": 2.0783565044403076, "Pretrain/Step": 12322, "Pretrain/Step Time": 8.44094175286591} +{"Pretrain/Learning Rate": 1.4701057400992427e-05, "Pretrain/Loss": 1.989956021308899, "Pretrain/Loss (Raw)": 2.0664713382720947, "Pretrain/Step": 12323, "Pretrain/Step Time": 8.43932718411088} +{"Pretrain/Learning Rate": 1.4697189341622056e-05, "Pretrain/Loss": 1.9918748140335083, "Pretrain/Loss (Raw)": 2.178046226501465, "Pretrain/Step": 12324, "Pretrain/Step Time": 8.438031263649464} +{"Pretrain/Learning Rate": 1.4693321579325966e-05, "Pretrain/Loss": 1.9914393424987793, "Pretrain/Loss (Raw)": 2.087843656539917, "Pretrain/Step": 12325, "Pretrain/Step Time": 8.439783833920956} +{"Pretrain/Learning Rate": 1.4689454114215684e-05, "Pretrain/Loss": 1.9913954734802246, "Pretrain/Loss (Raw)": 2.113839626312256, "Pretrain/Step": 12326, "Pretrain/Step Time": 8.432746337726712} +{"Pretrain/Learning Rate": 1.4685586946402725e-05, "Pretrain/Loss": 1.9919687509536743, "Pretrain/Loss (Raw)": 2.1567037105560303, "Pretrain/Step": 12327, "Pretrain/Step Time": 8.431886196136475} +{"Pretrain/Learning Rate": 1.4681720075998595e-05, "Pretrain/Loss": 1.9941911697387695, "Pretrain/Loss (Raw)": 2.119464159011841, "Pretrain/Step": 12328, "Pretrain/Step Time": 8.431197991594672} +{"Pretrain/Learning Rate": 1.4677853503114791e-05, "Pretrain/Loss": 1.9949791431427002, "Pretrain/Loss (Raw)": 2.0896246433258057, "Pretrain/Step": 12329, "Pretrain/Step Time": 8.430131027475} +{"Pretrain/Learning Rate": 1.4673987227862806e-05, "Pretrain/Loss": 1.9958291053771973, "Pretrain/Loss (Raw)": 2.107905864715576, "Pretrain/Step": 12330, "Pretrain/Step Time": 8.429137071594596} +{"Pretrain/Learning Rate": 1.467012125035412e-05, "Pretrain/Loss": 1.9956276416778564, "Pretrain/Loss (Raw)": 2.0418031215667725, "Pretrain/Step": 12331, "Pretrain/Step Time": 8.426724491640925} +{"Pretrain/Learning Rate": 1.4666255570700202e-05, "Pretrain/Loss": 1.9984731674194336, "Pretrain/Loss (Raw)": 2.2470998764038086, "Pretrain/Step": 12332, "Pretrain/Step Time": 8.427960697561502} +{"Pretrain/Learning Rate": 1.4662390189012525e-05, "Pretrain/Loss": 1.9973706007003784, "Pretrain/Loss (Raw)": 1.9080772399902344, "Pretrain/Step": 12333, "Pretrain/Step Time": 8.434253171086311} +{"Pretrain/Learning Rate": 1.4658525105402537e-05, "Pretrain/Loss": 1.9977025985717773, "Pretrain/Loss (Raw)": 1.964624047279358, "Pretrain/Step": 12334, "Pretrain/Step Time": 8.430270336568356} +{"Pretrain/Learning Rate": 1.465466031998169e-05, "Pretrain/Loss": 1.9983799457550049, "Pretrain/Loss (Raw)": 2.021811008453369, "Pretrain/Step": 12335, "Pretrain/Step Time": 8.434001913294196} +{"Pretrain/Learning Rate": 1.4650795832861414e-05, "Pretrain/Loss": 1.9973335266113281, "Pretrain/Loss (Raw)": 2.2528698444366455, "Pretrain/Step": 12336, "Pretrain/Step Time": 8.430160401389003} +{"Pretrain/Learning Rate": 1.464693164415315e-05, "Pretrain/Loss": 1.9981001615524292, "Pretrain/Loss (Raw)": 1.9553803205490112, "Pretrain/Step": 12337, "Pretrain/Step Time": 8.429923424497247} +{"Pretrain/Learning Rate": 1.464306775396831e-05, "Pretrain/Loss": 1.9969491958618164, "Pretrain/Loss (Raw)": 1.736390233039856, "Pretrain/Step": 12338, "Pretrain/Step Time": 8.42869502492249} +{"Pretrain/Learning Rate": 1.4639204162418313e-05, "Pretrain/Loss": 1.9948054552078247, "Pretrain/Loss (Raw)": 1.8044352531433105, "Pretrain/Step": 12339, "Pretrain/Step Time": 8.433817185461521} +{"Pretrain/Learning Rate": 1.463534086961456e-05, "Pretrain/Loss": 1.9929828643798828, "Pretrain/Loss (Raw)": 1.845166802406311, "Pretrain/Step": 12340, "Pretrain/Step Time": 8.431007407605648} +{"Pretrain/Learning Rate": 1.4631477875668442e-05, "Pretrain/Loss": 1.9926342964172363, "Pretrain/Loss (Raw)": 1.9267990589141846, "Pretrain/Step": 12341, "Pretrain/Step Time": 8.434404779225588} +{"Pretrain/Learning Rate": 1.4627615180691353e-05, "Pretrain/Loss": 1.991753101348877, "Pretrain/Loss (Raw)": 1.8859928846359253, "Pretrain/Step": 12342, "Pretrain/Step Time": 8.432397058233619} +{"Pretrain/Learning Rate": 1.462375278479467e-05, "Pretrain/Loss": 1.990796685218811, "Pretrain/Loss (Raw)": 1.8875024318695068, "Pretrain/Step": 12343, "Pretrain/Step Time": 8.43129281513393} +{"Pretrain/Learning Rate": 1.461989068808976e-05, "Pretrain/Loss": 1.9883006811141968, "Pretrain/Loss (Raw)": 1.6048848628997803, "Pretrain/Step": 12344, "Pretrain/Step Time": 8.433771401643753} +{"Pretrain/Learning Rate": 1.4616028890687982e-05, "Pretrain/Loss": 1.9854977130889893, "Pretrain/Loss (Raw)": 2.1638412475585938, "Pretrain/Step": 12345, "Pretrain/Step Time": 8.435705456882715} +{"Pretrain/Learning Rate": 1.4612167392700694e-05, "Pretrain/Loss": 1.9835174083709717, "Pretrain/Loss (Raw)": 1.8021825551986694, "Pretrain/Step": 12346, "Pretrain/Step Time": 8.436656663194299} +{"Pretrain/Learning Rate": 1.4608306194239236e-05, "Pretrain/Loss": 1.9797157049179077, "Pretrain/Loss (Raw)": 1.6562412977218628, "Pretrain/Step": 12347, "Pretrain/Step Time": 8.434298733249307} +{"Pretrain/Learning Rate": 1.4604445295414938e-05, "Pretrain/Loss": 1.978217601776123, "Pretrain/Loss (Raw)": 1.8912380933761597, "Pretrain/Step": 12348, "Pretrain/Step Time": 8.43378751911223} +{"Pretrain/Learning Rate": 1.460058469633914e-05, "Pretrain/Loss": 1.9790802001953125, "Pretrain/Loss (Raw)": 2.011425256729126, "Pretrain/Step": 12349, "Pretrain/Step Time": 8.443212904036045} +{"Pretrain/Learning Rate": 1.4596724397123147e-05, "Pretrain/Loss": 1.9787237644195557, "Pretrain/Loss (Raw)": 1.9691088199615479, "Pretrain/Step": 12350, "Pretrain/Step Time": 8.441076047718525} +{"Pretrain/Learning Rate": 1.4592864397878269e-05, "Pretrain/Loss": 1.9791016578674316, "Pretrain/Loss (Raw)": 2.1170358657836914, "Pretrain/Step": 12351, "Pretrain/Step Time": 8.447104377672076} +{"Pretrain/Learning Rate": 1.4589004698715816e-05, "Pretrain/Loss": 1.980224370956421, "Pretrain/Loss (Raw)": 2.03928804397583, "Pretrain/Step": 12352, "Pretrain/Step Time": 8.440990941599011} +{"Pretrain/Learning Rate": 1.4585145299747066e-05, "Pretrain/Loss": 1.9799567461013794, "Pretrain/Loss (Raw)": 1.9582730531692505, "Pretrain/Step": 12353, "Pretrain/Step Time": 8.444592608138919} +{"Pretrain/Learning Rate": 1.4581286201083317e-05, "Pretrain/Loss": 1.9780185222625732, "Pretrain/Loss (Raw)": 1.9596381187438965, "Pretrain/Step": 12354, "Pretrain/Step Time": 8.441155914217234} +{"Pretrain/Learning Rate": 1.4577427402835825e-05, "Pretrain/Loss": 1.9789365530014038, "Pretrain/Loss (Raw)": 1.996737003326416, "Pretrain/Step": 12355, "Pretrain/Step Time": 8.440737241879106} +{"Pretrain/Learning Rate": 1.4573568905115875e-05, "Pretrain/Loss": 1.978440523147583, "Pretrain/Loss (Raw)": 2.004484176635742, "Pretrain/Step": 12356, "Pretrain/Step Time": 8.440718803554773} +{"Pretrain/Learning Rate": 1.4569710708034718e-05, "Pretrain/Loss": 1.9801616668701172, "Pretrain/Loss (Raw)": 2.048654794692993, "Pretrain/Step": 12357, "Pretrain/Step Time": 8.442592445760965} +{"Pretrain/Learning Rate": 1.456585281170359e-05, "Pretrain/Loss": 1.9811861515045166, "Pretrain/Loss (Raw)": 2.0037288665771484, "Pretrain/Step": 12358, "Pretrain/Step Time": 8.44350217282772} +{"Pretrain/Learning Rate": 1.4561995216233747e-05, "Pretrain/Loss": 1.9842244386672974, "Pretrain/Loss (Raw)": 2.008441925048828, "Pretrain/Step": 12359, "Pretrain/Step Time": 8.44356663711369} +{"Pretrain/Learning Rate": 1.4558137921736408e-05, "Pretrain/Loss": 1.9863685369491577, "Pretrain/Loss (Raw)": 2.1840298175811768, "Pretrain/Step": 12360, "Pretrain/Step Time": 8.445144567638636} +{"Pretrain/Learning Rate": 1.455428092832281e-05, "Pretrain/Loss": 1.9877996444702148, "Pretrain/Loss (Raw)": 1.9295045137405396, "Pretrain/Step": 12361, "Pretrain/Step Time": 8.444994512945414} +{"Pretrain/Learning Rate": 1.455042423610416e-05, "Pretrain/Loss": 1.989734172821045, "Pretrain/Loss (Raw)": 2.1340324878692627, "Pretrain/Step": 12362, "Pretrain/Step Time": 8.446984503418207} +{"Pretrain/Learning Rate": 1.4546567845191644e-05, "Pretrain/Loss": 1.9903483390808105, "Pretrain/Loss (Raw)": 1.9488842487335205, "Pretrain/Step": 12363, "Pretrain/Step Time": 8.443365436047316} +{"Pretrain/Learning Rate": 1.4542711755696492e-05, "Pretrain/Loss": 1.9930481910705566, "Pretrain/Loss (Raw)": 2.146097421646118, "Pretrain/Step": 12364, "Pretrain/Step Time": 8.446367414668202} +{"Pretrain/Learning Rate": 1.453885596772986e-05, "Pretrain/Loss": 1.9898580312728882, "Pretrain/Loss (Raw)": 1.8954073190689087, "Pretrain/Step": 12365, "Pretrain/Step Time": 8.441585533320904} +{"Pretrain/Learning Rate": 1.4535000481402955e-05, "Pretrain/Loss": 1.9899356365203857, "Pretrain/Loss (Raw)": 2.0267655849456787, "Pretrain/Step": 12366, "Pretrain/Step Time": 8.447920383885503} +{"Pretrain/Learning Rate": 1.4531145296826932e-05, "Pretrain/Loss": 1.9913990497589111, "Pretrain/Loss (Raw)": 1.9348047971725464, "Pretrain/Step": 12367, "Pretrain/Step Time": 8.446367280557752} +{"Pretrain/Learning Rate": 1.4527290414112942e-05, "Pretrain/Loss": 1.989446759223938, "Pretrain/Loss (Raw)": 1.8781449794769287, "Pretrain/Step": 12368, "Pretrain/Step Time": 8.446746302768588} +{"Pretrain/Learning Rate": 1.4523435833372162e-05, "Pretrain/Loss": 1.9867887496948242, "Pretrain/Loss (Raw)": 1.6649821996688843, "Pretrain/Step": 12369, "Pretrain/Step Time": 8.44883119687438} +{"Pretrain/Learning Rate": 1.4519581554715716e-05, "Pretrain/Loss": 1.988746166229248, "Pretrain/Loss (Raw)": 1.884075403213501, "Pretrain/Step": 12370, "Pretrain/Step Time": 8.448836965486407} +{"Pretrain/Learning Rate": 1.4515727578254756e-05, "Pretrain/Loss": 1.987884759902954, "Pretrain/Loss (Raw)": 1.8540840148925781, "Pretrain/Step": 12371, "Pretrain/Step Time": 8.446739124134183} +{"Pretrain/Learning Rate": 1.4511873904100401e-05, "Pretrain/Loss": 1.9863859415054321, "Pretrain/Loss (Raw)": 1.6136748790740967, "Pretrain/Step": 12372, "Pretrain/Step Time": 8.448638543486595} +{"Pretrain/Learning Rate": 1.4508020532363759e-05, "Pretrain/Loss": 1.9831398725509644, "Pretrain/Loss (Raw)": 1.7848706245422363, "Pretrain/Step": 12373, "Pretrain/Step Time": 8.448370216414332} +{"Pretrain/Learning Rate": 1.4504167463155954e-05, "Pretrain/Loss": 1.9853105545043945, "Pretrain/Loss (Raw)": 2.115570306777954, "Pretrain/Step": 12374, "Pretrain/Step Time": 8.444797487929463} +{"Pretrain/Learning Rate": 1.4500314696588077e-05, "Pretrain/Loss": 1.9851428270339966, "Pretrain/Loss (Raw)": 1.9887055158615112, "Pretrain/Step": 12375, "Pretrain/Step Time": 8.443360636010766} +{"Pretrain/Learning Rate": 1.4496462232771229e-05, "Pretrain/Loss": 1.9842755794525146, "Pretrain/Loss (Raw)": 1.7945728302001953, "Pretrain/Step": 12376, "Pretrain/Step Time": 8.444423155859113} +{"Pretrain/Learning Rate": 1.4492610071816493e-05, "Pretrain/Loss": 1.9837757349014282, "Pretrain/Loss (Raw)": 2.0763778686523438, "Pretrain/Step": 12377, "Pretrain/Step Time": 8.442210542038083} +{"Pretrain/Learning Rate": 1.4488758213834924e-05, "Pretrain/Loss": 1.985685110092163, "Pretrain/Loss (Raw)": 1.9796944856643677, "Pretrain/Step": 12378, "Pretrain/Step Time": 8.444570595398545} +{"Pretrain/Learning Rate": 1.4484906658937617e-05, "Pretrain/Loss": 1.9859261512756348, "Pretrain/Loss (Raw)": 2.1892170906066895, "Pretrain/Step": 12379, "Pretrain/Step Time": 8.448310855776072} +{"Pretrain/Learning Rate": 1.44810554072356e-05, "Pretrain/Loss": 1.9850913286209106, "Pretrain/Loss (Raw)": 1.9518126249313354, "Pretrain/Step": 12380, "Pretrain/Step Time": 8.454260865226388} +{"Pretrain/Learning Rate": 1.4477204458839943e-05, "Pretrain/Loss": 1.9842989444732666, "Pretrain/Loss (Raw)": 2.1248106956481934, "Pretrain/Step": 12381, "Pretrain/Step Time": 8.45228386297822} +{"Pretrain/Learning Rate": 1.4473353813861684e-05, "Pretrain/Loss": 1.9846909046173096, "Pretrain/Loss (Raw)": 2.0869297981262207, "Pretrain/Step": 12382, "Pretrain/Step Time": 8.448245991021395} +{"Pretrain/Learning Rate": 1.4469503472411833e-05, "Pretrain/Loss": 1.9861364364624023, "Pretrain/Loss (Raw)": 2.017216444015503, "Pretrain/Step": 12383, "Pretrain/Step Time": 8.449245715513825} +{"Pretrain/Learning Rate": 1.4465653434601434e-05, "Pretrain/Loss": 1.9838359355926514, "Pretrain/Loss (Raw)": 1.8156042098999023, "Pretrain/Step": 12384, "Pretrain/Step Time": 8.452427167445421} +{"Pretrain/Learning Rate": 1.4461803700541485e-05, "Pretrain/Loss": 1.9878125190734863, "Pretrain/Loss (Raw)": 2.0747156143188477, "Pretrain/Step": 12385, "Pretrain/Step Time": 8.452605137601495} +{"Pretrain/Learning Rate": 1.4457954270343005e-05, "Pretrain/Loss": 1.9883602857589722, "Pretrain/Loss (Raw)": 2.0964343547821045, "Pretrain/Step": 12386, "Pretrain/Step Time": 8.451083101332188} +{"Pretrain/Learning Rate": 1.4454105144116984e-05, "Pretrain/Loss": 1.9873650074005127, "Pretrain/Loss (Raw)": 1.9817460775375366, "Pretrain/Step": 12387, "Pretrain/Step Time": 8.451879052445292} +{"Pretrain/Learning Rate": 1.4450256321974407e-05, "Pretrain/Loss": 1.9827626943588257, "Pretrain/Loss (Raw)": 1.7104732990264893, "Pretrain/Step": 12388, "Pretrain/Step Time": 8.451514173299074} +{"Pretrain/Learning Rate": 1.444640780402624e-05, "Pretrain/Loss": 1.9824326038360596, "Pretrain/Loss (Raw)": 1.9431086778640747, "Pretrain/Step": 12389, "Pretrain/Step Time": 8.452593974769115} +{"Pretrain/Learning Rate": 1.4442559590383476e-05, "Pretrain/Loss": 1.9811677932739258, "Pretrain/Loss (Raw)": 1.8826245069503784, "Pretrain/Step": 12390, "Pretrain/Step Time": 8.448690289631486} +{"Pretrain/Learning Rate": 1.4438711681157063e-05, "Pretrain/Loss": 1.982860803604126, "Pretrain/Loss (Raw)": 2.276577949523926, "Pretrain/Step": 12391, "Pretrain/Step Time": 8.449029743671417} +{"Pretrain/Learning Rate": 1.4434864076457943e-05, "Pretrain/Loss": 1.9812448024749756, "Pretrain/Loss (Raw)": 1.9528013467788696, "Pretrain/Step": 12392, "Pretrain/Step Time": 8.451323606073856} +{"Pretrain/Learning Rate": 1.4431016776397077e-05, "Pretrain/Loss": 1.9825680255889893, "Pretrain/Loss (Raw)": 2.188636302947998, "Pretrain/Step": 12393, "Pretrain/Step Time": 8.449520155787468} +{"Pretrain/Learning Rate": 1.4427169781085386e-05, "Pretrain/Loss": 1.9826316833496094, "Pretrain/Loss (Raw)": 2.041999340057373, "Pretrain/Step": 12394, "Pretrain/Step Time": 8.45266186259687} +{"Pretrain/Learning Rate": 1.4423323090633809e-05, "Pretrain/Loss": 1.9824782609939575, "Pretrain/Loss (Raw)": 1.7702258825302124, "Pretrain/Step": 12395, "Pretrain/Step Time": 8.453111574053764} +{"Pretrain/Learning Rate": 1.4419476705153256e-05, "Pretrain/Loss": 1.984322190284729, "Pretrain/Loss (Raw)": 1.9534616470336914, "Pretrain/Step": 12396, "Pretrain/Step Time": 8.45740157365799} +{"Pretrain/Learning Rate": 1.4415630624754622e-05, "Pretrain/Loss": 1.984196424484253, "Pretrain/Loss (Raw)": 1.9035249948501587, "Pretrain/Step": 12397, "Pretrain/Step Time": 8.461769746616483} +{"Pretrain/Learning Rate": 1.4411784849548826e-05, "Pretrain/Loss": 1.9869476556777954, "Pretrain/Loss (Raw)": 1.9869815111160278, "Pretrain/Step": 12398, "Pretrain/Step Time": 8.462025674059987} +{"Pretrain/Learning Rate": 1.4407939379646743e-05, "Pretrain/Loss": 1.9884474277496338, "Pretrain/Loss (Raw)": 2.006481647491455, "Pretrain/Step": 12399, "Pretrain/Step Time": 8.46654967032373} +{"Pretrain/Learning Rate": 1.4404094215159269e-05, "Pretrain/Loss": 1.9874204397201538, "Pretrain/Loss (Raw)": 1.955260157585144, "Pretrain/Step": 12400, "Pretrain/Step Time": 8.46618908084929} +{"Pretrain/Learning Rate": 1.440024935619727e-05, "Pretrain/Loss": 1.9863920211791992, "Pretrain/Loss (Raw)": 1.9087146520614624, "Pretrain/Step": 12401, "Pretrain/Step Time": 8.467787081375718} +{"Pretrain/Learning Rate": 1.4396404802871596e-05, "Pretrain/Loss": 1.985339641571045, "Pretrain/Loss (Raw)": 2.113884449005127, "Pretrain/Step": 12402, "Pretrain/Step Time": 8.466720027849078} +{"Pretrain/Learning Rate": 1.4392560555293127e-05, "Pretrain/Loss": 1.9867212772369385, "Pretrain/Loss (Raw)": 2.0420708656311035, "Pretrain/Step": 12403, "Pretrain/Step Time": 8.46673071756959} +{"Pretrain/Learning Rate": 1.4388716613572683e-05, "Pretrain/Loss": 1.988708734512329, "Pretrain/Loss (Raw)": 2.2006564140319824, "Pretrain/Step": 12404, "Pretrain/Step Time": 8.467124607414007} +{"Pretrain/Learning Rate": 1.438487297782113e-05, "Pretrain/Loss": 1.990657925605774, "Pretrain/Loss (Raw)": 1.880873680114746, "Pretrain/Step": 12405, "Pretrain/Step Time": 8.463174125179648} +{"Pretrain/Learning Rate": 1.438102964814928e-05, "Pretrain/Loss": 1.9911288022994995, "Pretrain/Loss (Raw)": 1.951895833015442, "Pretrain/Step": 12406, "Pretrain/Step Time": 8.463287755846977} +{"Pretrain/Learning Rate": 1.4377186624667944e-05, "Pretrain/Loss": 1.9905760288238525, "Pretrain/Loss (Raw)": 1.961340308189392, "Pretrain/Step": 12407, "Pretrain/Step Time": 8.455932023003697} +{"Pretrain/Learning Rate": 1.4373343907487951e-05, "Pretrain/Loss": 1.9905130863189697, "Pretrain/Loss (Raw)": 1.9522454738616943, "Pretrain/Step": 12408, "Pretrain/Step Time": 8.463186325505376} +{"Pretrain/Learning Rate": 1.436950149672009e-05, "Pretrain/Loss": 1.9905931949615479, "Pretrain/Loss (Raw)": 1.8491889238357544, "Pretrain/Step": 12409, "Pretrain/Step Time": 8.456142509356141} +{"Pretrain/Learning Rate": 1.4365659392475162e-05, "Pretrain/Loss": 1.9888821840286255, "Pretrain/Loss (Raw)": 2.0198898315429688, "Pretrain/Step": 12410, "Pretrain/Step Time": 8.45963772945106} +{"Pretrain/Learning Rate": 1.4361817594863953e-05, "Pretrain/Loss": 1.9897074699401855, "Pretrain/Loss (Raw)": 2.048158884048462, "Pretrain/Step": 12411, "Pretrain/Step Time": 8.458588352426887} +{"Pretrain/Learning Rate": 1.4357976103997226e-05, "Pretrain/Loss": 1.9882302284240723, "Pretrain/Loss (Raw)": 1.840721845626831, "Pretrain/Step": 12412, "Pretrain/Step Time": 8.455624898895621} +{"Pretrain/Learning Rate": 1.4354134919985762e-05, "Pretrain/Loss": 1.9872171878814697, "Pretrain/Loss (Raw)": 1.7565679550170898, "Pretrain/Step": 12413, "Pretrain/Step Time": 8.459126269444823} +{"Pretrain/Learning Rate": 1.4350294042940304e-05, "Pretrain/Loss": 1.9858481884002686, "Pretrain/Loss (Raw)": 2.019188404083252, "Pretrain/Step": 12414, "Pretrain/Step Time": 8.458484336733818} +{"Pretrain/Learning Rate": 1.4346453472971621e-05, "Pretrain/Loss": 1.9855780601501465, "Pretrain/Loss (Raw)": 1.9207402467727661, "Pretrain/Step": 12415, "Pretrain/Step Time": 8.459573114290833} +{"Pretrain/Learning Rate": 1.4342613210190443e-05, "Pretrain/Loss": 1.9877091646194458, "Pretrain/Loss (Raw)": 2.070051431655884, "Pretrain/Step": 12416, "Pretrain/Step Time": 8.459258958697319} +{"Pretrain/Learning Rate": 1.4338773254707488e-05, "Pretrain/Loss": 1.9835753440856934, "Pretrain/Loss (Raw)": 1.7812613248825073, "Pretrain/Step": 12417, "Pretrain/Step Time": 8.458129251375794} +{"Pretrain/Learning Rate": 1.43349336066335e-05, "Pretrain/Loss": 1.9869693517684937, "Pretrain/Loss (Raw)": 2.120774507522583, "Pretrain/Step": 12418, "Pretrain/Step Time": 8.462200727313757} +{"Pretrain/Learning Rate": 1.4331094266079176e-05, "Pretrain/Loss": 1.9881808757781982, "Pretrain/Loss (Raw)": 2.1677474975585938, "Pretrain/Step": 12419, "Pretrain/Step Time": 8.460953833535314} +{"Pretrain/Learning Rate": 1.4327255233155234e-05, "Pretrain/Loss": 1.9870150089263916, "Pretrain/Loss (Raw)": 1.9404182434082031, "Pretrain/Step": 12420, "Pretrain/Step Time": 8.464865364134312} +{"Pretrain/Learning Rate": 1.4323416507972365e-05, "Pretrain/Loss": 1.9860739707946777, "Pretrain/Loss (Raw)": 1.946806788444519, "Pretrain/Step": 12421, "Pretrain/Step Time": 8.464948950335383} +{"Pretrain/Learning Rate": 1.4319578090641245e-05, "Pretrain/Loss": 1.9895384311676025, "Pretrain/Loss (Raw)": 2.255805253982544, "Pretrain/Step": 12422, "Pretrain/Step Time": 8.466226276010275} +{"Pretrain/Learning Rate": 1.431573998127257e-05, "Pretrain/Loss": 1.9894070625305176, "Pretrain/Loss (Raw)": 1.909796118736267, "Pretrain/Step": 12423, "Pretrain/Step Time": 8.467604821547866} +{"Pretrain/Learning Rate": 1.4311902179976993e-05, "Pretrain/Loss": 1.9927048683166504, "Pretrain/Loss (Raw)": 2.4344139099121094, "Pretrain/Step": 12424, "Pretrain/Step Time": 8.466516906395555} +{"Pretrain/Learning Rate": 1.4308064686865191e-05, "Pretrain/Loss": 1.9926354885101318, "Pretrain/Loss (Raw)": 2.2740795612335205, "Pretrain/Step": 12425, "Pretrain/Step Time": 8.467222720384598} +{"Pretrain/Learning Rate": 1.4304227502047807e-05, "Pretrain/Loss": 1.9914802312850952, "Pretrain/Loss (Raw)": 1.8798155784606934, "Pretrain/Step": 12426, "Pretrain/Step Time": 8.471562702208757} +{"Pretrain/Learning Rate": 1.4300390625635474e-05, "Pretrain/Loss": 1.9914675951004028, "Pretrain/Loss (Raw)": 1.9762340784072876, "Pretrain/Step": 12427, "Pretrain/Step Time": 8.473025847226381} +{"Pretrain/Learning Rate": 1.4296554057738842e-05, "Pretrain/Loss": 1.9903278350830078, "Pretrain/Loss (Raw)": 1.9850608110427856, "Pretrain/Step": 12428, "Pretrain/Step Time": 8.470894888043404} +{"Pretrain/Learning Rate": 1.429271779846852e-05, "Pretrain/Loss": 1.9894746541976929, "Pretrain/Loss (Raw)": 1.8080929517745972, "Pretrain/Step": 12429, "Pretrain/Step Time": 8.476857805624604} +{"Pretrain/Learning Rate": 1.428888184793514e-05, "Pretrain/Loss": 1.98833429813385, "Pretrain/Loss (Raw)": 2.149139642715454, "Pretrain/Step": 12430, "Pretrain/Step Time": 8.473986657336354} +{"Pretrain/Learning Rate": 1.4285046206249303e-05, "Pretrain/Loss": 1.987133264541626, "Pretrain/Loss (Raw)": 1.9085289239883423, "Pretrain/Step": 12431, "Pretrain/Step Time": 8.474717484787107} +{"Pretrain/Learning Rate": 1.4281210873521594e-05, "Pretrain/Loss": 1.9891654253005981, "Pretrain/Loss (Raw)": 2.1149516105651855, "Pretrain/Step": 12432, "Pretrain/Step Time": 8.477841474115849} +{"Pretrain/Learning Rate": 1.4277375849862623e-05, "Pretrain/Loss": 1.9872419834136963, "Pretrain/Loss (Raw)": 1.8428553342819214, "Pretrain/Step": 12433, "Pretrain/Step Time": 8.479853443801403} +{"Pretrain/Learning Rate": 1.427354113538295e-05, "Pretrain/Loss": 1.991138219833374, "Pretrain/Loss (Raw)": 2.3463938236236572, "Pretrain/Step": 12434, "Pretrain/Step Time": 8.484776198863983} +{"Pretrain/Learning Rate": 1.426970673019317e-05, "Pretrain/Loss": 1.9907972812652588, "Pretrain/Loss (Raw)": 2.1513891220092773, "Pretrain/Step": 12435, "Pretrain/Step Time": 8.480098159983754} +{"Pretrain/Learning Rate": 1.4265872634403829e-05, "Pretrain/Loss": 1.991220235824585, "Pretrain/Loss (Raw)": 2.0449860095977783, "Pretrain/Step": 12436, "Pretrain/Step Time": 8.482271017506719} +{"Pretrain/Learning Rate": 1.4262038848125475e-05, "Pretrain/Loss": 1.9920979738235474, "Pretrain/Loss (Raw)": 1.9164676666259766, "Pretrain/Step": 12437, "Pretrain/Step Time": 8.485171416774392} +{"Pretrain/Learning Rate": 1.425820537146867e-05, "Pretrain/Loss": 1.993234634399414, "Pretrain/Loss (Raw)": 2.1609511375427246, "Pretrain/Step": 12438, "Pretrain/Step Time": 8.480931492522359} +{"Pretrain/Learning Rate": 1.425437220454393e-05, "Pretrain/Loss": 1.9925172328948975, "Pretrain/Loss (Raw)": 2.0071213245391846, "Pretrain/Step": 12439, "Pretrain/Step Time": 8.481673397123814} +{"Pretrain/Learning Rate": 1.4250539347461806e-05, "Pretrain/Loss": 1.9929548501968384, "Pretrain/Loss (Raw)": 2.045018196105957, "Pretrain/Step": 12440, "Pretrain/Step Time": 8.480900801718235} +{"Pretrain/Learning Rate": 1.4246706800332799e-05, "Pretrain/Loss": 1.9909918308258057, "Pretrain/Loss (Raw)": 1.9145874977111816, "Pretrain/Step": 12441, "Pretrain/Step Time": 8.485394744202495} +{"Pretrain/Learning Rate": 1.424287456326741e-05, "Pretrain/Loss": 1.9918254613876343, "Pretrain/Loss (Raw)": 1.91258704662323, "Pretrain/Step": 12442, "Pretrain/Step Time": 8.482893448323011} +{"Pretrain/Learning Rate": 1.4239042636376162e-05, "Pretrain/Loss": 1.990344524383545, "Pretrain/Loss (Raw)": 1.8692114353179932, "Pretrain/Step": 12443, "Pretrain/Step Time": 8.48217954300344} +{"Pretrain/Learning Rate": 1.4235211019769523e-05, "Pretrain/Loss": 1.9871892929077148, "Pretrain/Loss (Raw)": 1.7659763097763062, "Pretrain/Step": 12444, "Pretrain/Step Time": 8.49280782788992} +{"Pretrain/Learning Rate": 1.4231379713557997e-05, "Pretrain/Loss": 1.9856632947921753, "Pretrain/Loss (Raw)": 1.8275370597839355, "Pretrain/Step": 12445, "Pretrain/Step Time": 8.489064687862992} +{"Pretrain/Learning Rate": 1.4227548717852044e-05, "Pretrain/Loss": 1.9850645065307617, "Pretrain/Loss (Raw)": 1.9534491300582886, "Pretrain/Step": 12446, "Pretrain/Step Time": 8.485881866887212} +{"Pretrain/Learning Rate": 1.4223718032762118e-05, "Pretrain/Loss": 1.985577940940857, "Pretrain/Loss (Raw)": 1.8772423267364502, "Pretrain/Step": 12447, "Pretrain/Step Time": 8.485253751277924} +{"Pretrain/Learning Rate": 1.4219887658398698e-05, "Pretrain/Loss": 1.9831297397613525, "Pretrain/Loss (Raw)": 1.6201825141906738, "Pretrain/Step": 12448, "Pretrain/Step Time": 8.486689262092113} +{"Pretrain/Learning Rate": 1.4216057594872206e-05, "Pretrain/Loss": 1.9825971126556396, "Pretrain/Loss (Raw)": 1.8710182905197144, "Pretrain/Step": 12449, "Pretrain/Step Time": 8.487093672156334} +{"Pretrain/Learning Rate": 1.4212227842293101e-05, "Pretrain/Loss": 1.982419490814209, "Pretrain/Loss (Raw)": 2.0556302070617676, "Pretrain/Step": 12450, "Pretrain/Step Time": 8.489635553210974} +{"Pretrain/Learning Rate": 1.4208398400771805e-05, "Pretrain/Loss": 1.983008861541748, "Pretrain/Loss (Raw)": 2.141896963119507, "Pretrain/Step": 12451, "Pretrain/Step Time": 8.490043757483363} +{"Pretrain/Learning Rate": 1.4204569270418722e-05, "Pretrain/Loss": 1.9800138473510742, "Pretrain/Loss (Raw)": 1.7946833372116089, "Pretrain/Step": 12452, "Pretrain/Step Time": 8.48722174577415} +{"Pretrain/Learning Rate": 1.420074045134428e-05, "Pretrain/Loss": 1.9772917032241821, "Pretrain/Loss (Raw)": 1.7394229173660278, "Pretrain/Step": 12453, "Pretrain/Step Time": 8.486969796940684} +{"Pretrain/Learning Rate": 1.4196911943658869e-05, "Pretrain/Loss": 1.9765487909317017, "Pretrain/Loss (Raw)": 2.0187463760375977, "Pretrain/Step": 12454, "Pretrain/Step Time": 8.484951781108975} +{"Pretrain/Learning Rate": 1.4193083747472893e-05, "Pretrain/Loss": 1.9765374660491943, "Pretrain/Loss (Raw)": 2.1552462577819824, "Pretrain/Step": 12455, "Pretrain/Step Time": 8.485943390056491} +{"Pretrain/Learning Rate": 1.4189255862896722e-05, "Pretrain/Loss": 1.9744694232940674, "Pretrain/Loss (Raw)": 1.854769229888916, "Pretrain/Step": 12456, "Pretrain/Step Time": 8.488965053111315} +{"Pretrain/Learning Rate": 1.4185428290040745e-05, "Pretrain/Loss": 1.9743937253952026, "Pretrain/Loss (Raw)": 2.079925298690796, "Pretrain/Step": 12457, "Pretrain/Step Time": 8.493052527308464} +{"Pretrain/Learning Rate": 1.4181601029015318e-05, "Pretrain/Loss": 1.9747838973999023, "Pretrain/Loss (Raw)": 2.157844066619873, "Pretrain/Step": 12458, "Pretrain/Step Time": 8.492370104417205} +{"Pretrain/Learning Rate": 1.4177774079930791e-05, "Pretrain/Loss": 1.973630428314209, "Pretrain/Loss (Raw)": 1.8941539525985718, "Pretrain/Step": 12459, "Pretrain/Step Time": 8.496475042775273} +{"Pretrain/Learning Rate": 1.4173947442897528e-05, "Pretrain/Loss": 1.9715538024902344, "Pretrain/Loss (Raw)": 1.9812997579574585, "Pretrain/Step": 12460, "Pretrain/Step Time": 8.497403802350163} +{"Pretrain/Learning Rate": 1.4170121118025853e-05, "Pretrain/Loss": 1.9734517335891724, "Pretrain/Loss (Raw)": 2.1510121822357178, "Pretrain/Step": 12461, "Pretrain/Step Time": 8.498574052006006} +{"Pretrain/Learning Rate": 1.4166295105426106e-05, "Pretrain/Loss": 1.9756157398223877, "Pretrain/Loss (Raw)": 2.241612434387207, "Pretrain/Step": 12462, "Pretrain/Step Time": 8.500338423997164} +{"Pretrain/Learning Rate": 1.4162469405208602e-05, "Pretrain/Loss": 1.976233959197998, "Pretrain/Loss (Raw)": 2.1009488105773926, "Pretrain/Step": 12463, "Pretrain/Step Time": 8.497749110683799} +{"Pretrain/Learning Rate": 1.4158644017483647e-05, "Pretrain/Loss": 1.9745659828186035, "Pretrain/Loss (Raw)": 2.039386749267578, "Pretrain/Step": 12464, "Pretrain/Step Time": 8.498302267864347} +{"Pretrain/Learning Rate": 1.4154818942361555e-05, "Pretrain/Loss": 1.9756033420562744, "Pretrain/Loss (Raw)": 2.0881478786468506, "Pretrain/Step": 12465, "Pretrain/Step Time": 8.496393648907542} +{"Pretrain/Learning Rate": 1.4150994179952606e-05, "Pretrain/Loss": 1.9785457849502563, "Pretrain/Loss (Raw)": 2.113027811050415, "Pretrain/Step": 12466, "Pretrain/Step Time": 8.498491361737251} +{"Pretrain/Learning Rate": 1.4147169730367102e-05, "Pretrain/Loss": 1.9804086685180664, "Pretrain/Loss (Raw)": 2.042875051498413, "Pretrain/Step": 12467, "Pretrain/Step Time": 8.492286520078778} +{"Pretrain/Learning Rate": 1.4143345593715307e-05, "Pretrain/Loss": 1.9798394441604614, "Pretrain/Loss (Raw)": 1.772310733795166, "Pretrain/Step": 12468, "Pretrain/Step Time": 8.491507276892662} +{"Pretrain/Learning Rate": 1.4139521770107478e-05, "Pretrain/Loss": 1.9803513288497925, "Pretrain/Loss (Raw)": 1.9923181533813477, "Pretrain/Step": 12469, "Pretrain/Step Time": 8.487712478265166} +{"Pretrain/Learning Rate": 1.4135698259653893e-05, "Pretrain/Loss": 1.9817630052566528, "Pretrain/Loss (Raw)": 2.0666871070861816, "Pretrain/Step": 12470, "Pretrain/Step Time": 8.488797195255756} +{"Pretrain/Learning Rate": 1.4131875062464778e-05, "Pretrain/Loss": 1.9844233989715576, "Pretrain/Loss (Raw)": 2.228029489517212, "Pretrain/Step": 12471, "Pretrain/Step Time": 8.484679583460093} +{"Pretrain/Learning Rate": 1.4128052178650409e-05, "Pretrain/Loss": 1.9868555068969727, "Pretrain/Loss (Raw)": 1.9161959886550903, "Pretrain/Step": 12472, "Pretrain/Step Time": 8.478539695963264} +{"Pretrain/Learning Rate": 1.4124229608320965e-05, "Pretrain/Loss": 1.986580729484558, "Pretrain/Loss (Raw)": 2.128666400909424, "Pretrain/Step": 12473, "Pretrain/Step Time": 8.479059344157577} +{"Pretrain/Learning Rate": 1.4120407351586707e-05, "Pretrain/Loss": 1.987198829650879, "Pretrain/Loss (Raw)": 1.881294846534729, "Pretrain/Step": 12474, "Pretrain/Step Time": 8.485824765637517} +{"Pretrain/Learning Rate": 1.4116585408557833e-05, "Pretrain/Loss": 1.990399956703186, "Pretrain/Loss (Raw)": 2.065990686416626, "Pretrain/Step": 12475, "Pretrain/Step Time": 8.483188649639487} +{"Pretrain/Learning Rate": 1.4112763779344537e-05, "Pretrain/Loss": 1.991684913635254, "Pretrain/Loss (Raw)": 2.0557126998901367, "Pretrain/Step": 12476, "Pretrain/Step Time": 8.482857497408986} +{"Pretrain/Learning Rate": 1.4108942464057032e-05, "Pretrain/Loss": 1.98981773853302, "Pretrain/Loss (Raw)": 1.7724334001541138, "Pretrain/Step": 12477, "Pretrain/Step Time": 8.475468683987856} +{"Pretrain/Learning Rate": 1.4105121462805483e-05, "Pretrain/Loss": 1.9849334955215454, "Pretrain/Loss (Raw)": 1.343920350074768, "Pretrain/Step": 12478, "Pretrain/Step Time": 8.484342344105244} +{"Pretrain/Learning Rate": 1.4101300775700088e-05, "Pretrain/Loss": 1.983420968055725, "Pretrain/Loss (Raw)": 1.9234377145767212, "Pretrain/Step": 12479, "Pretrain/Step Time": 8.47940351255238} +{"Pretrain/Learning Rate": 1.4097480402851e-05, "Pretrain/Loss": 1.9842333793640137, "Pretrain/Loss (Raw)": 2.143280267715454, "Pretrain/Step": 12480, "Pretrain/Step Time": 8.480814803391695} +{"Pretrain/Learning Rate": 1.409366034436837e-05, "Pretrain/Loss": 1.9827470779418945, "Pretrain/Loss (Raw)": 1.7680153846740723, "Pretrain/Step": 12481, "Pretrain/Step Time": 8.476935738697648} +{"Pretrain/Learning Rate": 1.4089840600362363e-05, "Pretrain/Loss": 1.9811832904815674, "Pretrain/Loss (Raw)": 1.7594865560531616, "Pretrain/Step": 12482, "Pretrain/Step Time": 8.481028268113732} +{"Pretrain/Learning Rate": 1.4086021170943103e-05, "Pretrain/Loss": 1.983483076095581, "Pretrain/Loss (Raw)": 2.291109800338745, "Pretrain/Step": 12483, "Pretrain/Step Time": 8.480052029713988} +{"Pretrain/Learning Rate": 1.4082202056220739e-05, "Pretrain/Loss": 1.9824327230453491, "Pretrain/Loss (Raw)": 1.8700437545776367, "Pretrain/Step": 12484, "Pretrain/Step Time": 8.48215926811099} +{"Pretrain/Learning Rate": 1.4078383256305382e-05, "Pretrain/Loss": 1.9806418418884277, "Pretrain/Loss (Raw)": 1.819408655166626, "Pretrain/Step": 12485, "Pretrain/Step Time": 8.476594410836697} +{"Pretrain/Learning Rate": 1.4074564771307133e-05, "Pretrain/Loss": 1.981536865234375, "Pretrain/Loss (Raw)": 2.118293046951294, "Pretrain/Step": 12486, "Pretrain/Step Time": 8.476252380758524} +{"Pretrain/Learning Rate": 1.4070746601336118e-05, "Pretrain/Loss": 1.978773832321167, "Pretrain/Loss (Raw)": 1.654775619506836, "Pretrain/Step": 12487, "Pretrain/Step Time": 8.474592886865139} +{"Pretrain/Learning Rate": 1.406692874650241e-05, "Pretrain/Loss": 1.9782893657684326, "Pretrain/Loss (Raw)": 2.1220195293426514, "Pretrain/Step": 12488, "Pretrain/Step Time": 8.469176802784204} +{"Pretrain/Learning Rate": 1.4063111206916116e-05, "Pretrain/Loss": 1.9781074523925781, "Pretrain/Loss (Raw)": 1.9062093496322632, "Pretrain/Step": 12489, "Pretrain/Step Time": 8.469311999157071} +{"Pretrain/Learning Rate": 1.40592939826873e-05, "Pretrain/Loss": 1.9764759540557861, "Pretrain/Loss (Raw)": 1.9252115488052368, "Pretrain/Step": 12490, "Pretrain/Step Time": 8.466713678091764} +{"Pretrain/Learning Rate": 1.4055477073926015e-05, "Pretrain/Loss": 1.9751207828521729, "Pretrain/Loss (Raw)": 1.7754104137420654, "Pretrain/Step": 12491, "Pretrain/Step Time": 8.471663443371654} +{"Pretrain/Learning Rate": 1.4051660480742348e-05, "Pretrain/Loss": 1.9745291471481323, "Pretrain/Loss (Raw)": 2.070377826690674, "Pretrain/Step": 12492, "Pretrain/Step Time": 8.468664152547717} +{"Pretrain/Learning Rate": 1.4047844203246321e-05, "Pretrain/Loss": 1.9758656024932861, "Pretrain/Loss (Raw)": 2.0664689540863037, "Pretrain/Step": 12493, "Pretrain/Step Time": 8.471865493804216} +{"Pretrain/Learning Rate": 1.4044028241547996e-05, "Pretrain/Loss": 1.9788329601287842, "Pretrain/Loss (Raw)": 2.4065821170806885, "Pretrain/Step": 12494, "Pretrain/Step Time": 8.469860633835196} +{"Pretrain/Learning Rate": 1.4040212595757394e-05, "Pretrain/Loss": 1.978294849395752, "Pretrain/Loss (Raw)": 1.8659236431121826, "Pretrain/Step": 12495, "Pretrain/Step Time": 8.47219941392541} +{"Pretrain/Learning Rate": 1.4036397265984524e-05, "Pretrain/Loss": 1.9780057668685913, "Pretrain/Loss (Raw)": 1.8411600589752197, "Pretrain/Step": 12496, "Pretrain/Step Time": 8.471642961725593} +{"Pretrain/Learning Rate": 1.4032582252339422e-05, "Pretrain/Loss": 1.9810444116592407, "Pretrain/Loss (Raw)": 2.0539166927337646, "Pretrain/Step": 12497, "Pretrain/Step Time": 8.468719705939293} +{"Pretrain/Learning Rate": 1.4028767554932068e-05, "Pretrain/Loss": 1.981914758682251, "Pretrain/Loss (Raw)": 1.9954745769500732, "Pretrain/Step": 12498, "Pretrain/Step Time": 8.4710323382169} +{"Pretrain/Learning Rate": 1.402495317387248e-05, "Pretrain/Loss": 1.982059121131897, "Pretrain/Loss (Raw)": 1.8725841045379639, "Pretrain/Step": 12499, "Pretrain/Step Time": 8.470585344359279} +{"Pretrain/Learning Rate": 1.4021139109270625e-05, "Pretrain/Loss": 1.9846864938735962, "Pretrain/Loss (Raw)": 1.9499669075012207, "Pretrain/Step": 12500, "Pretrain/Step Time": 8.46952517516911} +{"Pretrain/Learning Rate": 1.4017325361236478e-05, "Pretrain/Loss": 1.9856057167053223, "Pretrain/Loss (Raw)": 1.9025260210037231, "Pretrain/Step": 12501, "Pretrain/Step Time": 8.474504061043262} +{"Pretrain/Learning Rate": 1.4013511929880019e-05, "Pretrain/Loss": 1.9829157590866089, "Pretrain/Loss (Raw)": 1.7712513208389282, "Pretrain/Step": 12502, "Pretrain/Step Time": 8.474349152296782} +{"Pretrain/Learning Rate": 1.400969881531119e-05, "Pretrain/Loss": 1.985053539276123, "Pretrain/Loss (Raw)": 2.2623586654663086, "Pretrain/Step": 12503, "Pretrain/Step Time": 8.475019671022892} +{"Pretrain/Learning Rate": 1.400588601763996e-05, "Pretrain/Loss": 1.9887831211090088, "Pretrain/Loss (Raw)": 2.271955728530884, "Pretrain/Step": 12504, "Pretrain/Step Time": 8.47322491183877} +{"Pretrain/Learning Rate": 1.4002073536976256e-05, "Pretrain/Loss": 1.988487720489502, "Pretrain/Loss (Raw)": 2.0385661125183105, "Pretrain/Step": 12505, "Pretrain/Step Time": 8.474999597296119} +{"Pretrain/Learning Rate": 1.3998261373429997e-05, "Pretrain/Loss": 1.9886715412139893, "Pretrain/Loss (Raw)": 2.0032119750976562, "Pretrain/Step": 12506, "Pretrain/Step Time": 8.471433974802494} +{"Pretrain/Learning Rate": 1.3994449527111126e-05, "Pretrain/Loss": 1.985217809677124, "Pretrain/Loss (Raw)": 1.7471470832824707, "Pretrain/Step": 12507, "Pretrain/Step Time": 8.469199560582638} +{"Pretrain/Learning Rate": 1.3990637998129536e-05, "Pretrain/Loss": 1.9851104021072388, "Pretrain/Loss (Raw)": 1.9380689859390259, "Pretrain/Step": 12508, "Pretrain/Step Time": 8.465365989133716} +{"Pretrain/Learning Rate": 1.3986826786595145e-05, "Pretrain/Loss": 1.9843363761901855, "Pretrain/Loss (Raw)": 2.025749683380127, "Pretrain/Step": 12509, "Pretrain/Step Time": 8.464652817696333} +{"Pretrain/Learning Rate": 1.398301589261784e-05, "Pretrain/Loss": 1.985204815864563, "Pretrain/Loss (Raw)": 2.1980674266815186, "Pretrain/Step": 12510, "Pretrain/Step Time": 8.467993499711156} +{"Pretrain/Learning Rate": 1.3979205316307497e-05, "Pretrain/Loss": 1.9863770008087158, "Pretrain/Loss (Raw)": 2.167264699935913, "Pretrain/Step": 12511, "Pretrain/Step Time": 8.468442363664508} +{"Pretrain/Learning Rate": 1.397539505777401e-05, "Pretrain/Loss": 1.9871242046356201, "Pretrain/Loss (Raw)": 1.9112435579299927, "Pretrain/Step": 12512, "Pretrain/Step Time": 8.4638680703938} +{"Pretrain/Learning Rate": 1.3971585117127222e-05, "Pretrain/Loss": 1.9855320453643799, "Pretrain/Loss (Raw)": 1.8709187507629395, "Pretrain/Step": 12513, "Pretrain/Step Time": 8.468382289633155} +{"Pretrain/Learning Rate": 1.3967775494477017e-05, "Pretrain/Loss": 1.9862700700759888, "Pretrain/Loss (Raw)": 2.1909000873565674, "Pretrain/Step": 12514, "Pretrain/Step Time": 8.467720352113247} +{"Pretrain/Learning Rate": 1.3963966189933226e-05, "Pretrain/Loss": 1.9861664772033691, "Pretrain/Loss (Raw)": 1.9684946537017822, "Pretrain/Step": 12515, "Pretrain/Step Time": 8.46679736673832} +{"Pretrain/Learning Rate": 1.3960157203605678e-05, "Pretrain/Loss": 1.9890775680541992, "Pretrain/Loss (Raw)": 2.0830798149108887, "Pretrain/Step": 12516, "Pretrain/Step Time": 8.467123206704855} +{"Pretrain/Learning Rate": 1.395634853560423e-05, "Pretrain/Loss": 1.9897809028625488, "Pretrain/Loss (Raw)": 2.0331368446350098, "Pretrain/Step": 12517, "Pretrain/Step Time": 8.467709455639124} +{"Pretrain/Learning Rate": 1.3952540186038671e-05, "Pretrain/Loss": 1.99005126953125, "Pretrain/Loss (Raw)": 1.9172158241271973, "Pretrain/Step": 12518, "Pretrain/Step Time": 8.469159230589867} +{"Pretrain/Learning Rate": 1.394873215501884e-05, "Pretrain/Loss": 1.9878042936325073, "Pretrain/Loss (Raw)": 1.9889893531799316, "Pretrain/Step": 12519, "Pretrain/Step Time": 8.46763881854713} +{"Pretrain/Learning Rate": 1.3944924442654517e-05, "Pretrain/Loss": 1.9891736507415771, "Pretrain/Loss (Raw)": 2.128087282180786, "Pretrain/Step": 12520, "Pretrain/Step Time": 8.463231470435858} +{"Pretrain/Learning Rate": 1.3941117049055513e-05, "Pretrain/Loss": 1.987700343132019, "Pretrain/Loss (Raw)": 2.000040054321289, "Pretrain/Step": 12521, "Pretrain/Step Time": 8.461095418781042} +{"Pretrain/Learning Rate": 1.3937309974331605e-05, "Pretrain/Loss": 1.9891998767852783, "Pretrain/Loss (Raw)": 2.2339272499084473, "Pretrain/Step": 12522, "Pretrain/Step Time": 8.462293425574899} +{"Pretrain/Learning Rate": 1.3933503218592552e-05, "Pretrain/Loss": 1.9905388355255127, "Pretrain/Loss (Raw)": 1.9416170120239258, "Pretrain/Step": 12523, "Pretrain/Step Time": 8.461884967982769} +{"Pretrain/Learning Rate": 1.3929696781948149e-05, "Pretrain/Loss": 1.9904520511627197, "Pretrain/Loss (Raw)": 1.9423669576644897, "Pretrain/Step": 12524, "Pretrain/Step Time": 8.460212860256433} +{"Pretrain/Learning Rate": 1.3925890664508117e-05, "Pretrain/Loss": 1.99114191532135, "Pretrain/Loss (Raw)": 1.9918289184570312, "Pretrain/Step": 12525, "Pretrain/Step Time": 8.457612900063396} +{"Pretrain/Learning Rate": 1.3922084866382237e-05, "Pretrain/Loss": 1.9903380870819092, "Pretrain/Loss (Raw)": 1.8840750455856323, "Pretrain/Step": 12526, "Pretrain/Step Time": 8.458048513159156} +{"Pretrain/Learning Rate": 1.3918279387680227e-05, "Pretrain/Loss": 1.9915046691894531, "Pretrain/Loss (Raw)": 2.155806303024292, "Pretrain/Step": 12527, "Pretrain/Step Time": 8.456129727885127} +{"Pretrain/Learning Rate": 1.3914474228511809e-05, "Pretrain/Loss": 1.9925365447998047, "Pretrain/Loss (Raw)": 2.087341785430908, "Pretrain/Step": 12528, "Pretrain/Step Time": 8.456912569701672} +{"Pretrain/Learning Rate": 1.3910669388986724e-05, "Pretrain/Loss": 1.99264395236969, "Pretrain/Loss (Raw)": 1.9224697351455688, "Pretrain/Step": 12529, "Pretrain/Step Time": 8.455216327682137} +{"Pretrain/Learning Rate": 1.3906864869214659e-05, "Pretrain/Loss": 1.9929490089416504, "Pretrain/Loss (Raw)": 2.152923107147217, "Pretrain/Step": 12530, "Pretrain/Step Time": 8.455095885321498} +{"Pretrain/Learning Rate": 1.3903060669305334e-05, "Pretrain/Loss": 1.992952585220337, "Pretrain/Loss (Raw)": 2.042532444000244, "Pretrain/Step": 12531, "Pretrain/Step Time": 8.453099580481648} +{"Pretrain/Learning Rate": 1.3899256789368434e-05, "Pretrain/Loss": 1.990539312362671, "Pretrain/Loss (Raw)": 1.8917651176452637, "Pretrain/Step": 12532, "Pretrain/Step Time": 8.45336046256125} +{"Pretrain/Learning Rate": 1.3895453229513627e-05, "Pretrain/Loss": 1.9916046857833862, "Pretrain/Loss (Raw)": 2.0172369480133057, "Pretrain/Step": 12533, "Pretrain/Step Time": 8.452265098690987} +{"Pretrain/Learning Rate": 1.3891649989850608e-05, "Pretrain/Loss": 1.9913914203643799, "Pretrain/Loss (Raw)": 1.9245859384536743, "Pretrain/Step": 12534, "Pretrain/Step Time": 8.451500359922647} +{"Pretrain/Learning Rate": 1.3887847070489021e-05, "Pretrain/Loss": 1.9919058084487915, "Pretrain/Loss (Raw)": 2.0271971225738525, "Pretrain/Step": 12535, "Pretrain/Step Time": 8.459299581125379} +{"Pretrain/Learning Rate": 1.388404447153854e-05, "Pretrain/Loss": 1.9933273792266846, "Pretrain/Loss (Raw)": 2.134195327758789, "Pretrain/Step": 12536, "Pretrain/Step Time": 8.455938499420881} +{"Pretrain/Learning Rate": 1.38802421931088e-05, "Pretrain/Loss": 1.9937338829040527, "Pretrain/Loss (Raw)": 1.901216745376587, "Pretrain/Step": 12537, "Pretrain/Step Time": 8.455621702596545} +{"Pretrain/Learning Rate": 1.387644023530943e-05, "Pretrain/Loss": 1.9917240142822266, "Pretrain/Loss (Raw)": 1.7626240253448486, "Pretrain/Step": 12538, "Pretrain/Step Time": 8.452006550505757} +{"Pretrain/Learning Rate": 1.387263859825007e-05, "Pretrain/Loss": 1.9918817281723022, "Pretrain/Loss (Raw)": 2.068354606628418, "Pretrain/Step": 12539, "Pretrain/Step Time": 8.452154941856861} +{"Pretrain/Learning Rate": 1.3868837282040326e-05, "Pretrain/Loss": 1.9910236597061157, "Pretrain/Loss (Raw)": 1.730886459350586, "Pretrain/Step": 12540, "Pretrain/Step Time": 8.449130471795797} +{"Pretrain/Learning Rate": 1.386503628678982e-05, "Pretrain/Loss": 1.9918270111083984, "Pretrain/Loss (Raw)": 1.8594136238098145, "Pretrain/Step": 12541, "Pretrain/Step Time": 8.447415690869093} +{"Pretrain/Learning Rate": 1.3861235612608142e-05, "Pretrain/Loss": 1.9913303852081299, "Pretrain/Loss (Raw)": 1.955596685409546, "Pretrain/Step": 12542, "Pretrain/Step Time": 8.452780248597264} +{"Pretrain/Learning Rate": 1.3857435259604876e-05, "Pretrain/Loss": 1.9911737442016602, "Pretrain/Loss (Raw)": 1.9006984233856201, "Pretrain/Step": 12543, "Pretrain/Step Time": 8.451740201562643} +{"Pretrain/Learning Rate": 1.3853635227889616e-05, "Pretrain/Loss": 1.990949034690857, "Pretrain/Loss (Raw)": 2.0412936210632324, "Pretrain/Step": 12544, "Pretrain/Step Time": 8.451990325003862} +{"Pretrain/Learning Rate": 1.3849835517571918e-05, "Pretrain/Loss": 1.992396593093872, "Pretrain/Loss (Raw)": 1.9665496349334717, "Pretrain/Step": 12545, "Pretrain/Step Time": 8.453700635582209} +{"Pretrain/Learning Rate": 1.3846036128761364e-05, "Pretrain/Loss": 1.992219090461731, "Pretrain/Loss (Raw)": 2.098046064376831, "Pretrain/Step": 12546, "Pretrain/Step Time": 8.447016971185803} +{"Pretrain/Learning Rate": 1.3842237061567492e-05, "Pretrain/Loss": 1.9904649257659912, "Pretrain/Loss (Raw)": 1.9432299137115479, "Pretrain/Step": 12547, "Pretrain/Step Time": 8.452494038268924} +{"Pretrain/Learning Rate": 1.3838438316099841e-05, "Pretrain/Loss": 1.990662932395935, "Pretrain/Loss (Raw)": 1.965762734413147, "Pretrain/Step": 12548, "Pretrain/Step Time": 8.44599481485784} +{"Pretrain/Learning Rate": 1.3834639892467962e-05, "Pretrain/Loss": 1.9915038347244263, "Pretrain/Loss (Raw)": 2.054431438446045, "Pretrain/Step": 12549, "Pretrain/Step Time": 8.445434900000691} +{"Pretrain/Learning Rate": 1.3830841790781362e-05, "Pretrain/Loss": 1.9951064586639404, "Pretrain/Loss (Raw)": 2.7169413566589355, "Pretrain/Step": 12550, "Pretrain/Step Time": 8.44356476701796} +{"Pretrain/Learning Rate": 1.3827044011149573e-05, "Pretrain/Loss": 1.9939056634902954, "Pretrain/Loss (Raw)": 1.7560968399047852, "Pretrain/Step": 12551, "Pretrain/Step Time": 8.440848169848323} +{"Pretrain/Learning Rate": 1.3823246553682096e-05, "Pretrain/Loss": 1.9922490119934082, "Pretrain/Loss (Raw)": 2.2223589420318604, "Pretrain/Step": 12552, "Pretrain/Step Time": 8.441746514290571} +{"Pretrain/Learning Rate": 1.381944941848841e-05, "Pretrain/Loss": 1.9891092777252197, "Pretrain/Loss (Raw)": 1.8721827268600464, "Pretrain/Step": 12553, "Pretrain/Step Time": 8.438973790034652} +{"Pretrain/Learning Rate": 1.3815652605678033e-05, "Pretrain/Loss": 1.9902092218399048, "Pretrain/Loss (Raw)": 2.020618200302124, "Pretrain/Step": 12554, "Pretrain/Step Time": 8.436176905408502} +{"Pretrain/Learning Rate": 1.381185611536042e-05, "Pretrain/Loss": 1.9890801906585693, "Pretrain/Loss (Raw)": 1.8317296504974365, "Pretrain/Step": 12555, "Pretrain/Step Time": 8.4355803206563} +{"Pretrain/Learning Rate": 1.3808059947645066e-05, "Pretrain/Loss": 1.9889206886291504, "Pretrain/Loss (Raw)": 1.964636206626892, "Pretrain/Step": 12556, "Pretrain/Step Time": 8.42870812676847} +{"Pretrain/Learning Rate": 1.3804264102641395e-05, "Pretrain/Loss": 1.9911001920700073, "Pretrain/Loss (Raw)": 2.087062358856201, "Pretrain/Step": 12557, "Pretrain/Step Time": 8.425938731059432} +{"Pretrain/Learning Rate": 1.3800468580458887e-05, "Pretrain/Loss": 1.9896639585494995, "Pretrain/Loss (Raw)": 1.9653136730194092, "Pretrain/Step": 12558, "Pretrain/Step Time": 8.429750563576818} +{"Pretrain/Learning Rate": 1.3796673381206967e-05, "Pretrain/Loss": 1.9897688627243042, "Pretrain/Loss (Raw)": 1.9219378232955933, "Pretrain/Step": 12559, "Pretrain/Step Time": 8.43805332109332} +{"Pretrain/Learning Rate": 1.3792878504995066e-05, "Pretrain/Loss": 1.9887192249298096, "Pretrain/Loss (Raw)": 1.9806069135665894, "Pretrain/Step": 12560, "Pretrain/Step Time": 8.435287814587355} +{"Pretrain/Learning Rate": 1.3789083951932625e-05, "Pretrain/Loss": 1.990835189819336, "Pretrain/Loss (Raw)": 2.1137032508850098, "Pretrain/Step": 12561, "Pretrain/Step Time": 8.4333791192621} +{"Pretrain/Learning Rate": 1.378528972212903e-05, "Pretrain/Loss": 1.98829185962677, "Pretrain/Loss (Raw)": 2.020850658416748, "Pretrain/Step": 12562, "Pretrain/Step Time": 8.430574795231223} +{"Pretrain/Learning Rate": 1.3781495815693712e-05, "Pretrain/Loss": 1.9889857769012451, "Pretrain/Loss (Raw)": 2.2402184009552, "Pretrain/Step": 12563, "Pretrain/Step Time": 8.430881233885884} +{"Pretrain/Learning Rate": 1.3777702232736055e-05, "Pretrain/Loss": 1.9893499612808228, "Pretrain/Loss (Raw)": 2.091585636138916, "Pretrain/Step": 12564, "Pretrain/Step Time": 8.430951595306396} +{"Pretrain/Learning Rate": 1.3773908973365435e-05, "Pretrain/Loss": 1.990342140197754, "Pretrain/Loss (Raw)": 2.0434696674346924, "Pretrain/Step": 12565, "Pretrain/Step Time": 8.429217698052526} +{"Pretrain/Learning Rate": 1.3770116037691241e-05, "Pretrain/Loss": 1.9891799688339233, "Pretrain/Loss (Raw)": 2.0121922492980957, "Pretrain/Step": 12566, "Pretrain/Step Time": 8.427372766658664} +{"Pretrain/Learning Rate": 1.3766323425822828e-05, "Pretrain/Loss": 1.9879846572875977, "Pretrain/Loss (Raw)": 1.8541183471679688, "Pretrain/Step": 12567, "Pretrain/Step Time": 8.426669439300895} +{"Pretrain/Learning Rate": 1.3762531137869566e-05, "Pretrain/Loss": 1.988426923751831, "Pretrain/Loss (Raw)": 2.1016499996185303, "Pretrain/Step": 12568, "Pretrain/Step Time": 8.425837617367506} +{"Pretrain/Learning Rate": 1.3758739173940802e-05, "Pretrain/Loss": 1.9883790016174316, "Pretrain/Loss (Raw)": 1.908435583114624, "Pretrain/Step": 12569, "Pretrain/Step Time": 8.423817124217749} +{"Pretrain/Learning Rate": 1.3754947534145857e-05, "Pretrain/Loss": 1.9894427061080933, "Pretrain/Loss (Raw)": 2.0487518310546875, "Pretrain/Step": 12570, "Pretrain/Step Time": 8.422957116737962} +{"Pretrain/Learning Rate": 1.375115621859408e-05, "Pretrain/Loss": 1.9905409812927246, "Pretrain/Loss (Raw)": 2.009758710861206, "Pretrain/Step": 12571, "Pretrain/Step Time": 8.422681907191873} +{"Pretrain/Learning Rate": 1.3747365227394776e-05, "Pretrain/Loss": 1.9913214445114136, "Pretrain/Loss (Raw)": 1.8659000396728516, "Pretrain/Step": 12572, "Pretrain/Step Time": 8.414861526340246} +{"Pretrain/Learning Rate": 1.3743574560657275e-05, "Pretrain/Loss": 1.9932518005371094, "Pretrain/Loss (Raw)": 2.074619770050049, "Pretrain/Step": 12573, "Pretrain/Step Time": 8.414751121774316} +{"Pretrain/Learning Rate": 1.3739784218490864e-05, "Pretrain/Loss": 1.994751214981079, "Pretrain/Loss (Raw)": 2.1453769207000732, "Pretrain/Step": 12574, "Pretrain/Step Time": 8.413873251527548} +{"Pretrain/Learning Rate": 1.3735994201004825e-05, "Pretrain/Loss": 1.9956276416778564, "Pretrain/Loss (Raw)": 1.9894073009490967, "Pretrain/Step": 12575, "Pretrain/Step Time": 8.420025825500488} +{"Pretrain/Learning Rate": 1.3732204508308466e-05, "Pretrain/Loss": 1.9979931116104126, "Pretrain/Loss (Raw)": 1.9229786396026611, "Pretrain/Step": 12576, "Pretrain/Step Time": 8.418218782171607} +{"Pretrain/Learning Rate": 1.3728415140511036e-05, "Pretrain/Loss": 1.9972347021102905, "Pretrain/Loss (Raw)": 1.7739487886428833, "Pretrain/Step": 12577, "Pretrain/Step Time": 8.419935258105397} +{"Pretrain/Learning Rate": 1.3724626097721819e-05, "Pretrain/Loss": 1.9972628355026245, "Pretrain/Loss (Raw)": 2.059237003326416, "Pretrain/Step": 12578, "Pretrain/Step Time": 8.418349865823984} +{"Pretrain/Learning Rate": 1.3720837380050062e-05, "Pretrain/Loss": 1.9953819513320923, "Pretrain/Loss (Raw)": 1.9011296033859253, "Pretrain/Step": 12579, "Pretrain/Step Time": 8.42279035039246} +{"Pretrain/Learning Rate": 1.3717048987604994e-05, "Pretrain/Loss": 1.997377634048462, "Pretrain/Loss (Raw)": 2.0501251220703125, "Pretrain/Step": 12580, "Pretrain/Step Time": 8.423261011019349} +{"Pretrain/Learning Rate": 1.3713260920495874e-05, "Pretrain/Loss": 1.9957916736602783, "Pretrain/Loss (Raw)": 1.5364196300506592, "Pretrain/Step": 12581, "Pretrain/Step Time": 8.424692058935761} +{"Pretrain/Learning Rate": 1.370947317883191e-05, "Pretrain/Loss": 1.9941655397415161, "Pretrain/Loss (Raw)": 1.8106108903884888, "Pretrain/Step": 12582, "Pretrain/Step Time": 8.42318850941956} +{"Pretrain/Learning Rate": 1.3705685762722343e-05, "Pretrain/Loss": 1.9921579360961914, "Pretrain/Loss (Raw)": 1.8982754945755005, "Pretrain/Step": 12583, "Pretrain/Step Time": 8.426837811246514} +{"Pretrain/Learning Rate": 1.3701898672276348e-05, "Pretrain/Loss": 1.9926782846450806, "Pretrain/Loss (Raw)": 1.9213736057281494, "Pretrain/Step": 12584, "Pretrain/Step Time": 8.419565554708242} +{"Pretrain/Learning Rate": 1.3698111907603154e-05, "Pretrain/Loss": 1.9924311637878418, "Pretrain/Loss (Raw)": 2.048304796218872, "Pretrain/Step": 12585, "Pretrain/Step Time": 8.41609936580062} +{"Pretrain/Learning Rate": 1.3694325468811935e-05, "Pretrain/Loss": 1.992098331451416, "Pretrain/Loss (Raw)": 2.115234851837158, "Pretrain/Step": 12586, "Pretrain/Step Time": 8.41570769995451} +{"Pretrain/Learning Rate": 1.3690539356011862e-05, "Pretrain/Loss": 1.9957473278045654, "Pretrain/Loss (Raw)": 2.361194372177124, "Pretrain/Step": 12587, "Pretrain/Step Time": 8.414716126397252} +{"Pretrain/Learning Rate": 1.3686753569312122e-05, "Pretrain/Loss": 1.995217204093933, "Pretrain/Loss (Raw)": 1.9134567975997925, "Pretrain/Step": 12588, "Pretrain/Step Time": 8.413222189992666} +{"Pretrain/Learning Rate": 1.3682968108821858e-05, "Pretrain/Loss": 1.9927997589111328, "Pretrain/Loss (Raw)": 1.8415908813476562, "Pretrain/Step": 12589, "Pretrain/Step Time": 8.410174544900656} +{"Pretrain/Learning Rate": 1.367918297465024e-05, "Pretrain/Loss": 1.9902180433273315, "Pretrain/Loss (Raw)": 1.9111552238464355, "Pretrain/Step": 12590, "Pretrain/Step Time": 8.419221809133887} +{"Pretrain/Learning Rate": 1.36753981669064e-05, "Pretrain/Loss": 1.9902350902557373, "Pretrain/Loss (Raw)": 2.1031315326690674, "Pretrain/Step": 12591, "Pretrain/Step Time": 8.42149548791349} +{"Pretrain/Learning Rate": 1.3671613685699463e-05, "Pretrain/Loss": 1.9905779361724854, "Pretrain/Loss (Raw)": 2.0832595825195312, "Pretrain/Step": 12592, "Pretrain/Step Time": 8.42157636769116} +{"Pretrain/Learning Rate": 1.3667829531138568e-05, "Pretrain/Loss": 1.9905645847320557, "Pretrain/Loss (Raw)": 2.086463689804077, "Pretrain/Step": 12593, "Pretrain/Step Time": 8.425391662865877} +{"Pretrain/Learning Rate": 1.3664045703332811e-05, "Pretrain/Loss": 1.9891133308410645, "Pretrain/Loss (Raw)": 1.9272617101669312, "Pretrain/Step": 12594, "Pretrain/Step Time": 8.4251176007092} +{"Pretrain/Learning Rate": 1.3660262202391314e-05, "Pretrain/Loss": 1.9897485971450806, "Pretrain/Loss (Raw)": 2.124173164367676, "Pretrain/Step": 12595, "Pretrain/Step Time": 8.43391210027039} +{"Pretrain/Learning Rate": 1.3656479028423161e-05, "Pretrain/Loss": 1.9894864559173584, "Pretrain/Loss (Raw)": 1.7387586832046509, "Pretrain/Step": 12596, "Pretrain/Step Time": 8.433577984571457} +{"Pretrain/Learning Rate": 1.365269618153743e-05, "Pretrain/Loss": 1.99041748046875, "Pretrain/Loss (Raw)": 2.1114866733551025, "Pretrain/Step": 12597, "Pretrain/Step Time": 8.436419110745192} +{"Pretrain/Learning Rate": 1.3648913661843216e-05, "Pretrain/Loss": 1.990417718887329, "Pretrain/Loss (Raw)": 2.066723346710205, "Pretrain/Step": 12598, "Pretrain/Step Time": 8.437077017500997} +{"Pretrain/Learning Rate": 1.3645131469449562e-05, "Pretrain/Loss": 1.9883664846420288, "Pretrain/Loss (Raw)": 1.965465784072876, "Pretrain/Step": 12599, "Pretrain/Step Time": 8.43575881049037} +{"Pretrain/Learning Rate": 1.3641349604465547e-05, "Pretrain/Loss": 1.9892504215240479, "Pretrain/Loss (Raw)": 2.029344081878662, "Pretrain/Step": 12600, "Pretrain/Step Time": 8.432762226089835} +{"Pretrain/Learning Rate": 1.3637568067000212e-05, "Pretrain/Loss": 1.991729736328125, "Pretrain/Loss (Raw)": 2.4460341930389404, "Pretrain/Step": 12601, "Pretrain/Step Time": 8.434967461973429} +{"Pretrain/Learning Rate": 1.3633786857162584e-05, "Pretrain/Loss": 1.9932372570037842, "Pretrain/Loss (Raw)": 2.074234962463379, "Pretrain/Step": 12602, "Pretrain/Step Time": 8.426928363740444} +{"Pretrain/Learning Rate": 1.3630005975061705e-05, "Pretrain/Loss": 1.9919943809509277, "Pretrain/Loss (Raw)": 1.9069182872772217, "Pretrain/Step": 12603, "Pretrain/Step Time": 8.425966428592801} +{"Pretrain/Learning Rate": 1.3626225420806577e-05, "Pretrain/Loss": 1.991399884223938, "Pretrain/Loss (Raw)": 1.9796115159988403, "Pretrain/Step": 12604, "Pretrain/Step Time": 8.428886499255896} +{"Pretrain/Learning Rate": 1.3622445194506234e-05, "Pretrain/Loss": 1.9924429655075073, "Pretrain/Loss (Raw)": 1.9059451818466187, "Pretrain/Step": 12605, "Pretrain/Step Time": 8.428295195102692} +{"Pretrain/Learning Rate": 1.3618665296269661e-05, "Pretrain/Loss": 1.9983186721801758, "Pretrain/Loss (Raw)": 2.096006155014038, "Pretrain/Step": 12606, "Pretrain/Step Time": 8.424914233386517} +{"Pretrain/Learning Rate": 1.3614885726205845e-05, "Pretrain/Loss": 2.0021469593048096, "Pretrain/Loss (Raw)": 2.4134721755981445, "Pretrain/Step": 12607, "Pretrain/Step Time": 8.426378428936005} +{"Pretrain/Learning Rate": 1.361110648442378e-05, "Pretrain/Loss": 2.0024571418762207, "Pretrain/Loss (Raw)": 2.1829848289489746, "Pretrain/Step": 12608, "Pretrain/Step Time": 8.428767312318087} +{"Pretrain/Learning Rate": 1.3607327571032421e-05, "Pretrain/Loss": 2.0033912658691406, "Pretrain/Loss (Raw)": 1.887594223022461, "Pretrain/Step": 12609, "Pretrain/Step Time": 8.430015748366714} +{"Pretrain/Learning Rate": 1.3603548986140752e-05, "Pretrain/Loss": 2.0034666061401367, "Pretrain/Loss (Raw)": 1.7691094875335693, "Pretrain/Step": 12610, "Pretrain/Step Time": 8.42781506665051} +{"Pretrain/Learning Rate": 1.359977072985771e-05, "Pretrain/Loss": 2.0013394355773926, "Pretrain/Loss (Raw)": 2.018815040588379, "Pretrain/Step": 12611, "Pretrain/Step Time": 8.43008229881525} +{"Pretrain/Learning Rate": 1.3595992802292235e-05, "Pretrain/Loss": 2.001208543777466, "Pretrain/Loss (Raw)": 1.8533045053482056, "Pretrain/Step": 12612, "Pretrain/Step Time": 8.426412647590041} +{"Pretrain/Learning Rate": 1.3592215203553279e-05, "Pretrain/Loss": 2.0041112899780273, "Pretrain/Loss (Raw)": 2.1909477710723877, "Pretrain/Step": 12613, "Pretrain/Step Time": 8.425254482775927} +{"Pretrain/Learning Rate": 1.3588437933749746e-05, "Pretrain/Loss": 2.0035505294799805, "Pretrain/Loss (Raw)": 2.0465266704559326, "Pretrain/Step": 12614, "Pretrain/Step Time": 8.428276488557458} +{"Pretrain/Learning Rate": 1.3584660992990567e-05, "Pretrain/Loss": 2.0064785480499268, "Pretrain/Loss (Raw)": 2.0295543670654297, "Pretrain/Step": 12615, "Pretrain/Step Time": 8.429260540753603} +{"Pretrain/Learning Rate": 1.3580884381384645e-05, "Pretrain/Loss": 2.0035762786865234, "Pretrain/Loss (Raw)": 1.7505244016647339, "Pretrain/Step": 12616, "Pretrain/Step Time": 8.430223086848855} +{"Pretrain/Learning Rate": 1.3577108099040858e-05, "Pretrain/Loss": 2.0053277015686035, "Pretrain/Loss (Raw)": 2.1304309368133545, "Pretrain/Step": 12617, "Pretrain/Step Time": 8.427818305790424} +{"Pretrain/Learning Rate": 1.3573332146068121e-05, "Pretrain/Loss": 2.0060880184173584, "Pretrain/Loss (Raw)": 2.0224926471710205, "Pretrain/Step": 12618, "Pretrain/Step Time": 8.427633544430137} +{"Pretrain/Learning Rate": 1.3569556522575284e-05, "Pretrain/Loss": 2.008619785308838, "Pretrain/Loss (Raw)": 2.0994701385498047, "Pretrain/Step": 12619, "Pretrain/Step Time": 8.424187744036317} +{"Pretrain/Learning Rate": 1.3565781228671238e-05, "Pretrain/Loss": 2.006897449493408, "Pretrain/Loss (Raw)": 1.8499634265899658, "Pretrain/Step": 12620, "Pretrain/Step Time": 8.42494804225862} +{"Pretrain/Learning Rate": 1.3562006264464828e-05, "Pretrain/Loss": 2.0054526329040527, "Pretrain/Loss (Raw)": 1.8814952373504639, "Pretrain/Step": 12621, "Pretrain/Step Time": 8.428036293014884} +{"Pretrain/Learning Rate": 1.3558231630064894e-05, "Pretrain/Loss": 2.001218318939209, "Pretrain/Loss (Raw)": 1.8645946979522705, "Pretrain/Step": 12622, "Pretrain/Step Time": 8.428850693628192} +{"Pretrain/Learning Rate": 1.3554457325580294e-05, "Pretrain/Loss": 2.0035810470581055, "Pretrain/Loss (Raw)": 2.1683526039123535, "Pretrain/Step": 12623, "Pretrain/Step Time": 8.425390623509884} +{"Pretrain/Learning Rate": 1.3550683351119842e-05, "Pretrain/Loss": 2.003741502761841, "Pretrain/Loss (Raw)": 1.8617035150527954, "Pretrain/Step": 12624, "Pretrain/Step Time": 8.428594106808305} +{"Pretrain/Learning Rate": 1.354690970679237e-05, "Pretrain/Loss": 2.00368332862854, "Pretrain/Loss (Raw)": 2.046477794647217, "Pretrain/Step": 12625, "Pretrain/Step Time": 8.428807310760021} +{"Pretrain/Learning Rate": 1.3543136392706685e-05, "Pretrain/Loss": 2.0078721046447754, "Pretrain/Loss (Raw)": 2.531651258468628, "Pretrain/Step": 12626, "Pretrain/Step Time": 8.428208177909255} +{"Pretrain/Learning Rate": 1.3539363408971578e-05, "Pretrain/Loss": 2.008953094482422, "Pretrain/Loss (Raw)": 2.010953903198242, "Pretrain/Step": 12627, "Pretrain/Step Time": 8.430843016132712} +{"Pretrain/Learning Rate": 1.3535590755695854e-05, "Pretrain/Loss": 2.0090208053588867, "Pretrain/Loss (Raw)": 1.9586260318756104, "Pretrain/Step": 12628, "Pretrain/Step Time": 8.429821630939841} +{"Pretrain/Learning Rate": 1.353181843298828e-05, "Pretrain/Loss": 2.0091331005096436, "Pretrain/Loss (Raw)": 1.9168857336044312, "Pretrain/Step": 12629, "Pretrain/Step Time": 8.427027765661478} +{"Pretrain/Learning Rate": 1.3528046440957648e-05, "Pretrain/Loss": 2.0117011070251465, "Pretrain/Loss (Raw)": 2.0999646186828613, "Pretrain/Step": 12630, "Pretrain/Step Time": 8.425716603174806} +{"Pretrain/Learning Rate": 1.3524274779712709e-05, "Pretrain/Loss": 2.010800838470459, "Pretrain/Loss (Raw)": 2.1471314430236816, "Pretrain/Step": 12631, "Pretrain/Step Time": 8.431818049401045} +{"Pretrain/Learning Rate": 1.3520503449362204e-05, "Pretrain/Loss": 2.0082285404205322, "Pretrain/Loss (Raw)": 1.9426918029785156, "Pretrain/Step": 12632, "Pretrain/Step Time": 8.429957551881671} +{"Pretrain/Learning Rate": 1.3516732450014901e-05, "Pretrain/Loss": 2.008314609527588, "Pretrain/Loss (Raw)": 2.04960560798645, "Pretrain/Step": 12633, "Pretrain/Step Time": 8.429054291918874} +{"Pretrain/Learning Rate": 1.3512961781779515e-05, "Pretrain/Loss": 2.0086252689361572, "Pretrain/Loss (Raw)": 2.04293155670166, "Pretrain/Step": 12634, "Pretrain/Step Time": 8.425110215321183} +{"Pretrain/Learning Rate": 1.3509191444764788e-05, "Pretrain/Loss": 2.0091545581817627, "Pretrain/Loss (Raw)": 1.8149217367172241, "Pretrain/Step": 12635, "Pretrain/Step Time": 8.424081282690167} +{"Pretrain/Learning Rate": 1.3505421439079424e-05, "Pretrain/Loss": 2.0083656311035156, "Pretrain/Loss (Raw)": 1.8370819091796875, "Pretrain/Step": 12636, "Pretrain/Step Time": 8.42142315581441} +{"Pretrain/Learning Rate": 1.3501651764832119e-05, "Pretrain/Loss": 2.0094499588012695, "Pretrain/Loss (Raw)": 2.1645517349243164, "Pretrain/Step": 12637, "Pretrain/Step Time": 8.419509125873446} +{"Pretrain/Learning Rate": 1.349788242213159e-05, "Pretrain/Loss": 2.00789737701416, "Pretrain/Loss (Raw)": 1.9993159770965576, "Pretrain/Step": 12638, "Pretrain/Step Time": 8.421371392905712} +{"Pretrain/Learning Rate": 1.3494113411086506e-05, "Pretrain/Loss": 2.00681471824646, "Pretrain/Loss (Raw)": 2.0287115573883057, "Pretrain/Step": 12639, "Pretrain/Step Time": 8.424782620742917} +{"Pretrain/Learning Rate": 1.3490344731805566e-05, "Pretrain/Loss": 2.007725954055786, "Pretrain/Loss (Raw)": 2.027864933013916, "Pretrain/Step": 12640, "Pretrain/Step Time": 8.42476774379611} +{"Pretrain/Learning Rate": 1.3486576384397404e-05, "Pretrain/Loss": 2.0082662105560303, "Pretrain/Loss (Raw)": 1.9400848150253296, "Pretrain/Step": 12641, "Pretrain/Step Time": 8.423176072537899} +{"Pretrain/Learning Rate": 1.3482808368970707e-05, "Pretrain/Loss": 2.006916046142578, "Pretrain/Loss (Raw)": 2.0180885791778564, "Pretrain/Step": 12642, "Pretrain/Step Time": 8.424758840352297} +{"Pretrain/Learning Rate": 1.347904068563411e-05, "Pretrain/Loss": 2.006993055343628, "Pretrain/Loss (Raw)": 1.9783319234848022, "Pretrain/Step": 12643, "Pretrain/Step Time": 8.430767636746168} +{"Pretrain/Learning Rate": 1.347527333449624e-05, "Pretrain/Loss": 2.0048556327819824, "Pretrain/Loss (Raw)": 1.80951726436615, "Pretrain/Step": 12644, "Pretrain/Step Time": 8.432206235826015} +{"Pretrain/Learning Rate": 1.3471506315665755e-05, "Pretrain/Loss": 2.005746364593506, "Pretrain/Loss (Raw)": 2.14713191986084, "Pretrain/Step": 12645, "Pretrain/Step Time": 8.4348778501153} +{"Pretrain/Learning Rate": 1.3467739629251244e-05, "Pretrain/Loss": 2.005767345428467, "Pretrain/Loss (Raw)": 1.9198968410491943, "Pretrain/Step": 12646, "Pretrain/Step Time": 8.432926574721932} +{"Pretrain/Learning Rate": 1.346397327536134e-05, "Pretrain/Loss": 2.005324363708496, "Pretrain/Loss (Raw)": 1.9322969913482666, "Pretrain/Step": 12647, "Pretrain/Step Time": 8.43510177731514} +{"Pretrain/Learning Rate": 1.346020725410464e-05, "Pretrain/Loss": 2.0058529376983643, "Pretrain/Loss (Raw)": 2.1957345008850098, "Pretrain/Step": 12648, "Pretrain/Step Time": 8.43607684224844} +{"Pretrain/Learning Rate": 1.3456441565589717e-05, "Pretrain/Loss": 2.0064492225646973, "Pretrain/Loss (Raw)": 2.0763673782348633, "Pretrain/Step": 12649, "Pretrain/Step Time": 8.440827775746584} +{"Pretrain/Learning Rate": 1.345267620992517e-05, "Pretrain/Loss": 2.0039820671081543, "Pretrain/Loss (Raw)": 1.9181300401687622, "Pretrain/Step": 12650, "Pretrain/Step Time": 8.435816260054708} +{"Pretrain/Learning Rate": 1.3448911187219556e-05, "Pretrain/Loss": 2.0021536350250244, "Pretrain/Loss (Raw)": 1.7075899839401245, "Pretrain/Step": 12651, "Pretrain/Step Time": 8.432682406157255} +{"Pretrain/Learning Rate": 1.3445146497581457e-05, "Pretrain/Loss": 2.001765489578247, "Pretrain/Loss (Raw)": 1.8926624059677124, "Pretrain/Step": 12652, "Pretrain/Step Time": 8.43340688943863} +{"Pretrain/Learning Rate": 1.3441382141119401e-05, "Pretrain/Loss": 2.0043869018554688, "Pretrain/Loss (Raw)": 2.3273661136627197, "Pretrain/Step": 12653, "Pretrain/Step Time": 8.429069707170129} +{"Pretrain/Learning Rate": 1.3437618117941953e-05, "Pretrain/Loss": 2.0063669681549072, "Pretrain/Loss (Raw)": 2.1375293731689453, "Pretrain/Step": 12654, "Pretrain/Step Time": 8.437552673742175} +{"Pretrain/Learning Rate": 1.3433854428157636e-05, "Pretrain/Loss": 2.0055418014526367, "Pretrain/Loss (Raw)": 2.0502192974090576, "Pretrain/Step": 12655, "Pretrain/Step Time": 8.434924870729446} +{"Pretrain/Learning Rate": 1.3430091071874961e-05, "Pretrain/Loss": 2.005404233932495, "Pretrain/Loss (Raw)": 2.0697193145751953, "Pretrain/Step": 12656, "Pretrain/Step Time": 8.43542568013072} +{"Pretrain/Learning Rate": 1.3426328049202469e-05, "Pretrain/Loss": 2.0079233646392822, "Pretrain/Loss (Raw)": 2.2449257373809814, "Pretrain/Step": 12657, "Pretrain/Step Time": 8.438724713400006} +{"Pretrain/Learning Rate": 1.3422565360248635e-05, "Pretrain/Loss": 2.007322311401367, "Pretrain/Loss (Raw)": 2.0759663581848145, "Pretrain/Step": 12658, "Pretrain/Step Time": 8.442886620759964} +{"Pretrain/Learning Rate": 1.3418803005121977e-05, "Pretrain/Loss": 2.006965160369873, "Pretrain/Loss (Raw)": 1.996804118156433, "Pretrain/Step": 12659, "Pretrain/Step Time": 8.443516271188855} +{"Pretrain/Learning Rate": 1.3415040983930972e-05, "Pretrain/Loss": 2.0052480697631836, "Pretrain/Loss (Raw)": 1.6720161437988281, "Pretrain/Step": 12660, "Pretrain/Step Time": 8.44633130915463} +{"Pretrain/Learning Rate": 1.3411279296784079e-05, "Pretrain/Loss": 2.0042927265167236, "Pretrain/Loss (Raw)": 1.894920825958252, "Pretrain/Step": 12661, "Pretrain/Step Time": 8.446422478184104} +{"Pretrain/Learning Rate": 1.340751794378979e-05, "Pretrain/Loss": 2.005357503890991, "Pretrain/Loss (Raw)": 2.0608956813812256, "Pretrain/Step": 12662, "Pretrain/Step Time": 8.448400441557169} +{"Pretrain/Learning Rate": 1.3403756925056543e-05, "Pretrain/Loss": 2.00579571723938, "Pretrain/Loss (Raw)": 2.0832672119140625, "Pretrain/Step": 12663, "Pretrain/Step Time": 8.441270761191845} +{"Pretrain/Learning Rate": 1.3399996240692797e-05, "Pretrain/Loss": 2.0040462017059326, "Pretrain/Loss (Raw)": 1.9102720022201538, "Pretrain/Step": 12664, "Pretrain/Step Time": 8.439328903332353} +{"Pretrain/Learning Rate": 1.339623589080698e-05, "Pretrain/Loss": 2.0046725273132324, "Pretrain/Loss (Raw)": 1.981397032737732, "Pretrain/Step": 12665, "Pretrain/Step Time": 8.437315681949258} +{"Pretrain/Learning Rate": 1.3392475875507516e-05, "Pretrain/Loss": 2.0070104598999023, "Pretrain/Loss (Raw)": 2.0618560314178467, "Pretrain/Step": 12666, "Pretrain/Step Time": 8.436667986214161} +{"Pretrain/Learning Rate": 1.3388716194902833e-05, "Pretrain/Loss": 2.0072975158691406, "Pretrain/Loss (Raw)": 2.105090379714966, "Pretrain/Step": 12667, "Pretrain/Step Time": 8.436409916728735} +{"Pretrain/Learning Rate": 1.3384956849101323e-05, "Pretrain/Loss": 2.009859561920166, "Pretrain/Loss (Raw)": 2.058861494064331, "Pretrain/Step": 12668, "Pretrain/Step Time": 8.439884578809142} +{"Pretrain/Learning Rate": 1.3381197838211407e-05, "Pretrain/Loss": 2.0097904205322266, "Pretrain/Loss (Raw)": 1.8505622148513794, "Pretrain/Step": 12669, "Pretrain/Step Time": 8.436428872868419} +{"Pretrain/Learning Rate": 1.3377439162341459e-05, "Pretrain/Loss": 2.0115325450897217, "Pretrain/Loss (Raw)": 2.1785635948181152, "Pretrain/Step": 12670, "Pretrain/Step Time": 8.438242526724935} +{"Pretrain/Learning Rate": 1.3373680821599849e-05, "Pretrain/Loss": 2.0139617919921875, "Pretrain/Loss (Raw)": 2.211663007736206, "Pretrain/Step": 12671, "Pretrain/Step Time": 8.435771649703383} +{"Pretrain/Learning Rate": 1.3369922816094968e-05, "Pretrain/Loss": 2.011199712753296, "Pretrain/Loss (Raw)": 1.68775475025177, "Pretrain/Step": 12672, "Pretrain/Step Time": 8.439118029549718} +{"Pretrain/Learning Rate": 1.3366165145935152e-05, "Pretrain/Loss": 2.01177978515625, "Pretrain/Loss (Raw)": 2.040790557861328, "Pretrain/Step": 12673, "Pretrain/Step Time": 8.438892411068082} +{"Pretrain/Learning Rate": 1.3362407811228775e-05, "Pretrain/Loss": 2.01106595993042, "Pretrain/Loss (Raw)": 2.006680488586426, "Pretrain/Step": 12674, "Pretrain/Step Time": 8.445561541244388} +{"Pretrain/Learning Rate": 1.3358650812084164e-05, "Pretrain/Loss": 2.012115955352783, "Pretrain/Loss (Raw)": 2.0776255130767822, "Pretrain/Step": 12675, "Pretrain/Step Time": 8.44074041582644} +{"Pretrain/Learning Rate": 1.335489414860964e-05, "Pretrain/Loss": 2.012014150619507, "Pretrain/Loss (Raw)": 1.9527323246002197, "Pretrain/Step": 12676, "Pretrain/Step Time": 8.443485913798213} +{"Pretrain/Learning Rate": 1.3351137820913546e-05, "Pretrain/Loss": 2.011005401611328, "Pretrain/Loss (Raw)": 1.9253000020980835, "Pretrain/Step": 12677, "Pretrain/Step Time": 8.442139094695449} +{"Pretrain/Learning Rate": 1.3347381829104167e-05, "Pretrain/Loss": 2.0067291259765625, "Pretrain/Loss (Raw)": 2.1695966720581055, "Pretrain/Step": 12678, "Pretrain/Step Time": 8.447702603414655} +{"Pretrain/Learning Rate": 1.334362617328983e-05, "Pretrain/Loss": 2.0086209774017334, "Pretrain/Loss (Raw)": 1.9982296228408813, "Pretrain/Step": 12679, "Pretrain/Step Time": 8.446175079792738} +{"Pretrain/Learning Rate": 1.3339870853578815e-05, "Pretrain/Loss": 2.009752035140991, "Pretrain/Loss (Raw)": 2.367147207260132, "Pretrain/Step": 12680, "Pretrain/Step Time": 8.445831643417478} +{"Pretrain/Learning Rate": 1.3336115870079396e-05, "Pretrain/Loss": 2.0102896690368652, "Pretrain/Loss (Raw)": 1.9410167932510376, "Pretrain/Step": 12681, "Pretrain/Step Time": 8.4460632763803} +{"Pretrain/Learning Rate": 1.333236122289986e-05, "Pretrain/Loss": 2.0101311206817627, "Pretrain/Loss (Raw)": 2.000319004058838, "Pretrain/Step": 12682, "Pretrain/Step Time": 8.444549776613712} +{"Pretrain/Learning Rate": 1.3328606912148455e-05, "Pretrain/Loss": 2.0107743740081787, "Pretrain/Loss (Raw)": 1.9140559434890747, "Pretrain/Step": 12683, "Pretrain/Step Time": 8.443606110289693} +{"Pretrain/Learning Rate": 1.3324852937933452e-05, "Pretrain/Loss": 2.0136594772338867, "Pretrain/Loss (Raw)": 2.3339245319366455, "Pretrain/Step": 12684, "Pretrain/Step Time": 8.442373428493738} +{"Pretrain/Learning Rate": 1.3321099300363083e-05, "Pretrain/Loss": 2.0135464668273926, "Pretrain/Loss (Raw)": 2.0725796222686768, "Pretrain/Step": 12685, "Pretrain/Step Time": 8.442298751324415} +{"Pretrain/Learning Rate": 1.3317345999545575e-05, "Pretrain/Loss": 2.0123484134674072, "Pretrain/Loss (Raw)": 1.8119639158248901, "Pretrain/Step": 12686, "Pretrain/Step Time": 8.441502584144473} +{"Pretrain/Learning Rate": 1.3313593035589167e-05, "Pretrain/Loss": 2.014073371887207, "Pretrain/Loss (Raw)": 2.1427667140960693, "Pretrain/Step": 12687, "Pretrain/Step Time": 8.435053372755647} +{"Pretrain/Learning Rate": 1.3309840408602057e-05, "Pretrain/Loss": 2.0139057636260986, "Pretrain/Loss (Raw)": 1.9591422080993652, "Pretrain/Step": 12688, "Pretrain/Step Time": 8.438172314316034} +{"Pretrain/Learning Rate": 1.3306088118692467e-05, "Pretrain/Loss": 2.0125222206115723, "Pretrain/Loss (Raw)": 1.9366074800491333, "Pretrain/Step": 12689, "Pretrain/Step Time": 8.441325223073363} +{"Pretrain/Learning Rate": 1.3302336165968582e-05, "Pretrain/Loss": 2.0118424892425537, "Pretrain/Loss (Raw)": 1.9338260889053345, "Pretrain/Step": 12690, "Pretrain/Step Time": 8.439647696912289} +{"Pretrain/Learning Rate": 1.329858455053858e-05, "Pretrain/Loss": 2.0092921257019043, "Pretrain/Loss (Raw)": 1.913778305053711, "Pretrain/Step": 12691, "Pretrain/Step Time": 8.441510703414679} +{"Pretrain/Learning Rate": 1.3294833272510649e-05, "Pretrain/Loss": 2.0089547634124756, "Pretrain/Loss (Raw)": 2.048410177230835, "Pretrain/Step": 12692, "Pretrain/Step Time": 8.448085471987724} +{"Pretrain/Learning Rate": 1.3291082331992944e-05, "Pretrain/Loss": 2.0106589794158936, "Pretrain/Loss (Raw)": 2.26161527633667, "Pretrain/Step": 12693, "Pretrain/Step Time": 8.445876808837056} +{"Pretrain/Learning Rate": 1.3287331729093634e-05, "Pretrain/Loss": 2.0095973014831543, "Pretrain/Loss (Raw)": 1.8763030767440796, "Pretrain/Step": 12694, "Pretrain/Step Time": 8.449858468025923} +{"Pretrain/Learning Rate": 1.3283581463920852e-05, "Pretrain/Loss": 2.0100812911987305, "Pretrain/Loss (Raw)": 1.9160635471343994, "Pretrain/Step": 12695, "Pretrain/Step Time": 8.447503885254264} +{"Pretrain/Learning Rate": 1.3279831536582732e-05, "Pretrain/Loss": 2.0099337100982666, "Pretrain/Loss (Raw)": 2.0827507972717285, "Pretrain/Step": 12696, "Pretrain/Step Time": 8.449034675955772} +{"Pretrain/Learning Rate": 1.3276081947187418e-05, "Pretrain/Loss": 2.0114431381225586, "Pretrain/Loss (Raw)": 2.1016578674316406, "Pretrain/Step": 12697, "Pretrain/Step Time": 8.451791631057858} +{"Pretrain/Learning Rate": 1.327233269584301e-05, "Pretrain/Loss": 2.0122900009155273, "Pretrain/Loss (Raw)": 2.157134532928467, "Pretrain/Step": 12698, "Pretrain/Step Time": 8.45069194957614} +{"Pretrain/Learning Rate": 1.3268583782657626e-05, "Pretrain/Loss": 2.0139353275299072, "Pretrain/Loss (Raw)": 2.220349073410034, "Pretrain/Step": 12699, "Pretrain/Step Time": 8.44733765348792} +{"Pretrain/Learning Rate": 1.326483520773936e-05, "Pretrain/Loss": 2.0154900550842285, "Pretrain/Loss (Raw)": 2.0649051666259766, "Pretrain/Step": 12700, "Pretrain/Step Time": 8.44470820389688} +{"Pretrain/Learning Rate": 1.3261086971196287e-05, "Pretrain/Loss": 2.0143990516662598, "Pretrain/Loss (Raw)": 1.9349620342254639, "Pretrain/Step": 12701, "Pretrain/Step Time": 8.444426072761416} +{"Pretrain/Learning Rate": 1.325733907313651e-05, "Pretrain/Loss": 2.011972427368164, "Pretrain/Loss (Raw)": 1.8348110914230347, "Pretrain/Step": 12702, "Pretrain/Step Time": 8.444594388827682} +{"Pretrain/Learning Rate": 1.3253591513668067e-05, "Pretrain/Loss": 2.0118250846862793, "Pretrain/Loss (Raw)": 1.9705429077148438, "Pretrain/Step": 12703, "Pretrain/Step Time": 8.44202395901084} +{"Pretrain/Learning Rate": 1.3249844292899043e-05, "Pretrain/Loss": 2.01218843460083, "Pretrain/Loss (Raw)": 1.9694792032241821, "Pretrain/Step": 12704, "Pretrain/Step Time": 8.449969427660108} +{"Pretrain/Learning Rate": 1.324609741093748e-05, "Pretrain/Loss": 2.014897584915161, "Pretrain/Loss (Raw)": 2.120723009109497, "Pretrain/Step": 12705, "Pretrain/Step Time": 8.446909833699465} +{"Pretrain/Learning Rate": 1.3242350867891402e-05, "Pretrain/Loss": 2.014491319656372, "Pretrain/Loss (Raw)": 2.0072052478790283, "Pretrain/Step": 12706, "Pretrain/Step Time": 8.449650507420301} +{"Pretrain/Learning Rate": 1.3238604663868854e-05, "Pretrain/Loss": 2.0156707763671875, "Pretrain/Loss (Raw)": 2.052128791809082, "Pretrain/Step": 12707, "Pretrain/Step Time": 8.445676369592547} +{"Pretrain/Learning Rate": 1.323485879897784e-05, "Pretrain/Loss": 2.014878273010254, "Pretrain/Loss (Raw)": 1.9486782550811768, "Pretrain/Step": 12708, "Pretrain/Step Time": 8.447549620643258} +{"Pretrain/Learning Rate": 1.323111327332639e-05, "Pretrain/Loss": 2.018111228942871, "Pretrain/Loss (Raw)": 1.9502651691436768, "Pretrain/Step": 12709, "Pretrain/Step Time": 8.447175500914454} +{"Pretrain/Learning Rate": 1.322736808702249e-05, "Pretrain/Loss": 2.020204544067383, "Pretrain/Loss (Raw)": 2.0785155296325684, "Pretrain/Step": 12710, "Pretrain/Step Time": 8.450270794332027} +{"Pretrain/Learning Rate": 1.3223623240174127e-05, "Pretrain/Loss": 2.019611358642578, "Pretrain/Loss (Raw)": 1.8223811388015747, "Pretrain/Step": 12711, "Pretrain/Step Time": 8.448326908051968} +{"Pretrain/Learning Rate": 1.3219878732889291e-05, "Pretrain/Loss": 2.0200912952423096, "Pretrain/Loss (Raw)": 1.9827862977981567, "Pretrain/Step": 12712, "Pretrain/Step Time": 8.453479869291186} +{"Pretrain/Learning Rate": 1.321613456527594e-05, "Pretrain/Loss": 2.019310235977173, "Pretrain/Loss (Raw)": 1.9483392238616943, "Pretrain/Step": 12713, "Pretrain/Step Time": 8.456837099045515} +{"Pretrain/Learning Rate": 1.3212390737442051e-05, "Pretrain/Loss": 2.0185844898223877, "Pretrain/Loss (Raw)": 2.022312641143799, "Pretrain/Step": 12714, "Pretrain/Step Time": 8.45762132294476} +{"Pretrain/Learning Rate": 1.3208647249495565e-05, "Pretrain/Loss": 2.016946792602539, "Pretrain/Loss (Raw)": 2.1515893936157227, "Pretrain/Step": 12715, "Pretrain/Step Time": 8.453535348176956} +{"Pretrain/Learning Rate": 1.3204904101544413e-05, "Pretrain/Loss": 2.017993450164795, "Pretrain/Loss (Raw)": 2.047419786453247, "Pretrain/Step": 12716, "Pretrain/Step Time": 8.451834090054035} +{"Pretrain/Learning Rate": 1.3201161293696548e-05, "Pretrain/Loss": 2.0202744007110596, "Pretrain/Loss (Raw)": 2.133545160293579, "Pretrain/Step": 12717, "Pretrain/Step Time": 8.453384321182966} +{"Pretrain/Learning Rate": 1.3197418826059869e-05, "Pretrain/Loss": 2.019779682159424, "Pretrain/Loss (Raw)": 1.8478341102600098, "Pretrain/Step": 12718, "Pretrain/Step Time": 8.444697292521596} +{"Pretrain/Learning Rate": 1.3193676698742308e-05, "Pretrain/Loss": 2.0175905227661133, "Pretrain/Loss (Raw)": 1.8229038715362549, "Pretrain/Step": 12719, "Pretrain/Step Time": 8.446824302896857} +{"Pretrain/Learning Rate": 1.3189934911851746e-05, "Pretrain/Loss": 2.017925262451172, "Pretrain/Loss (Raw)": 2.1260905265808105, "Pretrain/Step": 12720, "Pretrain/Step Time": 8.443747380748391} +{"Pretrain/Learning Rate": 1.3186193465496094e-05, "Pretrain/Loss": 2.016599655151367, "Pretrain/Loss (Raw)": 1.9168306589126587, "Pretrain/Step": 12721, "Pretrain/Step Time": 8.444380559027195} +{"Pretrain/Learning Rate": 1.3182452359783226e-05, "Pretrain/Loss": 2.016936779022217, "Pretrain/Loss (Raw)": 1.9703965187072754, "Pretrain/Step": 12722, "Pretrain/Step Time": 8.444213612005115} +{"Pretrain/Learning Rate": 1.3178711594821003e-05, "Pretrain/Loss": 2.0132133960723877, "Pretrain/Loss (Raw)": 1.6475908756256104, "Pretrain/Step": 12723, "Pretrain/Step Time": 8.44607587531209} +{"Pretrain/Learning Rate": 1.3174971170717318e-05, "Pretrain/Loss": 2.0150136947631836, "Pretrain/Loss (Raw)": 1.9691989421844482, "Pretrain/Step": 12724, "Pretrain/Step Time": 8.447156360372901} +{"Pretrain/Learning Rate": 1.3171231087579983e-05, "Pretrain/Loss": 2.0135645866394043, "Pretrain/Loss (Raw)": 1.9260175228118896, "Pretrain/Step": 12725, "Pretrain/Step Time": 8.448242831975222} +{"Pretrain/Learning Rate": 1.3167491345516871e-05, "Pretrain/Loss": 2.0134215354919434, "Pretrain/Loss (Raw)": 2.0483970642089844, "Pretrain/Step": 12726, "Pretrain/Step Time": 8.449491038918495} +{"Pretrain/Learning Rate": 1.3163751944635797e-05, "Pretrain/Loss": 2.013542652130127, "Pretrain/Loss (Raw)": 1.9809788465499878, "Pretrain/Step": 12727, "Pretrain/Step Time": 8.448765641078353} +{"Pretrain/Learning Rate": 1.3160012885044598e-05, "Pretrain/Loss": 2.0139143466949463, "Pretrain/Loss (Raw)": 2.0769131183624268, "Pretrain/Step": 12728, "Pretrain/Step Time": 8.451349092647433} +{"Pretrain/Learning Rate": 1.3156274166851085e-05, "Pretrain/Loss": 2.011125326156616, "Pretrain/Loss (Raw)": 2.089035749435425, "Pretrain/Step": 12729, "Pretrain/Step Time": 8.454672744497657} +{"Pretrain/Learning Rate": 1.3152535790163042e-05, "Pretrain/Loss": 2.0113370418548584, "Pretrain/Loss (Raw)": 2.1013219356536865, "Pretrain/Step": 12730, "Pretrain/Step Time": 8.455753548070788} +{"Pretrain/Learning Rate": 1.314879775508829e-05, "Pretrain/Loss": 2.012392044067383, "Pretrain/Loss (Raw)": 2.041985273361206, "Pretrain/Step": 12731, "Pretrain/Step Time": 8.455654669553041} +{"Pretrain/Learning Rate": 1.3145060061734593e-05, "Pretrain/Loss": 2.0119802951812744, "Pretrain/Loss (Raw)": 1.9268800020217896, "Pretrain/Step": 12732, "Pretrain/Step Time": 8.45371574908495} +{"Pretrain/Learning Rate": 1.3141322710209736e-05, "Pretrain/Loss": 2.015913963317871, "Pretrain/Loss (Raw)": 2.4094653129577637, "Pretrain/Step": 12733, "Pretrain/Step Time": 8.45479467511177} +{"Pretrain/Learning Rate": 1.3137585700621485e-05, "Pretrain/Loss": 2.0144524574279785, "Pretrain/Loss (Raw)": 1.9089373350143433, "Pretrain/Step": 12734, "Pretrain/Step Time": 8.449888234958053} +{"Pretrain/Learning Rate": 1.3133849033077572e-05, "Pretrain/Loss": 2.011475086212158, "Pretrain/Loss (Raw)": 2.032339572906494, "Pretrain/Step": 12735, "Pretrain/Step Time": 8.455608678981662} +{"Pretrain/Learning Rate": 1.3130112707685771e-05, "Pretrain/Loss": 2.011444568634033, "Pretrain/Loss (Raw)": 2.1790997982025146, "Pretrain/Step": 12736, "Pretrain/Step Time": 8.452425980940461} +{"Pretrain/Learning Rate": 1.312637672455379e-05, "Pretrain/Loss": 2.011019706726074, "Pretrain/Loss (Raw)": 1.833212971687317, "Pretrain/Step": 12737, "Pretrain/Step Time": 8.457445196807384} +{"Pretrain/Learning Rate": 1.3122641083789378e-05, "Pretrain/Loss": 2.0144495964050293, "Pretrain/Loss (Raw)": 2.208139657974243, "Pretrain/Step": 12738, "Pretrain/Step Time": 8.457758003845811} +{"Pretrain/Learning Rate": 1.3118905785500238e-05, "Pretrain/Loss": 2.015887498855591, "Pretrain/Loss (Raw)": 2.2028660774230957, "Pretrain/Step": 12739, "Pretrain/Step Time": 8.45974506624043} +{"Pretrain/Learning Rate": 1.3115170829794062e-05, "Pretrain/Loss": 2.017549753189087, "Pretrain/Loss (Raw)": 2.0660669803619385, "Pretrain/Step": 12740, "Pretrain/Step Time": 8.461662735790014} +{"Pretrain/Learning Rate": 1.3111436216778567e-05, "Pretrain/Loss": 2.0173897743225098, "Pretrain/Loss (Raw)": 2.1704633235931396, "Pretrain/Step": 12741, "Pretrain/Step Time": 8.462657960131764} +{"Pretrain/Learning Rate": 1.3107701946561418e-05, "Pretrain/Loss": 2.016584873199463, "Pretrain/Loss (Raw)": 1.943516731262207, "Pretrain/Step": 12742, "Pretrain/Step Time": 8.465641835704446} +{"Pretrain/Learning Rate": 1.3103968019250312e-05, "Pretrain/Loss": 2.016638994216919, "Pretrain/Loss (Raw)": 2.0364623069763184, "Pretrain/Step": 12743, "Pretrain/Step Time": 8.464112071320415} +{"Pretrain/Learning Rate": 1.3100234434952899e-05, "Pretrain/Loss": 2.019650936126709, "Pretrain/Loss (Raw)": 2.1360671520233154, "Pretrain/Step": 12744, "Pretrain/Step Time": 8.459624929353595} +{"Pretrain/Learning Rate": 1.3096501193776829e-05, "Pretrain/Loss": 2.0183920860290527, "Pretrain/Loss (Raw)": 1.9692893028259277, "Pretrain/Step": 12745, "Pretrain/Step Time": 8.468724513426423} +{"Pretrain/Learning Rate": 1.3092768295829765e-05, "Pretrain/Loss": 2.0169196128845215, "Pretrain/Loss (Raw)": 1.8340338468551636, "Pretrain/Step": 12746, "Pretrain/Step Time": 8.47176799736917} +{"Pretrain/Learning Rate": 1.3089035741219325e-05, "Pretrain/Loss": 2.016336441040039, "Pretrain/Loss (Raw)": 2.0248124599456787, "Pretrain/Step": 12747, "Pretrain/Step Time": 8.47071878425777} +{"Pretrain/Learning Rate": 1.308530353005315e-05, "Pretrain/Loss": 2.016831874847412, "Pretrain/Loss (Raw)": 1.913393259048462, "Pretrain/Step": 12748, "Pretrain/Step Time": 8.467329503968358} +{"Pretrain/Learning Rate": 1.3081571662438846e-05, "Pretrain/Loss": 2.018467426300049, "Pretrain/Loss (Raw)": 2.090820074081421, "Pretrain/Step": 12749, "Pretrain/Step Time": 8.465818658471107} +{"Pretrain/Learning Rate": 1.3077840138484015e-05, "Pretrain/Loss": 2.020223379135132, "Pretrain/Loss (Raw)": 2.0893731117248535, "Pretrain/Step": 12750, "Pretrain/Step Time": 8.465300677344203} +{"Pretrain/Learning Rate": 1.3074108958296272e-05, "Pretrain/Loss": 2.022474765777588, "Pretrain/Loss (Raw)": 2.456535816192627, "Pretrain/Step": 12751, "Pretrain/Step Time": 8.467077378183603} +{"Pretrain/Learning Rate": 1.3070378121983174e-05, "Pretrain/Loss": 2.0252280235290527, "Pretrain/Loss (Raw)": 2.214132070541382, "Pretrain/Step": 12752, "Pretrain/Step Time": 8.466818140819669} +{"Pretrain/Learning Rate": 1.3066647629652326e-05, "Pretrain/Loss": 2.024369239807129, "Pretrain/Loss (Raw)": 1.9365378618240356, "Pretrain/Step": 12753, "Pretrain/Step Time": 8.467076249420643} +{"Pretrain/Learning Rate": 1.306291748141128e-05, "Pretrain/Loss": 2.02060866355896, "Pretrain/Loss (Raw)": 2.0502824783325195, "Pretrain/Step": 12754, "Pretrain/Step Time": 8.466417636722326} +{"Pretrain/Learning Rate": 1.3059187677367586e-05, "Pretrain/Loss": 2.0230722427368164, "Pretrain/Loss (Raw)": 2.3262956142425537, "Pretrain/Step": 12755, "Pretrain/Step Time": 8.464224530383945} +{"Pretrain/Learning Rate": 1.3055458217628804e-05, "Pretrain/Loss": 2.0231881141662598, "Pretrain/Loss (Raw)": 1.9734461307525635, "Pretrain/Step": 12756, "Pretrain/Step Time": 8.464340910315514} +{"Pretrain/Learning Rate": 1.3051729102302457e-05, "Pretrain/Loss": 2.023988723754883, "Pretrain/Loss (Raw)": 2.0193867683410645, "Pretrain/Step": 12757, "Pretrain/Step Time": 8.46137836202979} +{"Pretrain/Learning Rate": 1.3048000331496086e-05, "Pretrain/Loss": 2.02401065826416, "Pretrain/Loss (Raw)": 2.102771520614624, "Pretrain/Step": 12758, "Pretrain/Step Time": 8.468325890600681} +{"Pretrain/Learning Rate": 1.3044271905317202e-05, "Pretrain/Loss": 2.0232512950897217, "Pretrain/Loss (Raw)": 2.04992413520813, "Pretrain/Step": 12759, "Pretrain/Step Time": 8.463467847555876} +{"Pretrain/Learning Rate": 1.3040543823873297e-05, "Pretrain/Loss": 2.0232083797454834, "Pretrain/Loss (Raw)": 1.9372040033340454, "Pretrain/Step": 12760, "Pretrain/Step Time": 8.461951527744532} +{"Pretrain/Learning Rate": 1.303681608727189e-05, "Pretrain/Loss": 2.0225465297698975, "Pretrain/Loss (Raw)": 1.964890480041504, "Pretrain/Step": 12761, "Pretrain/Step Time": 8.464109055697918} +{"Pretrain/Learning Rate": 1.3033088695620449e-05, "Pretrain/Loss": 2.0207529067993164, "Pretrain/Loss (Raw)": 1.8133598566055298, "Pretrain/Step": 12762, "Pretrain/Step Time": 8.465698225423694} +{"Pretrain/Learning Rate": 1.3029361649026473e-05, "Pretrain/Loss": 2.022775411605835, "Pretrain/Loss (Raw)": 2.0737881660461426, "Pretrain/Step": 12763, "Pretrain/Step Time": 8.467595856636763} +{"Pretrain/Learning Rate": 1.3025634947597409e-05, "Pretrain/Loss": 2.0268442630767822, "Pretrain/Loss (Raw)": 2.3578925132751465, "Pretrain/Step": 12764, "Pretrain/Step Time": 8.467086547985673} +{"Pretrain/Learning Rate": 1.3021908591440713e-05, "Pretrain/Loss": 2.0260324478149414, "Pretrain/Loss (Raw)": 2.060671329498291, "Pretrain/Step": 12765, "Pretrain/Step Time": 8.464995319023728} +{"Pretrain/Learning Rate": 1.3018182580663846e-05, "Pretrain/Loss": 2.0256547927856445, "Pretrain/Loss (Raw)": 1.950942039489746, "Pretrain/Step": 12766, "Pretrain/Step Time": 8.467404460534453} +{"Pretrain/Learning Rate": 1.3014456915374229e-05, "Pretrain/Loss": 2.025331974029541, "Pretrain/Loss (Raw)": 1.9874106645584106, "Pretrain/Step": 12767, "Pretrain/Step Time": 8.46397008933127} +{"Pretrain/Learning Rate": 1.301073159567931e-05, "Pretrain/Loss": 2.024660587310791, "Pretrain/Loss (Raw)": 1.9419052600860596, "Pretrain/Step": 12768, "Pretrain/Step Time": 8.465997548773885} +{"Pretrain/Learning Rate": 1.300700662168649e-05, "Pretrain/Loss": 2.024925708770752, "Pretrain/Loss (Raw)": 1.9740482568740845, "Pretrain/Step": 12769, "Pretrain/Step Time": 8.464299287647009} +{"Pretrain/Learning Rate": 1.3003281993503175e-05, "Pretrain/Loss": 2.0240206718444824, "Pretrain/Loss (Raw)": 1.9022247791290283, "Pretrain/Step": 12770, "Pretrain/Step Time": 8.467649478465319} +{"Pretrain/Learning Rate": 1.299955771123677e-05, "Pretrain/Loss": 2.0249216556549072, "Pretrain/Loss (Raw)": 2.0936596393585205, "Pretrain/Step": 12771, "Pretrain/Step Time": 8.461516348645091} +{"Pretrain/Learning Rate": 1.2995833774994654e-05, "Pretrain/Loss": 2.027942657470703, "Pretrain/Loss (Raw)": 2.1961827278137207, "Pretrain/Step": 12772, "Pretrain/Step Time": 8.459089782088995} +{"Pretrain/Learning Rate": 1.2992110184884215e-05, "Pretrain/Loss": 2.0264391899108887, "Pretrain/Loss (Raw)": 1.9547075033187866, "Pretrain/Step": 12773, "Pretrain/Step Time": 8.45659257285297} +{"Pretrain/Learning Rate": 1.2988386941012814e-05, "Pretrain/Loss": 2.0279760360717773, "Pretrain/Loss (Raw)": 2.116607427597046, "Pretrain/Step": 12774, "Pretrain/Step Time": 8.46132036857307} +{"Pretrain/Learning Rate": 1.2984664043487799e-05, "Pretrain/Loss": 2.0294065475463867, "Pretrain/Loss (Raw)": 2.11539626121521, "Pretrain/Step": 12775, "Pretrain/Step Time": 8.466948632150888} +{"Pretrain/Learning Rate": 1.2980941492416538e-05, "Pretrain/Loss": 2.029327630996704, "Pretrain/Loss (Raw)": 2.185643196105957, "Pretrain/Step": 12776, "Pretrain/Step Time": 8.463743302971125} +{"Pretrain/Learning Rate": 1.2977219287906345e-05, "Pretrain/Loss": 2.028353214263916, "Pretrain/Loss (Raw)": 1.9516593217849731, "Pretrain/Step": 12777, "Pretrain/Step Time": 8.466256788000464} +{"Pretrain/Learning Rate": 1.2973497430064566e-05, "Pretrain/Loss": 2.0299084186553955, "Pretrain/Loss (Raw)": 2.1171882152557373, "Pretrain/Step": 12778, "Pretrain/Step Time": 8.467229299247265} +{"Pretrain/Learning Rate": 1.2969775918998512e-05, "Pretrain/Loss": 2.0315823554992676, "Pretrain/Loss (Raw)": 1.9218287467956543, "Pretrain/Step": 12779, "Pretrain/Step Time": 8.470406237989664} +{"Pretrain/Learning Rate": 1.2966054754815476e-05, "Pretrain/Loss": 2.03257417678833, "Pretrain/Loss (Raw)": 2.0196146965026855, "Pretrain/Step": 12780, "Pretrain/Step Time": 8.464869236573577} +{"Pretrain/Learning Rate": 1.2962333937622784e-05, "Pretrain/Loss": 2.0296409130096436, "Pretrain/Loss (Raw)": 1.951940655708313, "Pretrain/Step": 12781, "Pretrain/Step Time": 8.467884151265025} +{"Pretrain/Learning Rate": 1.2958613467527691e-05, "Pretrain/Loss": 2.028571605682373, "Pretrain/Loss (Raw)": 2.0006372928619385, "Pretrain/Step": 12782, "Pretrain/Step Time": 8.45667009986937} +{"Pretrain/Learning Rate": 1.2954893344637504e-05, "Pretrain/Loss": 2.0280447006225586, "Pretrain/Loss (Raw)": 1.9828046560287476, "Pretrain/Step": 12783, "Pretrain/Step Time": 8.461088165640831} +{"Pretrain/Learning Rate": 1.2951173569059472e-05, "Pretrain/Loss": 2.028374671936035, "Pretrain/Loss (Raw)": 2.1119346618652344, "Pretrain/Step": 12784, "Pretrain/Step Time": 8.460594106465578} +{"Pretrain/Learning Rate": 1.294745414090085e-05, "Pretrain/Loss": 2.026426315307617, "Pretrain/Loss (Raw)": 1.9955228567123413, "Pretrain/Step": 12785, "Pretrain/Step Time": 8.46211458556354} +{"Pretrain/Learning Rate": 1.2943735060268902e-05, "Pretrain/Loss": 2.025616407394409, "Pretrain/Loss (Raw)": 1.9723141193389893, "Pretrain/Step": 12786, "Pretrain/Step Time": 8.45779181830585} +{"Pretrain/Learning Rate": 1.2940016327270842e-05, "Pretrain/Loss": 2.025529384613037, "Pretrain/Loss (Raw)": 1.9856353998184204, "Pretrain/Step": 12787, "Pretrain/Step Time": 8.458854852244258} +{"Pretrain/Learning Rate": 1.293629794201392e-05, "Pretrain/Loss": 2.02850604057312, "Pretrain/Loss (Raw)": 2.05303692817688, "Pretrain/Step": 12788, "Pretrain/Step Time": 8.460181418806314} +{"Pretrain/Learning Rate": 1.2932579904605333e-05, "Pretrain/Loss": 2.029301166534424, "Pretrain/Loss (Raw)": 1.9967018365859985, "Pretrain/Step": 12789, "Pretrain/Step Time": 8.458943778648973} +{"Pretrain/Learning Rate": 1.2928862215152305e-05, "Pretrain/Loss": 2.0295982360839844, "Pretrain/Loss (Raw)": 2.098945140838623, "Pretrain/Step": 12790, "Pretrain/Step Time": 8.461769565939903} +{"Pretrain/Learning Rate": 1.2925144873762029e-05, "Pretrain/Loss": 2.0292725563049316, "Pretrain/Loss (Raw)": 2.0415594577789307, "Pretrain/Step": 12791, "Pretrain/Step Time": 8.465521467849612} +{"Pretrain/Learning Rate": 1.2921427880541676e-05, "Pretrain/Loss": 2.0298473834991455, "Pretrain/Loss (Raw)": 1.9838569164276123, "Pretrain/Step": 12792, "Pretrain/Step Time": 8.467052267864347} +{"Pretrain/Learning Rate": 1.2917711235598445e-05, "Pretrain/Loss": 2.031538963317871, "Pretrain/Loss (Raw)": 2.1979010105133057, "Pretrain/Step": 12793, "Pretrain/Step Time": 8.469575172290206} +{"Pretrain/Learning Rate": 1.2913994939039486e-05, "Pretrain/Loss": 2.030778408050537, "Pretrain/Loss (Raw)": 1.9645495414733887, "Pretrain/Step": 12794, "Pretrain/Step Time": 8.472414709627628} +{"Pretrain/Learning Rate": 1.2910278990971969e-05, "Pretrain/Loss": 2.030579090118408, "Pretrain/Loss (Raw)": 2.079545021057129, "Pretrain/Step": 12795, "Pretrain/Step Time": 8.471655260771513} +{"Pretrain/Learning Rate": 1.2906563391503038e-05, "Pretrain/Loss": 2.0278239250183105, "Pretrain/Loss (Raw)": 1.7062034606933594, "Pretrain/Step": 12796, "Pretrain/Step Time": 8.46967851370573} +{"Pretrain/Learning Rate": 1.2902848140739816e-05, "Pretrain/Loss": 2.0282442569732666, "Pretrain/Loss (Raw)": 1.9043577909469604, "Pretrain/Step": 12797, "Pretrain/Step Time": 8.470893183723092} +{"Pretrain/Learning Rate": 1.2899133238789445e-05, "Pretrain/Loss": 2.0250258445739746, "Pretrain/Loss (Raw)": 1.7666051387786865, "Pretrain/Step": 12798, "Pretrain/Step Time": 8.468020552769303} +{"Pretrain/Learning Rate": 1.2895418685759034e-05, "Pretrain/Loss": 2.023819923400879, "Pretrain/Loss (Raw)": 2.0573089122772217, "Pretrain/Step": 12799, "Pretrain/Step Time": 8.470660930499434} +{"Pretrain/Learning Rate": 1.2891704481755698e-05, "Pretrain/Loss": 2.026909828186035, "Pretrain/Loss (Raw)": 2.0832579135894775, "Pretrain/Step": 12800, "Pretrain/Step Time": 8.47319782152772} +{"Pretrain/Learning Rate": 1.2887990626886526e-05, "Pretrain/Loss": 2.026885509490967, "Pretrain/Loss (Raw)": 2.0376880168914795, "Pretrain/Step": 12801, "Pretrain/Step Time": 8.47045812010765} +{"Pretrain/Learning Rate": 1.2884277121258597e-05, "Pretrain/Loss": 2.027777671813965, "Pretrain/Loss (Raw)": 2.1208608150482178, "Pretrain/Step": 12802, "Pretrain/Step Time": 8.472883351147175} +{"Pretrain/Learning Rate": 1.288056396497901e-05, "Pretrain/Loss": 2.02813982963562, "Pretrain/Loss (Raw)": 2.123990297317505, "Pretrain/Step": 12803, "Pretrain/Step Time": 8.473676750436425} +{"Pretrain/Learning Rate": 1.2876851158154803e-05, "Pretrain/Loss": 2.0287694931030273, "Pretrain/Loss (Raw)": 2.033325672149658, "Pretrain/Step": 12804, "Pretrain/Step Time": 8.477751228958368} +{"Pretrain/Learning Rate": 1.2873138700893058e-05, "Pretrain/Loss": 2.0288772583007812, "Pretrain/Loss (Raw)": 1.939126968383789, "Pretrain/Step": 12805, "Pretrain/Step Time": 8.47902898862958} +{"Pretrain/Learning Rate": 1.286942659330081e-05, "Pretrain/Loss": 2.027574062347412, "Pretrain/Loss (Raw)": 2.0027801990509033, "Pretrain/Step": 12806, "Pretrain/Step Time": 8.477755246683955} +{"Pretrain/Learning Rate": 1.2865714835485086e-05, "Pretrain/Loss": 2.0267438888549805, "Pretrain/Loss (Raw)": 1.8919439315795898, "Pretrain/Step": 12807, "Pretrain/Step Time": 8.47731702029705} +{"Pretrain/Learning Rate": 1.2862003427552938e-05, "Pretrain/Loss": 2.024547576904297, "Pretrain/Loss (Raw)": 2.086024284362793, "Pretrain/Step": 12808, "Pretrain/Step Time": 8.481219410896301} +{"Pretrain/Learning Rate": 1.2858292369611344e-05, "Pretrain/Loss": 2.0250887870788574, "Pretrain/Loss (Raw)": 2.01031756401062, "Pretrain/Step": 12809, "Pretrain/Step Time": 8.485460173338652} +{"Pretrain/Learning Rate": 1.285458166176734e-05, "Pretrain/Loss": 2.0256690979003906, "Pretrain/Loss (Raw)": 2.074582576751709, "Pretrain/Step": 12810, "Pretrain/Step Time": 8.488156026229262} +{"Pretrain/Learning Rate": 1.2850871304127905e-05, "Pretrain/Loss": 2.025636672973633, "Pretrain/Loss (Raw)": 1.9099278450012207, "Pretrain/Step": 12811, "Pretrain/Step Time": 8.489540806040168} +{"Pretrain/Learning Rate": 1.284716129680004e-05, "Pretrain/Loss": 2.023916721343994, "Pretrain/Loss (Raw)": 2.113720655441284, "Pretrain/Step": 12812, "Pretrain/Step Time": 8.490547617897391} +{"Pretrain/Learning Rate": 1.284345163989071e-05, "Pretrain/Loss": 2.0233566761016846, "Pretrain/Loss (Raw)": 2.000901937484741, "Pretrain/Step": 12813, "Pretrain/Step Time": 8.490241969004273} +{"Pretrain/Learning Rate": 1.2839742333506877e-05, "Pretrain/Loss": 2.025195360183716, "Pretrain/Loss (Raw)": 2.0473411083221436, "Pretrain/Step": 12814, "Pretrain/Step Time": 8.48800141364336} +{"Pretrain/Learning Rate": 1.2836033377755508e-05, "Pretrain/Loss": 2.023895502090454, "Pretrain/Loss (Raw)": 1.9763824939727783, "Pretrain/Step": 12815, "Pretrain/Step Time": 8.486442709341645} +{"Pretrain/Learning Rate": 1.2832324772743531e-05, "Pretrain/Loss": 2.0251071453094482, "Pretrain/Loss (Raw)": 2.1142117977142334, "Pretrain/Step": 12816, "Pretrain/Step Time": 8.488812450319529} +{"Pretrain/Learning Rate": 1.2828616518577902e-05, "Pretrain/Loss": 2.026431083679199, "Pretrain/Loss (Raw)": 2.1060640811920166, "Pretrain/Step": 12817, "Pretrain/Step Time": 8.484916292130947} +{"Pretrain/Learning Rate": 1.2824908615365533e-05, "Pretrain/Loss": 2.0308480262756348, "Pretrain/Loss (Raw)": 2.4991824626922607, "Pretrain/Step": 12818, "Pretrain/Step Time": 8.48723217844963} +{"Pretrain/Learning Rate": 1.2821201063213333e-05, "Pretrain/Loss": 2.0313711166381836, "Pretrain/Loss (Raw)": 1.98076331615448, "Pretrain/Step": 12819, "Pretrain/Step Time": 8.48982759192586} +{"Pretrain/Learning Rate": 1.2817493862228227e-05, "Pretrain/Loss": 2.031959295272827, "Pretrain/Loss (Raw)": 2.123699426651001, "Pretrain/Step": 12820, "Pretrain/Step Time": 8.481074238196015} +{"Pretrain/Learning Rate": 1.2813787012517087e-05, "Pretrain/Loss": 2.029569149017334, "Pretrain/Loss (Raw)": 1.9556963443756104, "Pretrain/Step": 12821, "Pretrain/Step Time": 8.487232316285372} +{"Pretrain/Learning Rate": 1.2810080514186817e-05, "Pretrain/Loss": 2.031482219696045, "Pretrain/Loss (Raw)": 2.121152400970459, "Pretrain/Step": 12822, "Pretrain/Step Time": 8.488273093476892} +{"Pretrain/Learning Rate": 1.2806374367344281e-05, "Pretrain/Loss": 2.0309367179870605, "Pretrain/Loss (Raw)": 1.8462622165679932, "Pretrain/Step": 12823, "Pretrain/Step Time": 8.492968875914812} +{"Pretrain/Learning Rate": 1.2802668572096335e-05, "Pretrain/Loss": 2.029935836791992, "Pretrain/Loss (Raw)": 1.954607605934143, "Pretrain/Step": 12824, "Pretrain/Step Time": 8.493207011371851} +{"Pretrain/Learning Rate": 1.2798963128549851e-05, "Pretrain/Loss": 2.0311293601989746, "Pretrain/Loss (Raw)": 2.2544548511505127, "Pretrain/Step": 12825, "Pretrain/Step Time": 8.489972088485956} +{"Pretrain/Learning Rate": 1.2795258036811658e-05, "Pretrain/Loss": 2.030298948287964, "Pretrain/Loss (Raw)": 2.05082106590271, "Pretrain/Step": 12826, "Pretrain/Step Time": 8.498760329559445} +{"Pretrain/Learning Rate": 1.27915532969886e-05, "Pretrain/Loss": 2.02933406829834, "Pretrain/Loss (Raw)": 2.09684157371521, "Pretrain/Step": 12827, "Pretrain/Step Time": 8.498688535764813} +{"Pretrain/Learning Rate": 1.27878489091875e-05, "Pretrain/Loss": 2.029484748840332, "Pretrain/Loss (Raw)": 2.0841879844665527, "Pretrain/Step": 12828, "Pretrain/Step Time": 8.498282227665186} +{"Pretrain/Learning Rate": 1.2784144873515158e-05, "Pretrain/Loss": 2.0285496711730957, "Pretrain/Loss (Raw)": 1.815302848815918, "Pretrain/Step": 12829, "Pretrain/Step Time": 8.500550566241145} +{"Pretrain/Learning Rate": 1.2780441190078396e-05, "Pretrain/Loss": 2.0296411514282227, "Pretrain/Loss (Raw)": 1.9744845628738403, "Pretrain/Step": 12830, "Pretrain/Step Time": 8.500489171594381} +{"Pretrain/Learning Rate": 1.277673785898399e-05, "Pretrain/Loss": 2.0300393104553223, "Pretrain/Loss (Raw)": 2.0215420722961426, "Pretrain/Step": 12831, "Pretrain/Step Time": 8.495138155296445} +{"Pretrain/Learning Rate": 1.2773034880338736e-05, "Pretrain/Loss": 2.0275659561157227, "Pretrain/Loss (Raw)": 1.6528537273406982, "Pretrain/Step": 12832, "Pretrain/Step Time": 8.492307113483548} +{"Pretrain/Learning Rate": 1.2769332254249405e-05, "Pretrain/Loss": 2.025656223297119, "Pretrain/Loss (Raw)": 1.8763176202774048, "Pretrain/Step": 12833, "Pretrain/Step Time": 8.492291789501905} +{"Pretrain/Learning Rate": 1.2765629980822746e-05, "Pretrain/Loss": 2.0240707397460938, "Pretrain/Loss (Raw)": 1.804237961769104, "Pretrain/Step": 12834, "Pretrain/Step Time": 8.492473488673568} +{"Pretrain/Learning Rate": 1.2761928060165535e-05, "Pretrain/Loss": 2.023440361022949, "Pretrain/Loss (Raw)": 1.9714468717575073, "Pretrain/Step": 12835, "Pretrain/Step Time": 8.495910752564669} +{"Pretrain/Learning Rate": 1.2758226492384486e-05, "Pretrain/Loss": 2.0254483222961426, "Pretrain/Loss (Raw)": 2.205695867538452, "Pretrain/Step": 12836, "Pretrain/Step Time": 8.492992574349046} +{"Pretrain/Learning Rate": 1.2754525277586359e-05, "Pretrain/Loss": 2.026731014251709, "Pretrain/Loss (Raw)": 2.1144378185272217, "Pretrain/Step": 12837, "Pretrain/Step Time": 8.494550893083215} +{"Pretrain/Learning Rate": 1.275082441587786e-05, "Pretrain/Loss": 2.0264010429382324, "Pretrain/Loss (Raw)": 2.036294460296631, "Pretrain/Step": 12838, "Pretrain/Step Time": 8.49466609209776} +{"Pretrain/Learning Rate": 1.27471239073657e-05, "Pretrain/Loss": 2.026660680770874, "Pretrain/Loss (Raw)": 1.8556230068206787, "Pretrain/Step": 12839, "Pretrain/Step Time": 8.493818033486605} +{"Pretrain/Learning Rate": 1.2743423752156589e-05, "Pretrain/Loss": 2.027299165725708, "Pretrain/Loss (Raw)": 2.064493179321289, "Pretrain/Step": 12840, "Pretrain/Step Time": 8.48727940581739} +{"Pretrain/Learning Rate": 1.2739723950357208e-05, "Pretrain/Loss": 2.0277931690216064, "Pretrain/Loss (Raw)": 2.011565923690796, "Pretrain/Step": 12841, "Pretrain/Step Time": 8.489466464146972} +{"Pretrain/Learning Rate": 1.2736024502074252e-05, "Pretrain/Loss": 2.0262184143066406, "Pretrain/Loss (Raw)": 1.8207650184631348, "Pretrain/Step": 12842, "Pretrain/Step Time": 8.48885203897953} +{"Pretrain/Learning Rate": 1.273232540741438e-05, "Pretrain/Loss": 2.0260815620422363, "Pretrain/Loss (Raw)": 2.134056806564331, "Pretrain/Step": 12843, "Pretrain/Step Time": 8.492782663553953} +{"Pretrain/Learning Rate": 1.272862666648425e-05, "Pretrain/Loss": 2.0263760089874268, "Pretrain/Loss (Raw)": 2.0851142406463623, "Pretrain/Step": 12844, "Pretrain/Step Time": 8.491215486079454} +{"Pretrain/Learning Rate": 1.272492827939053e-05, "Pretrain/Loss": 2.0244970321655273, "Pretrain/Loss (Raw)": 1.893019676208496, "Pretrain/Step": 12845, "Pretrain/Step Time": 8.49213689751923} +{"Pretrain/Learning Rate": 1.272123024623984e-05, "Pretrain/Loss": 2.0232181549072266, "Pretrain/Loss (Raw)": 1.6841470003128052, "Pretrain/Step": 12846, "Pretrain/Step Time": 8.491108011454344} +{"Pretrain/Learning Rate": 1.2717532567138829e-05, "Pretrain/Loss": 2.026355743408203, "Pretrain/Loss (Raw)": 2.2245359420776367, "Pretrain/Step": 12847, "Pretrain/Step Time": 8.487679129466414} +{"Pretrain/Learning Rate": 1.2713835242194105e-05, "Pretrain/Loss": 2.0257277488708496, "Pretrain/Loss (Raw)": 2.045720100402832, "Pretrain/Step": 12848, "Pretrain/Step Time": 8.49076921865344} +{"Pretrain/Learning Rate": 1.2710138271512275e-05, "Pretrain/Loss": 2.0271172523498535, "Pretrain/Loss (Raw)": 2.0946617126464844, "Pretrain/Step": 12849, "Pretrain/Step Time": 8.488458413630724} +{"Pretrain/Learning Rate": 1.2706441655199952e-05, "Pretrain/Loss": 2.0279860496520996, "Pretrain/Loss (Raw)": 2.081610918045044, "Pretrain/Step": 12850, "Pretrain/Step Time": 8.485853917896748} +{"Pretrain/Learning Rate": 1.2702745393363711e-05, "Pretrain/Loss": 2.0307366847991943, "Pretrain/Loss (Raw)": 1.9996776580810547, "Pretrain/Step": 12851, "Pretrain/Step Time": 8.479995984584093} +{"Pretrain/Learning Rate": 1.2699049486110142e-05, "Pretrain/Loss": 2.0314137935638428, "Pretrain/Loss (Raw)": 2.055845022201538, "Pretrain/Step": 12852, "Pretrain/Step Time": 8.482886517420411} +{"Pretrain/Learning Rate": 1.2695353933545806e-05, "Pretrain/Loss": 2.0316567420959473, "Pretrain/Loss (Raw)": 1.9571256637573242, "Pretrain/Step": 12853, "Pretrain/Step Time": 8.481154877692461} +{"Pretrain/Learning Rate": 1.2691658735777268e-05, "Pretrain/Loss": 2.0317749977111816, "Pretrain/Loss (Raw)": 2.063540458679199, "Pretrain/Step": 12854, "Pretrain/Step Time": 8.482342390343547} +{"Pretrain/Learning Rate": 1.2687963892911079e-05, "Pretrain/Loss": 2.031867742538452, "Pretrain/Loss (Raw)": 1.992843508720398, "Pretrain/Step": 12855, "Pretrain/Step Time": 8.486601062119007} +{"Pretrain/Learning Rate": 1.268426940505376e-05, "Pretrain/Loss": 2.0324463844299316, "Pretrain/Loss (Raw)": 2.1509768962860107, "Pretrain/Step": 12856, "Pretrain/Step Time": 8.481841377913952} +{"Pretrain/Learning Rate": 1.268057527231186e-05, "Pretrain/Loss": 2.0312752723693848, "Pretrain/Loss (Raw)": 1.9391125440597534, "Pretrain/Step": 12857, "Pretrain/Step Time": 8.486292177811265} +{"Pretrain/Learning Rate": 1.2676881494791876e-05, "Pretrain/Loss": 2.0284085273742676, "Pretrain/Loss (Raw)": 1.7344059944152832, "Pretrain/Step": 12858, "Pretrain/Step Time": 8.486409137025476} +{"Pretrain/Learning Rate": 1.2673188072600339e-05, "Pretrain/Loss": 2.0262985229492188, "Pretrain/Loss (Raw)": 1.7719060182571411, "Pretrain/Step": 12859, "Pretrain/Step Time": 8.485111776739359} +{"Pretrain/Learning Rate": 1.2669495005843734e-05, "Pretrain/Loss": 2.0279788970947266, "Pretrain/Loss (Raw)": 2.1419517993927, "Pretrain/Step": 12860, "Pretrain/Step Time": 8.483518769964576} +{"Pretrain/Learning Rate": 1.2665802294628537e-05, "Pretrain/Loss": 2.0241384506225586, "Pretrain/Loss (Raw)": 1.9178959131240845, "Pretrain/Step": 12861, "Pretrain/Step Time": 8.48483769223094} +{"Pretrain/Learning Rate": 1.2662109939061247e-05, "Pretrain/Loss": 2.0240325927734375, "Pretrain/Loss (Raw)": 1.895377516746521, "Pretrain/Step": 12862, "Pretrain/Step Time": 8.488845618441701} +{"Pretrain/Learning Rate": 1.265841793924831e-05, "Pretrain/Loss": 2.0232133865356445, "Pretrain/Loss (Raw)": 1.927505612373352, "Pretrain/Step": 12863, "Pretrain/Step Time": 8.483636995777488} +{"Pretrain/Learning Rate": 1.26547262952962e-05, "Pretrain/Loss": 2.0228171348571777, "Pretrain/Loss (Raw)": 2.1283645629882812, "Pretrain/Step": 12864, "Pretrain/Step Time": 8.484350685030222} +{"Pretrain/Learning Rate": 1.2651035007311355e-05, "Pretrain/Loss": 2.0232365131378174, "Pretrain/Loss (Raw)": 1.8868846893310547, "Pretrain/Step": 12865, "Pretrain/Step Time": 8.480740020051599} +{"Pretrain/Learning Rate": 1.26473440754002e-05, "Pretrain/Loss": 2.0232760906219482, "Pretrain/Loss (Raw)": 2.2132091522216797, "Pretrain/Step": 12866, "Pretrain/Step Time": 8.481234829872847} +{"Pretrain/Learning Rate": 1.2643653499669178e-05, "Pretrain/Loss": 2.022005081176758, "Pretrain/Loss (Raw)": 2.040193557739258, "Pretrain/Step": 12867, "Pretrain/Step Time": 8.481506492942572} +{"Pretrain/Learning Rate": 1.2639963280224692e-05, "Pretrain/Loss": 2.022881507873535, "Pretrain/Loss (Raw)": 2.1782290935516357, "Pretrain/Step": 12868, "Pretrain/Step Time": 8.48063570074737} +{"Pretrain/Learning Rate": 1.2636273417173155e-05, "Pretrain/Loss": 2.0207552909851074, "Pretrain/Loss (Raw)": 1.898302435874939, "Pretrain/Step": 12869, "Pretrain/Step Time": 8.48709219135344} +{"Pretrain/Learning Rate": 1.2632583910620966e-05, "Pretrain/Loss": 2.019804000854492, "Pretrain/Loss (Raw)": 1.8217822313308716, "Pretrain/Step": 12870, "Pretrain/Step Time": 8.48077368363738} +{"Pretrain/Learning Rate": 1.2628894760674486e-05, "Pretrain/Loss": 2.0190482139587402, "Pretrain/Loss (Raw)": 1.939723014831543, "Pretrain/Step": 12871, "Pretrain/Step Time": 8.48646611906588} +{"Pretrain/Learning Rate": 1.2625205967440115e-05, "Pretrain/Loss": 2.018537998199463, "Pretrain/Loss (Raw)": 2.0707452297210693, "Pretrain/Step": 12872, "Pretrain/Step Time": 8.486099177971482} +{"Pretrain/Learning Rate": 1.2621517531024197e-05, "Pretrain/Loss": 2.0191614627838135, "Pretrain/Loss (Raw)": 2.049069881439209, "Pretrain/Step": 12873, "Pretrain/Step Time": 8.481642438098788} +{"Pretrain/Learning Rate": 1.2617829451533106e-05, "Pretrain/Loss": 2.019376754760742, "Pretrain/Loss (Raw)": 1.8616054058074951, "Pretrain/Step": 12874, "Pretrain/Step Time": 8.48188553005457} +{"Pretrain/Learning Rate": 1.261414172907317e-05, "Pretrain/Loss": 2.0181326866149902, "Pretrain/Loss (Raw)": 1.865578532218933, "Pretrain/Step": 12875, "Pretrain/Step Time": 8.485034672543406} +{"Pretrain/Learning Rate": 1.261045436375072e-05, "Pretrain/Loss": 2.017180919647217, "Pretrain/Loss (Raw)": 1.7915549278259277, "Pretrain/Step": 12876, "Pretrain/Step Time": 8.489295711740851} +{"Pretrain/Learning Rate": 1.2606767355672095e-05, "Pretrain/Loss": 2.015111207962036, "Pretrain/Loss (Raw)": 1.825909972190857, "Pretrain/Step": 12877, "Pretrain/Step Time": 8.488908300176263} +{"Pretrain/Learning Rate": 1.2603080704943582e-05, "Pretrain/Loss": 2.0155417919158936, "Pretrain/Loss (Raw)": 2.144479990005493, "Pretrain/Step": 12878, "Pretrain/Step Time": 8.484856301918626} +{"Pretrain/Learning Rate": 1.2599394411671511e-05, "Pretrain/Loss": 2.0118160247802734, "Pretrain/Loss (Raw)": 1.979659080505371, "Pretrain/Step": 12879, "Pretrain/Step Time": 8.48849119246006} +{"Pretrain/Learning Rate": 1.2595708475962159e-05, "Pretrain/Loss": 2.0099573135375977, "Pretrain/Loss (Raw)": 1.9761906862258911, "Pretrain/Step": 12880, "Pretrain/Step Time": 8.485067065805197} +{"Pretrain/Learning Rate": 1.2592022897921802e-05, "Pretrain/Loss": 2.011692523956299, "Pretrain/Loss (Raw)": 2.158655881881714, "Pretrain/Step": 12881, "Pretrain/Step Time": 8.487158473581076} +{"Pretrain/Learning Rate": 1.2588337677656723e-05, "Pretrain/Loss": 2.0115084648132324, "Pretrain/Loss (Raw)": 2.0267295837402344, "Pretrain/Step": 12882, "Pretrain/Step Time": 8.484824595972896} +{"Pretrain/Learning Rate": 1.2584652815273168e-05, "Pretrain/Loss": 2.0093839168548584, "Pretrain/Loss (Raw)": 2.054344654083252, "Pretrain/Step": 12883, "Pretrain/Step Time": 8.484867861494422} +{"Pretrain/Learning Rate": 1.2580968310877408e-05, "Pretrain/Loss": 2.0099093914031982, "Pretrain/Loss (Raw)": 2.0407142639160156, "Pretrain/Step": 12884, "Pretrain/Step Time": 8.48770365677774} +{"Pretrain/Learning Rate": 1.2577284164575673e-05, "Pretrain/Loss": 2.0094473361968994, "Pretrain/Loss (Raw)": 1.9602280855178833, "Pretrain/Step": 12885, "Pretrain/Step Time": 8.492845678701997} +{"Pretrain/Learning Rate": 1.2573600376474182e-05, "Pretrain/Loss": 2.008208990097046, "Pretrain/Loss (Raw)": 1.9442689418792725, "Pretrain/Step": 12886, "Pretrain/Step Time": 8.488051382824779} +{"Pretrain/Learning Rate": 1.2569916946679172e-05, "Pretrain/Loss": 2.006481170654297, "Pretrain/Loss (Raw)": 1.828788161277771, "Pretrain/Step": 12887, "Pretrain/Step Time": 8.486952140927315} +{"Pretrain/Learning Rate": 1.2566233875296834e-05, "Pretrain/Loss": 2.007432460784912, "Pretrain/Loss (Raw)": 2.0589599609375, "Pretrain/Step": 12888, "Pretrain/Step Time": 8.48416868969798} +{"Pretrain/Learning Rate": 1.2562551162433389e-05, "Pretrain/Loss": 2.008885622024536, "Pretrain/Loss (Raw)": 2.150883197784424, "Pretrain/Step": 12889, "Pretrain/Step Time": 8.490423301234841} +{"Pretrain/Learning Rate": 1.2558868808195013e-05, "Pretrain/Loss": 2.010286569595337, "Pretrain/Loss (Raw)": 1.9926811456680298, "Pretrain/Step": 12890, "Pretrain/Step Time": 8.491054434329271} +{"Pretrain/Learning Rate": 1.2555186812687872e-05, "Pretrain/Loss": 2.0088398456573486, "Pretrain/Loss (Raw)": 1.8886137008666992, "Pretrain/Step": 12891, "Pretrain/Step Time": 8.492154272273183} +{"Pretrain/Learning Rate": 1.2551505176018168e-05, "Pretrain/Loss": 2.0051770210266113, "Pretrain/Loss (Raw)": 1.8890721797943115, "Pretrain/Step": 12892, "Pretrain/Step Time": 8.493541466072202} +{"Pretrain/Learning Rate": 1.2547823898292017e-05, "Pretrain/Loss": 2.0040621757507324, "Pretrain/Loss (Raw)": 1.9179407358169556, "Pretrain/Step": 12893, "Pretrain/Step Time": 8.497299782931805} +{"Pretrain/Learning Rate": 1.2544142979615595e-05, "Pretrain/Loss": 2.0037074089050293, "Pretrain/Loss (Raw)": 1.905526876449585, "Pretrain/Step": 12894, "Pretrain/Step Time": 8.494193524122238} +{"Pretrain/Learning Rate": 1.254046242009502e-05, "Pretrain/Loss": 2.0039305686950684, "Pretrain/Loss (Raw)": 2.0159971714019775, "Pretrain/Step": 12895, "Pretrain/Step Time": 8.496499514207244} +{"Pretrain/Learning Rate": 1.2536782219836438e-05, "Pretrain/Loss": 2.003807306289673, "Pretrain/Loss (Raw)": 1.9261059761047363, "Pretrain/Step": 12896, "Pretrain/Step Time": 8.494695959612727} +{"Pretrain/Learning Rate": 1.2533102378945955e-05, "Pretrain/Loss": 2.003307342529297, "Pretrain/Loss (Raw)": 1.9100866317749023, "Pretrain/Step": 12897, "Pretrain/Step Time": 8.493327513337135} +{"Pretrain/Learning Rate": 1.2529422897529664e-05, "Pretrain/Loss": 2.0043904781341553, "Pretrain/Loss (Raw)": 2.040844202041626, "Pretrain/Step": 12898, "Pretrain/Step Time": 8.492362417280674} +{"Pretrain/Learning Rate": 1.2525743775693683e-05, "Pretrain/Loss": 2.001811981201172, "Pretrain/Loss (Raw)": 1.7636115550994873, "Pretrain/Step": 12899, "Pretrain/Step Time": 8.498771488666534} +{"Pretrain/Learning Rate": 1.252206501354408e-05, "Pretrain/Loss": 1.9998533725738525, "Pretrain/Loss (Raw)": 1.9454830884933472, "Pretrain/Step": 12900, "Pretrain/Step Time": 8.49684745632112} +{"Pretrain/Learning Rate": 1.2518386611186942e-05, "Pretrain/Loss": 2.000215530395508, "Pretrain/Loss (Raw)": 2.0010311603546143, "Pretrain/Step": 12901, "Pretrain/Step Time": 8.498959705233574} +{"Pretrain/Learning Rate": 1.2514708568728328e-05, "Pretrain/Loss": 1.998049020767212, "Pretrain/Loss (Raw)": 1.839325189590454, "Pretrain/Step": 12902, "Pretrain/Step Time": 8.49386184476316} +{"Pretrain/Learning Rate": 1.2511030886274283e-05, "Pretrain/Loss": 1.996622085571289, "Pretrain/Loss (Raw)": 1.9327400922775269, "Pretrain/Step": 12903, "Pretrain/Step Time": 8.48989157564938} +{"Pretrain/Learning Rate": 1.2507353563930865e-05, "Pretrain/Loss": 1.994478702545166, "Pretrain/Loss (Raw)": 1.9112944602966309, "Pretrain/Step": 12904, "Pretrain/Step Time": 8.491818748414516} +{"Pretrain/Learning Rate": 1.2503676601804093e-05, "Pretrain/Loss": 1.9918673038482666, "Pretrain/Loss (Raw)": 1.617402195930481, "Pretrain/Step": 12905, "Pretrain/Step Time": 8.490400779992342} +{"Pretrain/Learning Rate": 1.2500000000000006e-05, "Pretrain/Loss": 1.9916737079620361, "Pretrain/Loss (Raw)": 2.0924112796783447, "Pretrain/Step": 12906, "Pretrain/Step Time": 8.494721375405788} +{"Pretrain/Learning Rate": 1.2496323758624606e-05, "Pretrain/Loss": 1.992061734199524, "Pretrain/Loss (Raw)": 1.9714915752410889, "Pretrain/Step": 12907, "Pretrain/Step Time": 8.490660229697824} +{"Pretrain/Learning Rate": 1.2492647877783887e-05, "Pretrain/Loss": 1.9922196865081787, "Pretrain/Loss (Raw)": 2.0398476123809814, "Pretrain/Step": 12908, "Pretrain/Step Time": 8.49447980709374} +{"Pretrain/Learning Rate": 1.2488972357583858e-05, "Pretrain/Loss": 1.9929583072662354, "Pretrain/Loss (Raw)": 2.04646635055542, "Pretrain/Step": 12909, "Pretrain/Step Time": 8.493906384333968} +{"Pretrain/Learning Rate": 1.2485297198130484e-05, "Pretrain/Loss": 1.9939398765563965, "Pretrain/Loss (Raw)": 2.12626576423645, "Pretrain/Step": 12910, "Pretrain/Step Time": 8.49736886844039} +{"Pretrain/Learning Rate": 1.2481622399529752e-05, "Pretrain/Loss": 1.9939676523208618, "Pretrain/Loss (Raw)": 1.9863712787628174, "Pretrain/Step": 12911, "Pretrain/Step Time": 8.498103400692344} +{"Pretrain/Learning Rate": 1.2477947961887613e-05, "Pretrain/Loss": 1.9933468103408813, "Pretrain/Loss (Raw)": 2.032467842102051, "Pretrain/Step": 12912, "Pretrain/Step Time": 8.49654228053987} +{"Pretrain/Learning Rate": 1.2474273885310007e-05, "Pretrain/Loss": 1.9929702281951904, "Pretrain/Loss (Raw)": 1.9473326206207275, "Pretrain/Step": 12913, "Pretrain/Step Time": 8.49084728769958} +{"Pretrain/Learning Rate": 1.2470600169902894e-05, "Pretrain/Loss": 1.9936188459396362, "Pretrain/Loss (Raw)": 2.0553340911865234, "Pretrain/Step": 12914, "Pretrain/Step Time": 8.493418421596289} +{"Pretrain/Learning Rate": 1.2466926815772182e-05, "Pretrain/Loss": 1.992699146270752, "Pretrain/Loss (Raw)": 1.8679078817367554, "Pretrain/Step": 12915, "Pretrain/Step Time": 8.492694951593876} +{"Pretrain/Learning Rate": 1.2463253823023806e-05, "Pretrain/Loss": 1.991998314857483, "Pretrain/Loss (Raw)": 1.9633246660232544, "Pretrain/Step": 12916, "Pretrain/Step Time": 8.490677405148745} +{"Pretrain/Learning Rate": 1.2459581191763665e-05, "Pretrain/Loss": 1.9925240278244019, "Pretrain/Loss (Raw)": 2.0640060901641846, "Pretrain/Step": 12917, "Pretrain/Step Time": 8.493535535410047} +{"Pretrain/Learning Rate": 1.2455908922097667e-05, "Pretrain/Loss": 1.9929943084716797, "Pretrain/Loss (Raw)": 2.1591265201568604, "Pretrain/Step": 12918, "Pretrain/Step Time": 8.496520798653364} +{"Pretrain/Learning Rate": 1.245223701413169e-05, "Pretrain/Loss": 1.990161418914795, "Pretrain/Loss (Raw)": 1.678951382637024, "Pretrain/Step": 12919, "Pretrain/Step Time": 8.4947120975703} +{"Pretrain/Learning Rate": 1.2448565467971608e-05, "Pretrain/Loss": 1.9914233684539795, "Pretrain/Loss (Raw)": 2.145395517349243, "Pretrain/Step": 12920, "Pretrain/Step Time": 8.495990647003055} +{"Pretrain/Learning Rate": 1.24448942837233e-05, "Pretrain/Loss": 1.9904322624206543, "Pretrain/Loss (Raw)": 2.0710246562957764, "Pretrain/Step": 12921, "Pretrain/Step Time": 8.497031325474381} +{"Pretrain/Learning Rate": 1.2441223461492601e-05, "Pretrain/Loss": 1.9900047779083252, "Pretrain/Loss (Raw)": 1.9098341464996338, "Pretrain/Step": 12922, "Pretrain/Step Time": 8.496016178280115} +{"Pretrain/Learning Rate": 1.2437553001385386e-05, "Pretrain/Loss": 1.9911433458328247, "Pretrain/Loss (Raw)": 2.2252979278564453, "Pretrain/Step": 12923, "Pretrain/Step Time": 8.498852236196399} +{"Pretrain/Learning Rate": 1.2433882903507472e-05, "Pretrain/Loss": 1.9947538375854492, "Pretrain/Loss (Raw)": 2.1683311462402344, "Pretrain/Step": 12924, "Pretrain/Step Time": 8.495304178446531} +{"Pretrain/Learning Rate": 1.2430213167964674e-05, "Pretrain/Loss": 1.995396614074707, "Pretrain/Loss (Raw)": 1.9866458177566528, "Pretrain/Step": 12925, "Pretrain/Step Time": 8.500345300883055} +{"Pretrain/Learning Rate": 1.242654379486283e-05, "Pretrain/Loss": 1.9968984127044678, "Pretrain/Loss (Raw)": 1.958843469619751, "Pretrain/Step": 12926, "Pretrain/Step Time": 8.500115398317575} +{"Pretrain/Learning Rate": 1.2422874784307723e-05, "Pretrain/Loss": 1.9956398010253906, "Pretrain/Loss (Raw)": 1.8961944580078125, "Pretrain/Step": 12927, "Pretrain/Step Time": 8.497308425605297} +{"Pretrain/Learning Rate": 1.2419206136405162e-05, "Pretrain/Loss": 1.9956153631210327, "Pretrain/Loss (Raw)": 2.080134868621826, "Pretrain/Step": 12928, "Pretrain/Step Time": 8.495159525424242} +{"Pretrain/Learning Rate": 1.2415537851260925e-05, "Pretrain/Loss": 1.9955925941467285, "Pretrain/Loss (Raw)": 2.034773111343384, "Pretrain/Step": 12929, "Pretrain/Step Time": 8.494179060682654} +{"Pretrain/Learning Rate": 1.2411869928980773e-05, "Pretrain/Loss": 1.9939992427825928, "Pretrain/Loss (Raw)": 1.9169210195541382, "Pretrain/Step": 12930, "Pretrain/Step Time": 8.488403093069792} +{"Pretrain/Learning Rate": 1.2408202369670487e-05, "Pretrain/Loss": 1.9921846389770508, "Pretrain/Loss (Raw)": 1.8917008638381958, "Pretrain/Step": 12931, "Pretrain/Step Time": 8.491006061434746} +{"Pretrain/Learning Rate": 1.2404535173435802e-05, "Pretrain/Loss": 1.992119550704956, "Pretrain/Loss (Raw)": 2.0249974727630615, "Pretrain/Step": 12932, "Pretrain/Step Time": 8.485093044117093} +{"Pretrain/Learning Rate": 1.2400868340382474e-05, "Pretrain/Loss": 1.9923901557922363, "Pretrain/Loss (Raw)": 1.9737786054611206, "Pretrain/Step": 12933, "Pretrain/Step Time": 8.487811146304011} +{"Pretrain/Learning Rate": 1.2397201870616223e-05, "Pretrain/Loss": 1.9908475875854492, "Pretrain/Loss (Raw)": 1.8053035736083984, "Pretrain/Step": 12934, "Pretrain/Step Time": 8.483376760035753} +{"Pretrain/Learning Rate": 1.2393535764242764e-05, "Pretrain/Loss": 1.9943538904190063, "Pretrain/Loss (Raw)": 2.3407721519470215, "Pretrain/Step": 12935, "Pretrain/Step Time": 8.484032213687897} +{"Pretrain/Learning Rate": 1.2389870021367825e-05, "Pretrain/Loss": 1.995337724685669, "Pretrain/Loss (Raw)": 2.2119545936584473, "Pretrain/Step": 12936, "Pretrain/Step Time": 8.480835171416402} +{"Pretrain/Learning Rate": 1.2386204642097082e-05, "Pretrain/Loss": 1.997341275215149, "Pretrain/Loss (Raw)": 2.2667582035064697, "Pretrain/Step": 12937, "Pretrain/Step Time": 8.477178826928139} +{"Pretrain/Learning Rate": 1.238253962653625e-05, "Pretrain/Loss": 1.9922819137573242, "Pretrain/Loss (Raw)": 1.4269938468933105, "Pretrain/Step": 12938, "Pretrain/Step Time": 8.482810689136386} +{"Pretrain/Learning Rate": 1.2378874974790988e-05, "Pretrain/Loss": 1.9909968376159668, "Pretrain/Loss (Raw)": 1.745452642440796, "Pretrain/Step": 12939, "Pretrain/Step Time": 8.481958512216806} +{"Pretrain/Learning Rate": 1.2375210686966962e-05, "Pretrain/Loss": 1.990262508392334, "Pretrain/Loss (Raw)": 2.019709348678589, "Pretrain/Step": 12940, "Pretrain/Step Time": 8.483001517131925} +{"Pretrain/Learning Rate": 1.2371546763169847e-05, "Pretrain/Loss": 1.9876770973205566, "Pretrain/Loss (Raw)": 1.6699761152267456, "Pretrain/Step": 12941, "Pretrain/Step Time": 8.485569532960653} +{"Pretrain/Learning Rate": 1.2367883203505267e-05, "Pretrain/Loss": 1.9867165088653564, "Pretrain/Loss (Raw)": 1.9243757724761963, "Pretrain/Step": 12942, "Pretrain/Step Time": 8.488104742020369} +{"Pretrain/Learning Rate": 1.2364220008078877e-05, "Pretrain/Loss": 1.987796425819397, "Pretrain/Loss (Raw)": 2.1146132946014404, "Pretrain/Step": 12943, "Pretrain/Step Time": 8.485917890444398} +{"Pretrain/Learning Rate": 1.2360557176996302e-05, "Pretrain/Loss": 1.9883079528808594, "Pretrain/Loss (Raw)": 2.17969012260437, "Pretrain/Step": 12944, "Pretrain/Step Time": 8.482922203838825} +{"Pretrain/Learning Rate": 1.2356894710363135e-05, "Pretrain/Loss": 1.986363410949707, "Pretrain/Loss (Raw)": 1.8571631908416748, "Pretrain/Step": 12945, "Pretrain/Step Time": 8.481031194329262} +{"Pretrain/Learning Rate": 1.235323260828501e-05, "Pretrain/Loss": 1.9814140796661377, "Pretrain/Loss (Raw)": 1.8656728267669678, "Pretrain/Step": 12946, "Pretrain/Step Time": 8.477287439629436} +{"Pretrain/Learning Rate": 1.2349570870867495e-05, "Pretrain/Loss": 1.979754090309143, "Pretrain/Loss (Raw)": 1.768282413482666, "Pretrain/Step": 12947, "Pretrain/Step Time": 8.477222222834826} +{"Pretrain/Learning Rate": 1.2345909498216193e-05, "Pretrain/Loss": 1.9788199663162231, "Pretrain/Loss (Raw)": 2.0041236877441406, "Pretrain/Step": 12948, "Pretrain/Step Time": 8.476942988112569} +{"Pretrain/Learning Rate": 1.2342248490436676e-05, "Pretrain/Loss": 1.979671597480774, "Pretrain/Loss (Raw)": 2.0647122859954834, "Pretrain/Step": 12949, "Pretrain/Step Time": 8.475145196542144} +{"Pretrain/Learning Rate": 1.2338587847634487e-05, "Pretrain/Loss": 1.9776611328125, "Pretrain/Loss (Raw)": 1.8637932538986206, "Pretrain/Step": 12950, "Pretrain/Step Time": 8.476302493363619} +{"Pretrain/Learning Rate": 1.2334927569915204e-05, "Pretrain/Loss": 1.9783793687820435, "Pretrain/Loss (Raw)": 1.9382147789001465, "Pretrain/Step": 12951, "Pretrain/Step Time": 8.471877137199044} +{"Pretrain/Learning Rate": 1.2331267657384344e-05, "Pretrain/Loss": 1.9801602363586426, "Pretrain/Loss (Raw)": 2.182553291320801, "Pretrain/Step": 12952, "Pretrain/Step Time": 8.46803012676537} +{"Pretrain/Learning Rate": 1.2327608110147462e-05, "Pretrain/Loss": 1.9815293550491333, "Pretrain/Loss (Raw)": 2.429704189300537, "Pretrain/Step": 12953, "Pretrain/Step Time": 8.468264071270823} +{"Pretrain/Learning Rate": 1.2323948928310064e-05, "Pretrain/Loss": 1.9819929599761963, "Pretrain/Loss (Raw)": 2.110170841217041, "Pretrain/Step": 12954, "Pretrain/Step Time": 8.466721529141068} +{"Pretrain/Learning Rate": 1.2320290111977656e-05, "Pretrain/Loss": 1.9804096221923828, "Pretrain/Loss (Raw)": 1.8941699266433716, "Pretrain/Step": 12955, "Pretrain/Step Time": 8.466020638123155} +{"Pretrain/Learning Rate": 1.231663166125575e-05, "Pretrain/Loss": 1.9809387922286987, "Pretrain/Loss (Raw)": 2.1519222259521484, "Pretrain/Step": 12956, "Pretrain/Step Time": 8.477753762155771} +{"Pretrain/Learning Rate": 1.2312973576249823e-05, "Pretrain/Loss": 1.9838299751281738, "Pretrain/Loss (Raw)": 2.1853864192962646, "Pretrain/Step": 12957, "Pretrain/Step Time": 8.47451407648623} +{"Pretrain/Learning Rate": 1.2309315857065368e-05, "Pretrain/Loss": 1.9830607175827026, "Pretrain/Loss (Raw)": 1.8760054111480713, "Pretrain/Step": 12958, "Pretrain/Step Time": 8.479624353349209} +{"Pretrain/Learning Rate": 1.2305658503807843e-05, "Pretrain/Loss": 1.983355164527893, "Pretrain/Loss (Raw)": 2.059224843978882, "Pretrain/Step": 12959, "Pretrain/Step Time": 8.482864867895842} +{"Pretrain/Learning Rate": 1.2302001516582699e-05, "Pretrain/Loss": 1.9870010614395142, "Pretrain/Loss (Raw)": 2.1195273399353027, "Pretrain/Step": 12960, "Pretrain/Step Time": 8.479030285030603} +{"Pretrain/Learning Rate": 1.2298344895495394e-05, "Pretrain/Loss": 1.9882110357284546, "Pretrain/Loss (Raw)": 2.0311989784240723, "Pretrain/Step": 12961, "Pretrain/Step Time": 8.47963166050613} +{"Pretrain/Learning Rate": 1.2294688640651355e-05, "Pretrain/Loss": 1.9880428314208984, "Pretrain/Loss (Raw)": 1.7826988697052002, "Pretrain/Step": 12962, "Pretrain/Step Time": 8.479285392910242} +{"Pretrain/Learning Rate": 1.229103275215602e-05, "Pretrain/Loss": 1.9874769449234009, "Pretrain/Loss (Raw)": 1.899031162261963, "Pretrain/Step": 12963, "Pretrain/Step Time": 8.474640384316444} +{"Pretrain/Learning Rate": 1.2287377230114797e-05, "Pretrain/Loss": 1.9856759309768677, "Pretrain/Loss (Raw)": 1.975152850151062, "Pretrain/Step": 12964, "Pretrain/Step Time": 8.47855043783784} +{"Pretrain/Learning Rate": 1.228372207463308e-05, "Pretrain/Loss": 1.9856067895889282, "Pretrain/Loss (Raw)": 2.105602264404297, "Pretrain/Step": 12965, "Pretrain/Step Time": 8.480039432644844} +{"Pretrain/Learning Rate": 1.2280067285816282e-05, "Pretrain/Loss": 1.984722375869751, "Pretrain/Loss (Raw)": 1.9230766296386719, "Pretrain/Step": 12966, "Pretrain/Step Time": 8.481557192280889} +{"Pretrain/Learning Rate": 1.2276412863769767e-05, "Pretrain/Loss": 1.9851794242858887, "Pretrain/Loss (Raw)": 1.9141250848770142, "Pretrain/Step": 12967, "Pretrain/Step Time": 8.480456439778209} +{"Pretrain/Learning Rate": 1.2272758808598928e-05, "Pretrain/Loss": 1.9861352443695068, "Pretrain/Loss (Raw)": 2.186850070953369, "Pretrain/Step": 12968, "Pretrain/Step Time": 8.486275900155306} +{"Pretrain/Learning Rate": 1.2269105120409116e-05, "Pretrain/Loss": 1.9868299961090088, "Pretrain/Loss (Raw)": 2.100498676300049, "Pretrain/Step": 12969, "Pretrain/Step Time": 8.483154257759452} +{"Pretrain/Learning Rate": 1.2265451799305674e-05, "Pretrain/Loss": 1.9879560470581055, "Pretrain/Loss (Raw)": 1.9648785591125488, "Pretrain/Step": 12970, "Pretrain/Step Time": 8.485181733965874} +{"Pretrain/Learning Rate": 1.2261798845393962e-05, "Pretrain/Loss": 1.984445571899414, "Pretrain/Loss (Raw)": 1.684712290763855, "Pretrain/Step": 12971, "Pretrain/Step Time": 8.484526356682181} +{"Pretrain/Learning Rate": 1.225814625877929e-05, "Pretrain/Loss": 1.98280930519104, "Pretrain/Loss (Raw)": 1.875686764717102, "Pretrain/Step": 12972, "Pretrain/Step Time": 8.489688716828823} +{"Pretrain/Learning Rate": 1.2254494039566997e-05, "Pretrain/Loss": 1.9833054542541504, "Pretrain/Loss (Raw)": 1.9565374851226807, "Pretrain/Step": 12973, "Pretrain/Step Time": 8.485457014292479} +{"Pretrain/Learning Rate": 1.2250842187862385e-05, "Pretrain/Loss": 1.9856781959533691, "Pretrain/Loss (Raw)": 1.9878531694412231, "Pretrain/Step": 12974, "Pretrain/Step Time": 8.489660134539008} +{"Pretrain/Learning Rate": 1.2247190703770742e-05, "Pretrain/Loss": 1.9840892553329468, "Pretrain/Loss (Raw)": 2.0211434364318848, "Pretrain/Step": 12975, "Pretrain/Step Time": 8.489434340968728} +{"Pretrain/Learning Rate": 1.2243539587397373e-05, "Pretrain/Loss": 1.9833091497421265, "Pretrain/Loss (Raw)": 1.9458658695220947, "Pretrain/Step": 12976, "Pretrain/Step Time": 8.487976035103202} +{"Pretrain/Learning Rate": 1.2239888838847546e-05, "Pretrain/Loss": 1.98403000831604, "Pretrain/Loss (Raw)": 2.186938524246216, "Pretrain/Step": 12977, "Pretrain/Step Time": 8.491303516551852} +{"Pretrain/Learning Rate": 1.2236238458226532e-05, "Pretrain/Loss": 1.9832427501678467, "Pretrain/Loss (Raw)": 1.9808361530303955, "Pretrain/Step": 12978, "Pretrain/Step Time": 8.492670573294163} +{"Pretrain/Learning Rate": 1.2232588445639572e-05, "Pretrain/Loss": 1.9826610088348389, "Pretrain/Loss (Raw)": 1.9252073764801025, "Pretrain/Step": 12979, "Pretrain/Step Time": 8.487294271588326} +{"Pretrain/Learning Rate": 1.2228938801191936e-05, "Pretrain/Loss": 1.981754183769226, "Pretrain/Loss (Raw)": 1.9397765398025513, "Pretrain/Step": 12980, "Pretrain/Step Time": 8.489555925130844} +{"Pretrain/Learning Rate": 1.2225289524988845e-05, "Pretrain/Loss": 1.9818538427352905, "Pretrain/Loss (Raw)": 1.9698888063430786, "Pretrain/Step": 12981, "Pretrain/Step Time": 8.492674581706524} +{"Pretrain/Learning Rate": 1.2221640617135516e-05, "Pretrain/Loss": 1.9796115159988403, "Pretrain/Loss (Raw)": 1.776521921157837, "Pretrain/Step": 12982, "Pretrain/Step Time": 8.490044463425875} +{"Pretrain/Learning Rate": 1.2217992077737181e-05, "Pretrain/Loss": 1.9786440134048462, "Pretrain/Loss (Raw)": 1.868996500968933, "Pretrain/Step": 12983, "Pretrain/Step Time": 8.48651278577745} +{"Pretrain/Learning Rate": 1.2214343906899022e-05, "Pretrain/Loss": 1.9779105186462402, "Pretrain/Loss (Raw)": 2.0570998191833496, "Pretrain/Step": 12984, "Pretrain/Step Time": 8.490798437967896} +{"Pretrain/Learning Rate": 1.2210696104726258e-05, "Pretrain/Loss": 1.9808838367462158, "Pretrain/Loss (Raw)": 2.319697618484497, "Pretrain/Step": 12985, "Pretrain/Step Time": 8.478449910879135} +{"Pretrain/Learning Rate": 1.2207048671324043e-05, "Pretrain/Loss": 1.9810469150543213, "Pretrain/Loss (Raw)": 1.755277395248413, "Pretrain/Step": 12986, "Pretrain/Step Time": 8.479611372575164} +{"Pretrain/Learning Rate": 1.2203401606797568e-05, "Pretrain/Loss": 1.9844403266906738, "Pretrain/Loss (Raw)": 2.2062408924102783, "Pretrain/Step": 12987, "Pretrain/Step Time": 8.485363299027085} +{"Pretrain/Learning Rate": 1.219975491125199e-05, "Pretrain/Loss": 1.9849317073822021, "Pretrain/Loss (Raw)": 2.204864978790283, "Pretrain/Step": 12988, "Pretrain/Step Time": 8.486727967858315} +{"Pretrain/Learning Rate": 1.2196108584792445e-05, "Pretrain/Loss": 1.9855543375015259, "Pretrain/Loss (Raw)": 1.9975866079330444, "Pretrain/Step": 12989, "Pretrain/Step Time": 8.484047345817089} +{"Pretrain/Learning Rate": 1.2192462627524096e-05, "Pretrain/Loss": 1.9867557287216187, "Pretrain/Loss (Raw)": 2.049164056777954, "Pretrain/Step": 12990, "Pretrain/Step Time": 8.485489225015044} +{"Pretrain/Learning Rate": 1.2188817039552045e-05, "Pretrain/Loss": 1.9886693954467773, "Pretrain/Loss (Raw)": 2.1724493503570557, "Pretrain/Step": 12991, "Pretrain/Step Time": 8.487402986735106} +{"Pretrain/Learning Rate": 1.2185171820981433e-05, "Pretrain/Loss": 1.986190915107727, "Pretrain/Loss (Raw)": 1.8111257553100586, "Pretrain/Step": 12992, "Pretrain/Step Time": 8.489455433562398} +{"Pretrain/Learning Rate": 1.2181526971917359e-05, "Pretrain/Loss": 1.9884510040283203, "Pretrain/Loss (Raw)": 2.176173686981201, "Pretrain/Step": 12993, "Pretrain/Step Time": 8.485290871933103} +{"Pretrain/Learning Rate": 1.2177882492464906e-05, "Pretrain/Loss": 1.9865972995758057, "Pretrain/Loss (Raw)": 1.9759297370910645, "Pretrain/Step": 12994, "Pretrain/Step Time": 8.484962621703744} +{"Pretrain/Learning Rate": 1.2174238382729186e-05, "Pretrain/Loss": 1.9895045757293701, "Pretrain/Loss (Raw)": 2.412315607070923, "Pretrain/Step": 12995, "Pretrain/Step Time": 8.481295539066195} +{"Pretrain/Learning Rate": 1.2170594642815247e-05, "Pretrain/Loss": 1.988373875617981, "Pretrain/Loss (Raw)": 2.0335147380828857, "Pretrain/Step": 12996, "Pretrain/Step Time": 8.4790383502841} +{"Pretrain/Learning Rate": 1.216695127282818e-05, "Pretrain/Loss": 1.9901944398880005, "Pretrain/Loss (Raw)": 2.1313223838806152, "Pretrain/Step": 12997, "Pretrain/Step Time": 8.478611517697573} +{"Pretrain/Learning Rate": 1.2163308272873025e-05, "Pretrain/Loss": 1.9905496835708618, "Pretrain/Loss (Raw)": 1.867260217666626, "Pretrain/Step": 12998, "Pretrain/Step Time": 8.480521632358432} +{"Pretrain/Learning Rate": 1.2159665643054819e-05, "Pretrain/Loss": 1.9917501211166382, "Pretrain/Loss (Raw)": 2.0933849811553955, "Pretrain/Step": 12999, "Pretrain/Step Time": 8.475120525807142} +{"Pretrain/Learning Rate": 1.215602338347861e-05, "Pretrain/Loss": 1.9904899597167969, "Pretrain/Loss (Raw)": 1.9094599485397339, "Pretrain/Step": 13000, "Pretrain/Step Time": 8.477148549631238} +{"Pretrain/Learning Rate": 1.2152381494249402e-05, "Pretrain/Loss": 1.9906550645828247, "Pretrain/Loss (Raw)": 2.0701889991760254, "Pretrain/Step": 13001, "Pretrain/Step Time": 8.474774308502674} +{"Pretrain/Learning Rate": 1.2148739975472229e-05, "Pretrain/Loss": 1.995097279548645, "Pretrain/Loss (Raw)": 2.430194139480591, "Pretrain/Step": 13002, "Pretrain/Step Time": 8.470810264348984} +{"Pretrain/Learning Rate": 1.2145098827252078e-05, "Pretrain/Loss": 1.9962077140808105, "Pretrain/Loss (Raw)": 2.0077097415924072, "Pretrain/Step": 13003, "Pretrain/Step Time": 8.478153768926859} +{"Pretrain/Learning Rate": 1.214145804969393e-05, "Pretrain/Loss": 1.9991474151611328, "Pretrain/Loss (Raw)": 2.167863607406616, "Pretrain/Step": 13004, "Pretrain/Step Time": 8.477893222123384} +{"Pretrain/Learning Rate": 1.2137817642902782e-05, "Pretrain/Loss": 2.0011885166168213, "Pretrain/Loss (Raw)": 2.0871529579162598, "Pretrain/Step": 13005, "Pretrain/Step Time": 8.472672522068024} +{"Pretrain/Learning Rate": 1.2134177606983588e-05, "Pretrain/Loss": 2.0002682209014893, "Pretrain/Loss (Raw)": 2.026688575744629, "Pretrain/Step": 13006, "Pretrain/Step Time": 8.47536956332624} +{"Pretrain/Learning Rate": 1.2130537942041322e-05, "Pretrain/Loss": 2.0004563331604004, "Pretrain/Loss (Raw)": 2.0037245750427246, "Pretrain/Step": 13007, "Pretrain/Step Time": 8.47925778105855} +{"Pretrain/Learning Rate": 1.2126898648180923e-05, "Pretrain/Loss": 2.000580310821533, "Pretrain/Loss (Raw)": 1.9920709133148193, "Pretrain/Step": 13008, "Pretrain/Step Time": 8.477247655391693} +{"Pretrain/Learning Rate": 1.2123259725507317e-05, "Pretrain/Loss": 1.9961739778518677, "Pretrain/Loss (Raw)": 1.594648838043213, "Pretrain/Step": 13009, "Pretrain/Step Time": 8.480942118912935} +{"Pretrain/Learning Rate": 1.2119621174125448e-05, "Pretrain/Loss": 1.9954614639282227, "Pretrain/Loss (Raw)": 1.9355345964431763, "Pretrain/Step": 13010, "Pretrain/Step Time": 8.480048375204206} +{"Pretrain/Learning Rate": 1.2115982994140213e-05, "Pretrain/Loss": 1.9956823587417603, "Pretrain/Loss (Raw)": 2.082608222961426, "Pretrain/Step": 13011, "Pretrain/Step Time": 8.478659531101584} +{"Pretrain/Learning Rate": 1.2112345185656534e-05, "Pretrain/Loss": 1.9942516088485718, "Pretrain/Loss (Raw)": 1.8575788736343384, "Pretrain/Step": 13012, "Pretrain/Step Time": 8.477707590907812} +{"Pretrain/Learning Rate": 1.21087077487793e-05, "Pretrain/Loss": 1.9936470985412598, "Pretrain/Loss (Raw)": 1.882840871810913, "Pretrain/Step": 13013, "Pretrain/Step Time": 8.475656434893608} +{"Pretrain/Learning Rate": 1.2105070683613376e-05, "Pretrain/Loss": 1.9917316436767578, "Pretrain/Loss (Raw)": 1.6991019248962402, "Pretrain/Step": 13014, "Pretrain/Step Time": 8.479179291054606} +{"Pretrain/Learning Rate": 1.2101433990263662e-05, "Pretrain/Loss": 1.9921034574508667, "Pretrain/Loss (Raw)": 1.8763824701309204, "Pretrain/Step": 13015, "Pretrain/Step Time": 8.477813055738807} +{"Pretrain/Learning Rate": 1.2097797668834996e-05, "Pretrain/Loss": 1.9924516677856445, "Pretrain/Loss (Raw)": 2.103541374206543, "Pretrain/Step": 13016, "Pretrain/Step Time": 8.480868274345994} +{"Pretrain/Learning Rate": 1.2094161719432245e-05, "Pretrain/Loss": 1.9911384582519531, "Pretrain/Loss (Raw)": 1.9827780723571777, "Pretrain/Step": 13017, "Pretrain/Step Time": 8.475693728774786} +{"Pretrain/Learning Rate": 1.2090526142160243e-05, "Pretrain/Loss": 1.9917974472045898, "Pretrain/Loss (Raw)": 2.077028512954712, "Pretrain/Step": 13018, "Pretrain/Step Time": 8.476907288655639} +{"Pretrain/Learning Rate": 1.2086890937123812e-05, "Pretrain/Loss": 1.9960366487503052, "Pretrain/Loss (Raw)": 2.4312429428100586, "Pretrain/Step": 13019, "Pretrain/Step Time": 8.47481000609696} +{"Pretrain/Learning Rate": 1.208325610442779e-05, "Pretrain/Loss": 1.9974966049194336, "Pretrain/Loss (Raw)": 2.075939178466797, "Pretrain/Step": 13020, "Pretrain/Step Time": 8.479365102946758} +{"Pretrain/Learning Rate": 1.2079621644176958e-05, "Pretrain/Loss": 1.9980168342590332, "Pretrain/Loss (Raw)": 1.9845446348190308, "Pretrain/Step": 13021, "Pretrain/Step Time": 8.477306617423892} +{"Pretrain/Learning Rate": 1.207598755647614e-05, "Pretrain/Loss": 1.9986696243286133, "Pretrain/Loss (Raw)": 1.9890645742416382, "Pretrain/Step": 13022, "Pretrain/Step Time": 8.473479505628347} +{"Pretrain/Learning Rate": 1.2072353841430108e-05, "Pretrain/Loss": 1.998215675354004, "Pretrain/Loss (Raw)": 1.9579155445098877, "Pretrain/Step": 13023, "Pretrain/Step Time": 8.476545194163918} +{"Pretrain/Learning Rate": 1.2068720499143632e-05, "Pretrain/Loss": 1.9991096258163452, "Pretrain/Loss (Raw)": 2.0405077934265137, "Pretrain/Step": 13024, "Pretrain/Step Time": 8.478580806404352} +{"Pretrain/Learning Rate": 1.2065087529721492e-05, "Pretrain/Loss": 1.9995152950286865, "Pretrain/Loss (Raw)": 1.9620120525360107, "Pretrain/Step": 13025, "Pretrain/Step Time": 8.477850176393986} +{"Pretrain/Learning Rate": 1.2061454933268427e-05, "Pretrain/Loss": 1.9984111785888672, "Pretrain/Loss (Raw)": 1.8995282649993896, "Pretrain/Step": 13026, "Pretrain/Step Time": 8.476706068962812} +{"Pretrain/Learning Rate": 1.2057822709889194e-05, "Pretrain/Loss": 2.000533103942871, "Pretrain/Loss (Raw)": 2.0352044105529785, "Pretrain/Step": 13027, "Pretrain/Step Time": 8.474700694903731} +{"Pretrain/Learning Rate": 1.2054190859688524e-05, "Pretrain/Loss": 2.00087833404541, "Pretrain/Loss (Raw)": 1.989669919013977, "Pretrain/Step": 13028, "Pretrain/Step Time": 8.47650902159512} +{"Pretrain/Learning Rate": 1.2050559382771123e-05, "Pretrain/Loss": 2.0002973079681396, "Pretrain/Loss (Raw)": 1.9266608953475952, "Pretrain/Step": 13029, "Pretrain/Step Time": 8.473542094230652} +{"Pretrain/Learning Rate": 1.204692827924172e-05, "Pretrain/Loss": 2.0011513233184814, "Pretrain/Loss (Raw)": 1.948653221130371, "Pretrain/Step": 13030, "Pretrain/Step Time": 8.474491080269217} +{"Pretrain/Learning Rate": 1.2043297549205005e-05, "Pretrain/Loss": 2.0014944076538086, "Pretrain/Loss (Raw)": 1.9766323566436768, "Pretrain/Step": 13031, "Pretrain/Step Time": 8.474624877795577} +{"Pretrain/Learning Rate": 1.2039667192765677e-05, "Pretrain/Loss": 2.0026180744171143, "Pretrain/Loss (Raw)": 2.0551345348358154, "Pretrain/Step": 13032, "Pretrain/Step Time": 8.473829429596663} +{"Pretrain/Learning Rate": 1.2036037210028408e-05, "Pretrain/Loss": 2.005451202392578, "Pretrain/Loss (Raw)": 1.9800591468811035, "Pretrain/Step": 13033, "Pretrain/Step Time": 8.472736567258835} +{"Pretrain/Learning Rate": 1.2032407601097862e-05, "Pretrain/Loss": 2.0051331520080566, "Pretrain/Loss (Raw)": 2.051692247390747, "Pretrain/Step": 13034, "Pretrain/Step Time": 8.467053322121501} +{"Pretrain/Learning Rate": 1.2028778366078708e-05, "Pretrain/Loss": 2.0049099922180176, "Pretrain/Loss (Raw)": 1.9429179430007935, "Pretrain/Step": 13035, "Pretrain/Step Time": 8.469478759914637} +{"Pretrain/Learning Rate": 1.2025149505075575e-05, "Pretrain/Loss": 2.0048837661743164, "Pretrain/Loss (Raw)": 2.0365099906921387, "Pretrain/Step": 13036, "Pretrain/Step Time": 8.471609042957425} +{"Pretrain/Learning Rate": 1.2021521018193122e-05, "Pretrain/Loss": 2.0034193992614746, "Pretrain/Loss (Raw)": 1.859032154083252, "Pretrain/Step": 13037, "Pretrain/Step Time": 8.471736328676343} +{"Pretrain/Learning Rate": 1.2017892905535958e-05, "Pretrain/Loss": 2.004805088043213, "Pretrain/Loss (Raw)": 2.3036255836486816, "Pretrain/Step": 13038, "Pretrain/Step Time": 8.471304150298238} +{"Pretrain/Learning Rate": 1.201426516720869e-05, "Pretrain/Loss": 2.004009962081909, "Pretrain/Loss (Raw)": 1.8845914602279663, "Pretrain/Step": 13039, "Pretrain/Step Time": 8.46957477927208} +{"Pretrain/Learning Rate": 1.2010637803315947e-05, "Pretrain/Loss": 2.0013232231140137, "Pretrain/Loss (Raw)": 1.6885437965393066, "Pretrain/Step": 13040, "Pretrain/Step Time": 8.469173200428486} +{"Pretrain/Learning Rate": 1.2007010813962292e-05, "Pretrain/Loss": 2.002474546432495, "Pretrain/Loss (Raw)": 2.0947113037109375, "Pretrain/Step": 13041, "Pretrain/Step Time": 8.468526031821966} +{"Pretrain/Learning Rate": 1.200338419925233e-05, "Pretrain/Loss": 2.0001533031463623, "Pretrain/Loss (Raw)": 1.7582248449325562, "Pretrain/Step": 13042, "Pretrain/Step Time": 8.47119359485805} +{"Pretrain/Learning Rate": 1.1999757959290626e-05, "Pretrain/Loss": 2.0006370544433594, "Pretrain/Loss (Raw)": 1.9298381805419922, "Pretrain/Step": 13043, "Pretrain/Step Time": 8.47383789345622} +{"Pretrain/Learning Rate": 1.1996132094181722e-05, "Pretrain/Loss": 2.000734329223633, "Pretrain/Loss (Raw)": 1.9757661819458008, "Pretrain/Step": 13044, "Pretrain/Step Time": 8.473235601559281} +{"Pretrain/Learning Rate": 1.1992506604030196e-05, "Pretrain/Loss": 2.001762628555298, "Pretrain/Loss (Raw)": 2.1956207752227783, "Pretrain/Step": 13045, "Pretrain/Step Time": 8.47225870192051} +{"Pretrain/Learning Rate": 1.198888148894056e-05, "Pretrain/Loss": 1.9999804496765137, "Pretrain/Loss (Raw)": 1.93101966381073, "Pretrain/Step": 13046, "Pretrain/Step Time": 8.466668443754315} +{"Pretrain/Learning Rate": 1.1985256749017366e-05, "Pretrain/Loss": 2.002100706100464, "Pretrain/Loss (Raw)": 1.9503474235534668, "Pretrain/Step": 13047, "Pretrain/Step Time": 8.469635671004653} +{"Pretrain/Learning Rate": 1.1981632384365116e-05, "Pretrain/Loss": 2.0002617835998535, "Pretrain/Loss (Raw)": 1.9099793434143066, "Pretrain/Step": 13048, "Pretrain/Step Time": 8.466051502153277} +{"Pretrain/Learning Rate": 1.1978008395088311e-05, "Pretrain/Loss": 1.9982450008392334, "Pretrain/Loss (Raw)": 1.8129011392593384, "Pretrain/Step": 13049, "Pretrain/Step Time": 8.470118284225464} +{"Pretrain/Learning Rate": 1.1974384781291464e-05, "Pretrain/Loss": 1.9978618621826172, "Pretrain/Loss (Raw)": 1.8607896566390991, "Pretrain/Step": 13050, "Pretrain/Step Time": 8.468624183908105} +{"Pretrain/Learning Rate": 1.197076154307904e-05, "Pretrain/Loss": 1.9947713613510132, "Pretrain/Loss (Raw)": 1.8297152519226074, "Pretrain/Step": 13051, "Pretrain/Step Time": 8.468283021822572} +{"Pretrain/Learning Rate": 1.1967138680555532e-05, "Pretrain/Loss": 1.9914186000823975, "Pretrain/Loss (Raw)": 1.7391637563705444, "Pretrain/Step": 13052, "Pretrain/Step Time": 8.467678554356098} +{"Pretrain/Learning Rate": 1.196351619382538e-05, "Pretrain/Loss": 1.9916682243347168, "Pretrain/Loss (Raw)": 2.0186238288879395, "Pretrain/Step": 13053, "Pretrain/Step Time": 8.467060681432486} +{"Pretrain/Learning Rate": 1.195989408299306e-05, "Pretrain/Loss": 1.991274356842041, "Pretrain/Loss (Raw)": 1.908429741859436, "Pretrain/Step": 13054, "Pretrain/Step Time": 8.473188495263457} +{"Pretrain/Learning Rate": 1.1956272348163e-05, "Pretrain/Loss": 1.9903500080108643, "Pretrain/Loss (Raw)": 1.7778637409210205, "Pretrain/Step": 13055, "Pretrain/Step Time": 8.48098168335855} +{"Pretrain/Learning Rate": 1.1952650989439623e-05, "Pretrain/Loss": 1.9872889518737793, "Pretrain/Loss (Raw)": 1.6883125305175781, "Pretrain/Step": 13056, "Pretrain/Step Time": 8.481091195717454} +{"Pretrain/Learning Rate": 1.1949030006927366e-05, "Pretrain/Loss": 1.9870216846466064, "Pretrain/Loss (Raw)": 2.00056529045105, "Pretrain/Step": 13057, "Pretrain/Step Time": 8.48667542077601} +{"Pretrain/Learning Rate": 1.1945409400730622e-05, "Pretrain/Loss": 1.988826870918274, "Pretrain/Loss (Raw)": 2.1479992866516113, "Pretrain/Step": 13058, "Pretrain/Step Time": 8.484869681298733} +{"Pretrain/Learning Rate": 1.1941789170953802e-05, "Pretrain/Loss": 1.9887827634811401, "Pretrain/Loss (Raw)": 1.8860504627227783, "Pretrain/Step": 13059, "Pretrain/Step Time": 8.481687372550368} +{"Pretrain/Learning Rate": 1.1938169317701286e-05, "Pretrain/Loss": 1.9876163005828857, "Pretrain/Loss (Raw)": 1.875688076019287, "Pretrain/Step": 13060, "Pretrain/Step Time": 8.485651846975088} +{"Pretrain/Learning Rate": 1.193454984107745e-05, "Pretrain/Loss": 1.9881671667099, "Pretrain/Loss (Raw)": 2.0442917346954346, "Pretrain/Step": 13061, "Pretrain/Step Time": 8.487922206521034} +{"Pretrain/Learning Rate": 1.1930930741186658e-05, "Pretrain/Loss": 1.9890638589859009, "Pretrain/Loss (Raw)": 1.9200868606567383, "Pretrain/Step": 13062, "Pretrain/Step Time": 8.488723505288363} +{"Pretrain/Learning Rate": 1.1927312018133256e-05, "Pretrain/Loss": 1.9855098724365234, "Pretrain/Loss (Raw)": 1.8858728408813477, "Pretrain/Step": 13063, "Pretrain/Step Time": 8.488596867769957} +{"Pretrain/Learning Rate": 1.1923693672021605e-05, "Pretrain/Loss": 1.9838563203811646, "Pretrain/Loss (Raw)": 2.0002779960632324, "Pretrain/Step": 13064, "Pretrain/Step Time": 8.485962599515915} +{"Pretrain/Learning Rate": 1.192007570295602e-05, "Pretrain/Loss": 1.9835000038146973, "Pretrain/Loss (Raw)": 2.221156358718872, "Pretrain/Step": 13065, "Pretrain/Step Time": 8.490032993257046} +{"Pretrain/Learning Rate": 1.1916458111040843e-05, "Pretrain/Loss": 1.9881103038787842, "Pretrain/Loss (Raw)": 2.017103910446167, "Pretrain/Step": 13066, "Pretrain/Step Time": 8.493289172649384} +{"Pretrain/Learning Rate": 1.191284089638037e-05, "Pretrain/Loss": 1.9908279180526733, "Pretrain/Loss (Raw)": 2.0933167934417725, "Pretrain/Step": 13067, "Pretrain/Step Time": 8.489542182534933} +{"Pretrain/Learning Rate": 1.1909224059078896e-05, "Pretrain/Loss": 1.9898250102996826, "Pretrain/Loss (Raw)": 1.8913276195526123, "Pretrain/Step": 13068, "Pretrain/Step Time": 8.490548975765705} +{"Pretrain/Learning Rate": 1.1905607599240725e-05, "Pretrain/Loss": 1.992472529411316, "Pretrain/Loss (Raw)": 2.008873701095581, "Pretrain/Step": 13069, "Pretrain/Step Time": 8.489943899214268} +{"Pretrain/Learning Rate": 1.1901991516970121e-05, "Pretrain/Loss": 1.9932457208633423, "Pretrain/Loss (Raw)": 2.023333787918091, "Pretrain/Step": 13070, "Pretrain/Step Time": 8.489267161116004} +{"Pretrain/Learning Rate": 1.1898375812371367e-05, "Pretrain/Loss": 1.9956032037734985, "Pretrain/Loss (Raw)": 2.4163873195648193, "Pretrain/Step": 13071, "Pretrain/Step Time": 8.497930750250816} +{"Pretrain/Learning Rate": 1.1894760485548712e-05, "Pretrain/Loss": 1.9961283206939697, "Pretrain/Loss (Raw)": 2.24688720703125, "Pretrain/Step": 13072, "Pretrain/Step Time": 8.497687483206391} +{"Pretrain/Learning Rate": 1.1891145536606387e-05, "Pretrain/Loss": 1.996188998222351, "Pretrain/Loss (Raw)": 1.8649414777755737, "Pretrain/Step": 13073, "Pretrain/Step Time": 8.495968468487263} +{"Pretrain/Learning Rate": 1.1887530965648652e-05, "Pretrain/Loss": 1.994219422340393, "Pretrain/Loss (Raw)": 1.613566517829895, "Pretrain/Step": 13074, "Pretrain/Step Time": 8.503801329061389} +{"Pretrain/Learning Rate": 1.1883916772779707e-05, "Pretrain/Loss": 1.9951781034469604, "Pretrain/Loss (Raw)": 1.8909887075424194, "Pretrain/Step": 13075, "Pretrain/Step Time": 8.499632060527802} +{"Pretrain/Learning Rate": 1.1880302958103784e-05, "Pretrain/Loss": 1.9963481426239014, "Pretrain/Loss (Raw)": 2.153883218765259, "Pretrain/Step": 13076, "Pretrain/Step Time": 8.499274533241987} +{"Pretrain/Learning Rate": 1.187668952172508e-05, "Pretrain/Loss": 1.9929122924804688, "Pretrain/Loss (Raw)": 1.624943733215332, "Pretrain/Step": 13077, "Pretrain/Step Time": 8.507430512458086} +{"Pretrain/Learning Rate": 1.1873076463747768e-05, "Pretrain/Loss": 1.9930232763290405, "Pretrain/Loss (Raw)": 1.8779796361923218, "Pretrain/Step": 13078, "Pretrain/Step Time": 8.50147795677185} +{"Pretrain/Learning Rate": 1.1869463784276055e-05, "Pretrain/Loss": 1.9959118366241455, "Pretrain/Loss (Raw)": 2.307952404022217, "Pretrain/Step": 13079, "Pretrain/Step Time": 8.501458939164877} +{"Pretrain/Learning Rate": 1.1865851483414087e-05, "Pretrain/Loss": 1.9949768781661987, "Pretrain/Loss (Raw)": 2.0628750324249268, "Pretrain/Step": 13080, "Pretrain/Step Time": 8.500057190656662} +{"Pretrain/Learning Rate": 1.1862239561266042e-05, "Pretrain/Loss": 1.9906926155090332, "Pretrain/Loss (Raw)": 1.8813164234161377, "Pretrain/Step": 13081, "Pretrain/Step Time": 8.507839906960726} +{"Pretrain/Learning Rate": 1.1858628017936058e-05, "Pretrain/Loss": 1.9900332689285278, "Pretrain/Loss (Raw)": 2.0257723331451416, "Pretrain/Step": 13082, "Pretrain/Step Time": 8.510580532252789} +{"Pretrain/Learning Rate": 1.1855016853528261e-05, "Pretrain/Loss": 1.9911638498306274, "Pretrain/Loss (Raw)": 2.038891077041626, "Pretrain/Step": 13083, "Pretrain/Step Time": 8.511858131736517} +{"Pretrain/Learning Rate": 1.1851406068146795e-05, "Pretrain/Loss": 1.9914710521697998, "Pretrain/Loss (Raw)": 2.1912519931793213, "Pretrain/Step": 13084, "Pretrain/Step Time": 8.499020408838987} +{"Pretrain/Learning Rate": 1.1847795661895758e-05, "Pretrain/Loss": 1.989743947982788, "Pretrain/Loss (Raw)": 1.9643234014511108, "Pretrain/Step": 13085, "Pretrain/Step Time": 8.503407496958971} +{"Pretrain/Learning Rate": 1.1844185634879271e-05, "Pretrain/Loss": 1.991465449333191, "Pretrain/Loss (Raw)": 2.0963432788848877, "Pretrain/Step": 13086, "Pretrain/Step Time": 8.498226469382644} +{"Pretrain/Learning Rate": 1.1840575987201416e-05, "Pretrain/Loss": 1.9907495975494385, "Pretrain/Loss (Raw)": 1.9675911664962769, "Pretrain/Step": 13087, "Pretrain/Step Time": 8.499846506863832} +{"Pretrain/Learning Rate": 1.1836966718966266e-05, "Pretrain/Loss": 1.990468144416809, "Pretrain/Loss (Raw)": 2.0835158824920654, "Pretrain/Step": 13088, "Pretrain/Step Time": 8.504057332873344} +{"Pretrain/Learning Rate": 1.183335783027791e-05, "Pretrain/Loss": 1.9909813404083252, "Pretrain/Loss (Raw)": 2.0968782901763916, "Pretrain/Step": 13089, "Pretrain/Step Time": 8.504099214449525} +{"Pretrain/Learning Rate": 1.1829749321240391e-05, "Pretrain/Loss": 1.991153597831726, "Pretrain/Loss (Raw)": 1.8047564029693604, "Pretrain/Step": 13090, "Pretrain/Step Time": 8.500207286328077} +{"Pretrain/Learning Rate": 1.1826141191957777e-05, "Pretrain/Loss": 1.9922043085098267, "Pretrain/Loss (Raw)": 2.0335135459899902, "Pretrain/Step": 13091, "Pretrain/Step Time": 8.501539861783385} +{"Pretrain/Learning Rate": 1.1822533442534092e-05, "Pretrain/Loss": 1.9943660497665405, "Pretrain/Loss (Raw)": 2.251852512359619, "Pretrain/Step": 13092, "Pretrain/Step Time": 8.505084540694952} +{"Pretrain/Learning Rate": 1.1818926073073359e-05, "Pretrain/Loss": 1.9934923648834229, "Pretrain/Loss (Raw)": 1.9937931299209595, "Pretrain/Step": 13093, "Pretrain/Step Time": 8.5012834277004} +{"Pretrain/Learning Rate": 1.1815319083679607e-05, "Pretrain/Loss": 1.9955551624298096, "Pretrain/Loss (Raw)": 2.187093496322632, "Pretrain/Step": 13094, "Pretrain/Step Time": 8.497828813269734} +{"Pretrain/Learning Rate": 1.1811712474456827e-05, "Pretrain/Loss": 1.9982109069824219, "Pretrain/Loss (Raw)": 2.2540712356567383, "Pretrain/Step": 13095, "Pretrain/Step Time": 8.498754318803549} +{"Pretrain/Learning Rate": 1.180810624550903e-05, "Pretrain/Loss": 1.995024561882019, "Pretrain/Loss (Raw)": 1.7789944410324097, "Pretrain/Step": 13096, "Pretrain/Step Time": 8.494357079267502} +{"Pretrain/Learning Rate": 1.1804500396940188e-05, "Pretrain/Loss": 1.9962804317474365, "Pretrain/Loss (Raw)": 2.261228561401367, "Pretrain/Step": 13097, "Pretrain/Step Time": 8.491763308644295} +{"Pretrain/Learning Rate": 1.1800894928854268e-05, "Pretrain/Loss": 1.9977809190750122, "Pretrain/Loss (Raw)": 2.1569581031799316, "Pretrain/Step": 13098, "Pretrain/Step Time": 8.498005529865623} +{"Pretrain/Learning Rate": 1.1797289841355246e-05, "Pretrain/Loss": 1.9992846250534058, "Pretrain/Loss (Raw)": 1.877184271812439, "Pretrain/Step": 13099, "Pretrain/Step Time": 8.496898652985692} +{"Pretrain/Learning Rate": 1.1793685134547056e-05, "Pretrain/Loss": 2.0007712841033936, "Pretrain/Loss (Raw)": 2.0659945011138916, "Pretrain/Step": 13100, "Pretrain/Step Time": 8.492896614596248} +{"Pretrain/Learning Rate": 1.1790080808533651e-05, "Pretrain/Loss": 2.002722978591919, "Pretrain/Loss (Raw)": 2.206338882446289, "Pretrain/Step": 13101, "Pretrain/Step Time": 8.490131856873631} +{"Pretrain/Learning Rate": 1.1786476863418958e-05, "Pretrain/Loss": 1.9982163906097412, "Pretrain/Loss (Raw)": 1.411010980606079, "Pretrain/Step": 13102, "Pretrain/Step Time": 8.492920991033316} +{"Pretrain/Learning Rate": 1.178287329930688e-05, "Pretrain/Loss": 1.995392084121704, "Pretrain/Loss (Raw)": 1.6596301794052124, "Pretrain/Step": 13103, "Pretrain/Step Time": 8.491580540314317} +{"Pretrain/Learning Rate": 1.177927011630134e-05, "Pretrain/Loss": 1.9967585802078247, "Pretrain/Loss (Raw)": 2.1207802295684814, "Pretrain/Step": 13104, "Pretrain/Step Time": 8.497149160131812} +{"Pretrain/Learning Rate": 1.1775667314506216e-05, "Pretrain/Loss": 1.9950611591339111, "Pretrain/Loss (Raw)": 1.969670295715332, "Pretrain/Step": 13105, "Pretrain/Step Time": 8.492386808618903} +{"Pretrain/Learning Rate": 1.1772064894025414e-05, "Pretrain/Loss": 1.993412971496582, "Pretrain/Loss (Raw)": 1.7698713541030884, "Pretrain/Step": 13106, "Pretrain/Step Time": 8.492794254794717} +{"Pretrain/Learning Rate": 1.1768462854962797e-05, "Pretrain/Loss": 1.993844985961914, "Pretrain/Loss (Raw)": 1.9805094003677368, "Pretrain/Step": 13107, "Pretrain/Step Time": 8.495733303949237} +{"Pretrain/Learning Rate": 1.1764861197422214e-05, "Pretrain/Loss": 1.9929839372634888, "Pretrain/Loss (Raw)": 1.8295578956604004, "Pretrain/Step": 13108, "Pretrain/Step Time": 8.491383247077465} +{"Pretrain/Learning Rate": 1.176125992150754e-05, "Pretrain/Loss": 1.9921271800994873, "Pretrain/Loss (Raw)": 1.8602221012115479, "Pretrain/Step": 13109, "Pretrain/Step Time": 8.487765312194824} +{"Pretrain/Learning Rate": 1.175765902732259e-05, "Pretrain/Loss": 1.9951062202453613, "Pretrain/Loss (Raw)": 2.1578352451324463, "Pretrain/Step": 13110, "Pretrain/Step Time": 8.486947946250439} +{"Pretrain/Learning Rate": 1.1754058514971219e-05, "Pretrain/Loss": 1.9952244758605957, "Pretrain/Loss (Raw)": 1.8841301202774048, "Pretrain/Step": 13111, "Pretrain/Step Time": 8.489233998581767} +{"Pretrain/Learning Rate": 1.1750458384557234e-05, "Pretrain/Loss": 1.9950066804885864, "Pretrain/Loss (Raw)": 2.0292229652404785, "Pretrain/Step": 13112, "Pretrain/Step Time": 8.486208233982325} +{"Pretrain/Learning Rate": 1.174685863618443e-05, "Pretrain/Loss": 1.992948055267334, "Pretrain/Loss (Raw)": 2.0561890602111816, "Pretrain/Step": 13113, "Pretrain/Step Time": 8.488899420946836} +{"Pretrain/Learning Rate": 1.1743259269956621e-05, "Pretrain/Loss": 1.9925684928894043, "Pretrain/Loss (Raw)": 1.7067034244537354, "Pretrain/Step": 13114, "Pretrain/Step Time": 8.492539850994945} +{"Pretrain/Learning Rate": 1.173966028597758e-05, "Pretrain/Loss": 1.988617181777954, "Pretrain/Loss (Raw)": 1.7004832029342651, "Pretrain/Step": 13115, "Pretrain/Step Time": 8.490245010703802} +{"Pretrain/Learning Rate": 1.1736061684351096e-05, "Pretrain/Loss": 1.986911654472351, "Pretrain/Loss (Raw)": 1.9865514039993286, "Pretrain/Step": 13116, "Pretrain/Step Time": 8.49004815891385} +{"Pretrain/Learning Rate": 1.1732463465180924e-05, "Pretrain/Loss": 1.9857022762298584, "Pretrain/Loss (Raw)": 1.8427889347076416, "Pretrain/Step": 13117, "Pretrain/Step Time": 8.49173192679882} +{"Pretrain/Learning Rate": 1.1728865628570804e-05, "Pretrain/Loss": 1.9844132661819458, "Pretrain/Loss (Raw)": 1.8841609954833984, "Pretrain/Step": 13118, "Pretrain/Step Time": 8.49010531231761} +{"Pretrain/Learning Rate": 1.1725268174624496e-05, "Pretrain/Loss": 1.9864548444747925, "Pretrain/Loss (Raw)": 2.4337778091430664, "Pretrain/Step": 13119, "Pretrain/Step Time": 8.490770496428013} +{"Pretrain/Learning Rate": 1.1721671103445714e-05, "Pretrain/Loss": 1.987502098083496, "Pretrain/Loss (Raw)": 1.9451580047607422, "Pretrain/Step": 13120, "Pretrain/Step Time": 8.48903251066804} +{"Pretrain/Learning Rate": 1.1718074415138194e-05, "Pretrain/Loss": 1.9856200218200684, "Pretrain/Loss (Raw)": 1.9352741241455078, "Pretrain/Step": 13121, "Pretrain/Step Time": 8.488232286646962} +{"Pretrain/Learning Rate": 1.1714478109805627e-05, "Pretrain/Loss": 1.9854904413223267, "Pretrain/Loss (Raw)": 1.9593532085418701, "Pretrain/Step": 13122, "Pretrain/Step Time": 8.489735970273614} +{"Pretrain/Learning Rate": 1.1710882187551725e-05, "Pretrain/Loss": 1.9811928272247314, "Pretrain/Loss (Raw)": 1.8622227907180786, "Pretrain/Step": 13123, "Pretrain/Step Time": 8.492514358833432} +{"Pretrain/Learning Rate": 1.170728664848017e-05, "Pretrain/Loss": 1.9812142848968506, "Pretrain/Loss (Raw)": 2.036252021789551, "Pretrain/Step": 13124, "Pretrain/Step Time": 8.490334859117866} +{"Pretrain/Learning Rate": 1.1703691492694622e-05, "Pretrain/Loss": 1.9805243015289307, "Pretrain/Loss (Raw)": 2.0430257320404053, "Pretrain/Step": 13125, "Pretrain/Step Time": 8.487193517386913} +{"Pretrain/Learning Rate": 1.1700096720298767e-05, "Pretrain/Loss": 1.9809412956237793, "Pretrain/Loss (Raw)": 1.9206181764602661, "Pretrain/Step": 13126, "Pretrain/Step Time": 8.485160691663623} +{"Pretrain/Learning Rate": 1.169650233139624e-05, "Pretrain/Loss": 1.9797091484069824, "Pretrain/Loss (Raw)": 1.9356900453567505, "Pretrain/Step": 13127, "Pretrain/Step Time": 8.486083270981908} +{"Pretrain/Learning Rate": 1.1692908326090696e-05, "Pretrain/Loss": 1.9806088209152222, "Pretrain/Loss (Raw)": 2.0245890617370605, "Pretrain/Step": 13128, "Pretrain/Step Time": 8.487432828173041} +{"Pretrain/Learning Rate": 1.1689314704485759e-05, "Pretrain/Loss": 1.979561448097229, "Pretrain/Loss (Raw)": 1.9361459016799927, "Pretrain/Step": 13129, "Pretrain/Step Time": 8.486348997801542} +{"Pretrain/Learning Rate": 1.168572146668504e-05, "Pretrain/Loss": 1.9762283563613892, "Pretrain/Loss (Raw)": 2.0035476684570312, "Pretrain/Step": 13130, "Pretrain/Step Time": 8.495103567838669} +{"Pretrain/Learning Rate": 1.1682128612792167e-05, "Pretrain/Loss": 1.9772462844848633, "Pretrain/Loss (Raw)": 2.1380155086517334, "Pretrain/Step": 13131, "Pretrain/Step Time": 8.488382728770375} +{"Pretrain/Learning Rate": 1.167853614291072e-05, "Pretrain/Loss": 1.9753504991531372, "Pretrain/Loss (Raw)": 1.9251960515975952, "Pretrain/Step": 13132, "Pretrain/Step Time": 8.487906884402037} +{"Pretrain/Learning Rate": 1.16749440571443e-05, "Pretrain/Loss": 1.9746220111846924, "Pretrain/Loss (Raw)": 1.9939085245132446, "Pretrain/Step": 13133, "Pretrain/Step Time": 8.490995611995459} +{"Pretrain/Learning Rate": 1.1671352355596474e-05, "Pretrain/Loss": 1.9726529121398926, "Pretrain/Loss (Raw)": 1.7746375799179077, "Pretrain/Step": 13134, "Pretrain/Step Time": 8.487907344475389} +{"Pretrain/Learning Rate": 1.1667761038370794e-05, "Pretrain/Loss": 1.9712061882019043, "Pretrain/Loss (Raw)": 1.8185611963272095, "Pretrain/Step": 13135, "Pretrain/Step Time": 8.490733316168189} +{"Pretrain/Learning Rate": 1.166417010557084e-05, "Pretrain/Loss": 1.9715535640716553, "Pretrain/Loss (Raw)": 2.036530017852783, "Pretrain/Step": 13136, "Pretrain/Step Time": 8.492672886699438} +{"Pretrain/Learning Rate": 1.1660579557300131e-05, "Pretrain/Loss": 1.97544264793396, "Pretrain/Loss (Raw)": 2.0924477577209473, "Pretrain/Step": 13137, "Pretrain/Step Time": 8.486716387793422} +{"Pretrain/Learning Rate": 1.1656989393662213e-05, "Pretrain/Loss": 1.9762272834777832, "Pretrain/Loss (Raw)": 2.0359630584716797, "Pretrain/Step": 13138, "Pretrain/Step Time": 8.49046122841537} +{"Pretrain/Learning Rate": 1.1653399614760602e-05, "Pretrain/Loss": 1.9755682945251465, "Pretrain/Loss (Raw)": 1.9982736110687256, "Pretrain/Step": 13139, "Pretrain/Step Time": 8.49307450465858} +{"Pretrain/Learning Rate": 1.1649810220698792e-05, "Pretrain/Loss": 1.9772155284881592, "Pretrain/Loss (Raw)": 2.0684151649475098, "Pretrain/Step": 13140, "Pretrain/Step Time": 8.490623218938708} +{"Pretrain/Learning Rate": 1.1646221211580305e-05, "Pretrain/Loss": 1.9767563343048096, "Pretrain/Loss (Raw)": 1.8240729570388794, "Pretrain/Step": 13141, "Pretrain/Step Time": 8.49143772572279} +{"Pretrain/Learning Rate": 1.1642632587508607e-05, "Pretrain/Loss": 1.9794615507125854, "Pretrain/Loss (Raw)": 2.045356035232544, "Pretrain/Step": 13142, "Pretrain/Step Time": 8.488006064668298} +{"Pretrain/Learning Rate": 1.1639044348587189e-05, "Pretrain/Loss": 1.9800416231155396, "Pretrain/Loss (Raw)": 1.9506357908248901, "Pretrain/Step": 13143, "Pretrain/Step Time": 8.490333426743746} +{"Pretrain/Learning Rate": 1.1635456494919508e-05, "Pretrain/Loss": 1.978897213935852, "Pretrain/Loss (Raw)": 1.9570508003234863, "Pretrain/Step": 13144, "Pretrain/Step Time": 8.489565957337618} +{"Pretrain/Learning Rate": 1.1631869026609018e-05, "Pretrain/Loss": 1.9788565635681152, "Pretrain/Loss (Raw)": 1.9775928258895874, "Pretrain/Step": 13145, "Pretrain/Step Time": 8.488736402243376} +{"Pretrain/Learning Rate": 1.1628281943759161e-05, "Pretrain/Loss": 1.9777131080627441, "Pretrain/Loss (Raw)": 1.9306511878967285, "Pretrain/Step": 13146, "Pretrain/Step Time": 8.487251931801438} +{"Pretrain/Learning Rate": 1.162469524647336e-05, "Pretrain/Loss": 1.9752748012542725, "Pretrain/Loss (Raw)": 2.1191301345825195, "Pretrain/Step": 13147, "Pretrain/Step Time": 8.483988845720887} +{"Pretrain/Learning Rate": 1.1621108934855051e-05, "Pretrain/Loss": 1.9747226238250732, "Pretrain/Loss (Raw)": 2.005263090133667, "Pretrain/Step": 13148, "Pretrain/Step Time": 8.481872580945492} +{"Pretrain/Learning Rate": 1.1617523009007624e-05, "Pretrain/Loss": 1.974348545074463, "Pretrain/Loss (Raw)": 1.9366682767868042, "Pretrain/Step": 13149, "Pretrain/Step Time": 8.482114540413022} +{"Pretrain/Learning Rate": 1.1613937469034496e-05, "Pretrain/Loss": 1.9739958047866821, "Pretrain/Loss (Raw)": 1.9439144134521484, "Pretrain/Step": 13150, "Pretrain/Step Time": 8.485719576478004} +{"Pretrain/Learning Rate": 1.1610352315039046e-05, "Pretrain/Loss": 1.974449872970581, "Pretrain/Loss (Raw)": 2.016028881072998, "Pretrain/Step": 13151, "Pretrain/Step Time": 8.481929883360863} +{"Pretrain/Learning Rate": 1.1606767547124639e-05, "Pretrain/Loss": 1.9751300811767578, "Pretrain/Loss (Raw)": 2.1275856494903564, "Pretrain/Step": 13152, "Pretrain/Step Time": 8.480222998186946} +{"Pretrain/Learning Rate": 1.1603183165394656e-05, "Pretrain/Loss": 1.975254774093628, "Pretrain/Loss (Raw)": 1.9779776334762573, "Pretrain/Step": 13153, "Pretrain/Step Time": 8.483515717089176} +{"Pretrain/Learning Rate": 1.1599599169952435e-05, "Pretrain/Loss": 1.9760751724243164, "Pretrain/Loss (Raw)": 2.004530906677246, "Pretrain/Step": 13154, "Pretrain/Step Time": 8.48052191734314} +{"Pretrain/Learning Rate": 1.1596015560901335e-05, "Pretrain/Loss": 1.9756698608398438, "Pretrain/Loss (Raw)": 1.9833252429962158, "Pretrain/Step": 13155, "Pretrain/Step Time": 8.480631535872817} +{"Pretrain/Learning Rate": 1.1592432338344675e-05, "Pretrain/Loss": 1.9756433963775635, "Pretrain/Loss (Raw)": 1.9862796068191528, "Pretrain/Step": 13156, "Pretrain/Step Time": 8.477581629529595} +{"Pretrain/Learning Rate": 1.1588849502385769e-05, "Pretrain/Loss": 1.976219892501831, "Pretrain/Loss (Raw)": 2.000455141067505, "Pretrain/Step": 13157, "Pretrain/Step Time": 8.4816779140383} +{"Pretrain/Learning Rate": 1.158526705312794e-05, "Pretrain/Loss": 1.9748542308807373, "Pretrain/Loss (Raw)": 1.7738486528396606, "Pretrain/Step": 13158, "Pretrain/Step Time": 8.482028096914291} +{"Pretrain/Learning Rate": 1.158168499067447e-05, "Pretrain/Loss": 1.976206660270691, "Pretrain/Loss (Raw)": 2.1497435569763184, "Pretrain/Step": 13159, "Pretrain/Step Time": 8.478817148134112} +{"Pretrain/Learning Rate": 1.1578103315128666e-05, "Pretrain/Loss": 1.9753870964050293, "Pretrain/Loss (Raw)": 1.9502278566360474, "Pretrain/Step": 13160, "Pretrain/Step Time": 8.476576736196876} +{"Pretrain/Learning Rate": 1.157452202659379e-05, "Pretrain/Loss": 1.9767986536026, "Pretrain/Loss (Raw)": 2.160747766494751, "Pretrain/Step": 13161, "Pretrain/Step Time": 8.478608151897788} +{"Pretrain/Learning Rate": 1.1570941125173096e-05, "Pretrain/Loss": 1.9754177331924438, "Pretrain/Loss (Raw)": 1.8749260902404785, "Pretrain/Step": 13162, "Pretrain/Step Time": 8.478675095364451} +{"Pretrain/Learning Rate": 1.1567360610969857e-05, "Pretrain/Loss": 1.9741722345352173, "Pretrain/Loss (Raw)": 1.7834913730621338, "Pretrain/Step": 13163, "Pretrain/Step Time": 8.475906433537602} +{"Pretrain/Learning Rate": 1.15637804840873e-05, "Pretrain/Loss": 1.9771575927734375, "Pretrain/Loss (Raw)": 2.41863751411438, "Pretrain/Step": 13164, "Pretrain/Step Time": 8.474173778668046} +{"Pretrain/Learning Rate": 1.1560200744628666e-05, "Pretrain/Loss": 1.9780701398849487, "Pretrain/Loss (Raw)": 1.9758321046829224, "Pretrain/Step": 13165, "Pretrain/Step Time": 8.474912505596876} +{"Pretrain/Learning Rate": 1.155662139269717e-05, "Pretrain/Loss": 1.9752249717712402, "Pretrain/Loss (Raw)": 1.9394519329071045, "Pretrain/Step": 13166, "Pretrain/Step Time": 8.47468813881278} +{"Pretrain/Learning Rate": 1.1553042428396011e-05, "Pretrain/Loss": 1.9766008853912354, "Pretrain/Loss (Raw)": 2.0607080459594727, "Pretrain/Step": 13167, "Pretrain/Step Time": 8.476147403940558} +{"Pretrain/Learning Rate": 1.1549463851828405e-05, "Pretrain/Loss": 1.978860855102539, "Pretrain/Loss (Raw)": 1.9778239727020264, "Pretrain/Step": 13168, "Pretrain/Step Time": 8.480332154780626} +{"Pretrain/Learning Rate": 1.1545885663097513e-05, "Pretrain/Loss": 1.9756537675857544, "Pretrain/Loss (Raw)": 1.6842058897018433, "Pretrain/Step": 13169, "Pretrain/Step Time": 8.482297770678997} +{"Pretrain/Learning Rate": 1.1542307862306537e-05, "Pretrain/Loss": 1.978367567062378, "Pretrain/Loss (Raw)": 2.1055896282196045, "Pretrain/Step": 13170, "Pretrain/Step Time": 8.480992322787642} +{"Pretrain/Learning Rate": 1.1538730449558624e-05, "Pretrain/Loss": 1.9776861667633057, "Pretrain/Loss (Raw)": 1.842608094215393, "Pretrain/Step": 13171, "Pretrain/Step Time": 8.475658304989338} +{"Pretrain/Learning Rate": 1.1535153424956922e-05, "Pretrain/Loss": 1.9765410423278809, "Pretrain/Loss (Raw)": 1.829189658164978, "Pretrain/Step": 13172, "Pretrain/Step Time": 8.475055418908596} +{"Pretrain/Learning Rate": 1.1531576788604583e-05, "Pretrain/Loss": 1.974778413772583, "Pretrain/Loss (Raw)": 1.9700112342834473, "Pretrain/Step": 13173, "Pretrain/Step Time": 8.472412617877126} +{"Pretrain/Learning Rate": 1.1528000540604727e-05, "Pretrain/Loss": 1.9748992919921875, "Pretrain/Loss (Raw)": 1.9464917182922363, "Pretrain/Step": 13174, "Pretrain/Step Time": 8.473136004060507} +{"Pretrain/Learning Rate": 1.1524424681060489e-05, "Pretrain/Loss": 1.9752583503723145, "Pretrain/Loss (Raw)": 1.9963041543960571, "Pretrain/Step": 13175, "Pretrain/Step Time": 8.472104646265507} +{"Pretrain/Learning Rate": 1.1520849210074966e-05, "Pretrain/Loss": 1.9764106273651123, "Pretrain/Loss (Raw)": 2.057471990585327, "Pretrain/Step": 13176, "Pretrain/Step Time": 8.473536929115653} +{"Pretrain/Learning Rate": 1.151727412775124e-05, "Pretrain/Loss": 1.978676676750183, "Pretrain/Loss (Raw)": 2.10296368598938, "Pretrain/Step": 13177, "Pretrain/Step Time": 8.467829020693898} +{"Pretrain/Learning Rate": 1.1513699434192425e-05, "Pretrain/Loss": 1.979874610900879, "Pretrain/Loss (Raw)": 2.0141072273254395, "Pretrain/Step": 13178, "Pretrain/Step Time": 8.469324385747313} +{"Pretrain/Learning Rate": 1.1510125129501565e-05, "Pretrain/Loss": 1.9813255071640015, "Pretrain/Loss (Raw)": 2.0154342651367188, "Pretrain/Step": 13179, "Pretrain/Step Time": 8.466557838022709} +{"Pretrain/Learning Rate": 1.150655121378175e-05, "Pretrain/Loss": 1.9851398468017578, "Pretrain/Loss (Raw)": 2.2273929119110107, "Pretrain/Step": 13180, "Pretrain/Step Time": 8.469712359830737} +{"Pretrain/Learning Rate": 1.1502977687136016e-05, "Pretrain/Loss": 1.986301302909851, "Pretrain/Loss (Raw)": 2.16729736328125, "Pretrain/Step": 13181, "Pretrain/Step Time": 8.464625542983413} +{"Pretrain/Learning Rate": 1.1499404549667397e-05, "Pretrain/Loss": 1.9871517419815063, "Pretrain/Loss (Raw)": 2.017291784286499, "Pretrain/Step": 13182, "Pretrain/Step Time": 8.457920083776116} +{"Pretrain/Learning Rate": 1.149583180147894e-05, "Pretrain/Loss": 1.9934422969818115, "Pretrain/Loss (Raw)": 2.5830609798431396, "Pretrain/Step": 13183, "Pretrain/Step Time": 8.456746270880103} +{"Pretrain/Learning Rate": 1.1492259442673645e-05, "Pretrain/Loss": 1.995023488998413, "Pretrain/Loss (Raw)": 1.8907053470611572, "Pretrain/Step": 13184, "Pretrain/Step Time": 8.456554932519794} +{"Pretrain/Learning Rate": 1.1488687473354537e-05, "Pretrain/Loss": 1.9962501525878906, "Pretrain/Loss (Raw)": 2.1575684547424316, "Pretrain/Step": 13185, "Pretrain/Step Time": 8.451554546132684} +{"Pretrain/Learning Rate": 1.1485115893624588e-05, "Pretrain/Loss": 1.9956786632537842, "Pretrain/Loss (Raw)": 2.074845552444458, "Pretrain/Step": 13186, "Pretrain/Step Time": 8.454823680222034} +{"Pretrain/Learning Rate": 1.1481544703586805e-05, "Pretrain/Loss": 1.9963572025299072, "Pretrain/Loss (Raw)": 1.9729138612747192, "Pretrain/Step": 13187, "Pretrain/Step Time": 8.46230798214674} +{"Pretrain/Learning Rate": 1.1477973903344152e-05, "Pretrain/Loss": 1.9980792999267578, "Pretrain/Loss (Raw)": 2.096099853515625, "Pretrain/Step": 13188, "Pretrain/Step Time": 8.459212217479944} +{"Pretrain/Learning Rate": 1.147440349299958e-05, "Pretrain/Loss": 1.9980272054672241, "Pretrain/Loss (Raw)": 2.0376274585723877, "Pretrain/Step": 13189, "Pretrain/Step Time": 8.455845041200519} +{"Pretrain/Learning Rate": 1.1470833472656056e-05, "Pretrain/Loss": 1.998306155204773, "Pretrain/Loss (Raw)": 1.9558026790618896, "Pretrain/Step": 13190, "Pretrain/Step Time": 8.457073481753469} +{"Pretrain/Learning Rate": 1.1467263842416504e-05, "Pretrain/Loss": 2.0002410411834717, "Pretrain/Loss (Raw)": 2.133535146713257, "Pretrain/Step": 13191, "Pretrain/Step Time": 8.453326731920242} +{"Pretrain/Learning Rate": 1.1463694602383867e-05, "Pretrain/Loss": 2.0008749961853027, "Pretrain/Loss (Raw)": 2.0814013481140137, "Pretrain/Step": 13192, "Pretrain/Step Time": 8.454248283058405} +{"Pretrain/Learning Rate": 1.1460125752661055e-05, "Pretrain/Loss": 1.9988187551498413, "Pretrain/Loss (Raw)": 1.9579863548278809, "Pretrain/Step": 13193, "Pretrain/Step Time": 8.451934739947319} +{"Pretrain/Learning Rate": 1.1456557293350961e-05, "Pretrain/Loss": 1.9986960887908936, "Pretrain/Loss (Raw)": 2.0013909339904785, "Pretrain/Step": 13194, "Pretrain/Step Time": 8.441034791991115} +{"Pretrain/Learning Rate": 1.1452989224556502e-05, "Pretrain/Loss": 1.9979212284088135, "Pretrain/Loss (Raw)": 1.9941329956054688, "Pretrain/Step": 13195, "Pretrain/Step Time": 8.44586114026606} +{"Pretrain/Learning Rate": 1.1449421546380537e-05, "Pretrain/Loss": 1.998382329940796, "Pretrain/Loss (Raw)": 1.9503490924835205, "Pretrain/Step": 13196, "Pretrain/Step Time": 8.441739924252033} +{"Pretrain/Learning Rate": 1.1445854258925958e-05, "Pretrain/Loss": 1.999281406402588, "Pretrain/Loss (Raw)": 2.123967409133911, "Pretrain/Step": 13197, "Pretrain/Step Time": 8.439131481572986} +{"Pretrain/Learning Rate": 1.1442287362295617e-05, "Pretrain/Loss": 1.998947262763977, "Pretrain/Loss (Raw)": 1.9805576801300049, "Pretrain/Step": 13198, "Pretrain/Step Time": 8.438077326864004} +{"Pretrain/Learning Rate": 1.1438720856592352e-05, "Pretrain/Loss": 1.9944367408752441, "Pretrain/Loss (Raw)": 1.839046597480774, "Pretrain/Step": 13199, "Pretrain/Step Time": 8.43755055591464} +{"Pretrain/Learning Rate": 1.1435154741919024e-05, "Pretrain/Loss": 1.9926815032958984, "Pretrain/Loss (Raw)": 2.0222127437591553, "Pretrain/Step": 13200, "Pretrain/Step Time": 8.436884047463536} +{"Pretrain/Learning Rate": 1.1431589018378434e-05, "Pretrain/Loss": 1.9936885833740234, "Pretrain/Loss (Raw)": 1.9938377141952515, "Pretrain/Step": 13201, "Pretrain/Step Time": 8.43869530968368} +{"Pretrain/Learning Rate": 1.1428023686073419e-05, "Pretrain/Loss": 1.9973303079605103, "Pretrain/Loss (Raw)": 2.079698324203491, "Pretrain/Step": 13202, "Pretrain/Step Time": 8.438284700736403} +{"Pretrain/Learning Rate": 1.1424458745106775e-05, "Pretrain/Loss": 1.997543454170227, "Pretrain/Loss (Raw)": 1.9182868003845215, "Pretrain/Step": 13203, "Pretrain/Step Time": 8.444617059081793} +{"Pretrain/Learning Rate": 1.1420894195581283e-05, "Pretrain/Loss": 1.9970804452896118, "Pretrain/Loss (Raw)": 2.0946078300476074, "Pretrain/Step": 13204, "Pretrain/Step Time": 8.44544392079115} +{"Pretrain/Learning Rate": 1.141733003759974e-05, "Pretrain/Loss": 2.0004873275756836, "Pretrain/Loss (Raw)": 2.061009168624878, "Pretrain/Step": 13205, "Pretrain/Step Time": 8.437335638329387} +{"Pretrain/Learning Rate": 1.1413766271264906e-05, "Pretrain/Loss": 2.001368284225464, "Pretrain/Loss (Raw)": 1.9907605648040771, "Pretrain/Step": 13206, "Pretrain/Step Time": 8.437093790620565} +{"Pretrain/Learning Rate": 1.141020289667955e-05, "Pretrain/Loss": 1.9993152618408203, "Pretrain/Loss (Raw)": 2.0451700687408447, "Pretrain/Step": 13207, "Pretrain/Step Time": 8.437954496592283} +{"Pretrain/Learning Rate": 1.1406639913946416e-05, "Pretrain/Loss": 1.9981945753097534, "Pretrain/Loss (Raw)": 1.9194190502166748, "Pretrain/Step": 13208, "Pretrain/Step Time": 8.438323413953185} +{"Pretrain/Learning Rate": 1.1403077323168226e-05, "Pretrain/Loss": 1.9979978799819946, "Pretrain/Loss (Raw)": 1.8561527729034424, "Pretrain/Step": 13209, "Pretrain/Step Time": 8.432297574356198} +{"Pretrain/Learning Rate": 1.1399515124447726e-05, "Pretrain/Loss": 1.9992481470108032, "Pretrain/Loss (Raw)": 2.1858022212982178, "Pretrain/Step": 13210, "Pretrain/Step Time": 8.424288423731923} +{"Pretrain/Learning Rate": 1.1395953317887612e-05, "Pretrain/Loss": 1.99995756149292, "Pretrain/Loss (Raw)": 2.1297059059143066, "Pretrain/Step": 13211, "Pretrain/Step Time": 8.425999607890844} +{"Pretrain/Learning Rate": 1.1392391903590603e-05, "Pretrain/Loss": 1.9968239068984985, "Pretrain/Loss (Raw)": 1.7901370525360107, "Pretrain/Step": 13212, "Pretrain/Step Time": 8.427727559581399} +{"Pretrain/Learning Rate": 1.1388830881659379e-05, "Pretrain/Loss": 1.997084140777588, "Pretrain/Loss (Raw)": 1.9976328611373901, "Pretrain/Step": 13213, "Pretrain/Step Time": 8.42357617802918} +{"Pretrain/Learning Rate": 1.1385270252196612e-05, "Pretrain/Loss": 1.995786190032959, "Pretrain/Loss (Raw)": 1.9302072525024414, "Pretrain/Step": 13214, "Pretrain/Step Time": 8.42740297690034} +{"Pretrain/Learning Rate": 1.1381710015304988e-05, "Pretrain/Loss": 1.9954948425292969, "Pretrain/Loss (Raw)": 1.9302910566329956, "Pretrain/Step": 13215, "Pretrain/Step Time": 8.423946751281619} +{"Pretrain/Learning Rate": 1.1378150171087149e-05, "Pretrain/Loss": 1.9935139417648315, "Pretrain/Loss (Raw)": 1.829959511756897, "Pretrain/Step": 13216, "Pretrain/Step Time": 8.42020620405674} +{"Pretrain/Learning Rate": 1.1374590719645754e-05, "Pretrain/Loss": 1.9935458898544312, "Pretrain/Loss (Raw)": 2.100968837738037, "Pretrain/Step": 13217, "Pretrain/Step Time": 8.419713178649545} +{"Pretrain/Learning Rate": 1.1371031661083432e-05, "Pretrain/Loss": 1.9953436851501465, "Pretrain/Loss (Raw)": 2.034867286682129, "Pretrain/Step": 13218, "Pretrain/Step Time": 8.42438705638051} +{"Pretrain/Learning Rate": 1.1367472995502792e-05, "Pretrain/Loss": 1.9949486255645752, "Pretrain/Loss (Raw)": 1.9829539060592651, "Pretrain/Step": 13219, "Pretrain/Step Time": 8.427234845235944} +{"Pretrain/Learning Rate": 1.1363914723006471e-05, "Pretrain/Loss": 1.9921036958694458, "Pretrain/Loss (Raw)": 1.887702226638794, "Pretrain/Step": 13220, "Pretrain/Step Time": 8.422386912629008} +{"Pretrain/Learning Rate": 1.1360356843697045e-05, "Pretrain/Loss": 1.9916166067123413, "Pretrain/Loss (Raw)": 1.931445598602295, "Pretrain/Step": 13221, "Pretrain/Step Time": 8.426009640097618} +{"Pretrain/Learning Rate": 1.1356799357677123e-05, "Pretrain/Loss": 1.9919315576553345, "Pretrain/Loss (Raw)": 2.227391004562378, "Pretrain/Step": 13222, "Pretrain/Step Time": 8.424618439748883} +{"Pretrain/Learning Rate": 1.1353242265049274e-05, "Pretrain/Loss": 1.9892489910125732, "Pretrain/Loss (Raw)": 1.9107040166854858, "Pretrain/Step": 13223, "Pretrain/Step Time": 8.422461109235883} +{"Pretrain/Learning Rate": 1.1349685565916054e-05, "Pretrain/Loss": 1.991877794265747, "Pretrain/Loss (Raw)": 2.1154913902282715, "Pretrain/Step": 13224, "Pretrain/Step Time": 8.424580546095967} +{"Pretrain/Learning Rate": 1.134612926038004e-05, "Pretrain/Loss": 1.9911144971847534, "Pretrain/Loss (Raw)": 2.163534164428711, "Pretrain/Step": 13225, "Pretrain/Step Time": 8.42716140858829} +{"Pretrain/Learning Rate": 1.1342573348543751e-05, "Pretrain/Loss": 1.9893072843551636, "Pretrain/Loss (Raw)": 1.9256243705749512, "Pretrain/Step": 13226, "Pretrain/Step Time": 8.419150086119771} +{"Pretrain/Learning Rate": 1.1339017830509743e-05, "Pretrain/Loss": 1.9898943901062012, "Pretrain/Loss (Raw)": 1.952354073524475, "Pretrain/Step": 13227, "Pretrain/Step Time": 8.420886410400271} +{"Pretrain/Learning Rate": 1.1335462706380524e-05, "Pretrain/Loss": 1.989995002746582, "Pretrain/Loss (Raw)": 2.0788731575012207, "Pretrain/Step": 13228, "Pretrain/Step Time": 8.422038342803717} +{"Pretrain/Learning Rate": 1.1331907976258604e-05, "Pretrain/Loss": 1.990229606628418, "Pretrain/Loss (Raw)": 2.236362934112549, "Pretrain/Step": 13229, "Pretrain/Step Time": 8.423976646736264} +{"Pretrain/Learning Rate": 1.1328353640246487e-05, "Pretrain/Loss": 1.9976856708526611, "Pretrain/Loss (Raw)": 2.365359306335449, "Pretrain/Step": 13230, "Pretrain/Step Time": 8.415592128410935} +{"Pretrain/Learning Rate": 1.1324799698446639e-05, "Pretrain/Loss": 2.001864194869995, "Pretrain/Loss (Raw)": 2.1944990158081055, "Pretrain/Step": 13231, "Pretrain/Step Time": 8.419150404632092} +{"Pretrain/Learning Rate": 1.1321246150961565e-05, "Pretrain/Loss": 2.00087308883667, "Pretrain/Loss (Raw)": 1.9938989877700806, "Pretrain/Step": 13232, "Pretrain/Step Time": 8.41800457984209} +{"Pretrain/Learning Rate": 1.1317692997893706e-05, "Pretrain/Loss": 2.001377820968628, "Pretrain/Loss (Raw)": 2.0342979431152344, "Pretrain/Step": 13233, "Pretrain/Step Time": 8.421262433752418} +{"Pretrain/Learning Rate": 1.131414023934553e-05, "Pretrain/Loss": 2.0028507709503174, "Pretrain/Loss (Raw)": 1.9584029912948608, "Pretrain/Step": 13234, "Pretrain/Step Time": 8.4210662599653} +{"Pretrain/Learning Rate": 1.1310587875419477e-05, "Pretrain/Loss": 2.001802682876587, "Pretrain/Loss (Raw)": 1.8463574647903442, "Pretrain/Step": 13235, "Pretrain/Step Time": 8.425850983709097} +{"Pretrain/Learning Rate": 1.1307035906217961e-05, "Pretrain/Loss": 2.0033254623413086, "Pretrain/Loss (Raw)": 2.024468183517456, "Pretrain/Step": 13236, "Pretrain/Step Time": 8.426172276958823} +{"Pretrain/Learning Rate": 1.130348433184342e-05, "Pretrain/Loss": 2.0025088787078857, "Pretrain/Loss (Raw)": 1.7557141780853271, "Pretrain/Step": 13237, "Pretrain/Step Time": 8.428970482200384} +{"Pretrain/Learning Rate": 1.1299933152398243e-05, "Pretrain/Loss": 2.0019302368164062, "Pretrain/Loss (Raw)": 2.08374285697937, "Pretrain/Step": 13238, "Pretrain/Step Time": 8.43008717149496} +{"Pretrain/Learning Rate": 1.1296382367984844e-05, "Pretrain/Loss": 2.0029821395874023, "Pretrain/Loss (Raw)": 2.0187714099884033, "Pretrain/Step": 13239, "Pretrain/Step Time": 8.427380559965968} +{"Pretrain/Learning Rate": 1.1292831978705604e-05, "Pretrain/Loss": 2.0034983158111572, "Pretrain/Loss (Raw)": 2.0953190326690674, "Pretrain/Step": 13240, "Pretrain/Step Time": 8.428928554058075} +{"Pretrain/Learning Rate": 1.1289281984662877e-05, "Pretrain/Loss": 2.0015830993652344, "Pretrain/Loss (Raw)": 1.8110477924346924, "Pretrain/Step": 13241, "Pretrain/Step Time": 8.427963331341743} +{"Pretrain/Learning Rate": 1.128573238595905e-05, "Pretrain/Loss": 2.0026512145996094, "Pretrain/Loss (Raw)": 1.8434221744537354, "Pretrain/Step": 13242, "Pretrain/Step Time": 8.423821050673723} +{"Pretrain/Learning Rate": 1.1282183182696454e-05, "Pretrain/Loss": 2.0049455165863037, "Pretrain/Loss (Raw)": 1.9941601753234863, "Pretrain/Step": 13243, "Pretrain/Step Time": 8.422432215884328} +{"Pretrain/Learning Rate": 1.1278634374977442e-05, "Pretrain/Loss": 2.006716251373291, "Pretrain/Loss (Raw)": 2.2132043838500977, "Pretrain/Step": 13244, "Pretrain/Step Time": 8.429187461733818} +{"Pretrain/Learning Rate": 1.1275085962904336e-05, "Pretrain/Loss": 2.009028434753418, "Pretrain/Loss (Raw)": 2.1387126445770264, "Pretrain/Step": 13245, "Pretrain/Step Time": 8.427213072776794} +{"Pretrain/Learning Rate": 1.127153794657944e-05, "Pretrain/Loss": 2.0093274116516113, "Pretrain/Loss (Raw)": 1.9224438667297363, "Pretrain/Step": 13246, "Pretrain/Step Time": 8.424984604120255} +{"Pretrain/Learning Rate": 1.126799032610508e-05, "Pretrain/Loss": 2.005845785140991, "Pretrain/Loss (Raw)": 1.9881260395050049, "Pretrain/Step": 13247, "Pretrain/Step Time": 8.425347222015262} +{"Pretrain/Learning Rate": 1.126444310158353e-05, "Pretrain/Loss": 2.0052545070648193, "Pretrain/Loss (Raw)": 1.869493842124939, "Pretrain/Step": 13248, "Pretrain/Step Time": 8.424623522907495} +{"Pretrain/Learning Rate": 1.1260896273117088e-05, "Pretrain/Loss": 2.006957530975342, "Pretrain/Loss (Raw)": 2.153250217437744, "Pretrain/Step": 13249, "Pretrain/Step Time": 8.430650267750025} +{"Pretrain/Learning Rate": 1.125734984080801e-05, "Pretrain/Loss": 2.0073115825653076, "Pretrain/Loss (Raw)": 2.0046703815460205, "Pretrain/Step": 13250, "Pretrain/Step Time": 8.429617341607809} +{"Pretrain/Learning Rate": 1.1253803804758567e-05, "Pretrain/Loss": 2.0057215690612793, "Pretrain/Loss (Raw)": 1.6586827039718628, "Pretrain/Step": 13251, "Pretrain/Step Time": 8.431925861164927} +{"Pretrain/Learning Rate": 1.1250258165071004e-05, "Pretrain/Loss": 2.0048837661743164, "Pretrain/Loss (Raw)": 1.9290425777435303, "Pretrain/Step": 13252, "Pretrain/Step Time": 8.436678474768996} +{"Pretrain/Learning Rate": 1.124671292184754e-05, "Pretrain/Loss": 2.005174398422241, "Pretrain/Loss (Raw)": 2.080223798751831, "Pretrain/Step": 13253, "Pretrain/Step Time": 8.433992344886065} +{"Pretrain/Learning Rate": 1.1243168075190427e-05, "Pretrain/Loss": 2.0065507888793945, "Pretrain/Loss (Raw)": 2.0968005657196045, "Pretrain/Step": 13254, "Pretrain/Step Time": 8.438619367778301} +{"Pretrain/Learning Rate": 1.1239623625201853e-05, "Pretrain/Loss": 2.0079703330993652, "Pretrain/Loss (Raw)": 2.11738920211792, "Pretrain/Step": 13255, "Pretrain/Step Time": 8.43873848952353} +{"Pretrain/Learning Rate": 1.1236079571984043e-05, "Pretrain/Loss": 2.0087201595306396, "Pretrain/Loss (Raw)": 2.1205577850341797, "Pretrain/Step": 13256, "Pretrain/Step Time": 8.43667851947248} +{"Pretrain/Learning Rate": 1.1232535915639176e-05, "Pretrain/Loss": 2.0093908309936523, "Pretrain/Loss (Raw)": 2.0220048427581787, "Pretrain/Step": 13257, "Pretrain/Step Time": 8.437587594613433} +{"Pretrain/Learning Rate": 1.1228992656269418e-05, "Pretrain/Loss": 2.009493827819824, "Pretrain/Loss (Raw)": 2.016698122024536, "Pretrain/Step": 13258, "Pretrain/Step Time": 8.428869124501944} +{"Pretrain/Learning Rate": 1.1225449793976962e-05, "Pretrain/Loss": 2.0082015991210938, "Pretrain/Loss (Raw)": 1.972619891166687, "Pretrain/Step": 13259, "Pretrain/Step Time": 8.427222922444344} +{"Pretrain/Learning Rate": 1.1221907328863938e-05, "Pretrain/Loss": 2.0092294216156006, "Pretrain/Loss (Raw)": 2.056777238845825, "Pretrain/Step": 13260, "Pretrain/Step Time": 8.431804398074746} +{"Pretrain/Learning Rate": 1.1218365261032512e-05, "Pretrain/Loss": 2.0076653957366943, "Pretrain/Loss (Raw)": 1.7937133312225342, "Pretrain/Step": 13261, "Pretrain/Step Time": 8.4308713786304} +{"Pretrain/Learning Rate": 1.1214823590584811e-05, "Pretrain/Loss": 2.0106687545776367, "Pretrain/Loss (Raw)": 2.1590514183044434, "Pretrain/Step": 13262, "Pretrain/Step Time": 8.433471120893955} +{"Pretrain/Learning Rate": 1.1211282317622942e-05, "Pretrain/Loss": 2.0115981101989746, "Pretrain/Loss (Raw)": 1.9375046491622925, "Pretrain/Step": 13263, "Pretrain/Step Time": 8.42333510890603} +{"Pretrain/Learning Rate": 1.120774144224904e-05, "Pretrain/Loss": 2.00968337059021, "Pretrain/Loss (Raw)": 1.7914843559265137, "Pretrain/Step": 13264, "Pretrain/Step Time": 8.423491850495338} +{"Pretrain/Learning Rate": 1.120420096456518e-05, "Pretrain/Loss": 2.0070948600769043, "Pretrain/Loss (Raw)": 1.761098027229309, "Pretrain/Step": 13265, "Pretrain/Step Time": 8.424733428284526} +{"Pretrain/Learning Rate": 1.1200660884673467e-05, "Pretrain/Loss": 2.006770610809326, "Pretrain/Loss (Raw)": 1.9944900274276733, "Pretrain/Step": 13266, "Pretrain/Step Time": 8.424382140859962} +{"Pretrain/Learning Rate": 1.1197121202675969e-05, "Pretrain/Loss": 2.0060513019561768, "Pretrain/Loss (Raw)": 1.9061590433120728, "Pretrain/Step": 13267, "Pretrain/Step Time": 8.427891340106726} +{"Pretrain/Learning Rate": 1.1193581918674745e-05, "Pretrain/Loss": 2.007974624633789, "Pretrain/Loss (Raw)": 2.314603567123413, "Pretrain/Step": 13268, "Pretrain/Step Time": 8.428910341113806} +{"Pretrain/Learning Rate": 1.119004303277186e-05, "Pretrain/Loss": 2.0093555450439453, "Pretrain/Loss (Raw)": 2.000870943069458, "Pretrain/Step": 13269, "Pretrain/Step Time": 8.427725283429027} +{"Pretrain/Learning Rate": 1.118650454506934e-05, "Pretrain/Loss": 2.008466958999634, "Pretrain/Loss (Raw)": 1.9315842390060425, "Pretrain/Step": 13270, "Pretrain/Step Time": 8.426772680133581} +{"Pretrain/Learning Rate": 1.1182966455669233e-05, "Pretrain/Loss": 2.0097784996032715, "Pretrain/Loss (Raw)": 2.11849308013916, "Pretrain/Step": 13271, "Pretrain/Step Time": 8.425074703991413} +{"Pretrain/Learning Rate": 1.117942876467355e-05, "Pretrain/Loss": 2.0114760398864746, "Pretrain/Loss (Raw)": 2.174386739730835, "Pretrain/Step": 13272, "Pretrain/Step Time": 8.423271257430315} +{"Pretrain/Learning Rate": 1.1175891472184283e-05, "Pretrain/Loss": 2.011129379272461, "Pretrain/Loss (Raw)": 1.9331868886947632, "Pretrain/Step": 13273, "Pretrain/Step Time": 8.421800430864096} +{"Pretrain/Learning Rate": 1.1172354578303451e-05, "Pretrain/Loss": 2.0106794834136963, "Pretrain/Loss (Raw)": 1.8730677366256714, "Pretrain/Step": 13274, "Pretrain/Step Time": 8.420958746224642} +{"Pretrain/Learning Rate": 1.1168818083133017e-05, "Pretrain/Loss": 2.008903980255127, "Pretrain/Loss (Raw)": 1.8918428421020508, "Pretrain/Step": 13275, "Pretrain/Step Time": 8.425703760236502} +{"Pretrain/Learning Rate": 1.1165281986774975e-05, "Pretrain/Loss": 2.0092434883117676, "Pretrain/Loss (Raw)": 2.0487678050994873, "Pretrain/Step": 13276, "Pretrain/Step Time": 8.423983754590154} +{"Pretrain/Learning Rate": 1.116174628933127e-05, "Pretrain/Loss": 2.009819507598877, "Pretrain/Loss (Raw)": 2.0103728771209717, "Pretrain/Step": 13277, "Pretrain/Step Time": 8.425979174673557} +{"Pretrain/Learning Rate": 1.115821099090385e-05, "Pretrain/Loss": 2.0102052688598633, "Pretrain/Loss (Raw)": 1.9932750463485718, "Pretrain/Step": 13278, "Pretrain/Step Time": 8.42678621225059} +{"Pretrain/Learning Rate": 1.1154676091594664e-05, "Pretrain/Loss": 2.0132064819335938, "Pretrain/Loss (Raw)": 2.4002020359039307, "Pretrain/Step": 13279, "Pretrain/Step Time": 8.424658151343465} +{"Pretrain/Learning Rate": 1.1151141591505626e-05, "Pretrain/Loss": 2.011749267578125, "Pretrain/Loss (Raw)": 1.9410889148712158, "Pretrain/Step": 13280, "Pretrain/Step Time": 8.429331926628947} +{"Pretrain/Learning Rate": 1.1147607490738666e-05, "Pretrain/Loss": 2.011383533477783, "Pretrain/Loss (Raw)": 1.9311470985412598, "Pretrain/Step": 13281, "Pretrain/Step Time": 8.42754859663546} +{"Pretrain/Learning Rate": 1.1144073789395679e-05, "Pretrain/Loss": 2.010850667953491, "Pretrain/Loss (Raw)": 1.9363256692886353, "Pretrain/Step": 13282, "Pretrain/Step Time": 8.436345595866442} +{"Pretrain/Learning Rate": 1.1140540487578547e-05, "Pretrain/Loss": 2.010648250579834, "Pretrain/Loss (Raw)": 1.9574135541915894, "Pretrain/Step": 13283, "Pretrain/Step Time": 8.434192230924964} +{"Pretrain/Learning Rate": 1.1137007585389167e-05, "Pretrain/Loss": 2.0095229148864746, "Pretrain/Loss (Raw)": 1.8422473669052124, "Pretrain/Step": 13284, "Pretrain/Step Time": 8.438768038526177} +{"Pretrain/Learning Rate": 1.1133475082929392e-05, "Pretrain/Loss": 2.0064985752105713, "Pretrain/Loss (Raw)": 1.613329529762268, "Pretrain/Step": 13285, "Pretrain/Step Time": 8.438000194728374} +{"Pretrain/Learning Rate": 1.11299429803011e-05, "Pretrain/Loss": 2.0061750411987305, "Pretrain/Loss (Raw)": 1.7324531078338623, "Pretrain/Step": 13286, "Pretrain/Step Time": 8.440636470913887} +{"Pretrain/Learning Rate": 1.1126411277606122e-05, "Pretrain/Loss": 2.0034749507904053, "Pretrain/Loss (Raw)": 1.8041077852249146, "Pretrain/Step": 13287, "Pretrain/Step Time": 8.442646324634552} +{"Pretrain/Learning Rate": 1.1122879974946285e-05, "Pretrain/Loss": 2.0009605884552, "Pretrain/Loss (Raw)": 1.6283930540084839, "Pretrain/Step": 13288, "Pretrain/Step Time": 8.443383980542421} +{"Pretrain/Learning Rate": 1.1119349072423432e-05, "Pretrain/Loss": 1.9999948740005493, "Pretrain/Loss (Raw)": 2.0371437072753906, "Pretrain/Step": 13289, "Pretrain/Step Time": 8.439071901142597} +{"Pretrain/Learning Rate": 1.1115818570139353e-05, "Pretrain/Loss": 2.0022621154785156, "Pretrain/Loss (Raw)": 2.1651432514190674, "Pretrain/Step": 13290, "Pretrain/Step Time": 8.439119409769773} +{"Pretrain/Learning Rate": 1.1112288468195867e-05, "Pretrain/Loss": 2.0036020278930664, "Pretrain/Loss (Raw)": 1.954983115196228, "Pretrain/Step": 13291, "Pretrain/Step Time": 8.441763715818524} +{"Pretrain/Learning Rate": 1.1108758766694755e-05, "Pretrain/Loss": 1.9999154806137085, "Pretrain/Loss (Raw)": 1.946755051612854, "Pretrain/Step": 13292, "Pretrain/Step Time": 8.442465839907527} +{"Pretrain/Learning Rate": 1.1105229465737779e-05, "Pretrain/Loss": 2.000765323638916, "Pretrain/Loss (Raw)": 2.084630250930786, "Pretrain/Step": 13293, "Pretrain/Step Time": 8.439108988270164} +{"Pretrain/Learning Rate": 1.1101700565426726e-05, "Pretrain/Loss": 2.001014232635498, "Pretrain/Loss (Raw)": 1.9713330268859863, "Pretrain/Step": 13294, "Pretrain/Step Time": 8.442297328263521} +{"Pretrain/Learning Rate": 1.109817206586333e-05, "Pretrain/Loss": 1.9988136291503906, "Pretrain/Loss (Raw)": 1.778996229171753, "Pretrain/Step": 13295, "Pretrain/Step Time": 8.437358845025301} +{"Pretrain/Learning Rate": 1.1094643967149354e-05, "Pretrain/Loss": 1.9993934631347656, "Pretrain/Loss (Raw)": 2.0520315170288086, "Pretrain/Step": 13296, "Pretrain/Step Time": 8.43431931361556} +{"Pretrain/Learning Rate": 1.1091116269386515e-05, "Pretrain/Loss": 2.0011532306671143, "Pretrain/Loss (Raw)": 1.9094722270965576, "Pretrain/Step": 13297, "Pretrain/Step Time": 8.438914628699422} +{"Pretrain/Learning Rate": 1.1087588972676525e-05, "Pretrain/Loss": 2.0000836849212646, "Pretrain/Loss (Raw)": 1.9686874151229858, "Pretrain/Step": 13298, "Pretrain/Step Time": 8.434029500931501} +{"Pretrain/Learning Rate": 1.1084062077121107e-05, "Pretrain/Loss": 2.000298023223877, "Pretrain/Loss (Raw)": 1.870050311088562, "Pretrain/Step": 13299, "Pretrain/Step Time": 8.441266492009163} +{"Pretrain/Learning Rate": 1.1080535582821938e-05, "Pretrain/Loss": 2.002699375152588, "Pretrain/Loss (Raw)": 2.1365623474121094, "Pretrain/Step": 13300, "Pretrain/Step Time": 8.444043504074216} +{"Pretrain/Learning Rate": 1.1077009489880726e-05, "Pretrain/Loss": 2.0024256706237793, "Pretrain/Loss (Raw)": 1.9349700212478638, "Pretrain/Step": 13301, "Pretrain/Step Time": 8.442476594820619} +{"Pretrain/Learning Rate": 1.107348379839913e-05, "Pretrain/Loss": 2.003330707550049, "Pretrain/Loss (Raw)": 2.0623412132263184, "Pretrain/Step": 13302, "Pretrain/Step Time": 8.446216573938727} +{"Pretrain/Learning Rate": 1.10699585084788e-05, "Pretrain/Loss": 2.001340389251709, "Pretrain/Loss (Raw)": 1.74150812625885, "Pretrain/Step": 13303, "Pretrain/Step Time": 8.44461864605546} +{"Pretrain/Learning Rate": 1.1066433620221405e-05, "Pretrain/Loss": 2.001594305038452, "Pretrain/Loss (Raw)": 2.090010643005371, "Pretrain/Step": 13304, "Pretrain/Step Time": 8.448995240032673} +{"Pretrain/Learning Rate": 1.1062909133728566e-05, "Pretrain/Loss": 2.0004138946533203, "Pretrain/Loss (Raw)": 1.9518486261367798, "Pretrain/Step": 13305, "Pretrain/Step Time": 8.447586180642247} +{"Pretrain/Learning Rate": 1.1059385049101928e-05, "Pretrain/Loss": 1.999545931816101, "Pretrain/Loss (Raw)": 1.9030308723449707, "Pretrain/Step": 13306, "Pretrain/Step Time": 8.44711697474122} +{"Pretrain/Learning Rate": 1.1055861366443092e-05, "Pretrain/Loss": 1.9984850883483887, "Pretrain/Loss (Raw)": 1.8796374797821045, "Pretrain/Step": 13307, "Pretrain/Step Time": 8.446688253432512} +{"Pretrain/Learning Rate": 1.1052338085853655e-05, "Pretrain/Loss": 1.9980720281600952, "Pretrain/Loss (Raw)": 2.1745147705078125, "Pretrain/Step": 13308, "Pretrain/Step Time": 8.446783445775509} +{"Pretrain/Learning Rate": 1.1048815207435226e-05, "Pretrain/Loss": 1.9950618743896484, "Pretrain/Loss (Raw)": 1.7819998264312744, "Pretrain/Step": 13309, "Pretrain/Step Time": 8.451353600248694} +{"Pretrain/Learning Rate": 1.1045292731289367e-05, "Pretrain/Loss": 1.9927709102630615, "Pretrain/Loss (Raw)": 1.724074125289917, "Pretrain/Step": 13310, "Pretrain/Step Time": 8.452971993014216} +{"Pretrain/Learning Rate": 1.1041770657517663e-05, "Pretrain/Loss": 1.9891283512115479, "Pretrain/Loss (Raw)": 2.1167807579040527, "Pretrain/Step": 13311, "Pretrain/Step Time": 8.445838704705238} +{"Pretrain/Learning Rate": 1.1038248986221664e-05, "Pretrain/Loss": 1.9916247129440308, "Pretrain/Loss (Raw)": 2.210245370864868, "Pretrain/Step": 13312, "Pretrain/Step Time": 8.447072271257639} +{"Pretrain/Learning Rate": 1.1034727717502912e-05, "Pretrain/Loss": 1.9900054931640625, "Pretrain/Loss (Raw)": 1.9502925872802734, "Pretrain/Step": 13313, "Pretrain/Step Time": 8.447748444974422} +{"Pretrain/Learning Rate": 1.1031206851462942e-05, "Pretrain/Loss": 1.989095687866211, "Pretrain/Loss (Raw)": 1.9584274291992188, "Pretrain/Step": 13314, "Pretrain/Step Time": 8.444058384746313} +{"Pretrain/Learning Rate": 1.1027686388203265e-05, "Pretrain/Loss": 1.9877134561538696, "Pretrain/Loss (Raw)": 1.7959622144699097, "Pretrain/Step": 13315, "Pretrain/Step Time": 8.44331987760961} +{"Pretrain/Learning Rate": 1.1024166327825409e-05, "Pretrain/Loss": 1.9889470338821411, "Pretrain/Loss (Raw)": 2.2540040016174316, "Pretrain/Step": 13316, "Pretrain/Step Time": 8.444668902084231} +{"Pretrain/Learning Rate": 1.1020646670430857e-05, "Pretrain/Loss": 1.9866561889648438, "Pretrain/Loss (Raw)": 1.7444028854370117, "Pretrain/Step": 13317, "Pretrain/Step Time": 8.441145533695817} +{"Pretrain/Learning Rate": 1.1017127416121112e-05, "Pretrain/Loss": 1.9879010915756226, "Pretrain/Loss (Raw)": 2.1151485443115234, "Pretrain/Step": 13318, "Pretrain/Step Time": 8.441170610487461} +{"Pretrain/Learning Rate": 1.1013608564997633e-05, "Pretrain/Loss": 1.9864201545715332, "Pretrain/Loss (Raw)": 1.9439640045166016, "Pretrain/Step": 13319, "Pretrain/Step Time": 8.442555544897914} +{"Pretrain/Learning Rate": 1.10100901171619e-05, "Pretrain/Loss": 1.9868744611740112, "Pretrain/Loss (Raw)": 2.1395609378814697, "Pretrain/Step": 13320, "Pretrain/Step Time": 8.440724173560739} +{"Pretrain/Learning Rate": 1.1006572072715355e-05, "Pretrain/Loss": 1.986112117767334, "Pretrain/Loss (Raw)": 1.8604028224945068, "Pretrain/Step": 13321, "Pretrain/Step Time": 8.442554721608758} +{"Pretrain/Learning Rate": 1.1003054431759433e-05, "Pretrain/Loss": 1.9866875410079956, "Pretrain/Loss (Raw)": 2.0750577449798584, "Pretrain/Step": 13322, "Pretrain/Step Time": 8.445457927882671} +{"Pretrain/Learning Rate": 1.0999537194395576e-05, "Pretrain/Loss": 1.9871060848236084, "Pretrain/Loss (Raw)": 2.0476911067962646, "Pretrain/Step": 13323, "Pretrain/Step Time": 8.441719403490424} +{"Pretrain/Learning Rate": 1.0996020360725185e-05, "Pretrain/Loss": 1.9875595569610596, "Pretrain/Loss (Raw)": 2.0083954334259033, "Pretrain/Step": 13324, "Pretrain/Step Time": 8.445125073194504} +{"Pretrain/Learning Rate": 1.0992503930849685e-05, "Pretrain/Loss": 1.9851317405700684, "Pretrain/Loss (Raw)": 1.8132094144821167, "Pretrain/Step": 13325, "Pretrain/Step Time": 8.442997505888343} +{"Pretrain/Learning Rate": 1.098898790487046e-05, "Pretrain/Loss": 1.9862223863601685, "Pretrain/Loss (Raw)": 2.1201608180999756, "Pretrain/Step": 13326, "Pretrain/Step Time": 8.449781889095902} +{"Pretrain/Learning Rate": 1.098547228288888e-05, "Pretrain/Loss": 1.9877512454986572, "Pretrain/Loss (Raw)": 2.0347516536712646, "Pretrain/Step": 13327, "Pretrain/Step Time": 8.44774291664362} +{"Pretrain/Learning Rate": 1.0981957065006338e-05, "Pretrain/Loss": 1.9880321025848389, "Pretrain/Loss (Raw)": 2.058171033859253, "Pretrain/Step": 13328, "Pretrain/Step Time": 8.446934750303626} +{"Pretrain/Learning Rate": 1.0978442251324172e-05, "Pretrain/Loss": 1.9877666234970093, "Pretrain/Loss (Raw)": 1.9598336219787598, "Pretrain/Step": 13329, "Pretrain/Step Time": 8.44841624982655} +{"Pretrain/Learning Rate": 1.0974927841943749e-05, "Pretrain/Loss": 1.9853863716125488, "Pretrain/Loss (Raw)": 1.7750437259674072, "Pretrain/Step": 13330, "Pretrain/Step Time": 8.445647533982992} +{"Pretrain/Learning Rate": 1.0971413836966396e-05, "Pretrain/Loss": 1.9856538772583008, "Pretrain/Loss (Raw)": 1.9525114297866821, "Pretrain/Step": 13331, "Pretrain/Step Time": 8.445314690470695} +{"Pretrain/Learning Rate": 1.0967900236493426e-05, "Pretrain/Loss": 1.984823226928711, "Pretrain/Loss (Raw)": 1.9882975816726685, "Pretrain/Step": 13332, "Pretrain/Step Time": 8.448721481487155} +{"Pretrain/Learning Rate": 1.0964387040626167e-05, "Pretrain/Loss": 1.9846065044403076, "Pretrain/Loss (Raw)": 2.0332679748535156, "Pretrain/Step": 13333, "Pretrain/Step Time": 8.44848289899528} +{"Pretrain/Learning Rate": 1.0960874249465908e-05, "Pretrain/Loss": 1.9858717918395996, "Pretrain/Loss (Raw)": 2.152695417404175, "Pretrain/Step": 13334, "Pretrain/Step Time": 8.449141694232821} +{"Pretrain/Learning Rate": 1.0957361863113949e-05, "Pretrain/Loss": 1.9846676588058472, "Pretrain/Loss (Raw)": 1.891048789024353, "Pretrain/Step": 13335, "Pretrain/Step Time": 8.449636552482843} +{"Pretrain/Learning Rate": 1.0953849881671562e-05, "Pretrain/Loss": 1.9848599433898926, "Pretrain/Loss (Raw)": 1.9440410137176514, "Pretrain/Step": 13336, "Pretrain/Step Time": 8.453586956486106} +{"Pretrain/Learning Rate": 1.0950338305240005e-05, "Pretrain/Loss": 1.9872069358825684, "Pretrain/Loss (Raw)": 2.156553030014038, "Pretrain/Step": 13337, "Pretrain/Step Time": 8.458524987101555} +{"Pretrain/Learning Rate": 1.0946827133920546e-05, "Pretrain/Loss": 1.9869788885116577, "Pretrain/Loss (Raw)": 2.1566219329833984, "Pretrain/Step": 13338, "Pretrain/Step Time": 8.457822507247329} +{"Pretrain/Learning Rate": 1.094331636781441e-05, "Pretrain/Loss": 1.9849578142166138, "Pretrain/Loss (Raw)": 1.8710048198699951, "Pretrain/Step": 13339, "Pretrain/Step Time": 8.457317152991891} +{"Pretrain/Learning Rate": 1.0939806007022846e-05, "Pretrain/Loss": 1.9866795539855957, "Pretrain/Loss (Raw)": 2.010545015335083, "Pretrain/Step": 13340, "Pretrain/Step Time": 8.456354063004255} +{"Pretrain/Learning Rate": 1.0936296051647066e-05, "Pretrain/Loss": 1.9893302917480469, "Pretrain/Loss (Raw)": 2.336907386779785, "Pretrain/Step": 13341, "Pretrain/Step Time": 8.456612829118967} +{"Pretrain/Learning Rate": 1.0932786501788264e-05, "Pretrain/Loss": 1.990790843963623, "Pretrain/Loss (Raw)": 2.117144823074341, "Pretrain/Step": 13342, "Pretrain/Step Time": 8.458926852792501} +{"Pretrain/Learning Rate": 1.0929277357547656e-05, "Pretrain/Loss": 1.9916749000549316, "Pretrain/Loss (Raw)": 2.04347562789917, "Pretrain/Step": 13343, "Pretrain/Step Time": 8.460798684507608} +{"Pretrain/Learning Rate": 1.0925768619026408e-05, "Pretrain/Loss": 1.9934964179992676, "Pretrain/Loss (Raw)": 2.063121795654297, "Pretrain/Step": 13344, "Pretrain/Step Time": 8.463736291974783} +{"Pretrain/Learning Rate": 1.0922260286325708e-05, "Pretrain/Loss": 1.991988182067871, "Pretrain/Loss (Raw)": 1.9078868627548218, "Pretrain/Step": 13345, "Pretrain/Step Time": 8.461841510608792} +{"Pretrain/Learning Rate": 1.091875235954671e-05, "Pretrain/Loss": 1.9905993938446045, "Pretrain/Loss (Raw)": 1.857102870941162, "Pretrain/Step": 13346, "Pretrain/Step Time": 8.463537391275167} +{"Pretrain/Learning Rate": 1.091524483879055e-05, "Pretrain/Loss": 1.9896389245986938, "Pretrain/Loss (Raw)": 1.8600188493728638, "Pretrain/Step": 13347, "Pretrain/Step Time": 8.458379095420241} +{"Pretrain/Learning Rate": 1.0911737724158388e-05, "Pretrain/Loss": 1.9910862445831299, "Pretrain/Loss (Raw)": 2.0729591846466064, "Pretrain/Step": 13348, "Pretrain/Step Time": 8.461607720702887} +{"Pretrain/Learning Rate": 1.0908231015751328e-05, "Pretrain/Loss": 1.9910862445831299, "Pretrain/Loss (Raw)": 1.9314491748809814, "Pretrain/Step": 13349, "Pretrain/Step Time": 8.460625670850277} +{"Pretrain/Learning Rate": 1.0904724713670498e-05, "Pretrain/Loss": 1.989461898803711, "Pretrain/Loss (Raw)": 2.0194733142852783, "Pretrain/Step": 13350, "Pretrain/Step Time": 8.464917972683907} +{"Pretrain/Learning Rate": 1.0901218818016998e-05, "Pretrain/Loss": 1.9898107051849365, "Pretrain/Loss (Raw)": 1.9553477764129639, "Pretrain/Step": 13351, "Pretrain/Step Time": 8.464465783908963} +{"Pretrain/Learning Rate": 1.0897713328891904e-05, "Pretrain/Loss": 1.9883980751037598, "Pretrain/Loss (Raw)": 1.934677004814148, "Pretrain/Step": 13352, "Pretrain/Step Time": 8.46980993449688} +{"Pretrain/Learning Rate": 1.0894208246396313e-05, "Pretrain/Loss": 1.9879353046417236, "Pretrain/Loss (Raw)": 2.1042914390563965, "Pretrain/Step": 13353, "Pretrain/Step Time": 8.466324720531702} +{"Pretrain/Learning Rate": 1.0890703570631276e-05, "Pretrain/Loss": 1.988857626914978, "Pretrain/Loss (Raw)": 2.0436906814575195, "Pretrain/Step": 13354, "Pretrain/Step Time": 8.470400048419833} +{"Pretrain/Learning Rate": 1.0887199301697862e-05, "Pretrain/Loss": 1.9873461723327637, "Pretrain/Loss (Raw)": 1.7588789463043213, "Pretrain/Step": 13355, "Pretrain/Step Time": 8.472391339018941} +{"Pretrain/Learning Rate": 1.0883695439697105e-05, "Pretrain/Loss": 1.9857664108276367, "Pretrain/Loss (Raw)": 1.8766791820526123, "Pretrain/Step": 13356, "Pretrain/Step Time": 8.47281057573855} +{"Pretrain/Learning Rate": 1.0880191984730035e-05, "Pretrain/Loss": 1.9840061664581299, "Pretrain/Loss (Raw)": 2.0110483169555664, "Pretrain/Step": 13357, "Pretrain/Step Time": 8.471513187512755} +{"Pretrain/Learning Rate": 1.0876688936897684e-05, "Pretrain/Loss": 1.981773853302002, "Pretrain/Loss (Raw)": 2.0796279907226562, "Pretrain/Step": 13358, "Pretrain/Step Time": 8.472155751660466} +{"Pretrain/Learning Rate": 1.0873186296301039e-05, "Pretrain/Loss": 1.9810086488723755, "Pretrain/Loss (Raw)": 2.0965514183044434, "Pretrain/Step": 13359, "Pretrain/Step Time": 8.472562862560153} +{"Pretrain/Learning Rate": 1.0869684063041118e-05, "Pretrain/Loss": 1.981403112411499, "Pretrain/Loss (Raw)": 2.044400930404663, "Pretrain/Step": 13360, "Pretrain/Step Time": 8.473924105986953} +{"Pretrain/Learning Rate": 1.0866182237218897e-05, "Pretrain/Loss": 1.9812519550323486, "Pretrain/Loss (Raw)": 2.0149316787719727, "Pretrain/Step": 13361, "Pretrain/Step Time": 8.476202111691236} +{"Pretrain/Learning Rate": 1.0862680818935339e-05, "Pretrain/Loss": 1.9827834367752075, "Pretrain/Loss (Raw)": 2.1544253826141357, "Pretrain/Step": 13362, "Pretrain/Step Time": 8.476258458569646} +{"Pretrain/Learning Rate": 1.085917980829142e-05, "Pretrain/Loss": 1.983788251876831, "Pretrain/Loss (Raw)": 1.9749739170074463, "Pretrain/Step": 13363, "Pretrain/Step Time": 8.473662935197353} +{"Pretrain/Learning Rate": 1.0855679205388076e-05, "Pretrain/Loss": 1.9827237129211426, "Pretrain/Loss (Raw)": 1.8882341384887695, "Pretrain/Step": 13364, "Pretrain/Step Time": 8.474259136244655} +{"Pretrain/Learning Rate": 1.085217901032626e-05, "Pretrain/Loss": 1.9849495887756348, "Pretrain/Loss (Raw)": 2.0406057834625244, "Pretrain/Step": 13365, "Pretrain/Step Time": 8.47164597734809} +{"Pretrain/Learning Rate": 1.0848679223206887e-05, "Pretrain/Loss": 1.9835665225982666, "Pretrain/Loss (Raw)": 1.9067058563232422, "Pretrain/Step": 13366, "Pretrain/Step Time": 8.472194964066148} +{"Pretrain/Learning Rate": 1.0845179844130865e-05, "Pretrain/Loss": 1.9828153848648071, "Pretrain/Loss (Raw)": 1.9226330518722534, "Pretrain/Step": 13367, "Pretrain/Step Time": 8.476242125034332} +{"Pretrain/Learning Rate": 1.0841680873199111e-05, "Pretrain/Loss": 1.9805717468261719, "Pretrain/Loss (Raw)": 1.8081345558166504, "Pretrain/Step": 13368, "Pretrain/Step Time": 8.477426143363118} +{"Pretrain/Learning Rate": 1.0838182310512502e-05, "Pretrain/Loss": 1.9826627969741821, "Pretrain/Loss (Raw)": 2.0786986351013184, "Pretrain/Step": 13369, "Pretrain/Step Time": 8.475572254508734} +{"Pretrain/Learning Rate": 1.083468415617193e-05, "Pretrain/Loss": 1.9839222431182861, "Pretrain/Loss (Raw)": 2.004631280899048, "Pretrain/Step": 13370, "Pretrain/Step Time": 8.477624068036675} +{"Pretrain/Learning Rate": 1.0831186410278254e-05, "Pretrain/Loss": 1.984208106994629, "Pretrain/Loss (Raw)": 2.030750274658203, "Pretrain/Step": 13371, "Pretrain/Step Time": 8.477313809096813} +{"Pretrain/Learning Rate": 1.082768907293232e-05, "Pretrain/Loss": 1.982923984527588, "Pretrain/Loss (Raw)": 2.048835515975952, "Pretrain/Step": 13372, "Pretrain/Step Time": 8.472818471491337} +{"Pretrain/Learning Rate": 1.082419214423499e-05, "Pretrain/Loss": 1.9822739362716675, "Pretrain/Loss (Raw)": 2.0555055141448975, "Pretrain/Step": 13373, "Pretrain/Step Time": 8.472504520788789} +{"Pretrain/Learning Rate": 1.0820695624287078e-05, "Pretrain/Loss": 1.98116135597229, "Pretrain/Loss (Raw)": 1.7800415754318237, "Pretrain/Step": 13374, "Pretrain/Step Time": 8.470591379329562} +{"Pretrain/Learning Rate": 1.0817199513189422e-05, "Pretrain/Loss": 1.9816679954528809, "Pretrain/Loss (Raw)": 2.052978992462158, "Pretrain/Step": 13375, "Pretrain/Step Time": 8.470945715904236} +{"Pretrain/Learning Rate": 1.0813703811042818e-05, "Pretrain/Loss": 1.9816381931304932, "Pretrain/Loss (Raw)": 1.8656648397445679, "Pretrain/Step": 13376, "Pretrain/Step Time": 8.47441409341991} +{"Pretrain/Learning Rate": 1.0810208517948056e-05, "Pretrain/Loss": 1.9817134141921997, "Pretrain/Loss (Raw)": 2.162889242172241, "Pretrain/Step": 13377, "Pretrain/Step Time": 8.47012696415186} +{"Pretrain/Learning Rate": 1.0806713634005936e-05, "Pretrain/Loss": 1.9801931381225586, "Pretrain/Loss (Raw)": 1.810081124305725, "Pretrain/Step": 13378, "Pretrain/Step Time": 8.47150268778205} +{"Pretrain/Learning Rate": 1.0803219159317216e-05, "Pretrain/Loss": 1.9834063053131104, "Pretrain/Loss (Raw)": 2.06997013092041, "Pretrain/Step": 13379, "Pretrain/Step Time": 8.46791766397655} +{"Pretrain/Learning Rate": 1.079972509398267e-05, "Pretrain/Loss": 1.9840459823608398, "Pretrain/Loss (Raw)": 2.010915756225586, "Pretrain/Step": 13380, "Pretrain/Step Time": 8.4653428979218} +{"Pretrain/Learning Rate": 1.0796231438103042e-05, "Pretrain/Loss": 1.983981728553772, "Pretrain/Loss (Raw)": 2.071993112564087, "Pretrain/Step": 13381, "Pretrain/Step Time": 8.472791405394673} +{"Pretrain/Learning Rate": 1.0792738191779055e-05, "Pretrain/Loss": 1.9831774234771729, "Pretrain/Loss (Raw)": 1.993857979774475, "Pretrain/Step": 13382, "Pretrain/Step Time": 8.469450753182173} +{"Pretrain/Learning Rate": 1.078924535511146e-05, "Pretrain/Loss": 1.9821332693099976, "Pretrain/Loss (Raw)": 1.9837239980697632, "Pretrain/Step": 13383, "Pretrain/Step Time": 8.471302626654506} +{"Pretrain/Learning Rate": 1.0785752928200948e-05, "Pretrain/Loss": 1.9797980785369873, "Pretrain/Loss (Raw)": 1.8216500282287598, "Pretrain/Step": 13384, "Pretrain/Step Time": 8.471177205443382} +{"Pretrain/Learning Rate": 1.0782260911148238e-05, "Pretrain/Loss": 1.9800233840942383, "Pretrain/Loss (Raw)": 2.050855875015259, "Pretrain/Step": 13385, "Pretrain/Step Time": 8.473718469962478} +{"Pretrain/Learning Rate": 1.0778769304054e-05, "Pretrain/Loss": 1.979385256767273, "Pretrain/Loss (Raw)": 1.9350166320800781, "Pretrain/Step": 13386, "Pretrain/Step Time": 8.475320685654879} +{"Pretrain/Learning Rate": 1.0775278107018938e-05, "Pretrain/Loss": 1.9799058437347412, "Pretrain/Loss (Raw)": 2.0392568111419678, "Pretrain/Step": 13387, "Pretrain/Step Time": 8.481402222067118} +{"Pretrain/Learning Rate": 1.07717873201437e-05, "Pretrain/Loss": 1.9790154695510864, "Pretrain/Loss (Raw)": 1.942810297012329, "Pretrain/Step": 13388, "Pretrain/Step Time": 8.474831407889724} +{"Pretrain/Learning Rate": 1.0768296943528939e-05, "Pretrain/Loss": 1.979357361793518, "Pretrain/Loss (Raw)": 1.837470293045044, "Pretrain/Step": 13389, "Pretrain/Step Time": 8.477929024025798} +{"Pretrain/Learning Rate": 1.0764806977275307e-05, "Pretrain/Loss": 1.9778544902801514, "Pretrain/Loss (Raw)": 1.9666811227798462, "Pretrain/Step": 13390, "Pretrain/Step Time": 8.475565422326326} +{"Pretrain/Learning Rate": 1.0761317421483426e-05, "Pretrain/Loss": 1.9769608974456787, "Pretrain/Loss (Raw)": 1.8231267929077148, "Pretrain/Step": 13391, "Pretrain/Step Time": 8.476164707913995} +{"Pretrain/Learning Rate": 1.0757828276253928e-05, "Pretrain/Loss": 1.9780676364898682, "Pretrain/Loss (Raw)": 1.9331541061401367, "Pretrain/Step": 13392, "Pretrain/Step Time": 8.478147828951478} +{"Pretrain/Learning Rate": 1.075433954168741e-05, "Pretrain/Loss": 1.9807850122451782, "Pretrain/Loss (Raw)": 2.1089134216308594, "Pretrain/Step": 13393, "Pretrain/Step Time": 8.475616736337543} +{"Pretrain/Learning Rate": 1.0750851217884462e-05, "Pretrain/Loss": 1.9806580543518066, "Pretrain/Loss (Raw)": 1.978245496749878, "Pretrain/Step": 13394, "Pretrain/Step Time": 8.475150801241398} +{"Pretrain/Learning Rate": 1.074736330494568e-05, "Pretrain/Loss": 1.9802742004394531, "Pretrain/Loss (Raw)": 1.8570163249969482, "Pretrain/Step": 13395, "Pretrain/Step Time": 8.470355102792382} +{"Pretrain/Learning Rate": 1.074387580297162e-05, "Pretrain/Loss": 1.976106882095337, "Pretrain/Loss (Raw)": 1.7811888456344604, "Pretrain/Step": 13396, "Pretrain/Step Time": 8.475146690383554} +{"Pretrain/Learning Rate": 1.0740388712062874e-05, "Pretrain/Loss": 1.976191520690918, "Pretrain/Loss (Raw)": 2.0117111206054688, "Pretrain/Step": 13397, "Pretrain/Step Time": 8.473115019500256} +{"Pretrain/Learning Rate": 1.0736902032319946e-05, "Pretrain/Loss": 1.9762680530548096, "Pretrain/Loss (Raw)": 1.9413774013519287, "Pretrain/Step": 13398, "Pretrain/Step Time": 8.475589672103524} +{"Pretrain/Learning Rate": 1.0733415763843403e-05, "Pretrain/Loss": 1.9763355255126953, "Pretrain/Loss (Raw)": 2.1271159648895264, "Pretrain/Step": 13399, "Pretrain/Step Time": 8.476079948246479} +{"Pretrain/Learning Rate": 1.0729929906733757e-05, "Pretrain/Loss": 1.976224660873413, "Pretrain/Loss (Raw)": 2.160200595855713, "Pretrain/Step": 13400, "Pretrain/Step Time": 8.476526813581586} +{"Pretrain/Learning Rate": 1.0726444461091517e-05, "Pretrain/Loss": 1.9773457050323486, "Pretrain/Loss (Raw)": 2.0766842365264893, "Pretrain/Step": 13401, "Pretrain/Step Time": 8.476673364639282} +{"Pretrain/Learning Rate": 1.0722959427017196e-05, "Pretrain/Loss": 1.9793033599853516, "Pretrain/Loss (Raw)": 2.123647928237915, "Pretrain/Step": 13402, "Pretrain/Step Time": 8.478104073554277} +{"Pretrain/Learning Rate": 1.0719474804611266e-05, "Pretrain/Loss": 1.9816807508468628, "Pretrain/Loss (Raw)": 2.196150779724121, "Pretrain/Step": 13403, "Pretrain/Step Time": 8.476746311411262} +{"Pretrain/Learning Rate": 1.071599059397422e-05, "Pretrain/Loss": 1.9807500839233398, "Pretrain/Loss (Raw)": 1.9296454191207886, "Pretrain/Step": 13404, "Pretrain/Step Time": 8.47578575834632} +{"Pretrain/Learning Rate": 1.071250679520652e-05, "Pretrain/Loss": 1.9801039695739746, "Pretrain/Loss (Raw)": 1.9276756048202515, "Pretrain/Step": 13405, "Pretrain/Step Time": 8.47392031736672} +{"Pretrain/Learning Rate": 1.0709023408408602e-05, "Pretrain/Loss": 1.9809900522232056, "Pretrain/Loss (Raw)": 2.1066832542419434, "Pretrain/Step": 13406, "Pretrain/Step Time": 8.474770521745086} +{"Pretrain/Learning Rate": 1.070554043368093e-05, "Pretrain/Loss": 1.9756927490234375, "Pretrain/Loss (Raw)": 1.722141981124878, "Pretrain/Step": 13407, "Pretrain/Step Time": 8.479591589421034} +{"Pretrain/Learning Rate": 1.0702057871123914e-05, "Pretrain/Loss": 1.9755377769470215, "Pretrain/Loss (Raw)": 1.921254277229309, "Pretrain/Step": 13408, "Pretrain/Step Time": 8.474135803058743} +{"Pretrain/Learning Rate": 1.0698575720837989e-05, "Pretrain/Loss": 1.9757856130599976, "Pretrain/Loss (Raw)": 1.962872862815857, "Pretrain/Step": 13409, "Pretrain/Step Time": 8.477164324373007} +{"Pretrain/Learning Rate": 1.0695093982923552e-05, "Pretrain/Loss": 1.9774055480957031, "Pretrain/Loss (Raw)": 2.143673896789551, "Pretrain/Step": 13410, "Pretrain/Step Time": 8.473002722486854} +{"Pretrain/Learning Rate": 1.0691612657480984e-05, "Pretrain/Loss": 1.977205514907837, "Pretrain/Loss (Raw)": 1.9318153858184814, "Pretrain/Step": 13411, "Pretrain/Step Time": 8.47017445974052} +{"Pretrain/Learning Rate": 1.0688131744610689e-05, "Pretrain/Loss": 1.9779090881347656, "Pretrain/Loss (Raw)": 1.9323073625564575, "Pretrain/Step": 13412, "Pretrain/Step Time": 8.47268815152347} +{"Pretrain/Learning Rate": 1.0684651244413016e-05, "Pretrain/Loss": 1.9799336194992065, "Pretrain/Loss (Raw)": 1.8724730014801025, "Pretrain/Step": 13413, "Pretrain/Step Time": 8.473929220810533} +{"Pretrain/Learning Rate": 1.0681171156988342e-05, "Pretrain/Loss": 1.9828765392303467, "Pretrain/Loss (Raw)": 2.1091408729553223, "Pretrain/Step": 13414, "Pretrain/Step Time": 8.473228886723518} +{"Pretrain/Learning Rate": 1.0677691482437005e-05, "Pretrain/Loss": 1.9844021797180176, "Pretrain/Loss (Raw)": 1.9993904829025269, "Pretrain/Step": 13415, "Pretrain/Step Time": 8.473755633458495} +{"Pretrain/Learning Rate": 1.0674212220859328e-05, "Pretrain/Loss": 1.9877784252166748, "Pretrain/Loss (Raw)": 2.060549020767212, "Pretrain/Step": 13416, "Pretrain/Step Time": 8.474872218444943} +{"Pretrain/Learning Rate": 1.0670733372355651e-05, "Pretrain/Loss": 1.988058090209961, "Pretrain/Loss (Raw)": 2.0729329586029053, "Pretrain/Step": 13417, "Pretrain/Step Time": 8.472556121647358} +{"Pretrain/Learning Rate": 1.0667254937026267e-05, "Pretrain/Loss": 1.9868907928466797, "Pretrain/Loss (Raw)": 2.0157456398010254, "Pretrain/Step": 13418, "Pretrain/Step Time": 8.480634186416864} +{"Pretrain/Learning Rate": 1.066377691497149e-05, "Pretrain/Loss": 1.989081621170044, "Pretrain/Loss (Raw)": 2.23539400100708, "Pretrain/Step": 13419, "Pretrain/Step Time": 8.477287292480469} +{"Pretrain/Learning Rate": 1.0660299306291602e-05, "Pretrain/Loss": 1.9889910221099854, "Pretrain/Loss (Raw)": 1.9351696968078613, "Pretrain/Step": 13420, "Pretrain/Step Time": 8.47760184854269} +{"Pretrain/Learning Rate": 1.0656822111086865e-05, "Pretrain/Loss": 1.9880952835083008, "Pretrain/Loss (Raw)": 1.9699691534042358, "Pretrain/Step": 13421, "Pretrain/Step Time": 8.476854415610433} +{"Pretrain/Learning Rate": 1.065334532945756e-05, "Pretrain/Loss": 1.9872016906738281, "Pretrain/Loss (Raw)": 1.8569533824920654, "Pretrain/Step": 13422, "Pretrain/Step Time": 8.47495710849762} +{"Pretrain/Learning Rate": 1.064986896150392e-05, "Pretrain/Loss": 1.9926097393035889, "Pretrain/Loss (Raw)": 2.4712350368499756, "Pretrain/Step": 13423, "Pretrain/Step Time": 8.475927082821727} +{"Pretrain/Learning Rate": 1.0646393007326199e-05, "Pretrain/Loss": 1.990870475769043, "Pretrain/Loss (Raw)": 1.8294084072113037, "Pretrain/Step": 13424, "Pretrain/Step Time": 8.475849026814103} +{"Pretrain/Learning Rate": 1.0642917467024622e-05, "Pretrain/Loss": 1.9904345273971558, "Pretrain/Loss (Raw)": 1.8536559343338013, "Pretrain/Step": 13425, "Pretrain/Step Time": 8.475850217044353} +{"Pretrain/Learning Rate": 1.0639442340699384e-05, "Pretrain/Loss": 1.9886797666549683, "Pretrain/Loss (Raw)": 1.7440857887268066, "Pretrain/Step": 13426, "Pretrain/Step Time": 8.480836661532521} +{"Pretrain/Learning Rate": 1.0635967628450716e-05, "Pretrain/Loss": 1.9904839992523193, "Pretrain/Loss (Raw)": 2.100996494293213, "Pretrain/Step": 13427, "Pretrain/Step Time": 8.472804198041558} +{"Pretrain/Learning Rate": 1.0632493330378785e-05, "Pretrain/Loss": 1.9880205392837524, "Pretrain/Loss (Raw)": 1.8212318420410156, "Pretrain/Step": 13428, "Pretrain/Step Time": 8.470512432977557} +{"Pretrain/Learning Rate": 1.0629019446583788e-05, "Pretrain/Loss": 1.988844633102417, "Pretrain/Loss (Raw)": 2.040468454360962, "Pretrain/Step": 13429, "Pretrain/Step Time": 8.475242743268609} +{"Pretrain/Learning Rate": 1.0625545977165885e-05, "Pretrain/Loss": 1.9871629476547241, "Pretrain/Loss (Raw)": 1.8470778465270996, "Pretrain/Step": 13430, "Pretrain/Step Time": 8.472950037568808} +{"Pretrain/Learning Rate": 1.062207292222522e-05, "Pretrain/Loss": 1.9900662899017334, "Pretrain/Loss (Raw)": 2.1131441593170166, "Pretrain/Step": 13431, "Pretrain/Step Time": 8.47590945661068} +{"Pretrain/Learning Rate": 1.061860028186196e-05, "Pretrain/Loss": 1.9893169403076172, "Pretrain/Loss (Raw)": 1.994075894355774, "Pretrain/Step": 13432, "Pretrain/Step Time": 8.473242577165365} +{"Pretrain/Learning Rate": 1.061512805617621e-05, "Pretrain/Loss": 1.9896756410598755, "Pretrain/Loss (Raw)": 1.9977667331695557, "Pretrain/Step": 13433, "Pretrain/Step Time": 8.47398118302226} +{"Pretrain/Learning Rate": 1.0611656245268112e-05, "Pretrain/Loss": 1.9900448322296143, "Pretrain/Loss (Raw)": 1.9502893686294556, "Pretrain/Step": 13434, "Pretrain/Step Time": 8.47605355642736} +{"Pretrain/Learning Rate": 1.0608184849237763e-05, "Pretrain/Loss": 1.991368293762207, "Pretrain/Loss (Raw)": 2.049032211303711, "Pretrain/Step": 13435, "Pretrain/Step Time": 8.477092683315277} +{"Pretrain/Learning Rate": 1.0604713868185251e-05, "Pretrain/Loss": 1.9903154373168945, "Pretrain/Loss (Raw)": 2.0397558212280273, "Pretrain/Step": 13436, "Pretrain/Step Time": 8.47642271593213} +{"Pretrain/Learning Rate": 1.0601243302210673e-05, "Pretrain/Loss": 1.9915310144424438, "Pretrain/Loss (Raw)": 1.9375972747802734, "Pretrain/Step": 13437, "Pretrain/Step Time": 8.473382217809558} +{"Pretrain/Learning Rate": 1.0597773151414087e-05, "Pretrain/Loss": 1.994027018547058, "Pretrain/Loss (Raw)": 2.0435659885406494, "Pretrain/Step": 13438, "Pretrain/Step Time": 8.46886983141303} +{"Pretrain/Learning Rate": 1.0594303415895565e-05, "Pretrain/Loss": 1.996017336845398, "Pretrain/Loss (Raw)": 2.3715462684631348, "Pretrain/Step": 13439, "Pretrain/Step Time": 8.474246423691511} +{"Pretrain/Learning Rate": 1.059083409575515e-05, "Pretrain/Loss": 1.9938867092132568, "Pretrain/Loss (Raw)": 1.9375180006027222, "Pretrain/Step": 13440, "Pretrain/Step Time": 8.470119090750813} +{"Pretrain/Learning Rate": 1.0587365191092868e-05, "Pretrain/Loss": 1.9945770502090454, "Pretrain/Loss (Raw)": 2.0386483669281006, "Pretrain/Step": 13441, "Pretrain/Step Time": 8.472196081653237} +{"Pretrain/Learning Rate": 1.0583896702008761e-05, "Pretrain/Loss": 1.996260404586792, "Pretrain/Loss (Raw)": 2.173901081085205, "Pretrain/Step": 13442, "Pretrain/Step Time": 8.474771181121469} +{"Pretrain/Learning Rate": 1.0580428628602818e-05, "Pretrain/Loss": 1.9979259967803955, "Pretrain/Loss (Raw)": 2.009158134460449, "Pretrain/Step": 13443, "Pretrain/Step Time": 8.46908114850521} +{"Pretrain/Learning Rate": 1.0576960970975061e-05, "Pretrain/Loss": 1.9943816661834717, "Pretrain/Loss (Raw)": 1.800335168838501, "Pretrain/Step": 13444, "Pretrain/Step Time": 8.466045934706926} +{"Pretrain/Learning Rate": 1.0573493729225468e-05, "Pretrain/Loss": 1.9964735507965088, "Pretrain/Loss (Raw)": 2.012178897857666, "Pretrain/Step": 13445, "Pretrain/Step Time": 8.468535229563713} +{"Pretrain/Learning Rate": 1.0570026903454e-05, "Pretrain/Loss": 1.9942553043365479, "Pretrain/Loss (Raw)": 1.8311874866485596, "Pretrain/Step": 13446, "Pretrain/Step Time": 8.471406506374478} +{"Pretrain/Learning Rate": 1.0566560493760647e-05, "Pretrain/Loss": 1.9957692623138428, "Pretrain/Loss (Raw)": 2.1377570629119873, "Pretrain/Step": 13447, "Pretrain/Step Time": 8.471455734223127} +{"Pretrain/Learning Rate": 1.0563094500245335e-05, "Pretrain/Loss": 1.9931992292404175, "Pretrain/Loss (Raw)": 1.810611605644226, "Pretrain/Step": 13448, "Pretrain/Step Time": 8.475917747244239} +{"Pretrain/Learning Rate": 1.0559628923008028e-05, "Pretrain/Loss": 1.995664119720459, "Pretrain/Loss (Raw)": 2.1758930683135986, "Pretrain/Step": 13449, "Pretrain/Step Time": 8.475954350084066} +{"Pretrain/Learning Rate": 1.0556163762148638e-05, "Pretrain/Loss": 1.9946025609970093, "Pretrain/Loss (Raw)": 1.939186692237854, "Pretrain/Step": 13450, "Pretrain/Step Time": 8.47706563770771} +{"Pretrain/Learning Rate": 1.0552699017767079e-05, "Pretrain/Loss": 1.9949431419372559, "Pretrain/Loss (Raw)": 2.0912883281707764, "Pretrain/Step": 13451, "Pretrain/Step Time": 8.477804752066731} +{"Pretrain/Learning Rate": 1.0549234689963264e-05, "Pretrain/Loss": 1.9949653148651123, "Pretrain/Loss (Raw)": 2.0112223625183105, "Pretrain/Step": 13452, "Pretrain/Step Time": 8.476418452337384} +{"Pretrain/Learning Rate": 1.0545770778837072e-05, "Pretrain/Loss": 1.9961010217666626, "Pretrain/Loss (Raw)": 1.9585886001586914, "Pretrain/Step": 13453, "Pretrain/Step Time": 8.478754764422774} +{"Pretrain/Learning Rate": 1.0542307284488399e-05, "Pretrain/Loss": 1.9957014322280884, "Pretrain/Loss (Raw)": 2.06900954246521, "Pretrain/Step": 13454, "Pretrain/Step Time": 8.471352439373732} +{"Pretrain/Learning Rate": 1.0538844207017095e-05, "Pretrain/Loss": 1.9966580867767334, "Pretrain/Loss (Raw)": 2.157209873199463, "Pretrain/Step": 13455, "Pretrain/Step Time": 8.468565320596099} +{"Pretrain/Learning Rate": 1.0535381546523032e-05, "Pretrain/Loss": 1.996239423751831, "Pretrain/Loss (Raw)": 2.00458025932312, "Pretrain/Step": 13456, "Pretrain/Step Time": 8.473027070984244} +{"Pretrain/Learning Rate": 1.0531919303106048e-05, "Pretrain/Loss": 1.9959919452667236, "Pretrain/Loss (Raw)": 1.9281491041183472, "Pretrain/Step": 13457, "Pretrain/Step Time": 8.471940968185663} +{"Pretrain/Learning Rate": 1.0528457476865958e-05, "Pretrain/Loss": 1.9968340396881104, "Pretrain/Loss (Raw)": 1.8828258514404297, "Pretrain/Step": 13458, "Pretrain/Step Time": 8.470764853060246} +{"Pretrain/Learning Rate": 1.0524996067902607e-05, "Pretrain/Loss": 1.9952635765075684, "Pretrain/Loss (Raw)": 1.751510500907898, "Pretrain/Step": 13459, "Pretrain/Step Time": 8.467126512899995} +{"Pretrain/Learning Rate": 1.0521535076315781e-05, "Pretrain/Loss": 1.995593547821045, "Pretrain/Loss (Raw)": 2.030521869659424, "Pretrain/Step": 13460, "Pretrain/Step Time": 8.468674635514617} +{"Pretrain/Learning Rate": 1.0518074502205291e-05, "Pretrain/Loss": 1.994612455368042, "Pretrain/Loss (Raw)": 1.907703161239624, "Pretrain/Step": 13461, "Pretrain/Step Time": 8.46525657363236} +{"Pretrain/Learning Rate": 1.0514614345670914e-05, "Pretrain/Loss": 1.993271827697754, "Pretrain/Loss (Raw)": 1.9810764789581299, "Pretrain/Step": 13462, "Pretrain/Step Time": 8.465146275237203} +{"Pretrain/Learning Rate": 1.0511154606812416e-05, "Pretrain/Loss": 1.9939059019088745, "Pretrain/Loss (Raw)": 1.9722131490707397, "Pretrain/Step": 13463, "Pretrain/Step Time": 8.469494258984923} +{"Pretrain/Learning Rate": 1.0507695285729566e-05, "Pretrain/Loss": 1.9913544654846191, "Pretrain/Loss (Raw)": 1.6174616813659668, "Pretrain/Step": 13464, "Pretrain/Step Time": 8.467477859929204} +{"Pretrain/Learning Rate": 1.0504236382522099e-05, "Pretrain/Loss": 1.9901840686798096, "Pretrain/Loss (Raw)": 2.0067389011383057, "Pretrain/Step": 13465, "Pretrain/Step Time": 8.46079364977777} +{"Pretrain/Learning Rate": 1.0500777897289765e-05, "Pretrain/Loss": 1.9898006916046143, "Pretrain/Loss (Raw)": 2.1075429916381836, "Pretrain/Step": 13466, "Pretrain/Step Time": 8.463306780904531} +{"Pretrain/Learning Rate": 1.0497319830132279e-05, "Pretrain/Loss": 1.9894328117370605, "Pretrain/Loss (Raw)": 1.8239262104034424, "Pretrain/Step": 13467, "Pretrain/Step Time": 8.464032450690866} +{"Pretrain/Learning Rate": 1.0493862181149342e-05, "Pretrain/Loss": 1.9882638454437256, "Pretrain/Loss (Raw)": 1.8609228134155273, "Pretrain/Step": 13468, "Pretrain/Step Time": 8.467045305296779} +{"Pretrain/Learning Rate": 1.0490404950440674e-05, "Pretrain/Loss": 1.9866764545440674, "Pretrain/Loss (Raw)": 2.1337156295776367, "Pretrain/Step": 13469, "Pretrain/Step Time": 8.466482317075133} +{"Pretrain/Learning Rate": 1.048694813810594e-05, "Pretrain/Loss": 1.986007571220398, "Pretrain/Loss (Raw)": 2.031514883041382, "Pretrain/Step": 13470, "Pretrain/Step Time": 8.464108588173985} +{"Pretrain/Learning Rate": 1.0483491744244836e-05, "Pretrain/Loss": 1.9850590229034424, "Pretrain/Loss (Raw)": 1.922067403793335, "Pretrain/Step": 13471, "Pretrain/Step Time": 8.460463905707002} +{"Pretrain/Learning Rate": 1.0480035768957013e-05, "Pretrain/Loss": 1.984708547592163, "Pretrain/Loss (Raw)": 2.0182607173919678, "Pretrain/Step": 13472, "Pretrain/Step Time": 8.457577768713236} +{"Pretrain/Learning Rate": 1.0476580212342113e-05, "Pretrain/Loss": 1.9854161739349365, "Pretrain/Loss (Raw)": 1.9984729290008545, "Pretrain/Step": 13473, "Pretrain/Step Time": 8.460183758288622} +{"Pretrain/Learning Rate": 1.0473125074499795e-05, "Pretrain/Loss": 1.9865906238555908, "Pretrain/Loss (Raw)": 2.0074269771575928, "Pretrain/Step": 13474, "Pretrain/Step Time": 8.45351698435843} +{"Pretrain/Learning Rate": 1.0469670355529664e-05, "Pretrain/Loss": 1.9883010387420654, "Pretrain/Loss (Raw)": 2.078951835632324, "Pretrain/Step": 13475, "Pretrain/Step Time": 8.45502963848412} +{"Pretrain/Learning Rate": 1.0466216055531355e-05, "Pretrain/Loss": 1.9871716499328613, "Pretrain/Loss (Raw)": 1.9284085035324097, "Pretrain/Step": 13476, "Pretrain/Step Time": 8.455024119466543} +{"Pretrain/Learning Rate": 1.0462762174604462e-05, "Pretrain/Loss": 1.9880270957946777, "Pretrain/Loss (Raw)": 2.0409345626831055, "Pretrain/Step": 13477, "Pretrain/Step Time": 8.452449781820178} +{"Pretrain/Learning Rate": 1.0459308712848561e-05, "Pretrain/Loss": 1.991296648979187, "Pretrain/Loss (Raw)": 2.437969446182251, "Pretrain/Step": 13478, "Pretrain/Step Time": 8.448132256045938} +{"Pretrain/Learning Rate": 1.0455855670363255e-05, "Pretrain/Loss": 1.989603877067566, "Pretrain/Loss (Raw)": 1.7386806011199951, "Pretrain/Step": 13479, "Pretrain/Step Time": 8.454984478652477} +{"Pretrain/Learning Rate": 1.0452403047248089e-05, "Pretrain/Loss": 1.9926204681396484, "Pretrain/Loss (Raw)": 2.320782423019409, "Pretrain/Step": 13480, "Pretrain/Step Time": 8.447496669366956} +{"Pretrain/Learning Rate": 1.044895084360264e-05, "Pretrain/Loss": 1.9915003776550293, "Pretrain/Loss (Raw)": 1.9609428644180298, "Pretrain/Step": 13481, "Pretrain/Step Time": 8.456192798912525} +{"Pretrain/Learning Rate": 1.044549905952642e-05, "Pretrain/Loss": 1.9878445863723755, "Pretrain/Loss (Raw)": 1.5757386684417725, "Pretrain/Step": 13482, "Pretrain/Step Time": 8.451001439243555} +{"Pretrain/Learning Rate": 1.0442047695118984e-05, "Pretrain/Loss": 1.9895634651184082, "Pretrain/Loss (Raw)": 1.9789063930511475, "Pretrain/Step": 13483, "Pretrain/Step Time": 8.44741590693593} +{"Pretrain/Learning Rate": 1.043859675047984e-05, "Pretrain/Loss": 1.9908262491226196, "Pretrain/Loss (Raw)": 2.0383224487304688, "Pretrain/Step": 13484, "Pretrain/Step Time": 8.44620163179934} +{"Pretrain/Learning Rate": 1.0435146225708483e-05, "Pretrain/Loss": 1.9911179542541504, "Pretrain/Loss (Raw)": 2.048367738723755, "Pretrain/Step": 13485, "Pretrain/Step Time": 8.447296470403671} +{"Pretrain/Learning Rate": 1.0431696120904427e-05, "Pretrain/Loss": 1.9892011880874634, "Pretrain/Loss (Raw)": 1.8342784643173218, "Pretrain/Step": 13486, "Pretrain/Step Time": 8.451898844912648} +{"Pretrain/Learning Rate": 1.0428246436167136e-05, "Pretrain/Loss": 1.9874202013015747, "Pretrain/Loss (Raw)": 1.8685907125473022, "Pretrain/Step": 13487, "Pretrain/Step Time": 8.448703998699784} +{"Pretrain/Learning Rate": 1.0424797171596092e-05, "Pretrain/Loss": 1.9880692958831787, "Pretrain/Loss (Raw)": 2.1274735927581787, "Pretrain/Step": 13488, "Pretrain/Step Time": 8.444326058030128} +{"Pretrain/Learning Rate": 1.0421348327290747e-05, "Pretrain/Loss": 1.9872260093688965, "Pretrain/Loss (Raw)": 1.9070062637329102, "Pretrain/Step": 13489, "Pretrain/Step Time": 8.437150616198778} +{"Pretrain/Learning Rate": 1.041789990335054e-05, "Pretrain/Loss": 1.9881503582000732, "Pretrain/Loss (Raw)": 2.272736072540283, "Pretrain/Step": 13490, "Pretrain/Step Time": 8.441864747554064} +{"Pretrain/Learning Rate": 1.0414451899874916e-05, "Pretrain/Loss": 1.9884097576141357, "Pretrain/Loss (Raw)": 2.0081889629364014, "Pretrain/Step": 13491, "Pretrain/Step Time": 8.437602944672108} +{"Pretrain/Learning Rate": 1.0411004316963283e-05, "Pretrain/Loss": 1.9904217720031738, "Pretrain/Loss (Raw)": 2.1457650661468506, "Pretrain/Step": 13492, "Pretrain/Step Time": 8.438410378992558} +{"Pretrain/Learning Rate": 1.0407557154715061e-05, "Pretrain/Loss": 1.9890546798706055, "Pretrain/Loss (Raw)": 1.8656151294708252, "Pretrain/Step": 13493, "Pretrain/Step Time": 8.44156863167882} +{"Pretrain/Learning Rate": 1.0404110413229645e-05, "Pretrain/Loss": 1.9884588718414307, "Pretrain/Loss (Raw)": 1.8304364681243896, "Pretrain/Step": 13494, "Pretrain/Step Time": 8.441087996587157} +{"Pretrain/Learning Rate": 1.0400664092606405e-05, "Pretrain/Loss": 1.9899753332138062, "Pretrain/Loss (Raw)": 2.1167519092559814, "Pretrain/Step": 13495, "Pretrain/Step Time": 8.439169760793447} +{"Pretrain/Learning Rate": 1.0397218192944736e-05, "Pretrain/Loss": 1.9915564060211182, "Pretrain/Loss (Raw)": 2.0104997158050537, "Pretrain/Step": 13496, "Pretrain/Step Time": 8.438917100429535} +{"Pretrain/Learning Rate": 1.0393772714343971e-05, "Pretrain/Loss": 1.991369605064392, "Pretrain/Loss (Raw)": 2.0547983646392822, "Pretrain/Step": 13497, "Pretrain/Step Time": 8.439651135355234} +{"Pretrain/Learning Rate": 1.0390327656903487e-05, "Pretrain/Loss": 1.9915318489074707, "Pretrain/Loss (Raw)": 2.0253989696502686, "Pretrain/Step": 13498, "Pretrain/Step Time": 8.440301885828376} +{"Pretrain/Learning Rate": 1.0386883020722604e-05, "Pretrain/Loss": 1.9910892248153687, "Pretrain/Loss (Raw)": 1.9740959405899048, "Pretrain/Step": 13499, "Pretrain/Step Time": 8.441377505660057} +{"Pretrain/Learning Rate": 1.038343880590064e-05, "Pretrain/Loss": 1.9895857572555542, "Pretrain/Loss (Raw)": 1.8563872575759888, "Pretrain/Step": 13500, "Pretrain/Step Time": 8.439354518428445} +{"Pretrain/Learning Rate": 1.0379995012536923e-05, "Pretrain/Loss": 1.9885210990905762, "Pretrain/Loss (Raw)": 1.9192343950271606, "Pretrain/Step": 13501, "Pretrain/Step Time": 8.438630679622293} +{"Pretrain/Learning Rate": 1.0376551640730733e-05, "Pretrain/Loss": 1.9904216527938843, "Pretrain/Loss (Raw)": 2.0233166217803955, "Pretrain/Step": 13502, "Pretrain/Step Time": 8.439038172364235} +{"Pretrain/Learning Rate": 1.0373108690581377e-05, "Pretrain/Loss": 1.9890868663787842, "Pretrain/Loss (Raw)": 1.8821191787719727, "Pretrain/Step": 13503, "Pretrain/Step Time": 8.43307933025062} +{"Pretrain/Learning Rate": 1.036966616218812e-05, "Pretrain/Loss": 1.9895365238189697, "Pretrain/Loss (Raw)": 1.9232062101364136, "Pretrain/Step": 13504, "Pretrain/Step Time": 8.431208405643702} +{"Pretrain/Learning Rate": 1.0366224055650217e-05, "Pretrain/Loss": 1.9891221523284912, "Pretrain/Loss (Raw)": 2.109856605529785, "Pretrain/Step": 13505, "Pretrain/Step Time": 8.430822586640716} +{"Pretrain/Learning Rate": 1.0362782371066937e-05, "Pretrain/Loss": 1.9891457557678223, "Pretrain/Loss (Raw)": 1.8131030797958374, "Pretrain/Step": 13506, "Pretrain/Step Time": 8.434690503403544} +{"Pretrain/Learning Rate": 1.0359341108537499e-05, "Pretrain/Loss": 1.9882742166519165, "Pretrain/Loss (Raw)": 1.9584226608276367, "Pretrain/Step": 13507, "Pretrain/Step Time": 8.431781297549605} +{"Pretrain/Learning Rate": 1.0355900268161148e-05, "Pretrain/Loss": 1.9883286952972412, "Pretrain/Loss (Raw)": 2.017873764038086, "Pretrain/Step": 13508, "Pretrain/Step Time": 8.431889841333032} +{"Pretrain/Learning Rate": 1.0352459850037091e-05, "Pretrain/Loss": 1.9871280193328857, "Pretrain/Loss (Raw)": 1.9183269739151, "Pretrain/Step": 13509, "Pretrain/Step Time": 8.426524734124541} +{"Pretrain/Learning Rate": 1.0349019854264519e-05, "Pretrain/Loss": 1.9881935119628906, "Pretrain/Loss (Raw)": 2.1302273273468018, "Pretrain/Step": 13510, "Pretrain/Step Time": 8.424379138275981} +{"Pretrain/Learning Rate": 1.0345580280942638e-05, "Pretrain/Loss": 1.9882649183273315, "Pretrain/Loss (Raw)": 1.9928784370422363, "Pretrain/Step": 13511, "Pretrain/Step Time": 8.426883146166801} +{"Pretrain/Learning Rate": 1.034214113017061e-05, "Pretrain/Loss": 1.9876399040222168, "Pretrain/Loss (Raw)": 1.7416311502456665, "Pretrain/Step": 13512, "Pretrain/Step Time": 8.427791429683566} +{"Pretrain/Learning Rate": 1.0338702402047621e-05, "Pretrain/Loss": 1.9891663789749146, "Pretrain/Loss (Raw)": 2.2462527751922607, "Pretrain/Step": 13513, "Pretrain/Step Time": 8.426501102745533} +{"Pretrain/Learning Rate": 1.0335264096672811e-05, "Pretrain/Loss": 1.9894819259643555, "Pretrain/Loss (Raw)": 1.97540283203125, "Pretrain/Step": 13514, "Pretrain/Step Time": 8.425140745937824} +{"Pretrain/Learning Rate": 1.0331826214145316e-05, "Pretrain/Loss": 1.988450288772583, "Pretrain/Loss (Raw)": 1.9072184562683105, "Pretrain/Step": 13515, "Pretrain/Step Time": 8.42241045087576} +{"Pretrain/Learning Rate": 1.0328388754564278e-05, "Pretrain/Loss": 1.9904338121414185, "Pretrain/Loss (Raw)": 2.1966817378997803, "Pretrain/Step": 13516, "Pretrain/Step Time": 8.425907779484987} +{"Pretrain/Learning Rate": 1.0324951718028799e-05, "Pretrain/Loss": 1.9917439222335815, "Pretrain/Loss (Raw)": 2.0051636695861816, "Pretrain/Step": 13517, "Pretrain/Step Time": 8.42166880518198} +{"Pretrain/Learning Rate": 1.0321515104638002e-05, "Pretrain/Loss": 1.9909090995788574, "Pretrain/Loss (Raw)": 1.8598406314849854, "Pretrain/Step": 13518, "Pretrain/Step Time": 8.424386523663998} +{"Pretrain/Learning Rate": 1.0318078914490958e-05, "Pretrain/Loss": 1.9915084838867188, "Pretrain/Loss (Raw)": 1.8998509645462036, "Pretrain/Step": 13519, "Pretrain/Step Time": 8.423841789364815} +{"Pretrain/Learning Rate": 1.031464314768677e-05, "Pretrain/Loss": 1.9914190769195557, "Pretrain/Loss (Raw)": 1.9216828346252441, "Pretrain/Step": 13520, "Pretrain/Step Time": 8.420550232753158} +{"Pretrain/Learning Rate": 1.0311207804324494e-05, "Pretrain/Loss": 1.991253137588501, "Pretrain/Loss (Raw)": 2.0876951217651367, "Pretrain/Step": 13521, "Pretrain/Step Time": 8.421244718134403} +{"Pretrain/Learning Rate": 1.0307772884503176e-05, "Pretrain/Loss": 1.9907596111297607, "Pretrain/Loss (Raw)": 1.915065050125122, "Pretrain/Step": 13522, "Pretrain/Step Time": 8.423474790528417} +{"Pretrain/Learning Rate": 1.030433838832188e-05, "Pretrain/Loss": 1.991018533706665, "Pretrain/Loss (Raw)": 1.8901780843734741, "Pretrain/Step": 13523, "Pretrain/Step Time": 8.42788440361619} +{"Pretrain/Learning Rate": 1.0300904315879614e-05, "Pretrain/Loss": 1.9929207563400269, "Pretrain/Loss (Raw)": 2.024660348892212, "Pretrain/Step": 13524, "Pretrain/Step Time": 8.424451898783445} +{"Pretrain/Learning Rate": 1.0297470667275424e-05, "Pretrain/Loss": 1.9934728145599365, "Pretrain/Loss (Raw)": 2.0823733806610107, "Pretrain/Step": 13525, "Pretrain/Step Time": 8.426187178120017} +{"Pretrain/Learning Rate": 1.0294037442608301e-05, "Pretrain/Loss": 1.993377923965454, "Pretrain/Loss (Raw)": 1.9292224645614624, "Pretrain/Step": 13526, "Pretrain/Step Time": 8.430268885567784} +{"Pretrain/Learning Rate": 1.029060464197723e-05, "Pretrain/Loss": 1.993439793586731, "Pretrain/Loss (Raw)": 2.135044574737549, "Pretrain/Step": 13527, "Pretrain/Step Time": 8.430174302309752} +{"Pretrain/Learning Rate": 1.0287172265481216e-05, "Pretrain/Loss": 1.995557188987732, "Pretrain/Loss (Raw)": 2.431225061416626, "Pretrain/Step": 13528, "Pretrain/Step Time": 8.429542874917388} +{"Pretrain/Learning Rate": 1.0283740313219208e-05, "Pretrain/Loss": 1.9948667287826538, "Pretrain/Loss (Raw)": 1.988315463066101, "Pretrain/Step": 13529, "Pretrain/Step Time": 8.433980207890272} +{"Pretrain/Learning Rate": 1.0280308785290182e-05, "Pretrain/Loss": 1.993457555770874, "Pretrain/Loss (Raw)": 1.9432638883590698, "Pretrain/Step": 13530, "Pretrain/Step Time": 8.434703094884753} +{"Pretrain/Learning Rate": 1.0276877681793079e-05, "Pretrain/Loss": 1.9949374198913574, "Pretrain/Loss (Raw)": 2.3855669498443604, "Pretrain/Step": 13531, "Pretrain/Step Time": 8.432918021455407} +{"Pretrain/Learning Rate": 1.0273447002826816e-05, "Pretrain/Loss": 1.996135950088501, "Pretrain/Loss (Raw)": 2.0830557346343994, "Pretrain/Step": 13532, "Pretrain/Step Time": 8.435274051502347} +{"Pretrain/Learning Rate": 1.0270016748490337e-05, "Pretrain/Loss": 1.9960546493530273, "Pretrain/Loss (Raw)": 1.9172592163085938, "Pretrain/Step": 13533, "Pretrain/Step Time": 8.438179817050695} +{"Pretrain/Learning Rate": 1.0266586918882535e-05, "Pretrain/Loss": 1.9940457344055176, "Pretrain/Loss (Raw)": 1.8495599031448364, "Pretrain/Step": 13534, "Pretrain/Step Time": 8.431711612269282} +{"Pretrain/Learning Rate": 1.0263157514102317e-05, "Pretrain/Loss": 1.996644377708435, "Pretrain/Loss (Raw)": 2.0547661781311035, "Pretrain/Step": 13535, "Pretrain/Step Time": 8.426106141880155} +{"Pretrain/Learning Rate": 1.0259728534248567e-05, "Pretrain/Loss": 1.9957443475723267, "Pretrain/Loss (Raw)": 1.806046962738037, "Pretrain/Step": 13536, "Pretrain/Step Time": 8.429244196042418} +{"Pretrain/Learning Rate": 1.0256299979420142e-05, "Pretrain/Loss": 1.9966397285461426, "Pretrain/Loss (Raw)": 2.0774872303009033, "Pretrain/Step": 13537, "Pretrain/Step Time": 8.428728513419628} +{"Pretrain/Learning Rate": 1.0252871849715926e-05, "Pretrain/Loss": 1.9974102973937988, "Pretrain/Loss (Raw)": 2.242309331893921, "Pretrain/Step": 13538, "Pretrain/Step Time": 8.42607093974948} +{"Pretrain/Learning Rate": 1.0249444145234743e-05, "Pretrain/Loss": 1.996476650238037, "Pretrain/Loss (Raw)": 1.812320351600647, "Pretrain/Step": 13539, "Pretrain/Step Time": 8.429967012256384} +{"Pretrain/Learning Rate": 1.0246016866075448e-05, "Pretrain/Loss": 1.997429609298706, "Pretrain/Loss (Raw)": 2.0542712211608887, "Pretrain/Step": 13540, "Pretrain/Step Time": 8.423530185595155} +{"Pretrain/Learning Rate": 1.0242590012336855e-05, "Pretrain/Loss": 1.9986748695373535, "Pretrain/Loss (Raw)": 2.0318546295166016, "Pretrain/Step": 13541, "Pretrain/Step Time": 8.420997126027942} +{"Pretrain/Learning Rate": 1.023916358411777e-05, "Pretrain/Loss": 1.9981458187103271, "Pretrain/Loss (Raw)": 2.041443109512329, "Pretrain/Step": 13542, "Pretrain/Step Time": 8.423858437687159} +{"Pretrain/Learning Rate": 1.0235737581517004e-05, "Pretrain/Loss": 1.9988069534301758, "Pretrain/Loss (Raw)": 2.084009885787964, "Pretrain/Step": 13543, "Pretrain/Step Time": 8.422427356243134} +{"Pretrain/Learning Rate": 1.0232312004633326e-05, "Pretrain/Loss": 1.9991133213043213, "Pretrain/Loss (Raw)": 2.0997745990753174, "Pretrain/Step": 13544, "Pretrain/Step Time": 8.425789806991816} +{"Pretrain/Learning Rate": 1.0228886853565534e-05, "Pretrain/Loss": 1.9981938600540161, "Pretrain/Loss (Raw)": 1.9552408456802368, "Pretrain/Step": 13545, "Pretrain/Step Time": 8.428814908489585} +{"Pretrain/Learning Rate": 1.0225462128412375e-05, "Pretrain/Loss": 1.9977898597717285, "Pretrain/Loss (Raw)": 1.9640156030654907, "Pretrain/Step": 13546, "Pretrain/Step Time": 8.42413629218936} +{"Pretrain/Learning Rate": 1.022203782927259e-05, "Pretrain/Loss": 1.9963022470474243, "Pretrain/Loss (Raw)": 2.044992446899414, "Pretrain/Step": 13547, "Pretrain/Step Time": 8.424510445445776} +{"Pretrain/Learning Rate": 1.0218613956244935e-05, "Pretrain/Loss": 1.9967973232269287, "Pretrain/Loss (Raw)": 1.9985346794128418, "Pretrain/Step": 13548, "Pretrain/Step Time": 8.42193616554141} +{"Pretrain/Learning Rate": 1.0215190509428118e-05, "Pretrain/Loss": 1.9955062866210938, "Pretrain/Loss (Raw)": 1.8047127723693848, "Pretrain/Step": 13549, "Pretrain/Step Time": 8.426411909982562} +{"Pretrain/Learning Rate": 1.021176748892087e-05, "Pretrain/Loss": 1.9933712482452393, "Pretrain/Loss (Raw)": 1.5836704969406128, "Pretrain/Step": 13550, "Pretrain/Step Time": 8.42736966535449} +{"Pretrain/Learning Rate": 1.0208344894821884e-05, "Pretrain/Loss": 1.989815592765808, "Pretrain/Loss (Raw)": 2.0161073207855225, "Pretrain/Step": 13551, "Pretrain/Step Time": 8.427809474989772} +{"Pretrain/Learning Rate": 1.0204922727229832e-05, "Pretrain/Loss": 1.9879069328308105, "Pretrain/Loss (Raw)": 1.58510422706604, "Pretrain/Step": 13552, "Pretrain/Step Time": 8.425058420747519} +{"Pretrain/Learning Rate": 1.0201500986243414e-05, "Pretrain/Loss": 1.987656831741333, "Pretrain/Loss (Raw)": 1.8216477632522583, "Pretrain/Step": 13553, "Pretrain/Step Time": 8.42285523377359} +{"Pretrain/Learning Rate": 1.0198079671961275e-05, "Pretrain/Loss": 1.9915772676467896, "Pretrain/Loss (Raw)": 2.245910406112671, "Pretrain/Step": 13554, "Pretrain/Step Time": 8.419942120090127} +{"Pretrain/Learning Rate": 1.019465878448208e-05, "Pretrain/Loss": 1.9898459911346436, "Pretrain/Loss (Raw)": 1.8793872594833374, "Pretrain/Step": 13555, "Pretrain/Step Time": 8.426199523732066} +{"Pretrain/Learning Rate": 1.0191238323904464e-05, "Pretrain/Loss": 1.9911314249038696, "Pretrain/Loss (Raw)": 1.9857707023620605, "Pretrain/Step": 13556, "Pretrain/Step Time": 8.424634717404842} +{"Pretrain/Learning Rate": 1.0187818290327041e-05, "Pretrain/Loss": 1.9917469024658203, "Pretrain/Loss (Raw)": 2.119245767593384, "Pretrain/Step": 13557, "Pretrain/Step Time": 8.421190671622753} +{"Pretrain/Learning Rate": 1.0184398683848448e-05, "Pretrain/Loss": 1.9925518035888672, "Pretrain/Loss (Raw)": 1.9501107931137085, "Pretrain/Step": 13558, "Pretrain/Step Time": 8.424251399934292} +{"Pretrain/Learning Rate": 1.0180979504567261e-05, "Pretrain/Loss": 1.990839958190918, "Pretrain/Loss (Raw)": 1.894029140472412, "Pretrain/Step": 13559, "Pretrain/Step Time": 8.420607233420014} +{"Pretrain/Learning Rate": 1.0177560752582097e-05, "Pretrain/Loss": 1.988700270652771, "Pretrain/Loss (Raw)": 1.7201882600784302, "Pretrain/Step": 13560, "Pretrain/Step Time": 8.418748192489147} +{"Pretrain/Learning Rate": 1.0174142427991514e-05, "Pretrain/Loss": 1.98695969581604, "Pretrain/Loss (Raw)": 1.7749820947647095, "Pretrain/Step": 13561, "Pretrain/Step Time": 8.425077598541975} +{"Pretrain/Learning Rate": 1.017072453089408e-05, "Pretrain/Loss": 1.9882946014404297, "Pretrain/Loss (Raw)": 2.121145486831665, "Pretrain/Step": 13562, "Pretrain/Step Time": 8.422566793859005} +{"Pretrain/Learning Rate": 1.0167307061388353e-05, "Pretrain/Loss": 1.9860992431640625, "Pretrain/Loss (Raw)": 1.7680256366729736, "Pretrain/Step": 13563, "Pretrain/Step Time": 8.42778648622334} +{"Pretrain/Learning Rate": 1.0163890019572867e-05, "Pretrain/Loss": 1.9849234819412231, "Pretrain/Loss (Raw)": 1.8892686367034912, "Pretrain/Step": 13564, "Pretrain/Step Time": 8.427608668804169} +{"Pretrain/Learning Rate": 1.0160473405546166e-05, "Pretrain/Loss": 1.9859445095062256, "Pretrain/Loss (Raw)": 2.06829571723938, "Pretrain/Step": 13565, "Pretrain/Step Time": 8.428738819435239} +{"Pretrain/Learning Rate": 1.015705721940674e-05, "Pretrain/Loss": 1.984548807144165, "Pretrain/Loss (Raw)": 1.8649005889892578, "Pretrain/Step": 13566, "Pretrain/Step Time": 8.430756371468306} +{"Pretrain/Learning Rate": 1.0153641461253114e-05, "Pretrain/Loss": 1.9808852672576904, "Pretrain/Loss (Raw)": 1.9026172161102295, "Pretrain/Step": 13567, "Pretrain/Step Time": 8.430451564490795} +{"Pretrain/Learning Rate": 1.0150226131183768e-05, "Pretrain/Loss": 1.9799716472625732, "Pretrain/Loss (Raw)": 1.820582389831543, "Pretrain/Step": 13568, "Pretrain/Step Time": 8.431094596162438} +{"Pretrain/Learning Rate": 1.0146811229297173e-05, "Pretrain/Loss": 1.980704665184021, "Pretrain/Loss (Raw)": 2.1324715614318848, "Pretrain/Step": 13569, "Pretrain/Step Time": 8.429153697565198} +{"Pretrain/Learning Rate": 1.014339675569182e-05, "Pretrain/Loss": 1.9784375429153442, "Pretrain/Loss (Raw)": 1.8836983442306519, "Pretrain/Step": 13570, "Pretrain/Step Time": 8.429567588493228} +{"Pretrain/Learning Rate": 1.0139982710466134e-05, "Pretrain/Loss": 1.9779729843139648, "Pretrain/Loss (Raw)": 1.9496968984603882, "Pretrain/Step": 13571, "Pretrain/Step Time": 8.434213696047664} +{"Pretrain/Learning Rate": 1.0136569093718582e-05, "Pretrain/Loss": 1.9769694805145264, "Pretrain/Loss (Raw)": 1.671903133392334, "Pretrain/Step": 13572, "Pretrain/Step Time": 8.435478357598186} +{"Pretrain/Learning Rate": 1.013315590554758e-05, "Pretrain/Loss": 1.9769327640533447, "Pretrain/Loss (Raw)": 2.007462501525879, "Pretrain/Step": 13573, "Pretrain/Step Time": 8.436577113345265} +{"Pretrain/Learning Rate": 1.0129743146051543e-05, "Pretrain/Loss": 1.9794385433197021, "Pretrain/Loss (Raw)": 2.151939630508423, "Pretrain/Step": 13574, "Pretrain/Step Time": 8.4332963693887} +{"Pretrain/Learning Rate": 1.0126330815328886e-05, "Pretrain/Loss": 1.97769296169281, "Pretrain/Loss (Raw)": 1.9143160581588745, "Pretrain/Step": 13575, "Pretrain/Step Time": 8.431362811475992} +{"Pretrain/Learning Rate": 1.0122918913477983e-05, "Pretrain/Loss": 1.9781739711761475, "Pretrain/Loss (Raw)": 1.872182846069336, "Pretrain/Step": 13576, "Pretrain/Step Time": 8.43139124661684} +{"Pretrain/Learning Rate": 1.0119507440597236e-05, "Pretrain/Loss": 1.9773893356323242, "Pretrain/Loss (Raw)": 2.075439929962158, "Pretrain/Step": 13577, "Pretrain/Step Time": 8.429532831534743} +{"Pretrain/Learning Rate": 1.0116096396785005e-05, "Pretrain/Loss": 1.9754071235656738, "Pretrain/Loss (Raw)": 1.6854751110076904, "Pretrain/Step": 13578, "Pretrain/Step Time": 8.427032498642802} +{"Pretrain/Learning Rate": 1.011268578213963e-05, "Pretrain/Loss": 1.9756137132644653, "Pretrain/Loss (Raw)": 2.117734909057617, "Pretrain/Step": 13579, "Pretrain/Step Time": 8.42909687384963} +{"Pretrain/Learning Rate": 1.0109275596759473e-05, "Pretrain/Loss": 1.97532057762146, "Pretrain/Loss (Raw)": 1.9737136363983154, "Pretrain/Step": 13580, "Pretrain/Step Time": 8.43090920895338} +{"Pretrain/Learning Rate": 1.010586584074285e-05, "Pretrain/Loss": 1.975463628768921, "Pretrain/Loss (Raw)": 1.976876974105835, "Pretrain/Step": 13581, "Pretrain/Step Time": 8.431751554831862} +{"Pretrain/Learning Rate": 1.0102456514188096e-05, "Pretrain/Loss": 1.9733959436416626, "Pretrain/Loss (Raw)": 1.8043631315231323, "Pretrain/Step": 13582, "Pretrain/Step Time": 8.432929657399654} +{"Pretrain/Learning Rate": 1.0099047617193498e-05, "Pretrain/Loss": 1.9754143953323364, "Pretrain/Loss (Raw)": 2.4155609607696533, "Pretrain/Step": 13583, "Pretrain/Step Time": 8.43249236792326} +{"Pretrain/Learning Rate": 1.0095639149857364e-05, "Pretrain/Loss": 1.9765031337738037, "Pretrain/Loss (Raw)": 2.1439402103424072, "Pretrain/Step": 13584, "Pretrain/Step Time": 8.430256200954318} +{"Pretrain/Learning Rate": 1.0092231112277969e-05, "Pretrain/Loss": 1.9776219129562378, "Pretrain/Loss (Raw)": 2.071347236633301, "Pretrain/Step": 13585, "Pretrain/Step Time": 8.434404365718365} +{"Pretrain/Learning Rate": 1.0088823504553571e-05, "Pretrain/Loss": 1.9795129299163818, "Pretrain/Loss (Raw)": 2.1248743534088135, "Pretrain/Step": 13586, "Pretrain/Step Time": 8.434937624260783} +{"Pretrain/Learning Rate": 1.0085416326782445e-05, "Pretrain/Loss": 1.9816950559616089, "Pretrain/Loss (Raw)": 2.030827283859253, "Pretrain/Step": 13587, "Pretrain/Step Time": 8.437356397509575} +{"Pretrain/Learning Rate": 1.0082009579062818e-05, "Pretrain/Loss": 1.981818675994873, "Pretrain/Loss (Raw)": 2.0463638305664062, "Pretrain/Step": 13588, "Pretrain/Step Time": 8.4341936763376} +{"Pretrain/Learning Rate": 1.0078603261492934e-05, "Pretrain/Loss": 1.9810657501220703, "Pretrain/Loss (Raw)": 1.8113045692443848, "Pretrain/Step": 13589, "Pretrain/Step Time": 8.433467315509915} +{"Pretrain/Learning Rate": 1.0075197374171009e-05, "Pretrain/Loss": 1.982424259185791, "Pretrain/Loss (Raw)": 2.1549746990203857, "Pretrain/Step": 13590, "Pretrain/Step Time": 8.440912257879972} +{"Pretrain/Learning Rate": 1.0071791917195234e-05, "Pretrain/Loss": 1.983220100402832, "Pretrain/Loss (Raw)": 2.07407808303833, "Pretrain/Step": 13591, "Pretrain/Step Time": 8.433551378548145} +{"Pretrain/Learning Rate": 1.0068386890663828e-05, "Pretrain/Loss": 1.9838063716888428, "Pretrain/Loss (Raw)": 1.6925086975097656, "Pretrain/Step": 13592, "Pretrain/Step Time": 8.434430243447423} +{"Pretrain/Learning Rate": 1.006498229467495e-05, "Pretrain/Loss": 1.9814209938049316, "Pretrain/Loss (Raw)": 1.7013976573944092, "Pretrain/Step": 13593, "Pretrain/Step Time": 8.436801001429558} +{"Pretrain/Learning Rate": 1.0061578129326785e-05, "Pretrain/Loss": 1.9794912338256836, "Pretrain/Loss (Raw)": 1.86053466796875, "Pretrain/Step": 13594, "Pretrain/Step Time": 8.438290890306234} +{"Pretrain/Learning Rate": 1.0058174394717487e-05, "Pretrain/Loss": 1.979874610900879, "Pretrain/Loss (Raw)": 1.8730038404464722, "Pretrain/Step": 13595, "Pretrain/Step Time": 8.43977688997984} +{"Pretrain/Learning Rate": 1.0054771090945187e-05, "Pretrain/Loss": 1.9800350666046143, "Pretrain/Loss (Raw)": 1.881477952003479, "Pretrain/Step": 13596, "Pretrain/Step Time": 8.43819079361856} +{"Pretrain/Learning Rate": 1.0051368218108037e-05, "Pretrain/Loss": 1.9795269966125488, "Pretrain/Loss (Raw)": 2.068666458129883, "Pretrain/Step": 13597, "Pretrain/Step Time": 8.439923778176308} +{"Pretrain/Learning Rate": 1.0047965776304136e-05, "Pretrain/Loss": 1.9779689311981201, "Pretrain/Loss (Raw)": 1.83208429813385, "Pretrain/Step": 13598, "Pretrain/Step Time": 8.437358370050788} +{"Pretrain/Learning Rate": 1.004456376563161e-05, "Pretrain/Loss": 1.9776310920715332, "Pretrain/Loss (Raw)": 1.8788214921951294, "Pretrain/Step": 13599, "Pretrain/Step Time": 8.438364716246724} +{"Pretrain/Learning Rate": 1.0041162186188546e-05, "Pretrain/Loss": 1.9804829359054565, "Pretrain/Loss (Raw)": 2.383308172225952, "Pretrain/Step": 13600, "Pretrain/Step Time": 8.439400566741824} +{"Pretrain/Learning Rate": 1.0037761038073015e-05, "Pretrain/Loss": 1.9816086292266846, "Pretrain/Loss (Raw)": 2.142550230026245, "Pretrain/Step": 13601, "Pretrain/Step Time": 8.442507239058614} +{"Pretrain/Learning Rate": 1.0034360321383107e-05, "Pretrain/Loss": 1.9815423488616943, "Pretrain/Loss (Raw)": 1.9989451169967651, "Pretrain/Step": 13602, "Pretrain/Step Time": 8.445706969127059} +{"Pretrain/Learning Rate": 1.003096003621686e-05, "Pretrain/Loss": 1.9843140840530396, "Pretrain/Loss (Raw)": 2.4337360858917236, "Pretrain/Step": 13603, "Pretrain/Step Time": 8.450873950496316} +{"Pretrain/Learning Rate": 1.0027560182672336e-05, "Pretrain/Loss": 1.9851553440093994, "Pretrain/Loss (Raw)": 2.036092758178711, "Pretrain/Step": 13604, "Pretrain/Step Time": 8.445684475824237} +{"Pretrain/Learning Rate": 1.0024160760847559e-05, "Pretrain/Loss": 1.9834579229354858, "Pretrain/Loss (Raw)": 1.823664665222168, "Pretrain/Step": 13605, "Pretrain/Step Time": 8.448381377384067} +{"Pretrain/Learning Rate": 1.0020761770840542e-05, "Pretrain/Loss": 1.980046272277832, "Pretrain/Loss (Raw)": 2.001279830932617, "Pretrain/Step": 13606, "Pretrain/Step Time": 8.451756915077567} +{"Pretrain/Learning Rate": 1.0017363212749306e-05, "Pretrain/Loss": 1.9835991859436035, "Pretrain/Loss (Raw)": 2.193446397781372, "Pretrain/Step": 13607, "Pretrain/Step Time": 8.447007162496448} +{"Pretrain/Learning Rate": 1.0013965086671833e-05, "Pretrain/Loss": 1.9795728921890259, "Pretrain/Loss (Raw)": 1.8054304122924805, "Pretrain/Step": 13608, "Pretrain/Step Time": 8.446410495787859} +{"Pretrain/Learning Rate": 1.001056739270612e-05, "Pretrain/Loss": 1.978559136390686, "Pretrain/Loss (Raw)": 1.8311710357666016, "Pretrain/Step": 13609, "Pretrain/Step Time": 8.441349737346172} +{"Pretrain/Learning Rate": 1.000717013095013e-05, "Pretrain/Loss": 1.9826087951660156, "Pretrain/Loss (Raw)": 2.0940849781036377, "Pretrain/Step": 13610, "Pretrain/Step Time": 8.442484050989151} +{"Pretrain/Learning Rate": 1.0003773301501811e-05, "Pretrain/Loss": 1.9845714569091797, "Pretrain/Loss (Raw)": 2.230137825012207, "Pretrain/Step": 13611, "Pretrain/Step Time": 8.449016382917762} +{"Pretrain/Learning Rate": 1.0000376904459128e-05, "Pretrain/Loss": 1.9843231439590454, "Pretrain/Loss (Raw)": 2.0065345764160156, "Pretrain/Step": 13612, "Pretrain/Step Time": 8.450283918529749} +{"Pretrain/Learning Rate": 9.99698093991999e-06, "Pretrain/Loss": 1.9842126369476318, "Pretrain/Loss (Raw)": 2.0342283248901367, "Pretrain/Step": 13613, "Pretrain/Step Time": 8.44906173273921} +{"Pretrain/Learning Rate": 9.993585407982343e-06, "Pretrain/Loss": 1.9864816665649414, "Pretrain/Loss (Raw)": 2.1247050762176514, "Pretrain/Step": 13614, "Pretrain/Step Time": 8.444940211251378} +{"Pretrain/Learning Rate": 9.990190308744079e-06, "Pretrain/Loss": 1.986588954925537, "Pretrain/Loss (Raw)": 1.8823362588882446, "Pretrain/Step": 13615, "Pretrain/Step Time": 8.446366786956787} +{"Pretrain/Learning Rate": 9.986795642303087e-06, "Pretrain/Loss": 1.985541820526123, "Pretrain/Loss (Raw)": 1.9934457540512085, "Pretrain/Step": 13616, "Pretrain/Step Time": 8.445812284946442} +{"Pretrain/Learning Rate": 9.98340140875727e-06, "Pretrain/Loss": 1.9864695072174072, "Pretrain/Loss (Raw)": 2.025735378265381, "Pretrain/Step": 13617, "Pretrain/Step Time": 8.450448213145137} +{"Pretrain/Learning Rate": 9.980007608204478e-06, "Pretrain/Loss": 1.9841749668121338, "Pretrain/Loss (Raw)": 1.9790453910827637, "Pretrain/Step": 13618, "Pretrain/Step Time": 8.44785919599235} +{"Pretrain/Learning Rate": 9.976614240742588e-06, "Pretrain/Loss": 1.984440803527832, "Pretrain/Loss (Raw)": 2.042208671569824, "Pretrain/Step": 13619, "Pretrain/Step Time": 8.449956305325031} +{"Pretrain/Learning Rate": 9.973221306469433e-06, "Pretrain/Loss": 1.9847328662872314, "Pretrain/Loss (Raw)": 2.1831400394439697, "Pretrain/Step": 13620, "Pretrain/Step Time": 8.447757434099913} +{"Pretrain/Learning Rate": 9.969828805482843e-06, "Pretrain/Loss": 1.9835467338562012, "Pretrain/Loss (Raw)": 1.7137949466705322, "Pretrain/Step": 13621, "Pretrain/Step Time": 8.445728370919824} +{"Pretrain/Learning Rate": 9.96643673788065e-06, "Pretrain/Loss": 1.9853379726409912, "Pretrain/Loss (Raw)": 2.0597219467163086, "Pretrain/Step": 13622, "Pretrain/Step Time": 8.444668598473072} +{"Pretrain/Learning Rate": 9.963045103760646e-06, "Pretrain/Loss": 1.9839967489242554, "Pretrain/Loss (Raw)": 1.9450641870498657, "Pretrain/Step": 13623, "Pretrain/Step Time": 8.446982340887189} +{"Pretrain/Learning Rate": 9.959653903220648e-06, "Pretrain/Loss": 1.9831838607788086, "Pretrain/Loss (Raw)": 1.9064512252807617, "Pretrain/Step": 13624, "Pretrain/Step Time": 8.44792728498578} +{"Pretrain/Learning Rate": 9.956263136358424e-06, "Pretrain/Loss": 1.9840878248214722, "Pretrain/Loss (Raw)": 2.170518159866333, "Pretrain/Step": 13625, "Pretrain/Step Time": 8.448442528024316} +{"Pretrain/Learning Rate": 9.95287280327174e-06, "Pretrain/Loss": 1.9856370687484741, "Pretrain/Loss (Raw)": 2.2236974239349365, "Pretrain/Step": 13626, "Pretrain/Step Time": 8.4439617972821} +{"Pretrain/Learning Rate": 9.94948290405837e-06, "Pretrain/Loss": 1.9844894409179688, "Pretrain/Loss (Raw)": 1.8272029161453247, "Pretrain/Step": 13627, "Pretrain/Step Time": 8.447175145149231} +{"Pretrain/Learning Rate": 9.946093438816042e-06, "Pretrain/Loss": 1.9848953485488892, "Pretrain/Loss (Raw)": 1.9083278179168701, "Pretrain/Step": 13628, "Pretrain/Step Time": 8.448556300252676} +{"Pretrain/Learning Rate": 9.942704407642505e-06, "Pretrain/Loss": 1.9858605861663818, "Pretrain/Loss (Raw)": 2.0427935123443604, "Pretrain/Step": 13629, "Pretrain/Step Time": 8.453817589208484} +{"Pretrain/Learning Rate": 9.939315810635475e-06, "Pretrain/Loss": 1.9834996461868286, "Pretrain/Loss (Raw)": 1.7211202383041382, "Pretrain/Step": 13630, "Pretrain/Step Time": 8.45402348972857} +{"Pretrain/Learning Rate": 9.935927647892643e-06, "Pretrain/Loss": 1.9845201969146729, "Pretrain/Loss (Raw)": 2.0127532482147217, "Pretrain/Step": 13631, "Pretrain/Step Time": 8.455464197322726} +{"Pretrain/Learning Rate": 9.932539919511729e-06, "Pretrain/Loss": 1.9854317903518677, "Pretrain/Loss (Raw)": 2.039881944656372, "Pretrain/Step": 13632, "Pretrain/Step Time": 8.454745704308152} +{"Pretrain/Learning Rate": 9.929152625590397e-06, "Pretrain/Loss": 1.9861174821853638, "Pretrain/Loss (Raw)": 2.197622776031494, "Pretrain/Step": 13633, "Pretrain/Step Time": 8.458476919680834} +{"Pretrain/Learning Rate": 9.925765766226333e-06, "Pretrain/Loss": 1.98724365234375, "Pretrain/Loss (Raw)": 1.9572466611862183, "Pretrain/Step": 13634, "Pretrain/Step Time": 8.453343255445361} +{"Pretrain/Learning Rate": 9.922379341517185e-06, "Pretrain/Loss": 1.9871464967727661, "Pretrain/Loss (Raw)": 1.9460023641586304, "Pretrain/Step": 13635, "Pretrain/Step Time": 8.453626310452819} +{"Pretrain/Learning Rate": 9.91899335156059e-06, "Pretrain/Loss": 1.9875380992889404, "Pretrain/Loss (Raw)": 2.0679826736450195, "Pretrain/Step": 13636, "Pretrain/Step Time": 8.45621226914227} +{"Pretrain/Learning Rate": 9.915607796454202e-06, "Pretrain/Loss": 1.9883956909179688, "Pretrain/Loss (Raw)": 2.02809476852417, "Pretrain/Step": 13637, "Pretrain/Step Time": 8.454733872786164} +{"Pretrain/Learning Rate": 9.912222676295618e-06, "Pretrain/Loss": 1.9878160953521729, "Pretrain/Loss (Raw)": 2.056051731109619, "Pretrain/Step": 13638, "Pretrain/Step Time": 8.45708217099309} +{"Pretrain/Learning Rate": 9.908837991182468e-06, "Pretrain/Loss": 1.9858603477478027, "Pretrain/Loss (Raw)": 1.7425323724746704, "Pretrain/Step": 13639, "Pretrain/Step Time": 8.456200892105699} +{"Pretrain/Learning Rate": 9.905453741212337e-06, "Pretrain/Loss": 1.9878495931625366, "Pretrain/Loss (Raw)": 1.996259093284607, "Pretrain/Step": 13640, "Pretrain/Step Time": 8.456197144463658} +{"Pretrain/Learning Rate": 9.902069926482793e-06, "Pretrain/Loss": 1.9845417737960815, "Pretrain/Loss (Raw)": 1.822859525680542, "Pretrain/Step": 13641, "Pretrain/Step Time": 8.453612484037876} +{"Pretrain/Learning Rate": 9.898686547091432e-06, "Pretrain/Loss": 1.9838924407958984, "Pretrain/Loss (Raw)": 1.8922816514968872, "Pretrain/Step": 13642, "Pretrain/Step Time": 8.456534646451473} +{"Pretrain/Learning Rate": 9.895303603135788e-06, "Pretrain/Loss": 1.9865195751190186, "Pretrain/Loss (Raw)": 2.2435028553009033, "Pretrain/Step": 13643, "Pretrain/Step Time": 8.453667379915714} +{"Pretrain/Learning Rate": 9.891921094713427e-06, "Pretrain/Loss": 1.984609842300415, "Pretrain/Loss (Raw)": 1.9522275924682617, "Pretrain/Step": 13644, "Pretrain/Step Time": 8.451920665800571} +{"Pretrain/Learning Rate": 9.888539021921869e-06, "Pretrain/Loss": 1.9849441051483154, "Pretrain/Loss (Raw)": 2.0479562282562256, "Pretrain/Step": 13645, "Pretrain/Step Time": 8.453204629942775} +{"Pretrain/Learning Rate": 9.885157384858629e-06, "Pretrain/Loss": 1.9861207008361816, "Pretrain/Loss (Raw)": 2.0104494094848633, "Pretrain/Step": 13646, "Pretrain/Step Time": 8.45033579878509} +{"Pretrain/Learning Rate": 9.881776183621227e-06, "Pretrain/Loss": 1.9853055477142334, "Pretrain/Loss (Raw)": 1.7955131530761719, "Pretrain/Step": 13647, "Pretrain/Step Time": 8.454579010605812} +{"Pretrain/Learning Rate": 9.878395418307143e-06, "Pretrain/Loss": 1.9867162704467773, "Pretrain/Loss (Raw)": 2.102229356765747, "Pretrain/Step": 13648, "Pretrain/Step Time": 8.455383824184537} +{"Pretrain/Learning Rate": 9.875015089013883e-06, "Pretrain/Loss": 1.9875754117965698, "Pretrain/Loss (Raw)": 2.1976797580718994, "Pretrain/Step": 13649, "Pretrain/Step Time": 8.456077445298433} +{"Pretrain/Learning Rate": 9.871635195838886e-06, "Pretrain/Loss": 1.9881888628005981, "Pretrain/Loss (Raw)": 1.9935907125473022, "Pretrain/Step": 13650, "Pretrain/Step Time": 8.453031620010734} +{"Pretrain/Learning Rate": 9.86825573887963e-06, "Pretrain/Loss": 1.9888267517089844, "Pretrain/Loss (Raw)": 1.9718308448791504, "Pretrain/Step": 13651, "Pretrain/Step Time": 8.454484198242426} +{"Pretrain/Learning Rate": 9.864876718233546e-06, "Pretrain/Loss": 1.9884341955184937, "Pretrain/Loss (Raw)": 1.9744150638580322, "Pretrain/Step": 13652, "Pretrain/Step Time": 8.451705746352673} +{"Pretrain/Learning Rate": 9.86149813399808e-06, "Pretrain/Loss": 1.9892678260803223, "Pretrain/Loss (Raw)": 2.1890830993652344, "Pretrain/Step": 13653, "Pretrain/Step Time": 8.450453206896782} +{"Pretrain/Learning Rate": 9.858119986270642e-06, "Pretrain/Loss": 1.9895904064178467, "Pretrain/Loss (Raw)": 1.970503807067871, "Pretrain/Step": 13654, "Pretrain/Step Time": 8.445121554657817} +{"Pretrain/Learning Rate": 9.854742275148631e-06, "Pretrain/Loss": 1.9872751235961914, "Pretrain/Loss (Raw)": 1.838683843612671, "Pretrain/Step": 13655, "Pretrain/Step Time": 8.445845184847713} +{"Pretrain/Learning Rate": 9.85136500072946e-06, "Pretrain/Loss": 1.9840233325958252, "Pretrain/Loss (Raw)": 2.015001058578491, "Pretrain/Step": 13656, "Pretrain/Step Time": 8.446364698931575} +{"Pretrain/Learning Rate": 9.847988163110492e-06, "Pretrain/Loss": 1.98282790184021, "Pretrain/Loss (Raw)": 1.835302472114563, "Pretrain/Step": 13657, "Pretrain/Step Time": 8.442704575136304} +{"Pretrain/Learning Rate": 9.844611762389112e-06, "Pretrain/Loss": 1.981846570968628, "Pretrain/Loss (Raw)": 1.817650318145752, "Pretrain/Step": 13658, "Pretrain/Step Time": 8.441213488578796} +{"Pretrain/Learning Rate": 9.841235798662666e-06, "Pretrain/Loss": 1.9783048629760742, "Pretrain/Loss (Raw)": 1.9322376251220703, "Pretrain/Step": 13659, "Pretrain/Step Time": 8.445319222286344} +{"Pretrain/Learning Rate": 9.837860272028494e-06, "Pretrain/Loss": 1.979503870010376, "Pretrain/Loss (Raw)": 2.236513376235962, "Pretrain/Step": 13660, "Pretrain/Step Time": 8.450811807066202} +{"Pretrain/Learning Rate": 9.834485182583938e-06, "Pretrain/Loss": 1.9790223836898804, "Pretrain/Loss (Raw)": 1.8556371927261353, "Pretrain/Step": 13661, "Pretrain/Step Time": 8.445969700813293} +{"Pretrain/Learning Rate": 9.831110530426301e-06, "Pretrain/Loss": 1.9809229373931885, "Pretrain/Loss (Raw)": 2.092834949493408, "Pretrain/Step": 13662, "Pretrain/Step Time": 8.447439504787326} +{"Pretrain/Learning Rate": 9.82773631565291e-06, "Pretrain/Loss": 1.9796161651611328, "Pretrain/Loss (Raw)": 1.8875032663345337, "Pretrain/Step": 13663, "Pretrain/Step Time": 8.44753791578114} +{"Pretrain/Learning Rate": 9.824362538361048e-06, "Pretrain/Loss": 1.981541395187378, "Pretrain/Loss (Raw)": 2.0524561405181885, "Pretrain/Step": 13664, "Pretrain/Step Time": 8.449984120205045} +{"Pretrain/Learning Rate": 9.820989198647984e-06, "Pretrain/Loss": 1.979032039642334, "Pretrain/Loss (Raw)": 1.7562999725341797, "Pretrain/Step": 13665, "Pretrain/Step Time": 8.447311898693442} +{"Pretrain/Learning Rate": 9.817616296611003e-06, "Pretrain/Loss": 1.9766688346862793, "Pretrain/Loss (Raw)": 1.9398256540298462, "Pretrain/Step": 13666, "Pretrain/Step Time": 8.446140192449093} +{"Pretrain/Learning Rate": 9.814243832347347e-06, "Pretrain/Loss": 1.9788936376571655, "Pretrain/Loss (Raw)": 2.09709095954895, "Pretrain/Step": 13667, "Pretrain/Step Time": 8.455446779727936} +{"Pretrain/Learning Rate": 9.810871805954272e-06, "Pretrain/Loss": 1.979109287261963, "Pretrain/Loss (Raw)": 2.0818724632263184, "Pretrain/Step": 13668, "Pretrain/Step Time": 8.454681072384119} +{"Pretrain/Learning Rate": 9.807500217529e-06, "Pretrain/Loss": 1.9791210889816284, "Pretrain/Loss (Raw)": 2.033374547958374, "Pretrain/Step": 13669, "Pretrain/Step Time": 8.45496429130435} +{"Pretrain/Learning Rate": 9.804129067168743e-06, "Pretrain/Loss": 1.978053331375122, "Pretrain/Loss (Raw)": 1.904762625694275, "Pretrain/Step": 13670, "Pretrain/Step Time": 8.451618203893304} +{"Pretrain/Learning Rate": 9.800758354970722e-06, "Pretrain/Loss": 1.9762978553771973, "Pretrain/Loss (Raw)": 1.859302282333374, "Pretrain/Step": 13671, "Pretrain/Step Time": 8.455134004354477} +{"Pretrain/Learning Rate": 9.797388081032106e-06, "Pretrain/Loss": 1.9756919145584106, "Pretrain/Loss (Raw)": 2.022223711013794, "Pretrain/Step": 13672, "Pretrain/Step Time": 8.449794873595238} +{"Pretrain/Learning Rate": 9.794018245450098e-06, "Pretrain/Loss": 1.9765547513961792, "Pretrain/Loss (Raw)": 2.0656869411468506, "Pretrain/Step": 13673, "Pretrain/Step Time": 8.453310053795576} +{"Pretrain/Learning Rate": 9.790648848321854e-06, "Pretrain/Loss": 1.9765326976776123, "Pretrain/Loss (Raw)": 1.96119225025177, "Pretrain/Step": 13674, "Pretrain/Step Time": 8.449618354439735} +{"Pretrain/Learning Rate": 9.787279889744519e-06, "Pretrain/Loss": 1.977225661277771, "Pretrain/Loss (Raw)": 2.1336874961853027, "Pretrain/Step": 13675, "Pretrain/Step Time": 8.45358451642096} +{"Pretrain/Learning Rate": 9.783911369815255e-06, "Pretrain/Loss": 1.978266716003418, "Pretrain/Loss (Raw)": 2.131784200668335, "Pretrain/Step": 13676, "Pretrain/Step Time": 8.453086072579026} +{"Pretrain/Learning Rate": 9.780543288631173e-06, "Pretrain/Loss": 1.9807400703430176, "Pretrain/Loss (Raw)": 2.1213009357452393, "Pretrain/Step": 13677, "Pretrain/Step Time": 8.455187914893031} +{"Pretrain/Learning Rate": 9.7771756462894e-06, "Pretrain/Loss": 1.9843264818191528, "Pretrain/Loss (Raw)": 2.042732000350952, "Pretrain/Step": 13678, "Pretrain/Step Time": 8.450928289443254} +{"Pretrain/Learning Rate": 9.77380844288704e-06, "Pretrain/Loss": 1.9828205108642578, "Pretrain/Loss (Raw)": 1.823345422744751, "Pretrain/Step": 13679, "Pretrain/Step Time": 8.454690340906382} +{"Pretrain/Learning Rate": 9.770441678521166e-06, "Pretrain/Loss": 1.9836691617965698, "Pretrain/Loss (Raw)": 1.6937364339828491, "Pretrain/Step": 13680, "Pretrain/Step Time": 8.457450717687607} +{"Pretrain/Learning Rate": 9.767075353288886e-06, "Pretrain/Loss": 1.985162377357483, "Pretrain/Loss (Raw)": 2.0127789974212646, "Pretrain/Step": 13681, "Pretrain/Step Time": 8.459134940057993} +{"Pretrain/Learning Rate": 9.763709467287236e-06, "Pretrain/Loss": 1.9838143587112427, "Pretrain/Loss (Raw)": 2.073362112045288, "Pretrain/Step": 13682, "Pretrain/Step Time": 8.457900062203407} +{"Pretrain/Learning Rate": 9.760344020613291e-06, "Pretrain/Loss": 1.9827369451522827, "Pretrain/Loss (Raw)": 1.7414734363555908, "Pretrain/Step": 13683, "Pretrain/Step Time": 8.46087385341525} +{"Pretrain/Learning Rate": 9.756979013364083e-06, "Pretrain/Loss": 1.9841009378433228, "Pretrain/Loss (Raw)": 2.1603667736053467, "Pretrain/Step": 13684, "Pretrain/Step Time": 8.458893336355686} +{"Pretrain/Learning Rate": 9.753614445636633e-06, "Pretrain/Loss": 1.98106050491333, "Pretrain/Loss (Raw)": 1.730078101158142, "Pretrain/Step": 13685, "Pretrain/Step Time": 8.461060719564557} +{"Pretrain/Learning Rate": 9.75025031752797e-06, "Pretrain/Loss": 1.9816975593566895, "Pretrain/Loss (Raw)": 2.0316519737243652, "Pretrain/Step": 13686, "Pretrain/Step Time": 8.458762634545565} +{"Pretrain/Learning Rate": 9.746886629135082e-06, "Pretrain/Loss": 1.985689401626587, "Pretrain/Loss (Raw)": 2.404977798461914, "Pretrain/Step": 13687, "Pretrain/Step Time": 8.459285639226437} +{"Pretrain/Learning Rate": 9.743523380554973e-06, "Pretrain/Loss": 1.98589026927948, "Pretrain/Loss (Raw)": 1.745901107788086, "Pretrain/Step": 13688, "Pretrain/Step Time": 8.460876500234008} +{"Pretrain/Learning Rate": 9.74016057188461e-06, "Pretrain/Loss": 1.9869962930679321, "Pretrain/Loss (Raw)": 1.9165419340133667, "Pretrain/Step": 13689, "Pretrain/Step Time": 8.458020942285657} +{"Pretrain/Learning Rate": 9.736798203220954e-06, "Pretrain/Loss": 1.9878485202789307, "Pretrain/Loss (Raw)": 2.2302486896514893, "Pretrain/Step": 13690, "Pretrain/Step Time": 8.45837670378387} +{"Pretrain/Learning Rate": 9.733436274660968e-06, "Pretrain/Loss": 1.9901326894760132, "Pretrain/Loss (Raw)": 2.060391426086426, "Pretrain/Step": 13691, "Pretrain/Step Time": 8.457652302458882} +{"Pretrain/Learning Rate": 9.730074786301577e-06, "Pretrain/Loss": 1.9909816980361938, "Pretrain/Loss (Raw)": 1.9979441165924072, "Pretrain/Step": 13692, "Pretrain/Step Time": 8.456459622830153} +{"Pretrain/Learning Rate": 9.726713738239724e-06, "Pretrain/Loss": 1.9893019199371338, "Pretrain/Loss (Raw)": 1.853285312652588, "Pretrain/Step": 13693, "Pretrain/Step Time": 8.459212807938457} +{"Pretrain/Learning Rate": 9.723353130572313e-06, "Pretrain/Loss": 1.9903066158294678, "Pretrain/Loss (Raw)": 1.9934883117675781, "Pretrain/Step": 13694, "Pretrain/Step Time": 8.457692634314299} +{"Pretrain/Learning Rate": 9.719992963396238e-06, "Pretrain/Loss": 1.9905240535736084, "Pretrain/Loss (Raw)": 1.9304643869400024, "Pretrain/Step": 13695, "Pretrain/Step Time": 8.45813999697566} +{"Pretrain/Learning Rate": 9.7166332368084e-06, "Pretrain/Loss": 1.9889416694641113, "Pretrain/Loss (Raw)": 1.6180309057235718, "Pretrain/Step": 13696, "Pretrain/Step Time": 8.457525536417961} +{"Pretrain/Learning Rate": 9.71327395090566e-06, "Pretrain/Loss": 1.9890400171279907, "Pretrain/Loss (Raw)": 2.1450557708740234, "Pretrain/Step": 13697, "Pretrain/Step Time": 8.458855528384447} +{"Pretrain/Learning Rate": 9.7099151057849e-06, "Pretrain/Loss": 1.9901717901229858, "Pretrain/Loss (Raw)": 2.028568983078003, "Pretrain/Step": 13698, "Pretrain/Step Time": 8.45672595500946} +{"Pretrain/Learning Rate": 9.706556701542959e-06, "Pretrain/Loss": 1.989797830581665, "Pretrain/Loss (Raw)": 1.9018386602401733, "Pretrain/Step": 13699, "Pretrain/Step Time": 8.458769807592034} +{"Pretrain/Learning Rate": 9.703198738276665e-06, "Pretrain/Loss": 1.9923501014709473, "Pretrain/Loss (Raw)": 1.998597264289856, "Pretrain/Step": 13700, "Pretrain/Step Time": 8.458395222201943} +{"Pretrain/Learning Rate": 9.69984121608286e-06, "Pretrain/Loss": 1.993920087814331, "Pretrain/Loss (Raw)": 2.208409309387207, "Pretrain/Step": 13701, "Pretrain/Step Time": 8.456653891131282} +{"Pretrain/Learning Rate": 9.69648413505834e-06, "Pretrain/Loss": 1.9924285411834717, "Pretrain/Loss (Raw)": 1.9610035419464111, "Pretrain/Step": 13702, "Pretrain/Step Time": 8.455583920702338} +{"Pretrain/Learning Rate": 9.69312749529992e-06, "Pretrain/Loss": 1.9938896894454956, "Pretrain/Loss (Raw)": 2.101374626159668, "Pretrain/Step": 13703, "Pretrain/Step Time": 8.458409536629915} +{"Pretrain/Learning Rate": 9.68977129690438e-06, "Pretrain/Loss": 1.994267225265503, "Pretrain/Loss (Raw)": 1.9204927682876587, "Pretrain/Step": 13704, "Pretrain/Step Time": 8.455925116315484} +{"Pretrain/Learning Rate": 9.68641553996848e-06, "Pretrain/Loss": 1.9911766052246094, "Pretrain/Loss (Raw)": 1.6798346042633057, "Pretrain/Step": 13705, "Pretrain/Step Time": 8.461842896416783} +{"Pretrain/Learning Rate": 9.683060224589e-06, "Pretrain/Loss": 1.9890952110290527, "Pretrain/Loss (Raw)": 1.4190667867660522, "Pretrain/Step": 13706, "Pretrain/Step Time": 8.460879186168313} +{"Pretrain/Learning Rate": 9.679705350862675e-06, "Pretrain/Loss": 1.9880409240722656, "Pretrain/Loss (Raw)": 1.982795000076294, "Pretrain/Step": 13707, "Pretrain/Step Time": 8.460223361849785} +{"Pretrain/Learning Rate": 9.676350918886253e-06, "Pretrain/Loss": 1.9870774745941162, "Pretrain/Loss (Raw)": 1.8503828048706055, "Pretrain/Step": 13708, "Pretrain/Step Time": 8.460776237770915} +{"Pretrain/Learning Rate": 9.67299692875645e-06, "Pretrain/Loss": 1.9907739162445068, "Pretrain/Loss (Raw)": 2.4500274658203125, "Pretrain/Step": 13709, "Pretrain/Step Time": 8.456201633438468} +{"Pretrain/Learning Rate": 9.669643380569971e-06, "Pretrain/Loss": 1.9928486347198486, "Pretrain/Loss (Raw)": 2.069899320602417, "Pretrain/Step": 13710, "Pretrain/Step Time": 8.459438417106867} +{"Pretrain/Learning Rate": 9.666290274423523e-06, "Pretrain/Loss": 1.9900288581848145, "Pretrain/Loss (Raw)": 2.0546600818634033, "Pretrain/Step": 13711, "Pretrain/Step Time": 8.460041716694832} +{"Pretrain/Learning Rate": 9.662937610413775e-06, "Pretrain/Loss": 1.988333821296692, "Pretrain/Loss (Raw)": 1.926960825920105, "Pretrain/Step": 13712, "Pretrain/Step Time": 8.456539215520024} +{"Pretrain/Learning Rate": 9.65958538863742e-06, "Pretrain/Loss": 1.9883993864059448, "Pretrain/Loss (Raw)": 2.079740047454834, "Pretrain/Step": 13713, "Pretrain/Step Time": 8.455563005059958} +{"Pretrain/Learning Rate": 9.656233609191106e-06, "Pretrain/Loss": 1.9884014129638672, "Pretrain/Loss (Raw)": 2.125136375427246, "Pretrain/Step": 13714, "Pretrain/Step Time": 8.454329648986459} +{"Pretrain/Learning Rate": 9.65288227217147e-06, "Pretrain/Loss": 1.9886698722839355, "Pretrain/Loss (Raw)": 2.065185308456421, "Pretrain/Step": 13715, "Pretrain/Step Time": 8.456051014363766} +{"Pretrain/Learning Rate": 9.649531377675164e-06, "Pretrain/Loss": 1.9875624179840088, "Pretrain/Loss (Raw)": 1.9046183824539185, "Pretrain/Step": 13716, "Pretrain/Step Time": 8.454326417297125} +{"Pretrain/Learning Rate": 9.646180925798793e-06, "Pretrain/Loss": 1.9879993200302124, "Pretrain/Loss (Raw)": 1.8672212362289429, "Pretrain/Step": 13717, "Pretrain/Step Time": 8.458519320935011} +{"Pretrain/Learning Rate": 9.642830916638976e-06, "Pretrain/Loss": 1.9871481657028198, "Pretrain/Loss (Raw)": 2.0460205078125, "Pretrain/Step": 13718, "Pretrain/Step Time": 8.451349155977368} +{"Pretrain/Learning Rate": 9.639481350292296e-06, "Pretrain/Loss": 1.986404538154602, "Pretrain/Loss (Raw)": 1.978910207748413, "Pretrain/Step": 13719, "Pretrain/Step Time": 8.457612128928304} +{"Pretrain/Learning Rate": 9.636132226855352e-06, "Pretrain/Loss": 1.9891376495361328, "Pretrain/Loss (Raw)": 2.0423426628112793, "Pretrain/Step": 13720, "Pretrain/Step Time": 8.461366783827543} +{"Pretrain/Learning Rate": 9.632783546424704e-06, "Pretrain/Loss": 1.9911385774612427, "Pretrain/Loss (Raw)": 1.9575121402740479, "Pretrain/Step": 13721, "Pretrain/Step Time": 8.459170749410987} +{"Pretrain/Learning Rate": 9.629435309096899e-06, "Pretrain/Loss": 1.9935270547866821, "Pretrain/Loss (Raw)": 2.1662607192993164, "Pretrain/Step": 13722, "Pretrain/Step Time": 8.456417521461844} +{"Pretrain/Learning Rate": 9.626087514968502e-06, "Pretrain/Loss": 1.9955717325210571, "Pretrain/Loss (Raw)": 2.1347203254699707, "Pretrain/Step": 13723, "Pretrain/Step Time": 8.453365698456764} +{"Pretrain/Learning Rate": 9.622740164136027e-06, "Pretrain/Loss": 1.994518518447876, "Pretrain/Loss (Raw)": 1.7466793060302734, "Pretrain/Step": 13724, "Pretrain/Step Time": 8.456141084432602} +{"Pretrain/Learning Rate": 9.619393256696005e-06, "Pretrain/Loss": 1.9929935932159424, "Pretrain/Loss (Raw)": 1.873469352722168, "Pretrain/Step": 13725, "Pretrain/Step Time": 8.454472191631794} +{"Pretrain/Learning Rate": 9.616046792744934e-06, "Pretrain/Loss": 1.9943978786468506, "Pretrain/Loss (Raw)": 2.0118203163146973, "Pretrain/Step": 13726, "Pretrain/Step Time": 8.459809834137559} +{"Pretrain/Learning Rate": 9.612700772379304e-06, "Pretrain/Loss": 1.9963159561157227, "Pretrain/Loss (Raw)": 2.1243433952331543, "Pretrain/Step": 13727, "Pretrain/Step Time": 8.460482535883784} +{"Pretrain/Learning Rate": 9.609355195695604e-06, "Pretrain/Loss": 1.9920488595962524, "Pretrain/Loss (Raw)": 1.8371151685714722, "Pretrain/Step": 13728, "Pretrain/Step Time": 8.459679190069437} +{"Pretrain/Learning Rate": 9.606010062790293e-06, "Pretrain/Loss": 1.9887735843658447, "Pretrain/Loss (Raw)": 1.7233220338821411, "Pretrain/Step": 13729, "Pretrain/Step Time": 8.458793932572007} +{"Pretrain/Learning Rate": 9.602665373759837e-06, "Pretrain/Loss": 1.9873771667480469, "Pretrain/Loss (Raw)": 1.8202052116394043, "Pretrain/Step": 13730, "Pretrain/Step Time": 8.45570683479309} +{"Pretrain/Learning Rate": 9.59932112870067e-06, "Pretrain/Loss": 1.9841930866241455, "Pretrain/Loss (Raw)": 2.0261714458465576, "Pretrain/Step": 13731, "Pretrain/Step Time": 8.451402354985476} +{"Pretrain/Learning Rate": 9.595977327709214e-06, "Pretrain/Loss": 1.9827165603637695, "Pretrain/Loss (Raw)": 1.8470927476882935, "Pretrain/Step": 13732, "Pretrain/Step Time": 8.458527697250247} +{"Pretrain/Learning Rate": 9.59263397088191e-06, "Pretrain/Loss": 1.9810724258422852, "Pretrain/Loss (Raw)": 1.6132183074951172, "Pretrain/Step": 13733, "Pretrain/Step Time": 8.453860960900784} +{"Pretrain/Learning Rate": 9.589291058315125e-06, "Pretrain/Loss": 1.981010913848877, "Pretrain/Loss (Raw)": 1.9934196472167969, "Pretrain/Step": 13734, "Pretrain/Step Time": 8.452717676758766} +{"Pretrain/Learning Rate": 9.585948590105278e-06, "Pretrain/Loss": 1.9822139739990234, "Pretrain/Loss (Raw)": 2.3474297523498535, "Pretrain/Step": 13735, "Pretrain/Step Time": 8.456121265888214} +{"Pretrain/Learning Rate": 9.58260656634873e-06, "Pretrain/Loss": 1.9837496280670166, "Pretrain/Loss (Raw)": 2.0019822120666504, "Pretrain/Step": 13736, "Pretrain/Step Time": 8.456686833873391} +{"Pretrain/Learning Rate": 9.57926498714186e-06, "Pretrain/Loss": 1.9853143692016602, "Pretrain/Loss (Raw)": 2.0314760208129883, "Pretrain/Step": 13737, "Pretrain/Step Time": 8.45551778562367} +{"Pretrain/Learning Rate": 9.575923852581012e-06, "Pretrain/Loss": 1.9846138954162598, "Pretrain/Loss (Raw)": 2.0044238567352295, "Pretrain/Step": 13738, "Pretrain/Step Time": 8.45668501406908} +{"Pretrain/Learning Rate": 9.57258316276252e-06, "Pretrain/Loss": 1.9834659099578857, "Pretrain/Loss (Raw)": 2.0831782817840576, "Pretrain/Step": 13739, "Pretrain/Step Time": 8.451551366597414} +{"Pretrain/Learning Rate": 9.569242917782726e-06, "Pretrain/Loss": 1.9814355373382568, "Pretrain/Loss (Raw)": 1.7466707229614258, "Pretrain/Step": 13740, "Pretrain/Step Time": 8.451343432068825} +{"Pretrain/Learning Rate": 9.565903117737923e-06, "Pretrain/Loss": 1.9774143695831299, "Pretrain/Loss (Raw)": 1.5195080041885376, "Pretrain/Step": 13741, "Pretrain/Step Time": 8.453533440828323} +{"Pretrain/Learning Rate": 9.562563762724434e-06, "Pretrain/Loss": 1.9755648374557495, "Pretrain/Loss (Raw)": 1.8879674673080444, "Pretrain/Step": 13742, "Pretrain/Step Time": 8.452604474499822} +{"Pretrain/Learning Rate": 9.559224852838535e-06, "Pretrain/Loss": 1.976873517036438, "Pretrain/Loss (Raw)": 2.0498385429382324, "Pretrain/Step": 13743, "Pretrain/Step Time": 8.457199219614267} +{"Pretrain/Learning Rate": 9.555886388176497e-06, "Pretrain/Loss": 1.9780309200286865, "Pretrain/Loss (Raw)": 2.1415977478027344, "Pretrain/Step": 13744, "Pretrain/Step Time": 8.459386250004172} +{"Pretrain/Learning Rate": 9.552548368834593e-06, "Pretrain/Loss": 1.9782191514968872, "Pretrain/Loss (Raw)": 2.049823522567749, "Pretrain/Step": 13745, "Pretrain/Step Time": 8.456240398809314} +{"Pretrain/Learning Rate": 9.549210794909058e-06, "Pretrain/Loss": 1.976710319519043, "Pretrain/Loss (Raw)": 1.785926103591919, "Pretrain/Step": 13746, "Pretrain/Step Time": 8.456983691081405} +{"Pretrain/Learning Rate": 9.545873666496147e-06, "Pretrain/Loss": 1.9762858152389526, "Pretrain/Loss (Raw)": 1.9878649711608887, "Pretrain/Step": 13747, "Pretrain/Step Time": 8.454531043767929} +{"Pretrain/Learning Rate": 9.542536983692076e-06, "Pretrain/Loss": 1.9744927883148193, "Pretrain/Loss (Raw)": 1.953620433807373, "Pretrain/Step": 13748, "Pretrain/Step Time": 8.465503381565213} +{"Pretrain/Learning Rate": 9.539200746593044e-06, "Pretrain/Loss": 1.9758808612823486, "Pretrain/Loss (Raw)": 1.8914861679077148, "Pretrain/Step": 13749, "Pretrain/Step Time": 8.465744556859136} +{"Pretrain/Learning Rate": 9.535864955295269e-06, "Pretrain/Loss": 1.9749939441680908, "Pretrain/Loss (Raw)": 1.9461925029754639, "Pretrain/Step": 13750, "Pretrain/Step Time": 8.464024802669883} +{"Pretrain/Learning Rate": 9.532529609894917e-06, "Pretrain/Loss": 1.9763596057891846, "Pretrain/Loss (Raw)": 2.1198620796203613, "Pretrain/Step": 13751, "Pretrain/Step Time": 8.460479062050581} +{"Pretrain/Learning Rate": 9.529194710488179e-06, "Pretrain/Loss": 1.9776899814605713, "Pretrain/Loss (Raw)": 2.076744318008423, "Pretrain/Step": 13752, "Pretrain/Step Time": 8.463050577789545} +{"Pretrain/Learning Rate": 9.525860257171207e-06, "Pretrain/Loss": 1.9768304824829102, "Pretrain/Loss (Raw)": 2.0605053901672363, "Pretrain/Step": 13753, "Pretrain/Step Time": 8.464436097070575} +{"Pretrain/Learning Rate": 9.522526250040133e-06, "Pretrain/Loss": 1.9756497144699097, "Pretrain/Loss (Raw)": 2.0725502967834473, "Pretrain/Step": 13754, "Pretrain/Step Time": 8.466026732698083} +{"Pretrain/Learning Rate": 9.519192689191117e-06, "Pretrain/Loss": 1.9760550260543823, "Pretrain/Loss (Raw)": 1.879092812538147, "Pretrain/Step": 13755, "Pretrain/Step Time": 8.465582638978958} +{"Pretrain/Learning Rate": 9.515859574720253e-06, "Pretrain/Loss": 1.9753875732421875, "Pretrain/Loss (Raw)": 1.8228938579559326, "Pretrain/Step": 13756, "Pretrain/Step Time": 8.464601306244731} +{"Pretrain/Learning Rate": 9.512526906723676e-06, "Pretrain/Loss": 1.9757401943206787, "Pretrain/Loss (Raw)": 2.0879318714141846, "Pretrain/Step": 13757, "Pretrain/Step Time": 8.462576912716031} +{"Pretrain/Learning Rate": 9.509194685297465e-06, "Pretrain/Loss": 1.9789226055145264, "Pretrain/Loss (Raw)": 2.1284685134887695, "Pretrain/Step": 13758, "Pretrain/Step Time": 8.46566498838365} +{"Pretrain/Learning Rate": 9.505862910537697e-06, "Pretrain/Loss": 1.9797500371932983, "Pretrain/Loss (Raw)": 2.118656873703003, "Pretrain/Step": 13759, "Pretrain/Step Time": 8.467234319075942} +{"Pretrain/Learning Rate": 9.502531582540457e-06, "Pretrain/Loss": 1.978987216949463, "Pretrain/Loss (Raw)": 1.9422348737716675, "Pretrain/Step": 13760, "Pretrain/Step Time": 8.468703653663397} +{"Pretrain/Learning Rate": 9.499200701401787e-06, "Pretrain/Loss": 1.9771406650543213, "Pretrain/Loss (Raw)": 1.9612663984298706, "Pretrain/Step": 13761, "Pretrain/Step Time": 8.469914935529232} +{"Pretrain/Learning Rate": 9.495870267217746e-06, "Pretrain/Loss": 1.976209044456482, "Pretrain/Loss (Raw)": 1.8379954099655151, "Pretrain/Step": 13762, "Pretrain/Step Time": 8.470003990456462} +{"Pretrain/Learning Rate": 9.492540280084355e-06, "Pretrain/Loss": 1.9772756099700928, "Pretrain/Loss (Raw)": 2.0825307369232178, "Pretrain/Step": 13763, "Pretrain/Step Time": 8.470298299565911} +{"Pretrain/Learning Rate": 9.489210740097624e-06, "Pretrain/Loss": 1.974902868270874, "Pretrain/Loss (Raw)": 1.7642687559127808, "Pretrain/Step": 13764, "Pretrain/Step Time": 8.469639984890819} +{"Pretrain/Learning Rate": 9.485881647353576e-06, "Pretrain/Loss": 1.9754301309585571, "Pretrain/Loss (Raw)": 2.095594644546509, "Pretrain/Step": 13765, "Pretrain/Step Time": 8.472899474203587} +{"Pretrain/Learning Rate": 9.482553001948185e-06, "Pretrain/Loss": 1.974157452583313, "Pretrain/Loss (Raw)": 1.8931423425674438, "Pretrain/Step": 13766, "Pretrain/Step Time": 8.470387186855078} +{"Pretrain/Learning Rate": 9.479224803977449e-06, "Pretrain/Loss": 1.9765288829803467, "Pretrain/Loss (Raw)": 2.046067953109741, "Pretrain/Step": 13767, "Pretrain/Step Time": 8.467366512864828} +{"Pretrain/Learning Rate": 9.475897053537324e-06, "Pretrain/Loss": 1.976534366607666, "Pretrain/Loss (Raw)": 1.9969562292099, "Pretrain/Step": 13768, "Pretrain/Step Time": 8.468039756640792} +{"Pretrain/Learning Rate": 9.472569750723753e-06, "Pretrain/Loss": 1.9797818660736084, "Pretrain/Loss (Raw)": 2.2385528087615967, "Pretrain/Step": 13769, "Pretrain/Step Time": 8.469846362248063} +{"Pretrain/Learning Rate": 9.469242895632698e-06, "Pretrain/Loss": 1.9821356534957886, "Pretrain/Loss (Raw)": 2.1935529708862305, "Pretrain/Step": 13770, "Pretrain/Step Time": 8.466668652370572} +{"Pretrain/Learning Rate": 9.465916488360065e-06, "Pretrain/Loss": 1.9801558256149292, "Pretrain/Loss (Raw)": 1.9900944232940674, "Pretrain/Step": 13771, "Pretrain/Step Time": 8.466991236433387} +{"Pretrain/Learning Rate": 9.462590529001792e-06, "Pretrain/Loss": 1.9806660413742065, "Pretrain/Loss (Raw)": 2.017526388168335, "Pretrain/Step": 13772, "Pretrain/Step Time": 8.467218112200499} +{"Pretrain/Learning Rate": 9.459265017653764e-06, "Pretrain/Loss": 1.9789960384368896, "Pretrain/Loss (Raw)": 1.8342125415802002, "Pretrain/Step": 13773, "Pretrain/Step Time": 8.469013899564743} +{"Pretrain/Learning Rate": 9.455939954411867e-06, "Pretrain/Loss": 1.9796056747436523, "Pretrain/Loss (Raw)": 2.0884830951690674, "Pretrain/Step": 13774, "Pretrain/Step Time": 8.470346858724952} +{"Pretrain/Learning Rate": 9.452615339371993e-06, "Pretrain/Loss": 1.9798938035964966, "Pretrain/Loss (Raw)": 1.8323860168457031, "Pretrain/Step": 13775, "Pretrain/Step Time": 8.470249928534031} +{"Pretrain/Learning Rate": 9.449291172629985e-06, "Pretrain/Loss": 1.9786723852157593, "Pretrain/Loss (Raw)": 1.9458853006362915, "Pretrain/Step": 13776, "Pretrain/Step Time": 8.47468433342874} +{"Pretrain/Learning Rate": 9.445967454281712e-06, "Pretrain/Loss": 1.9756319522857666, "Pretrain/Loss (Raw)": 1.8085180521011353, "Pretrain/Step": 13777, "Pretrain/Step Time": 8.475270414724946} +{"Pretrain/Learning Rate": 9.442644184423002e-06, "Pretrain/Loss": 1.9784202575683594, "Pretrain/Loss (Raw)": 2.350485324859619, "Pretrain/Step": 13778, "Pretrain/Step Time": 8.477022670209408} +{"Pretrain/Learning Rate": 9.439321363149672e-06, "Pretrain/Loss": 1.9811211824417114, "Pretrain/Loss (Raw)": 2.31754207611084, "Pretrain/Step": 13779, "Pretrain/Step Time": 8.47380675189197} +{"Pretrain/Learning Rate": 9.435998990557551e-06, "Pretrain/Loss": 1.983487844467163, "Pretrain/Loss (Raw)": 2.277345895767212, "Pretrain/Step": 13780, "Pretrain/Step Time": 8.47219156473875} +{"Pretrain/Learning Rate": 9.432677066742418e-06, "Pretrain/Loss": 1.9815921783447266, "Pretrain/Loss (Raw)": 1.9464532136917114, "Pretrain/Step": 13781, "Pretrain/Step Time": 8.478221090510488} +{"Pretrain/Learning Rate": 9.429355591800074e-06, "Pretrain/Loss": 1.9818730354309082, "Pretrain/Loss (Raw)": 2.0064523220062256, "Pretrain/Step": 13782, "Pretrain/Step Time": 8.47683709859848} +{"Pretrain/Learning Rate": 9.426034565826278e-06, "Pretrain/Loss": 1.9818662405014038, "Pretrain/Loss (Raw)": 1.8378082513809204, "Pretrain/Step": 13783, "Pretrain/Step Time": 8.477267634123564} +{"Pretrain/Learning Rate": 9.422713988916806e-06, "Pretrain/Loss": 1.9814722537994385, "Pretrain/Loss (Raw)": 1.9645705223083496, "Pretrain/Step": 13784, "Pretrain/Step Time": 8.484364645555615} +{"Pretrain/Learning Rate": 9.419393861167394e-06, "Pretrain/Loss": 1.983398199081421, "Pretrain/Loss (Raw)": 2.0818209648132324, "Pretrain/Step": 13785, "Pretrain/Step Time": 8.483167614787817} +{"Pretrain/Learning Rate": 9.416074182673768e-06, "Pretrain/Loss": 1.9836089611053467, "Pretrain/Loss (Raw)": 1.8446292877197266, "Pretrain/Step": 13786, "Pretrain/Step Time": 8.485025512054563} +{"Pretrain/Learning Rate": 9.412754953531663e-06, "Pretrain/Loss": 1.9856611490249634, "Pretrain/Loss (Raw)": 2.1949126720428467, "Pretrain/Step": 13787, "Pretrain/Step Time": 8.479546001181006} +{"Pretrain/Learning Rate": 9.409436173836775e-06, "Pretrain/Loss": 1.9809088706970215, "Pretrain/Loss (Raw)": 1.628210425376892, "Pretrain/Step": 13788, "Pretrain/Step Time": 8.474549254402518} +{"Pretrain/Learning Rate": 9.406117843684812e-06, "Pretrain/Loss": 1.9833507537841797, "Pretrain/Loss (Raw)": 2.1682143211364746, "Pretrain/Step": 13789, "Pretrain/Step Time": 8.473298516124487} +{"Pretrain/Learning Rate": 9.402799963171449e-06, "Pretrain/Loss": 1.9797054529190063, "Pretrain/Loss (Raw)": 1.626233458518982, "Pretrain/Step": 13790, "Pretrain/Step Time": 8.47938323393464} +{"Pretrain/Learning Rate": 9.399482532392343e-06, "Pretrain/Loss": 1.980863332748413, "Pretrain/Loss (Raw)": 2.0357134342193604, "Pretrain/Step": 13791, "Pretrain/Step Time": 8.481282997876406} +{"Pretrain/Learning Rate": 9.39616555144317e-06, "Pretrain/Loss": 1.9803218841552734, "Pretrain/Loss (Raw)": 1.9831637144088745, "Pretrain/Step": 13792, "Pretrain/Step Time": 8.479573549702764} +{"Pretrain/Learning Rate": 9.392849020419555e-06, "Pretrain/Loss": 1.981279969215393, "Pretrain/Loss (Raw)": 1.8789279460906982, "Pretrain/Step": 13793, "Pretrain/Step Time": 8.480433003976941} +{"Pretrain/Learning Rate": 9.389532939417145e-06, "Pretrain/Loss": 1.982050895690918, "Pretrain/Loss (Raw)": 2.038491725921631, "Pretrain/Step": 13794, "Pretrain/Step Time": 8.482536409050226} +{"Pretrain/Learning Rate": 9.386217308531548e-06, "Pretrain/Loss": 1.9818452596664429, "Pretrain/Loss (Raw)": 2.070763111114502, "Pretrain/Step": 13795, "Pretrain/Step Time": 8.471393266692758} +{"Pretrain/Learning Rate": 9.38290212785836e-06, "Pretrain/Loss": 1.9815025329589844, "Pretrain/Loss (Raw)": 2.0380213260650635, "Pretrain/Step": 13796, "Pretrain/Step Time": 8.473618727177382} +{"Pretrain/Learning Rate": 9.379587397493186e-06, "Pretrain/Loss": 1.9836456775665283, "Pretrain/Loss (Raw)": 2.3076894283294678, "Pretrain/Step": 13797, "Pretrain/Step Time": 8.475571621209383} +{"Pretrain/Learning Rate": 9.376273117531593e-06, "Pretrain/Loss": 1.9794747829437256, "Pretrain/Loss (Raw)": 1.3708877563476562, "Pretrain/Step": 13798, "Pretrain/Step Time": 8.471336105838418} +{"Pretrain/Learning Rate": 9.372959288069156e-06, "Pretrain/Loss": 1.981736183166504, "Pretrain/Loss (Raw)": 2.148770332336426, "Pretrain/Step": 13799, "Pretrain/Step Time": 8.473190048709512} +{"Pretrain/Learning Rate": 9.369645909201424e-06, "Pretrain/Loss": 1.9821200370788574, "Pretrain/Loss (Raw)": 2.071350574493408, "Pretrain/Step": 13800, "Pretrain/Step Time": 8.473787574097514} +{"Pretrain/Learning Rate": 9.366332981023923e-06, "Pretrain/Loss": 1.9810532331466675, "Pretrain/Loss (Raw)": 1.9291433095932007, "Pretrain/Step": 13801, "Pretrain/Step Time": 8.473157977685332} +{"Pretrain/Learning Rate": 9.363020503632197e-06, "Pretrain/Loss": 1.981468677520752, "Pretrain/Loss (Raw)": 2.0143630504608154, "Pretrain/Step": 13802, "Pretrain/Step Time": 8.475210031494498} +{"Pretrain/Learning Rate": 9.359708477121745e-06, "Pretrain/Loss": 1.9815305471420288, "Pretrain/Loss (Raw)": 2.1416027545928955, "Pretrain/Step": 13803, "Pretrain/Step Time": 8.473336895927787} +{"Pretrain/Learning Rate": 9.356396901588083e-06, "Pretrain/Loss": 1.980248212814331, "Pretrain/Loss (Raw)": 1.9676398038864136, "Pretrain/Step": 13804, "Pretrain/Step Time": 8.475711539387703} +{"Pretrain/Learning Rate": 9.353085777126685e-06, "Pretrain/Loss": 1.9782228469848633, "Pretrain/Loss (Raw)": 1.8620638847351074, "Pretrain/Step": 13805, "Pretrain/Step Time": 8.472301188856363} +{"Pretrain/Learning Rate": 9.349775103833022e-06, "Pretrain/Loss": 1.9763507843017578, "Pretrain/Loss (Raw)": 1.8031100034713745, "Pretrain/Step": 13806, "Pretrain/Step Time": 8.471297984942794} +{"Pretrain/Learning Rate": 9.34646488180257e-06, "Pretrain/Loss": 1.9773993492126465, "Pretrain/Loss (Raw)": 1.9575629234313965, "Pretrain/Step": 13807, "Pretrain/Step Time": 8.471734926104546} +{"Pretrain/Learning Rate": 9.343155111130757e-06, "Pretrain/Loss": 1.9788352251052856, "Pretrain/Loss (Raw)": 1.8775250911712646, "Pretrain/Step": 13808, "Pretrain/Step Time": 8.472806921228766} +{"Pretrain/Learning Rate": 9.33984579191304e-06, "Pretrain/Loss": 1.9782267808914185, "Pretrain/Loss (Raw)": 1.934898853302002, "Pretrain/Step": 13809, "Pretrain/Step Time": 8.471678143367171} +{"Pretrain/Learning Rate": 9.33653692424483e-06, "Pretrain/Loss": 1.978297233581543, "Pretrain/Loss (Raw)": 2.0823919773101807, "Pretrain/Step": 13810, "Pretrain/Step Time": 8.478371208533645} +{"Pretrain/Learning Rate": 9.333228508221526e-06, "Pretrain/Loss": 1.9792754650115967, "Pretrain/Loss (Raw)": 1.8666679859161377, "Pretrain/Step": 13811, "Pretrain/Step Time": 8.470499301329255} +{"Pretrain/Learning Rate": 9.329920543938545e-06, "Pretrain/Loss": 1.9780120849609375, "Pretrain/Loss (Raw)": 1.998668909072876, "Pretrain/Step": 13812, "Pretrain/Step Time": 8.474402656778693} +{"Pretrain/Learning Rate": 9.326613031491247e-06, "Pretrain/Loss": 1.9789880514144897, "Pretrain/Loss (Raw)": 1.8550026416778564, "Pretrain/Step": 13813, "Pretrain/Step Time": 8.478954238817096} +{"Pretrain/Learning Rate": 9.323305970975021e-06, "Pretrain/Loss": 1.9807263612747192, "Pretrain/Loss (Raw)": 2.2541439533233643, "Pretrain/Step": 13814, "Pretrain/Step Time": 8.474748071283102} +{"Pretrain/Learning Rate": 9.319999362485218e-06, "Pretrain/Loss": 1.978633165359497, "Pretrain/Loss (Raw)": 2.1370599269866943, "Pretrain/Step": 13815, "Pretrain/Step Time": 8.47508841007948} +{"Pretrain/Learning Rate": 9.31669320611717e-06, "Pretrain/Loss": 1.9798517227172852, "Pretrain/Loss (Raw)": 1.901871919631958, "Pretrain/Step": 13816, "Pretrain/Step Time": 8.476845674216747} +{"Pretrain/Learning Rate": 9.313387501966225e-06, "Pretrain/Loss": 1.9793744087219238, "Pretrain/Loss (Raw)": 1.8554428815841675, "Pretrain/Step": 13817, "Pretrain/Step Time": 8.473061354830861} +{"Pretrain/Learning Rate": 9.310082250127698e-06, "Pretrain/Loss": 1.9788159132003784, "Pretrain/Loss (Raw)": 2.158770799636841, "Pretrain/Step": 13818, "Pretrain/Step Time": 8.472668658941984} +{"Pretrain/Learning Rate": 9.306777450696883e-06, "Pretrain/Loss": 1.9784916639328003, "Pretrain/Loss (Raw)": 2.0188722610473633, "Pretrain/Step": 13819, "Pretrain/Step Time": 8.473348995670676} +{"Pretrain/Learning Rate": 9.303473103769069e-06, "Pretrain/Loss": 1.9778876304626465, "Pretrain/Loss (Raw)": 1.9206303358078003, "Pretrain/Step": 13820, "Pretrain/Step Time": 8.473024709150195} +{"Pretrain/Learning Rate": 9.300169209439555e-06, "Pretrain/Loss": 1.9773797988891602, "Pretrain/Loss (Raw)": 1.788291573524475, "Pretrain/Step": 13821, "Pretrain/Step Time": 8.47143373824656} +{"Pretrain/Learning Rate": 9.296865767803593e-06, "Pretrain/Loss": 1.9768699407577515, "Pretrain/Loss (Raw)": 1.9282310009002686, "Pretrain/Step": 13822, "Pretrain/Step Time": 8.47377960383892} +{"Pretrain/Learning Rate": 9.293562778956428e-06, "Pretrain/Loss": 1.9784269332885742, "Pretrain/Loss (Raw)": 2.1297519207000732, "Pretrain/Step": 13823, "Pretrain/Step Time": 8.471162779256701} +{"Pretrain/Learning Rate": 9.290260242993316e-06, "Pretrain/Loss": 1.9810255765914917, "Pretrain/Loss (Raw)": 1.950655460357666, "Pretrain/Step": 13824, "Pretrain/Step Time": 8.470124293118715} +{"Pretrain/Learning Rate": 9.286958160009465e-06, "Pretrain/Loss": 1.9824014902114868, "Pretrain/Loss (Raw)": 2.3211705684661865, "Pretrain/Step": 13825, "Pretrain/Step Time": 8.476148437708616} +{"Pretrain/Learning Rate": 9.283656530100107e-06, "Pretrain/Loss": 1.981264591217041, "Pretrain/Loss (Raw)": 1.8830559253692627, "Pretrain/Step": 13826, "Pretrain/Step Time": 8.47746217250824} +{"Pretrain/Learning Rate": 9.280355353360436e-06, "Pretrain/Loss": 1.9818260669708252, "Pretrain/Loss (Raw)": 1.9737000465393066, "Pretrain/Step": 13827, "Pretrain/Step Time": 8.470288498327136} +{"Pretrain/Learning Rate": 9.277054629885628e-06, "Pretrain/Loss": 1.9819345474243164, "Pretrain/Loss (Raw)": 2.012483835220337, "Pretrain/Step": 13828, "Pretrain/Step Time": 8.47391602396965} +{"Pretrain/Learning Rate": 9.273754359770873e-06, "Pretrain/Loss": 1.9805070161819458, "Pretrain/Loss (Raw)": 2.025683879852295, "Pretrain/Step": 13829, "Pretrain/Step Time": 8.476661639288068} +{"Pretrain/Learning Rate": 9.270454543111318e-06, "Pretrain/Loss": 1.9822496175765991, "Pretrain/Loss (Raw)": 2.184053421020508, "Pretrain/Step": 13830, "Pretrain/Step Time": 8.479773482307792} +{"Pretrain/Learning Rate": 9.267155180002123e-06, "Pretrain/Loss": 1.9814631938934326, "Pretrain/Loss (Raw)": 2.000696897506714, "Pretrain/Step": 13831, "Pretrain/Step Time": 8.479193849489093} +{"Pretrain/Learning Rate": 9.263856270538421e-06, "Pretrain/Loss": 1.982070803642273, "Pretrain/Loss (Raw)": 1.998282551765442, "Pretrain/Step": 13832, "Pretrain/Step Time": 8.485301822423935} +{"Pretrain/Learning Rate": 9.26055781481532e-06, "Pretrain/Loss": 1.9850142002105713, "Pretrain/Loss (Raw)": 2.056586742401123, "Pretrain/Step": 13833, "Pretrain/Step Time": 8.477636393159628} +{"Pretrain/Learning Rate": 9.257259812927948e-06, "Pretrain/Loss": 1.9873573780059814, "Pretrain/Loss (Raw)": 1.719001054763794, "Pretrain/Step": 13834, "Pretrain/Step Time": 8.481085369363427} +{"Pretrain/Learning Rate": 9.253962264971383e-06, "Pretrain/Loss": 1.9869539737701416, "Pretrain/Loss (Raw)": 1.9311597347259521, "Pretrain/Step": 13835, "Pretrain/Step Time": 8.480057582259178} +{"Pretrain/Learning Rate": 9.250665171040723e-06, "Pretrain/Loss": 1.98868727684021, "Pretrain/Loss (Raw)": 2.072247266769409, "Pretrain/Step": 13836, "Pretrain/Step Time": 8.479647602885962} +{"Pretrain/Learning Rate": 9.247368531231033e-06, "Pretrain/Loss": 1.984089732170105, "Pretrain/Loss (Raw)": 1.861535906791687, "Pretrain/Step": 13837, "Pretrain/Step Time": 8.488005857914686} +{"Pretrain/Learning Rate": 9.244072345637356e-06, "Pretrain/Loss": 1.983573079109192, "Pretrain/Loss (Raw)": 2.003774642944336, "Pretrain/Step": 13838, "Pretrain/Step Time": 8.485053336247802} +{"Pretrain/Learning Rate": 9.240776614354754e-06, "Pretrain/Loss": 1.9841382503509521, "Pretrain/Loss (Raw)": 2.126990795135498, "Pretrain/Step": 13839, "Pretrain/Step Time": 8.485637409612536} +{"Pretrain/Learning Rate": 9.23748133747824e-06, "Pretrain/Loss": 1.9837785959243774, "Pretrain/Loss (Raw)": 1.88092839717865, "Pretrain/Step": 13840, "Pretrain/Step Time": 8.490697754547} +{"Pretrain/Learning Rate": 9.23418651510285e-06, "Pretrain/Loss": 1.9805808067321777, "Pretrain/Loss (Raw)": 1.6704181432724, "Pretrain/Step": 13841, "Pretrain/Step Time": 8.49110198020935} +{"Pretrain/Learning Rate": 9.230892147323578e-06, "Pretrain/Loss": 1.9802433252334595, "Pretrain/Loss (Raw)": 2.081939697265625, "Pretrain/Step": 13842, "Pretrain/Step Time": 8.49037747271359} +{"Pretrain/Learning Rate": 9.227598234235402e-06, "Pretrain/Loss": 1.979889988899231, "Pretrain/Loss (Raw)": 2.0199646949768066, "Pretrain/Step": 13843, "Pretrain/Step Time": 8.485284600406885} +{"Pretrain/Learning Rate": 9.224304775933324e-06, "Pretrain/Loss": 1.9815733432769775, "Pretrain/Loss (Raw)": 2.120079517364502, "Pretrain/Step": 13844, "Pretrain/Step Time": 8.485197989270091} +{"Pretrain/Learning Rate": 9.221011772512287e-06, "Pretrain/Loss": 1.9811499118804932, "Pretrain/Loss (Raw)": 1.8130192756652832, "Pretrain/Step": 13845, "Pretrain/Step Time": 8.484148183837533} +{"Pretrain/Learning Rate": 9.217719224067262e-06, "Pretrain/Loss": 1.9800928831100464, "Pretrain/Loss (Raw)": 1.9107221364974976, "Pretrain/Step": 13846, "Pretrain/Step Time": 8.4865200817585} +{"Pretrain/Learning Rate": 9.214427130693176e-06, "Pretrain/Loss": 1.9784852266311646, "Pretrain/Loss (Raw)": 1.7731335163116455, "Pretrain/Step": 13847, "Pretrain/Step Time": 8.484291909262538} +{"Pretrain/Learning Rate": 9.211135492484945e-06, "Pretrain/Loss": 1.9787684679031372, "Pretrain/Loss (Raw)": 2.0785977840423584, "Pretrain/Step": 13848, "Pretrain/Step Time": 8.486955599859357} +{"Pretrain/Learning Rate": 9.207844309537505e-06, "Pretrain/Loss": 1.9821830987930298, "Pretrain/Loss (Raw)": 2.3945837020874023, "Pretrain/Step": 13849, "Pretrain/Step Time": 8.48713800497353} +{"Pretrain/Learning Rate": 9.20455358194573e-06, "Pretrain/Loss": 1.978499174118042, "Pretrain/Loss (Raw)": 1.69472074508667, "Pretrain/Step": 13850, "Pretrain/Step Time": 8.489247044548392} +{"Pretrain/Learning Rate": 9.201263309804528e-06, "Pretrain/Loss": 1.9761098623275757, "Pretrain/Loss (Raw)": 1.8288923501968384, "Pretrain/Step": 13851, "Pretrain/Step Time": 8.48855865560472} +{"Pretrain/Learning Rate": 9.19797349320875e-06, "Pretrain/Loss": 1.9757368564605713, "Pretrain/Loss (Raw)": 1.6989213228225708, "Pretrain/Step": 13852, "Pretrain/Step Time": 8.487505462020636} +{"Pretrain/Learning Rate": 9.194684132253276e-06, "Pretrain/Loss": 1.9778004884719849, "Pretrain/Loss (Raw)": 2.1376209259033203, "Pretrain/Step": 13853, "Pretrain/Step Time": 8.490779919549823} +{"Pretrain/Learning Rate": 9.191395227032946e-06, "Pretrain/Loss": 1.9775725603103638, "Pretrain/Loss (Raw)": 1.9826443195343018, "Pretrain/Step": 13854, "Pretrain/Step Time": 8.485810006037354} +{"Pretrain/Learning Rate": 9.188106777642577e-06, "Pretrain/Loss": 1.9756321907043457, "Pretrain/Loss (Raw)": 1.875985026359558, "Pretrain/Step": 13855, "Pretrain/Step Time": 8.487337350845337} +{"Pretrain/Learning Rate": 9.184818784177012e-06, "Pretrain/Loss": 1.9760994911193848, "Pretrain/Loss (Raw)": 1.8969236612319946, "Pretrain/Step": 13856, "Pretrain/Step Time": 8.487785587087274} +{"Pretrain/Learning Rate": 9.181531246731043e-06, "Pretrain/Loss": 1.9762920141220093, "Pretrain/Loss (Raw)": 1.7479709386825562, "Pretrain/Step": 13857, "Pretrain/Step Time": 8.48730537854135} +{"Pretrain/Learning Rate": 9.178244165399475e-06, "Pretrain/Loss": 1.9767094850540161, "Pretrain/Loss (Raw)": 1.8736332654953003, "Pretrain/Step": 13858, "Pretrain/Step Time": 8.4899547919631} +{"Pretrain/Learning Rate": 9.174957540277082e-06, "Pretrain/Loss": 1.976690649986267, "Pretrain/Loss (Raw)": 2.0237691402435303, "Pretrain/Step": 13859, "Pretrain/Step Time": 8.488800592720509} +{"Pretrain/Learning Rate": 9.171671371458626e-06, "Pretrain/Loss": 1.9772677421569824, "Pretrain/Loss (Raw)": 1.920965552330017, "Pretrain/Step": 13860, "Pretrain/Step Time": 8.48287370428443} +{"Pretrain/Learning Rate": 9.168385659038878e-06, "Pretrain/Loss": 1.9811758995056152, "Pretrain/Loss (Raw)": 2.1134541034698486, "Pretrain/Step": 13861, "Pretrain/Step Time": 8.485447516664863} +{"Pretrain/Learning Rate": 9.165100403112556e-06, "Pretrain/Loss": 1.9803472757339478, "Pretrain/Loss (Raw)": 1.8873549699783325, "Pretrain/Step": 13862, "Pretrain/Step Time": 8.489945756271482} +{"Pretrain/Learning Rate": 9.161815603774413e-06, "Pretrain/Loss": 1.9765353202819824, "Pretrain/Loss (Raw)": 1.859511375427246, "Pretrain/Step": 13863, "Pretrain/Step Time": 8.487000569701195} +{"Pretrain/Learning Rate": 9.15853126111915e-06, "Pretrain/Loss": 1.9768528938293457, "Pretrain/Loss (Raw)": 2.042623281478882, "Pretrain/Step": 13864, "Pretrain/Step Time": 8.493463044986129} +{"Pretrain/Learning Rate": 9.155247375241462e-06, "Pretrain/Loss": 1.9768624305725098, "Pretrain/Loss (Raw)": 2.0326809883117676, "Pretrain/Step": 13865, "Pretrain/Step Time": 8.492345981299877} +{"Pretrain/Learning Rate": 9.151963946236055e-06, "Pretrain/Loss": 1.9784653186798096, "Pretrain/Loss (Raw)": 2.2095909118652344, "Pretrain/Step": 13866, "Pretrain/Step Time": 8.489057136699557} +{"Pretrain/Learning Rate": 9.148680974197588e-06, "Pretrain/Loss": 1.9775452613830566, "Pretrain/Loss (Raw)": 1.9654231071472168, "Pretrain/Step": 13867, "Pretrain/Step Time": 8.48804284632206} +{"Pretrain/Learning Rate": 9.145398459220739e-06, "Pretrain/Loss": 1.9795554876327515, "Pretrain/Loss (Raw)": 2.0039782524108887, "Pretrain/Step": 13868, "Pretrain/Step Time": 8.486660977825522} +{"Pretrain/Learning Rate": 9.142116401400147e-06, "Pretrain/Loss": 1.9820417165756226, "Pretrain/Loss (Raw)": 1.8377537727355957, "Pretrain/Step": 13869, "Pretrain/Step Time": 8.490145280957222} +{"Pretrain/Learning Rate": 9.138834800830442e-06, "Pretrain/Loss": 1.9834661483764648, "Pretrain/Loss (Raw)": 2.0702767372131348, "Pretrain/Step": 13870, "Pretrain/Step Time": 8.490358794108033} +{"Pretrain/Learning Rate": 9.135553657606264e-06, "Pretrain/Loss": 1.9842702150344849, "Pretrain/Loss (Raw)": 2.152777671813965, "Pretrain/Step": 13871, "Pretrain/Step Time": 8.486436361446977} +{"Pretrain/Learning Rate": 9.132272971822204e-06, "Pretrain/Loss": 1.9841139316558838, "Pretrain/Loss (Raw)": 2.121586799621582, "Pretrain/Step": 13872, "Pretrain/Step Time": 8.487017599865794} +{"Pretrain/Learning Rate": 9.128992743572874e-06, "Pretrain/Loss": 1.9836996793746948, "Pretrain/Loss (Raw)": 1.9967970848083496, "Pretrain/Step": 13873, "Pretrain/Step Time": 8.491135591641068} +{"Pretrain/Learning Rate": 9.125712972952849e-06, "Pretrain/Loss": 1.9827642440795898, "Pretrain/Loss (Raw)": 1.6661913394927979, "Pretrain/Step": 13874, "Pretrain/Step Time": 8.490662954747677} +{"Pretrain/Learning Rate": 9.122433660056692e-06, "Pretrain/Loss": 1.9820407629013062, "Pretrain/Loss (Raw)": 1.8952714204788208, "Pretrain/Step": 13875, "Pretrain/Step Time": 8.491319024935365} +{"Pretrain/Learning Rate": 9.119154804978978e-06, "Pretrain/Loss": 1.9833948612213135, "Pretrain/Loss (Raw)": 2.1269452571868896, "Pretrain/Step": 13876, "Pretrain/Step Time": 8.48042133077979} +{"Pretrain/Learning Rate": 9.115876407814227e-06, "Pretrain/Loss": 1.9833664894104004, "Pretrain/Loss (Raw)": 1.8878529071807861, "Pretrain/Step": 13877, "Pretrain/Step Time": 8.482249511405826} +{"Pretrain/Learning Rate": 9.112598468656993e-06, "Pretrain/Loss": 1.9843796491622925, "Pretrain/Loss (Raw)": 2.075878143310547, "Pretrain/Step": 13878, "Pretrain/Step Time": 8.483822025358677} +{"Pretrain/Learning Rate": 9.109320987601782e-06, "Pretrain/Loss": 1.98349928855896, "Pretrain/Loss (Raw)": 2.007176637649536, "Pretrain/Step": 13879, "Pretrain/Step Time": 8.488661117851734} +{"Pretrain/Learning Rate": 9.106043964743091e-06, "Pretrain/Loss": 1.9827282428741455, "Pretrain/Loss (Raw)": 1.978049397468567, "Pretrain/Step": 13880, "Pretrain/Step Time": 8.486451350152493} +{"Pretrain/Learning Rate": 9.102767400175427e-06, "Pretrain/Loss": 1.9796130657196045, "Pretrain/Loss (Raw)": 1.661756157875061, "Pretrain/Step": 13881, "Pretrain/Step Time": 8.4855049084872} +{"Pretrain/Learning Rate": 9.099491293993247e-06, "Pretrain/Loss": 1.9825334548950195, "Pretrain/Loss (Raw)": 2.4463489055633545, "Pretrain/Step": 13882, "Pretrain/Step Time": 8.481970051303506} +{"Pretrain/Learning Rate": 9.096215646291037e-06, "Pretrain/Loss": 1.9836183786392212, "Pretrain/Loss (Raw)": 2.017967939376831, "Pretrain/Step": 13883, "Pretrain/Step Time": 8.48121445439756} +{"Pretrain/Learning Rate": 9.092940457163238e-06, "Pretrain/Loss": 1.9883191585540771, "Pretrain/Loss (Raw)": 2.4245975017547607, "Pretrain/Step": 13884, "Pretrain/Step Time": 8.480899689719081} +{"Pretrain/Learning Rate": 9.089665726704277e-06, "Pretrain/Loss": 1.988471269607544, "Pretrain/Loss (Raw)": 2.107409715652466, "Pretrain/Step": 13885, "Pretrain/Step Time": 8.477902548387647} +{"Pretrain/Learning Rate": 9.086391455008597e-06, "Pretrain/Loss": 1.9874063730239868, "Pretrain/Loss (Raw)": 1.992157220840454, "Pretrain/Step": 13886, "Pretrain/Step Time": 8.477649157866836} +{"Pretrain/Learning Rate": 9.083117642170593e-06, "Pretrain/Loss": 1.9872844219207764, "Pretrain/Loss (Raw)": 2.1030399799346924, "Pretrain/Step": 13887, "Pretrain/Step Time": 8.475197138264775} +{"Pretrain/Learning Rate": 9.079844288284681e-06, "Pretrain/Loss": 1.9894769191741943, "Pretrain/Loss (Raw)": 2.222874164581299, "Pretrain/Step": 13888, "Pretrain/Step Time": 8.478901585564017} +{"Pretrain/Learning Rate": 9.076571393445235e-06, "Pretrain/Loss": 1.9893094301223755, "Pretrain/Loss (Raw)": 1.9398348331451416, "Pretrain/Step": 13889, "Pretrain/Step Time": 8.479836059734225} +{"Pretrain/Learning Rate": 9.073298957746618e-06, "Pretrain/Loss": 1.9890398979187012, "Pretrain/Loss (Raw)": 1.8034818172454834, "Pretrain/Step": 13890, "Pretrain/Step Time": 8.478323690593243} +{"Pretrain/Learning Rate": 9.070026981283206e-06, "Pretrain/Loss": 1.988046407699585, "Pretrain/Loss (Raw)": 1.9553841352462769, "Pretrain/Step": 13891, "Pretrain/Step Time": 8.48078328743577} +{"Pretrain/Learning Rate": 9.06675546414933e-06, "Pretrain/Loss": 1.9906044006347656, "Pretrain/Loss (Raw)": 2.0916831493377686, "Pretrain/Step": 13892, "Pretrain/Step Time": 8.47905040346086} +{"Pretrain/Learning Rate": 9.063484406439334e-06, "Pretrain/Loss": 1.9908909797668457, "Pretrain/Loss (Raw)": 2.13228702545166, "Pretrain/Step": 13893, "Pretrain/Step Time": 8.47744113393128} +{"Pretrain/Learning Rate": 9.060213808247533e-06, "Pretrain/Loss": 1.9934203624725342, "Pretrain/Loss (Raw)": 2.216890573501587, "Pretrain/Step": 13894, "Pretrain/Step Time": 8.48014216683805} +{"Pretrain/Learning Rate": 9.056943669668221e-06, "Pretrain/Loss": 1.9924628734588623, "Pretrain/Loss (Raw)": 1.9235116243362427, "Pretrain/Step": 13895, "Pretrain/Step Time": 8.484513230621815} +{"Pretrain/Learning Rate": 9.053673990795708e-06, "Pretrain/Loss": 1.9945107698440552, "Pretrain/Loss (Raw)": 2.259091854095459, "Pretrain/Step": 13896, "Pretrain/Step Time": 8.483554376289248} +{"Pretrain/Learning Rate": 9.050404771724252e-06, "Pretrain/Loss": 1.9939451217651367, "Pretrain/Loss (Raw)": 2.1661458015441895, "Pretrain/Step": 13897, "Pretrain/Step Time": 8.490780605003238} +{"Pretrain/Learning Rate": 9.047136012548143e-06, "Pretrain/Loss": 1.9933836460113525, "Pretrain/Loss (Raw)": 2.121687650680542, "Pretrain/Step": 13898, "Pretrain/Step Time": 8.489920809864998} +{"Pretrain/Learning Rate": 9.04386771336162e-06, "Pretrain/Loss": 1.9923534393310547, "Pretrain/Loss (Raw)": 1.858217716217041, "Pretrain/Step": 13899, "Pretrain/Step Time": 8.49003203958273} +{"Pretrain/Learning Rate": 9.040599874258916e-06, "Pretrain/Loss": 1.9926410913467407, "Pretrain/Loss (Raw)": 2.054342269897461, "Pretrain/Step": 13900, "Pretrain/Step Time": 8.488260716199875} +{"Pretrain/Learning Rate": 9.03733249533427e-06, "Pretrain/Loss": 1.9949514865875244, "Pretrain/Loss (Raw)": 2.1299474239349365, "Pretrain/Step": 13901, "Pretrain/Step Time": 8.48768094740808} +{"Pretrain/Learning Rate": 9.03406557668189e-06, "Pretrain/Loss": 1.9940991401672363, "Pretrain/Loss (Raw)": 1.9793994426727295, "Pretrain/Step": 13902, "Pretrain/Step Time": 8.485216666013002} +{"Pretrain/Learning Rate": 9.030799118395974e-06, "Pretrain/Loss": 1.9922837018966675, "Pretrain/Loss (Raw)": 1.600000262260437, "Pretrain/Step": 13903, "Pretrain/Step Time": 8.488386023789644} +{"Pretrain/Learning Rate": 9.0275331205707e-06, "Pretrain/Loss": 1.9922009706497192, "Pretrain/Loss (Raw)": 1.9352952241897583, "Pretrain/Step": 13904, "Pretrain/Step Time": 8.486424345523119} +{"Pretrain/Learning Rate": 9.024267583300256e-06, "Pretrain/Loss": 1.9928505420684814, "Pretrain/Loss (Raw)": 1.891656756401062, "Pretrain/Step": 13905, "Pretrain/Step Time": 8.486945159733295} +{"Pretrain/Learning Rate": 9.021002506678795e-06, "Pretrain/Loss": 1.9898595809936523, "Pretrain/Loss (Raw)": 1.9676517248153687, "Pretrain/Step": 13906, "Pretrain/Step Time": 8.488040992990136} +{"Pretrain/Learning Rate": 9.01773789080045e-06, "Pretrain/Loss": 1.9873456954956055, "Pretrain/Loss (Raw)": 1.9957653284072876, "Pretrain/Step": 13907, "Pretrain/Step Time": 8.486527858301997} +{"Pretrain/Learning Rate": 9.014473735759377e-06, "Pretrain/Loss": 1.9831395149230957, "Pretrain/Loss (Raw)": 1.7389479875564575, "Pretrain/Step": 13908, "Pretrain/Step Time": 8.49003197439015} +{"Pretrain/Learning Rate": 9.011210041649679e-06, "Pretrain/Loss": 1.981256365776062, "Pretrain/Loss (Raw)": 1.7054163217544556, "Pretrain/Step": 13909, "Pretrain/Step Time": 8.48497612401843} +{"Pretrain/Learning Rate": 9.007946808565473e-06, "Pretrain/Loss": 1.9801318645477295, "Pretrain/Loss (Raw)": 1.8625234365463257, "Pretrain/Step": 13910, "Pretrain/Step Time": 8.48813728056848} +{"Pretrain/Learning Rate": 9.00468403660085e-06, "Pretrain/Loss": 1.9809787273406982, "Pretrain/Loss (Raw)": 1.9461934566497803, "Pretrain/Step": 13911, "Pretrain/Step Time": 8.486990422010422} +{"Pretrain/Learning Rate": 9.001421725849875e-06, "Pretrain/Loss": 1.9811360836029053, "Pretrain/Loss (Raw)": 1.984714150428772, "Pretrain/Step": 13912, "Pretrain/Step Time": 8.48780949600041} +{"Pretrain/Learning Rate": 8.998159876406636e-06, "Pretrain/Loss": 1.9827989339828491, "Pretrain/Loss (Raw)": 2.294670581817627, "Pretrain/Step": 13913, "Pretrain/Step Time": 8.49133481644094} +{"Pretrain/Learning Rate": 8.994898488365169e-06, "Pretrain/Loss": 1.9855047464370728, "Pretrain/Loss (Raw)": 2.1909635066986084, "Pretrain/Step": 13914, "Pretrain/Step Time": 8.489775348454714} +{"Pretrain/Learning Rate": 8.99163756181953e-06, "Pretrain/Loss": 1.9832780361175537, "Pretrain/Loss (Raw)": 1.9099072217941284, "Pretrain/Step": 13915, "Pretrain/Step Time": 8.493535036221147} +{"Pretrain/Learning Rate": 8.988377096863729e-06, "Pretrain/Loss": 1.9870574474334717, "Pretrain/Loss (Raw)": 2.111966609954834, "Pretrain/Step": 13916, "Pretrain/Step Time": 8.490671323612332} +{"Pretrain/Learning Rate": 8.985117093591794e-06, "Pretrain/Loss": 1.9856951236724854, "Pretrain/Loss (Raw)": 1.9938411712646484, "Pretrain/Step": 13917, "Pretrain/Step Time": 8.490886714309454} +{"Pretrain/Learning Rate": 8.981857552097717e-06, "Pretrain/Loss": 1.988499402999878, "Pretrain/Loss (Raw)": 1.9851741790771484, "Pretrain/Step": 13918, "Pretrain/Step Time": 8.490073436871171} +{"Pretrain/Learning Rate": 8.978598472475478e-06, "Pretrain/Loss": 1.988566517829895, "Pretrain/Loss (Raw)": 2.0443172454833984, "Pretrain/Step": 13919, "Pretrain/Step Time": 8.488264290615916} +{"Pretrain/Learning Rate": 8.975339854819064e-06, "Pretrain/Loss": 1.9900139570236206, "Pretrain/Loss (Raw)": 2.1684186458587646, "Pretrain/Step": 13920, "Pretrain/Step Time": 8.486621158197522} +{"Pretrain/Learning Rate": 8.972081699222423e-06, "Pretrain/Loss": 1.9900624752044678, "Pretrain/Loss (Raw)": 1.885154128074646, "Pretrain/Step": 13921, "Pretrain/Step Time": 8.486682962626219} +{"Pretrain/Learning Rate": 8.968824005779516e-06, "Pretrain/Loss": 1.9892020225524902, "Pretrain/Loss (Raw)": 1.928356409072876, "Pretrain/Step": 13922, "Pretrain/Step Time": 8.490841917693615} +{"Pretrain/Learning Rate": 8.965566774584266e-06, "Pretrain/Loss": 1.9891812801361084, "Pretrain/Loss (Raw)": 2.0680954456329346, "Pretrain/Step": 13923, "Pretrain/Step Time": 8.490634478628635} +{"Pretrain/Learning Rate": 8.962310005730587e-06, "Pretrain/Loss": 1.9892345666885376, "Pretrain/Loss (Raw)": 2.044844150543213, "Pretrain/Step": 13924, "Pretrain/Step Time": 8.490361861884594} +{"Pretrain/Learning Rate": 8.9590536993124e-06, "Pretrain/Loss": 1.9856754541397095, "Pretrain/Loss (Raw)": 1.852117657661438, "Pretrain/Step": 13925, "Pretrain/Step Time": 8.491008454933763} +{"Pretrain/Learning Rate": 8.955797855423584e-06, "Pretrain/Loss": 1.9930675029754639, "Pretrain/Loss (Raw)": 2.317087411880493, "Pretrain/Step": 13926, "Pretrain/Step Time": 8.491799879819155} +{"Pretrain/Learning Rate": 8.952542474158035e-06, "Pretrain/Loss": 1.9902275800704956, "Pretrain/Loss (Raw)": 1.7852394580841064, "Pretrain/Step": 13927, "Pretrain/Step Time": 8.491068286821246} +{"Pretrain/Learning Rate": 8.949287555609612e-06, "Pretrain/Loss": 1.9891142845153809, "Pretrain/Loss (Raw)": 1.9288560152053833, "Pretrain/Step": 13928, "Pretrain/Step Time": 8.491096265614033} +{"Pretrain/Learning Rate": 8.946033099872158e-06, "Pretrain/Loss": 1.986758828163147, "Pretrain/Loss (Raw)": 1.627639889717102, "Pretrain/Step": 13929, "Pretrain/Step Time": 8.497261002659798} +{"Pretrain/Learning Rate": 8.942779107039531e-06, "Pretrain/Loss": 1.9866467714309692, "Pretrain/Loss (Raw)": 2.0000243186950684, "Pretrain/Step": 13930, "Pretrain/Step Time": 8.496489418670535} +{"Pretrain/Learning Rate": 8.93952557720554e-06, "Pretrain/Loss": 1.9844815731048584, "Pretrain/Loss (Raw)": 1.8644700050354004, "Pretrain/Step": 13931, "Pretrain/Step Time": 8.49509291537106} +{"Pretrain/Learning Rate": 8.936272510464017e-06, "Pretrain/Loss": 1.9842309951782227, "Pretrain/Loss (Raw)": 1.9355473518371582, "Pretrain/Step": 13932, "Pretrain/Step Time": 8.496855383738875} +{"Pretrain/Learning Rate": 8.933019906908748e-06, "Pretrain/Loss": 1.9852232933044434, "Pretrain/Loss (Raw)": 1.9890903234481812, "Pretrain/Step": 13933, "Pretrain/Step Time": 8.49537560902536} +{"Pretrain/Learning Rate": 8.929767766633519e-06, "Pretrain/Loss": 1.9871212244033813, "Pretrain/Loss (Raw)": 2.0460376739501953, "Pretrain/Step": 13934, "Pretrain/Step Time": 8.497464288026094} +{"Pretrain/Learning Rate": 8.926516089732115e-06, "Pretrain/Loss": 1.9881043434143066, "Pretrain/Loss (Raw)": 2.083409547805786, "Pretrain/Step": 13935, "Pretrain/Step Time": 8.49611902795732} +{"Pretrain/Learning Rate": 8.923264876298279e-06, "Pretrain/Loss": 1.9896498918533325, "Pretrain/Loss (Raw)": 2.0753440856933594, "Pretrain/Step": 13936, "Pretrain/Step Time": 8.493976969271898} +{"Pretrain/Learning Rate": 8.920014126425777e-06, "Pretrain/Loss": 1.9900689125061035, "Pretrain/Loss (Raw)": 1.9885371923446655, "Pretrain/Step": 13937, "Pretrain/Step Time": 8.495785867795348} +{"Pretrain/Learning Rate": 8.916763840208331e-06, "Pretrain/Loss": 1.9877556562423706, "Pretrain/Loss (Raw)": 1.7862950563430786, "Pretrain/Step": 13938, "Pretrain/Step Time": 8.494617564603686} +{"Pretrain/Learning Rate": 8.913514017739652e-06, "Pretrain/Loss": 1.9885848760604858, "Pretrain/Loss (Raw)": 1.97280752658844, "Pretrain/Step": 13939, "Pretrain/Step Time": 8.496859353035688} +{"Pretrain/Learning Rate": 8.910264659113468e-06, "Pretrain/Loss": 1.989837408065796, "Pretrain/Loss (Raw)": 2.1589815616607666, "Pretrain/Step": 13940, "Pretrain/Step Time": 8.495027991011739} +{"Pretrain/Learning Rate": 8.90701576442345e-06, "Pretrain/Loss": 1.9914281368255615, "Pretrain/Loss (Raw)": 2.058619499206543, "Pretrain/Step": 13941, "Pretrain/Step Time": 8.48985106125474} +{"Pretrain/Learning Rate": 8.903767333763293e-06, "Pretrain/Loss": 1.988885521888733, "Pretrain/Loss (Raw)": 1.928688883781433, "Pretrain/Step": 13942, "Pretrain/Step Time": 8.4916379339993} +{"Pretrain/Learning Rate": 8.900519367226661e-06, "Pretrain/Loss": 1.9850423336029053, "Pretrain/Loss (Raw)": 1.645141839981079, "Pretrain/Step": 13943, "Pretrain/Step Time": 8.493034906685352} +{"Pretrain/Learning Rate": 8.897271864907195e-06, "Pretrain/Loss": 1.9884743690490723, "Pretrain/Loss (Raw)": 2.341175079345703, "Pretrain/Step": 13944, "Pretrain/Step Time": 8.489262014627457} +{"Pretrain/Learning Rate": 8.894024826898551e-06, "Pretrain/Loss": 1.9893271923065186, "Pretrain/Loss (Raw)": 1.9645992517471313, "Pretrain/Step": 13945, "Pretrain/Step Time": 8.495475836098194} +{"Pretrain/Learning Rate": 8.89077825329434e-06, "Pretrain/Loss": 1.9894644021987915, "Pretrain/Loss (Raw)": 2.1763339042663574, "Pretrain/Step": 13946, "Pretrain/Step Time": 8.49865672364831} +{"Pretrain/Learning Rate": 8.887532144188191e-06, "Pretrain/Loss": 1.9886289834976196, "Pretrain/Loss (Raw)": 1.9119466543197632, "Pretrain/Step": 13947, "Pretrain/Step Time": 8.494164124131203} +{"Pretrain/Learning Rate": 8.884286499673691e-06, "Pretrain/Loss": 1.9874966144561768, "Pretrain/Loss (Raw)": 1.7756884098052979, "Pretrain/Step": 13948, "Pretrain/Step Time": 8.493632387369871} +{"Pretrain/Learning Rate": 8.881041319844422e-06, "Pretrain/Loss": 1.9870853424072266, "Pretrain/Loss (Raw)": 1.7356369495391846, "Pretrain/Step": 13949, "Pretrain/Step Time": 8.493188871070743} +{"Pretrain/Learning Rate": 8.87779660479397e-06, "Pretrain/Loss": 1.9869356155395508, "Pretrain/Loss (Raw)": 1.909057378768921, "Pretrain/Step": 13950, "Pretrain/Step Time": 8.491510521620512} +{"Pretrain/Learning Rate": 8.874552354615881e-06, "Pretrain/Loss": 1.9855401515960693, "Pretrain/Loss (Raw)": 1.951136589050293, "Pretrain/Step": 13951, "Pretrain/Step Time": 8.494212545454502} +{"Pretrain/Learning Rate": 8.871308569403716e-06, "Pretrain/Loss": 1.9850448369979858, "Pretrain/Loss (Raw)": 1.8872708082199097, "Pretrain/Step": 13952, "Pretrain/Step Time": 8.50006141141057} +{"Pretrain/Learning Rate": 8.868065249250998e-06, "Pretrain/Loss": 1.9815030097961426, "Pretrain/Loss (Raw)": 1.867808222770691, "Pretrain/Step": 13953, "Pretrain/Step Time": 8.490690354257822} +{"Pretrain/Learning Rate": 8.864822394251238e-06, "Pretrain/Loss": 1.9798280000686646, "Pretrain/Loss (Raw)": 1.6686556339263916, "Pretrain/Step": 13954, "Pretrain/Step Time": 8.491737332195044} +{"Pretrain/Learning Rate": 8.861580004497957e-06, "Pretrain/Loss": 1.9806079864501953, "Pretrain/Loss (Raw)": 2.073535203933716, "Pretrain/Step": 13955, "Pretrain/Step Time": 8.490862675011158} +{"Pretrain/Learning Rate": 8.858338080084633e-06, "Pretrain/Loss": 1.9807722568511963, "Pretrain/Loss (Raw)": 2.033510208129883, "Pretrain/Step": 13956, "Pretrain/Step Time": 8.487842377275229} +{"Pretrain/Learning Rate": 8.855096621104757e-06, "Pretrain/Loss": 1.9838988780975342, "Pretrain/Loss (Raw)": 2.425907850265503, "Pretrain/Step": 13957, "Pretrain/Step Time": 8.485580360516906} +{"Pretrain/Learning Rate": 8.851855627651793e-06, "Pretrain/Loss": 1.9809656143188477, "Pretrain/Loss (Raw)": 1.8085780143737793, "Pretrain/Step": 13958, "Pretrain/Step Time": 8.487005481496453} +{"Pretrain/Learning Rate": 8.848615099819173e-06, "Pretrain/Loss": 1.9808409214019775, "Pretrain/Loss (Raw)": 1.9847553968429565, "Pretrain/Step": 13959, "Pretrain/Step Time": 8.486190410330892} +{"Pretrain/Learning Rate": 8.845375037700366e-06, "Pretrain/Loss": 1.9807820320129395, "Pretrain/Loss (Raw)": 1.9907240867614746, "Pretrain/Step": 13960, "Pretrain/Step Time": 8.48000793904066} +{"Pretrain/Learning Rate": 8.842135441388771e-06, "Pretrain/Loss": 1.9817709922790527, "Pretrain/Loss (Raw)": 2.1831841468811035, "Pretrain/Step": 13961, "Pretrain/Step Time": 8.484548704698682} +{"Pretrain/Learning Rate": 8.838896310977818e-06, "Pretrain/Loss": 1.9819616079330444, "Pretrain/Loss (Raw)": 1.7433927059173584, "Pretrain/Step": 13962, "Pretrain/Step Time": 8.48388822004199} +{"Pretrain/Learning Rate": 8.835657646560896e-06, "Pretrain/Loss": 1.9812616109848022, "Pretrain/Loss (Raw)": 1.8415601253509521, "Pretrain/Step": 13963, "Pretrain/Step Time": 8.483015108853579} +{"Pretrain/Learning Rate": 8.832419448231383e-06, "Pretrain/Loss": 1.9817159175872803, "Pretrain/Loss (Raw)": 2.1303956508636475, "Pretrain/Step": 13964, "Pretrain/Step Time": 8.480948437005281} +{"Pretrain/Learning Rate": 8.829181716082666e-06, "Pretrain/Loss": 1.9828919172286987, "Pretrain/Loss (Raw)": 2.012073516845703, "Pretrain/Step": 13965, "Pretrain/Step Time": 8.478754064068198} +{"Pretrain/Learning Rate": 8.825944450208088e-06, "Pretrain/Loss": 1.9818615913391113, "Pretrain/Loss (Raw)": 1.8718773126602173, "Pretrain/Step": 13966, "Pretrain/Step Time": 8.4769432451576} +{"Pretrain/Learning Rate": 8.822707650701003e-06, "Pretrain/Loss": 1.9806864261627197, "Pretrain/Loss (Raw)": 1.9765892028808594, "Pretrain/Step": 13967, "Pretrain/Step Time": 8.47797967121005} +{"Pretrain/Learning Rate": 8.819471317654746e-06, "Pretrain/Loss": 1.9805681705474854, "Pretrain/Loss (Raw)": 1.865787386894226, "Pretrain/Step": 13968, "Pretrain/Step Time": 8.47368979267776} +{"Pretrain/Learning Rate": 8.816235451162614e-06, "Pretrain/Loss": 1.9829927682876587, "Pretrain/Loss (Raw)": 1.9807699918746948, "Pretrain/Step": 13969, "Pretrain/Step Time": 8.477027768269181} +{"Pretrain/Learning Rate": 8.813000051317932e-06, "Pretrain/Loss": 1.9830801486968994, "Pretrain/Loss (Raw)": 2.0931315422058105, "Pretrain/Step": 13970, "Pretrain/Step Time": 8.475592104718089} +{"Pretrain/Learning Rate": 8.809765118213976e-06, "Pretrain/Loss": 1.983656644821167, "Pretrain/Loss (Raw)": 2.093740224838257, "Pretrain/Step": 13971, "Pretrain/Step Time": 8.475299587473273} +{"Pretrain/Learning Rate": 8.806530651944036e-06, "Pretrain/Loss": 1.9846028089523315, "Pretrain/Loss (Raw)": 2.24118709564209, "Pretrain/Step": 13972, "Pretrain/Step Time": 8.481027299538255} +{"Pretrain/Learning Rate": 8.80329665260137e-06, "Pretrain/Loss": 1.985342025756836, "Pretrain/Loss (Raw)": 1.907646656036377, "Pretrain/Step": 13973, "Pretrain/Step Time": 8.476484650745988} +{"Pretrain/Learning Rate": 8.80006312027922e-06, "Pretrain/Loss": 1.9882941246032715, "Pretrain/Loss (Raw)": 2.2885842323303223, "Pretrain/Step": 13974, "Pretrain/Step Time": 8.476459922268987} +{"Pretrain/Learning Rate": 8.796830055070837e-06, "Pretrain/Loss": 1.9896209239959717, "Pretrain/Loss (Raw)": 1.942972183227539, "Pretrain/Step": 13975, "Pretrain/Step Time": 8.476765591651201} +{"Pretrain/Learning Rate": 8.793597457069427e-06, "Pretrain/Loss": 1.9885740280151367, "Pretrain/Loss (Raw)": 1.944601058959961, "Pretrain/Step": 13976, "Pretrain/Step Time": 8.469978414475918} +{"Pretrain/Learning Rate": 8.790365326368223e-06, "Pretrain/Loss": 1.9838557243347168, "Pretrain/Loss (Raw)": 1.7906371355056763, "Pretrain/Step": 13977, "Pretrain/Step Time": 8.471505854278803} +{"Pretrain/Learning Rate": 8.787133663060401e-06, "Pretrain/Loss": 1.9857008457183838, "Pretrain/Loss (Raw)": 1.930899977684021, "Pretrain/Step": 13978, "Pretrain/Step Time": 8.470051296055317} +{"Pretrain/Learning Rate": 8.783902467239147e-06, "Pretrain/Loss": 1.9860050678253174, "Pretrain/Loss (Raw)": 1.8678205013275146, "Pretrain/Step": 13979, "Pretrain/Step Time": 8.469780568033457} +{"Pretrain/Learning Rate": 8.78067173899764e-06, "Pretrain/Loss": 1.9891983270645142, "Pretrain/Loss (Raw)": 2.1076693534851074, "Pretrain/Step": 13980, "Pretrain/Step Time": 8.469204913824797} +{"Pretrain/Learning Rate": 8.777441478429022e-06, "Pretrain/Loss": 1.987118124961853, "Pretrain/Loss (Raw)": 1.8713501691818237, "Pretrain/Step": 13981, "Pretrain/Step Time": 8.467358078807592} +{"Pretrain/Learning Rate": 8.774211685626448e-06, "Pretrain/Loss": 1.9870672225952148, "Pretrain/Loss (Raw)": 1.9761300086975098, "Pretrain/Step": 13982, "Pretrain/Step Time": 8.465486973524094} +{"Pretrain/Learning Rate": 8.770982360683046e-06, "Pretrain/Loss": 1.9884555339813232, "Pretrain/Loss (Raw)": 2.053682565689087, "Pretrain/Step": 13983, "Pretrain/Step Time": 8.465191714465618} +{"Pretrain/Learning Rate": 8.767753503691917e-06, "Pretrain/Loss": 1.9875035285949707, "Pretrain/Loss (Raw)": 1.7750701904296875, "Pretrain/Step": 13984, "Pretrain/Step Time": 8.464640570804477} +{"Pretrain/Learning Rate": 8.76452511474618e-06, "Pretrain/Loss": 1.9897059202194214, "Pretrain/Loss (Raw)": 2.0298759937286377, "Pretrain/Step": 13985, "Pretrain/Step Time": 8.462105123326182} +{"Pretrain/Learning Rate": 8.761297193938919e-06, "Pretrain/Loss": 1.991390347480774, "Pretrain/Loss (Raw)": 2.089242696762085, "Pretrain/Step": 13986, "Pretrain/Step Time": 8.460991956293583} +{"Pretrain/Learning Rate": 8.758069741363204e-06, "Pretrain/Loss": 1.99423086643219, "Pretrain/Loss (Raw)": 2.3873519897460938, "Pretrain/Step": 13987, "Pretrain/Step Time": 8.460512207821012} +{"Pretrain/Learning Rate": 8.754842757112088e-06, "Pretrain/Loss": 1.995078206062317, "Pretrain/Loss (Raw)": 2.029428005218506, "Pretrain/Step": 13988, "Pretrain/Step Time": 8.4661430940032} +{"Pretrain/Learning Rate": 8.751616241278641e-06, "Pretrain/Loss": 1.9944480657577515, "Pretrain/Loss (Raw)": 2.0328001976013184, "Pretrain/Step": 13989, "Pretrain/Step Time": 8.467344945296645} +{"Pretrain/Learning Rate": 8.748390193955874e-06, "Pretrain/Loss": 1.996974229812622, "Pretrain/Loss (Raw)": 2.210693120956421, "Pretrain/Step": 13990, "Pretrain/Step Time": 8.46179098263383} +{"Pretrain/Learning Rate": 8.745164615236832e-06, "Pretrain/Loss": 1.998223066329956, "Pretrain/Loss (Raw)": 2.019364595413208, "Pretrain/Step": 13991, "Pretrain/Step Time": 8.466531321406364} +{"Pretrain/Learning Rate": 8.741939505214506e-06, "Pretrain/Loss": 1.995162010192871, "Pretrain/Loss (Raw)": 1.6508222818374634, "Pretrain/Step": 13992, "Pretrain/Step Time": 8.461922101676464} +{"Pretrain/Learning Rate": 8.738714863981883e-06, "Pretrain/Loss": 1.9955387115478516, "Pretrain/Loss (Raw)": 2.080890417098999, "Pretrain/Step": 13993, "Pretrain/Step Time": 8.465896664187312} +{"Pretrain/Learning Rate": 8.735490691631965e-06, "Pretrain/Loss": 1.9934983253479004, "Pretrain/Loss (Raw)": 1.948425531387329, "Pretrain/Step": 13994, "Pretrain/Step Time": 8.470134621486068} +{"Pretrain/Learning Rate": 8.732266988257695e-06, "Pretrain/Loss": 1.997236967086792, "Pretrain/Loss (Raw)": 2.443966865539551, "Pretrain/Step": 13995, "Pretrain/Step Time": 8.470323136076331} +{"Pretrain/Learning Rate": 8.729043753952051e-06, "Pretrain/Loss": 1.998199462890625, "Pretrain/Loss (Raw)": 2.1271893978118896, "Pretrain/Step": 13996, "Pretrain/Step Time": 8.46942520327866} +{"Pretrain/Learning Rate": 8.725820988807958e-06, "Pretrain/Loss": 1.998471736907959, "Pretrain/Loss (Raw)": 1.872580885887146, "Pretrain/Step": 13997, "Pretrain/Step Time": 8.468469114974141} +{"Pretrain/Learning Rate": 8.722598692918335e-06, "Pretrain/Loss": 1.9969465732574463, "Pretrain/Loss (Raw)": 1.875063419342041, "Pretrain/Step": 13998, "Pretrain/Step Time": 8.468322364613414} +{"Pretrain/Learning Rate": 8.719376866376114e-06, "Pretrain/Loss": 1.9959008693695068, "Pretrain/Loss (Raw)": 2.0189409255981445, "Pretrain/Step": 13999, "Pretrain/Step Time": 8.46974466368556} +{"Pretrain/Learning Rate": 8.716155509274177e-06, "Pretrain/Loss": 1.9959638118743896, "Pretrain/Loss (Raw)": 2.1296329498291016, "Pretrain/Step": 14000, "Pretrain/Step Time": 8.469994738698006} +{"Pretrain/Learning Rate": 8.712934621705421e-06, "Pretrain/Loss": 1.9928957223892212, "Pretrain/Loss (Raw)": 1.6040704250335693, "Pretrain/Step": 14001, "Pretrain/Step Time": 8.46631241030991} +{"Pretrain/Learning Rate": 8.709714203762717e-06, "Pretrain/Loss": 1.9954254627227783, "Pretrain/Loss (Raw)": 1.9900039434432983, "Pretrain/Step": 14002, "Pretrain/Step Time": 8.464641734957695} +{"Pretrain/Learning Rate": 8.70649425553891e-06, "Pretrain/Loss": 1.9956927299499512, "Pretrain/Loss (Raw)": 1.9294803142547607, "Pretrain/Step": 14003, "Pretrain/Step Time": 8.465380724519491} +{"Pretrain/Learning Rate": 8.703274777126863e-06, "Pretrain/Loss": 1.9936959743499756, "Pretrain/Loss (Raw)": 1.8713691234588623, "Pretrain/Step": 14004, "Pretrain/Step Time": 8.465673565864563} +{"Pretrain/Learning Rate": 8.700055768619392e-06, "Pretrain/Loss": 1.9938359260559082, "Pretrain/Loss (Raw)": 1.9057692289352417, "Pretrain/Step": 14005, "Pretrain/Step Time": 8.463086614385247} +{"Pretrain/Learning Rate": 8.696837230109332e-06, "Pretrain/Loss": 1.9932479858398438, "Pretrain/Loss (Raw)": 2.000603675842285, "Pretrain/Step": 14006, "Pretrain/Step Time": 8.465828092768788} +{"Pretrain/Learning Rate": 8.693619161689473e-06, "Pretrain/Loss": 1.995073676109314, "Pretrain/Loss (Raw)": 2.2408785820007324, "Pretrain/Step": 14007, "Pretrain/Step Time": 8.45937523059547} +{"Pretrain/Learning Rate": 8.690401563452605e-06, "Pretrain/Loss": 1.9951785802841187, "Pretrain/Loss (Raw)": 1.9914833307266235, "Pretrain/Step": 14008, "Pretrain/Step Time": 8.45614280179143} +{"Pretrain/Learning Rate": 8.687184435491519e-06, "Pretrain/Loss": 1.995759129524231, "Pretrain/Loss (Raw)": 1.7360520362854004, "Pretrain/Step": 14009, "Pretrain/Step Time": 8.462360732257366} +{"Pretrain/Learning Rate": 8.68396777789896e-06, "Pretrain/Loss": 1.993544101715088, "Pretrain/Loss (Raw)": 2.1628410816192627, "Pretrain/Step": 14010, "Pretrain/Step Time": 8.467167479917407} +{"Pretrain/Learning Rate": 8.680751590767699e-06, "Pretrain/Loss": 1.9931658506393433, "Pretrain/Loss (Raw)": 1.969539999961853, "Pretrain/Step": 14011, "Pretrain/Step Time": 8.464306991547346} +{"Pretrain/Learning Rate": 8.67753587419046e-06, "Pretrain/Loss": 1.9886796474456787, "Pretrain/Loss (Raw)": 1.8503698110580444, "Pretrain/Step": 14012, "Pretrain/Step Time": 8.46549261175096} +{"Pretrain/Learning Rate": 8.674320628259957e-06, "Pretrain/Loss": 1.9868862628936768, "Pretrain/Loss (Raw)": 1.8778496980667114, "Pretrain/Step": 14013, "Pretrain/Step Time": 8.465279957279563} +{"Pretrain/Learning Rate": 8.671105853068922e-06, "Pretrain/Loss": 1.986364722251892, "Pretrain/Loss (Raw)": 1.925384283065796, "Pretrain/Step": 14014, "Pretrain/Step Time": 8.462448569014668} +{"Pretrain/Learning Rate": 8.667891548710028e-06, "Pretrain/Loss": 1.9857128858566284, "Pretrain/Loss (Raw)": 2.0196433067321777, "Pretrain/Step": 14015, "Pretrain/Step Time": 8.4657989628613} +{"Pretrain/Learning Rate": 8.664677715275977e-06, "Pretrain/Loss": 1.9857593774795532, "Pretrain/Loss (Raw)": 2.2288098335266113, "Pretrain/Step": 14016, "Pretrain/Step Time": 8.459798304364085} +{"Pretrain/Learning Rate": 8.661464352859428e-06, "Pretrain/Loss": 1.9869266748428345, "Pretrain/Loss (Raw)": 2.089242696762085, "Pretrain/Step": 14017, "Pretrain/Step Time": 8.456093143671751} +{"Pretrain/Learning Rate": 8.65825146155303e-06, "Pretrain/Loss": 1.9889373779296875, "Pretrain/Loss (Raw)": 2.060863494873047, "Pretrain/Step": 14018, "Pretrain/Step Time": 8.459091244265437} +{"Pretrain/Learning Rate": 8.655039041449436e-06, "Pretrain/Loss": 1.989380955696106, "Pretrain/Loss (Raw)": 2.0121588706970215, "Pretrain/Step": 14019, "Pretrain/Step Time": 8.455457279458642} +{"Pretrain/Learning Rate": 8.651827092641262e-06, "Pretrain/Loss": 1.9872944355010986, "Pretrain/Loss (Raw)": 1.8246089220046997, "Pretrain/Step": 14020, "Pretrain/Step Time": 8.460340993478894} +{"Pretrain/Learning Rate": 8.648615615221138e-06, "Pretrain/Loss": 1.9868526458740234, "Pretrain/Loss (Raw)": 2.075713872909546, "Pretrain/Step": 14021, "Pretrain/Step Time": 8.463151402771473} +{"Pretrain/Learning Rate": 8.645404609281654e-06, "Pretrain/Loss": 1.9864776134490967, "Pretrain/Loss (Raw)": 2.1688899993896484, "Pretrain/Step": 14022, "Pretrain/Step Time": 8.460858723148704} +{"Pretrain/Learning Rate": 8.64219407491539e-06, "Pretrain/Loss": 1.9888559579849243, "Pretrain/Loss (Raw)": 2.2279715538024902, "Pretrain/Step": 14023, "Pretrain/Step Time": 8.455545354634523} +{"Pretrain/Learning Rate": 8.63898401221494e-06, "Pretrain/Loss": 1.9858087301254272, "Pretrain/Loss (Raw)": 1.869032382965088, "Pretrain/Step": 14024, "Pretrain/Step Time": 8.458510380238295} +{"Pretrain/Learning Rate": 8.635774421272844e-06, "Pretrain/Loss": 1.9837040901184082, "Pretrain/Loss (Raw)": 1.896752953529358, "Pretrain/Step": 14025, "Pretrain/Step Time": 8.449688270688057} +{"Pretrain/Learning Rate": 8.632565302181664e-06, "Pretrain/Loss": 1.9813306331634521, "Pretrain/Loss (Raw)": 1.8178855180740356, "Pretrain/Step": 14026, "Pretrain/Step Time": 8.452587995678186} +{"Pretrain/Learning Rate": 8.629356655033924e-06, "Pretrain/Loss": 1.9817200899124146, "Pretrain/Loss (Raw)": 1.908058524131775, "Pretrain/Step": 14027, "Pretrain/Step Time": 8.457614349201322} +{"Pretrain/Learning Rate": 8.626148479922136e-06, "Pretrain/Loss": 1.9830008745193481, "Pretrain/Loss (Raw)": 2.2182905673980713, "Pretrain/Step": 14028, "Pretrain/Step Time": 8.457398986443877} +{"Pretrain/Learning Rate": 8.622940776938824e-06, "Pretrain/Loss": 1.982271671295166, "Pretrain/Loss (Raw)": 2.036607503890991, "Pretrain/Step": 14029, "Pretrain/Step Time": 8.457045273855329} +{"Pretrain/Learning Rate": 8.619733546176458e-06, "Pretrain/Loss": 1.9826078414916992, "Pretrain/Loss (Raw)": 2.022420644760132, "Pretrain/Step": 14030, "Pretrain/Step Time": 8.45678373426199} +{"Pretrain/Learning Rate": 8.616526787727538e-06, "Pretrain/Loss": 1.984673023223877, "Pretrain/Loss (Raw)": 1.8643707036972046, "Pretrain/Step": 14031, "Pretrain/Step Time": 8.451892152428627} +{"Pretrain/Learning Rate": 8.613320501684519e-06, "Pretrain/Loss": 1.9841820001602173, "Pretrain/Loss (Raw)": 1.8724299669265747, "Pretrain/Step": 14032, "Pretrain/Step Time": 8.448581581935287} +{"Pretrain/Learning Rate": 8.610114688139842e-06, "Pretrain/Loss": 1.9861061573028564, "Pretrain/Loss (Raw)": 2.1379501819610596, "Pretrain/Step": 14033, "Pretrain/Step Time": 8.45148585550487} +{"Pretrain/Learning Rate": 8.606909347185963e-06, "Pretrain/Loss": 1.9862991571426392, "Pretrain/Loss (Raw)": 1.9923452138900757, "Pretrain/Step": 14034, "Pretrain/Step Time": 8.451593892648816} +{"Pretrain/Learning Rate": 8.60370447891529e-06, "Pretrain/Loss": 1.9858161211013794, "Pretrain/Loss (Raw)": 1.9339442253112793, "Pretrain/Step": 14035, "Pretrain/Step Time": 8.451098522171378} +{"Pretrain/Learning Rate": 8.600500083420243e-06, "Pretrain/Loss": 1.9877820014953613, "Pretrain/Loss (Raw)": 1.9905718564987183, "Pretrain/Step": 14036, "Pretrain/Step Time": 8.451044416055083} +{"Pretrain/Learning Rate": 8.597296160793219e-06, "Pretrain/Loss": 1.9897785186767578, "Pretrain/Loss (Raw)": 1.9609774351119995, "Pretrain/Step": 14037, "Pretrain/Step Time": 8.454770198091865} +{"Pretrain/Learning Rate": 8.594092711126588e-06, "Pretrain/Loss": 1.9905726909637451, "Pretrain/Loss (Raw)": 1.9641761779785156, "Pretrain/Step": 14038, "Pretrain/Step Time": 8.451187258586287} +{"Pretrain/Learning Rate": 8.590889734512739e-06, "Pretrain/Loss": 1.992513656616211, "Pretrain/Loss (Raw)": 2.194658041000366, "Pretrain/Step": 14039, "Pretrain/Step Time": 8.448514632880688} +{"Pretrain/Learning Rate": 8.587687231044007e-06, "Pretrain/Loss": 1.9918017387390137, "Pretrain/Loss (Raw)": 1.8935668468475342, "Pretrain/Step": 14040, "Pretrain/Step Time": 8.44415608793497} +{"Pretrain/Learning Rate": 8.58448520081275e-06, "Pretrain/Loss": 1.9902024269104004, "Pretrain/Loss (Raw)": 2.089956760406494, "Pretrain/Step": 14041, "Pretrain/Step Time": 8.442172652110457} +{"Pretrain/Learning Rate": 8.58128364391129e-06, "Pretrain/Loss": 1.988114833831787, "Pretrain/Loss (Raw)": 1.9237524271011353, "Pretrain/Step": 14042, "Pretrain/Step Time": 8.440948547795415} +{"Pretrain/Learning Rate": 8.578082560431935e-06, "Pretrain/Loss": 1.9891316890716553, "Pretrain/Loss (Raw)": 2.040060520172119, "Pretrain/Step": 14043, "Pretrain/Step Time": 8.439897349104285} +{"Pretrain/Learning Rate": 8.574881950467001e-06, "Pretrain/Loss": 1.98689866065979, "Pretrain/Loss (Raw)": 1.8261497020721436, "Pretrain/Step": 14044, "Pretrain/Step Time": 8.444872004911304} +{"Pretrain/Learning Rate": 8.571681814108759e-06, "Pretrain/Loss": 1.986946940422058, "Pretrain/Loss (Raw)": 2.0000147819519043, "Pretrain/Step": 14045, "Pretrain/Step Time": 8.447285238653421} +{"Pretrain/Learning Rate": 8.568482151449498e-06, "Pretrain/Loss": 1.9871971607208252, "Pretrain/Loss (Raw)": 2.017205238342285, "Pretrain/Step": 14046, "Pretrain/Step Time": 8.443529361858964} +{"Pretrain/Learning Rate": 8.565282962581472e-06, "Pretrain/Loss": 1.9871668815612793, "Pretrain/Loss (Raw)": 2.0404393672943115, "Pretrain/Step": 14047, "Pretrain/Step Time": 8.446343587711453} +{"Pretrain/Learning Rate": 8.562084247596916e-06, "Pretrain/Loss": 1.988901138305664, "Pretrain/Loss (Raw)": 2.3904051780700684, "Pretrain/Step": 14048, "Pretrain/Step Time": 8.44383572973311} +{"Pretrain/Learning Rate": 8.558886006588082e-06, "Pretrain/Loss": 1.98857581615448, "Pretrain/Loss (Raw)": 1.8435146808624268, "Pretrain/Step": 14049, "Pretrain/Step Time": 8.442944049835205} +{"Pretrain/Learning Rate": 8.555688239647172e-06, "Pretrain/Loss": 1.9908716678619385, "Pretrain/Loss (Raw)": 2.2222092151641846, "Pretrain/Step": 14050, "Pretrain/Step Time": 8.439517686143517} +{"Pretrain/Learning Rate": 8.552490946866406e-06, "Pretrain/Loss": 1.9904489517211914, "Pretrain/Loss (Raw)": 2.0140011310577393, "Pretrain/Step": 14051, "Pretrain/Step Time": 8.441661182790995} +{"Pretrain/Learning Rate": 8.549294128337961e-06, "Pretrain/Loss": 1.9878793954849243, "Pretrain/Loss (Raw)": 1.7159438133239746, "Pretrain/Step": 14052, "Pretrain/Step Time": 8.442470232024789} +{"Pretrain/Learning Rate": 8.546097784154034e-06, "Pretrain/Loss": 1.9903405904769897, "Pretrain/Loss (Raw)": 2.167144775390625, "Pretrain/Step": 14053, "Pretrain/Step Time": 8.440001526847482} +{"Pretrain/Learning Rate": 8.542901914406773e-06, "Pretrain/Loss": 1.9874122142791748, "Pretrain/Loss (Raw)": 1.9422475099563599, "Pretrain/Step": 14054, "Pretrain/Step Time": 8.43949775584042} +{"Pretrain/Learning Rate": 8.539706519188329e-06, "Pretrain/Loss": 1.9891915321350098, "Pretrain/Loss (Raw)": 2.013000011444092, "Pretrain/Step": 14055, "Pretrain/Step Time": 8.43756559304893} +{"Pretrain/Learning Rate": 8.536511598590852e-06, "Pretrain/Loss": 1.991513967514038, "Pretrain/Loss (Raw)": 2.226135015487671, "Pretrain/Step": 14056, "Pretrain/Step Time": 8.436307666823268} +{"Pretrain/Learning Rate": 8.533317152706447e-06, "Pretrain/Loss": 1.9937891960144043, "Pretrain/Loss (Raw)": 1.9188679456710815, "Pretrain/Step": 14057, "Pretrain/Step Time": 8.429822539910674} +{"Pretrain/Learning Rate": 8.530123181627245e-06, "Pretrain/Loss": 1.9925179481506348, "Pretrain/Loss (Raw)": 1.8372846841812134, "Pretrain/Step": 14058, "Pretrain/Step Time": 8.434238661080599} +{"Pretrain/Learning Rate": 8.526929685445328e-06, "Pretrain/Loss": 1.9943280220031738, "Pretrain/Loss (Raw)": 2.0961740016937256, "Pretrain/Step": 14059, "Pretrain/Step Time": 8.438275655731559} +{"Pretrain/Learning Rate": 8.523736664252771e-06, "Pretrain/Loss": 1.9947773218154907, "Pretrain/Loss (Raw)": 1.9930559396743774, "Pretrain/Step": 14060, "Pretrain/Step Time": 8.4365258757025} +{"Pretrain/Learning Rate": 8.520544118141663e-06, "Pretrain/Loss": 1.9941916465759277, "Pretrain/Loss (Raw)": 1.9141303300857544, "Pretrain/Step": 14061, "Pretrain/Step Time": 8.437841191887856} +{"Pretrain/Learning Rate": 8.517352047204041e-06, "Pretrain/Loss": 1.9935734272003174, "Pretrain/Loss (Raw)": 1.9668980836868286, "Pretrain/Step": 14062, "Pretrain/Step Time": 8.439621141180396} +{"Pretrain/Learning Rate": 8.514160451531957e-06, "Pretrain/Loss": 1.9930119514465332, "Pretrain/Loss (Raw)": 2.0115442276000977, "Pretrain/Step": 14063, "Pretrain/Step Time": 8.43881930038333} +{"Pretrain/Learning Rate": 8.510969331217439e-06, "Pretrain/Loss": 1.9926849603652954, "Pretrain/Loss (Raw)": 2.0334906578063965, "Pretrain/Step": 14064, "Pretrain/Step Time": 8.436857342720032} +{"Pretrain/Learning Rate": 8.507778686352488e-06, "Pretrain/Loss": 1.9919861555099487, "Pretrain/Loss (Raw)": 1.8990824222564697, "Pretrain/Step": 14065, "Pretrain/Step Time": 8.432468883693218} +{"Pretrain/Learning Rate": 8.50458851702912e-06, "Pretrain/Loss": 1.9936507940292358, "Pretrain/Loss (Raw)": 1.9993653297424316, "Pretrain/Step": 14066, "Pretrain/Step Time": 8.426207294687629} +{"Pretrain/Learning Rate": 8.501398823339304e-06, "Pretrain/Loss": 1.9943268299102783, "Pretrain/Loss (Raw)": 2.0593531131744385, "Pretrain/Step": 14067, "Pretrain/Step Time": 8.431157881394029} +{"Pretrain/Learning Rate": 8.498209605375029e-06, "Pretrain/Loss": 1.9919698238372803, "Pretrain/Loss (Raw)": 1.8572938442230225, "Pretrain/Step": 14068, "Pretrain/Step Time": 8.43348179012537} +{"Pretrain/Learning Rate": 8.49502086322825e-06, "Pretrain/Loss": 1.9912896156311035, "Pretrain/Loss (Raw)": 1.971534252166748, "Pretrain/Step": 14069, "Pretrain/Step Time": 8.432350035756826} +{"Pretrain/Learning Rate": 8.49183259699091e-06, "Pretrain/Loss": 1.991834282875061, "Pretrain/Loss (Raw)": 1.9984065294265747, "Pretrain/Step": 14070, "Pretrain/Step Time": 8.433047287166119} +{"Pretrain/Learning Rate": 8.488644806754936e-06, "Pretrain/Loss": 1.9937914609909058, "Pretrain/Loss (Raw)": 1.8956706523895264, "Pretrain/Step": 14071, "Pretrain/Step Time": 8.43130512163043} +{"Pretrain/Learning Rate": 8.485457492612242e-06, "Pretrain/Loss": 1.9918732643127441, "Pretrain/Loss (Raw)": 2.095637798309326, "Pretrain/Step": 14072, "Pretrain/Step Time": 8.429133731871843} +{"Pretrain/Learning Rate": 8.482270654654751e-06, "Pretrain/Loss": 1.9917092323303223, "Pretrain/Loss (Raw)": 1.943607211112976, "Pretrain/Step": 14073, "Pretrain/Step Time": 8.426996361464262} +{"Pretrain/Learning Rate": 8.479084292974328e-06, "Pretrain/Loss": 1.9897350072860718, "Pretrain/Loss (Raw)": 1.92362642288208, "Pretrain/Step": 14074, "Pretrain/Step Time": 8.42439641058445} +{"Pretrain/Learning Rate": 8.475898407662874e-06, "Pretrain/Loss": 1.9906730651855469, "Pretrain/Loss (Raw)": 2.0320231914520264, "Pretrain/Step": 14075, "Pretrain/Step Time": 8.424997353926301} +{"Pretrain/Learning Rate": 8.472712998812241e-06, "Pretrain/Loss": 1.9927749633789062, "Pretrain/Loss (Raw)": 2.044724941253662, "Pretrain/Step": 14076, "Pretrain/Step Time": 8.428915686905384} +{"Pretrain/Learning Rate": 8.469528066514268e-06, "Pretrain/Loss": 1.994910717010498, "Pretrain/Loss (Raw)": 2.009016990661621, "Pretrain/Step": 14077, "Pretrain/Step Time": 8.424808010458946} +{"Pretrain/Learning Rate": 8.466343610860808e-06, "Pretrain/Loss": 1.996996283531189, "Pretrain/Loss (Raw)": 2.176018238067627, "Pretrain/Step": 14078, "Pretrain/Step Time": 8.429325196892023} +{"Pretrain/Learning Rate": 8.463159631943669e-06, "Pretrain/Loss": 1.9981553554534912, "Pretrain/Loss (Raw)": 2.0994908809661865, "Pretrain/Step": 14079, "Pretrain/Step Time": 8.42639534920454} +{"Pretrain/Learning Rate": 8.459976129854669e-06, "Pretrain/Loss": 1.9994845390319824, "Pretrain/Loss (Raw)": 2.0574114322662354, "Pretrain/Step": 14080, "Pretrain/Step Time": 8.42699883505702} +{"Pretrain/Learning Rate": 8.4567931046856e-06, "Pretrain/Loss": 2.0038199424743652, "Pretrain/Loss (Raw)": 2.4227423667907715, "Pretrain/Step": 14081, "Pretrain/Step Time": 8.428287353366613} +{"Pretrain/Learning Rate": 8.45361055652823e-06, "Pretrain/Loss": 2.0071163177490234, "Pretrain/Loss (Raw)": 2.0906009674072266, "Pretrain/Step": 14082, "Pretrain/Step Time": 8.429943736642599} +{"Pretrain/Learning Rate": 8.450428485474346e-06, "Pretrain/Loss": 2.007009267807007, "Pretrain/Loss (Raw)": 2.059826135635376, "Pretrain/Step": 14083, "Pretrain/Step Time": 8.428841991350055} +{"Pretrain/Learning Rate": 8.44724689161568e-06, "Pretrain/Loss": 2.0060999393463135, "Pretrain/Loss (Raw)": 1.917110800743103, "Pretrain/Step": 14084, "Pretrain/Step Time": 8.436914952471852} +{"Pretrain/Learning Rate": 8.444065775043988e-06, "Pretrain/Loss": 2.003183364868164, "Pretrain/Loss (Raw)": 2.052586793899536, "Pretrain/Step": 14085, "Pretrain/Step Time": 8.441285068169236} +{"Pretrain/Learning Rate": 8.440885135850988e-06, "Pretrain/Loss": 2.0043461322784424, "Pretrain/Loss (Raw)": 1.957411289215088, "Pretrain/Step": 14086, "Pretrain/Step Time": 8.438580609858036} +{"Pretrain/Learning Rate": 8.437704974128386e-06, "Pretrain/Loss": 2.0050909519195557, "Pretrain/Loss (Raw)": 2.080104351043701, "Pretrain/Step": 14087, "Pretrain/Step Time": 8.438828205689788} +{"Pretrain/Learning Rate": 8.43452528996789e-06, "Pretrain/Loss": 2.004899263381958, "Pretrain/Loss (Raw)": 1.9661837816238403, "Pretrain/Step": 14088, "Pretrain/Step Time": 8.441683804616332} +{"Pretrain/Learning Rate": 8.431346083461174e-06, "Pretrain/Loss": 2.0041728019714355, "Pretrain/Loss (Raw)": 2.090169668197632, "Pretrain/Step": 14089, "Pretrain/Step Time": 8.439258916303515} +{"Pretrain/Learning Rate": 8.42816735469992e-06, "Pretrain/Loss": 2.004720687866211, "Pretrain/Loss (Raw)": 1.8135372400283813, "Pretrain/Step": 14090, "Pretrain/Step Time": 8.438329368829727} +{"Pretrain/Learning Rate": 8.42498910377578e-06, "Pretrain/Loss": 2.0058345794677734, "Pretrain/Loss (Raw)": 1.9841411113739014, "Pretrain/Step": 14091, "Pretrain/Step Time": 8.437566293403506} +{"Pretrain/Learning Rate": 8.421811330780386e-06, "Pretrain/Loss": 2.002915143966675, "Pretrain/Loss (Raw)": 1.756711483001709, "Pretrain/Step": 14092, "Pretrain/Step Time": 8.446858471259475} +{"Pretrain/Learning Rate": 8.418634035805384e-06, "Pretrain/Loss": 2.002462863922119, "Pretrain/Loss (Raw)": 1.954176664352417, "Pretrain/Step": 14093, "Pretrain/Step Time": 8.441689336672425} +{"Pretrain/Learning Rate": 8.415457218942372e-06, "Pretrain/Loss": 2.004002571105957, "Pretrain/Loss (Raw)": 2.0689618587493896, "Pretrain/Step": 14094, "Pretrain/Step Time": 8.442111479118466} +{"Pretrain/Learning Rate": 8.412280880282966e-06, "Pretrain/Loss": 2.0039796829223633, "Pretrain/Loss (Raw)": 1.9736396074295044, "Pretrain/Step": 14095, "Pretrain/Step Time": 8.44209017418325} +{"Pretrain/Learning Rate": 8.409105019918748e-06, "Pretrain/Loss": 2.0056676864624023, "Pretrain/Loss (Raw)": 2.081861734390259, "Pretrain/Step": 14096, "Pretrain/Step Time": 8.442962367087603} +{"Pretrain/Learning Rate": 8.405929637941285e-06, "Pretrain/Loss": 2.005049705505371, "Pretrain/Loss (Raw)": 1.901652455329895, "Pretrain/Step": 14097, "Pretrain/Step Time": 8.435766527429223} +{"Pretrain/Learning Rate": 8.402754734442148e-06, "Pretrain/Loss": 2.0029568672180176, "Pretrain/Loss (Raw)": 1.825269341468811, "Pretrain/Step": 14098, "Pretrain/Step Time": 8.441307976841927} +{"Pretrain/Learning Rate": 8.39958030951287e-06, "Pretrain/Loss": 2.0028252601623535, "Pretrain/Loss (Raw)": 2.076897621154785, "Pretrain/Step": 14099, "Pretrain/Step Time": 8.442415652796626} +{"Pretrain/Learning Rate": 8.396406363245002e-06, "Pretrain/Loss": 2.0007152557373047, "Pretrain/Loss (Raw)": 1.9710917472839355, "Pretrain/Step": 14100, "Pretrain/Step Time": 8.438286671414971} +{"Pretrain/Learning Rate": 8.39323289573005e-06, "Pretrain/Loss": 2.0021510124206543, "Pretrain/Loss (Raw)": 2.0914478302001953, "Pretrain/Step": 14101, "Pretrain/Step Time": 8.445530839264393} +{"Pretrain/Learning Rate": 8.390059907059512e-06, "Pretrain/Loss": 1.9993741512298584, "Pretrain/Loss (Raw)": 1.9331486225128174, "Pretrain/Step": 14102, "Pretrain/Step Time": 8.446603870019317} +{"Pretrain/Learning Rate": 8.386887397324897e-06, "Pretrain/Loss": 2.0007925033569336, "Pretrain/Loss (Raw)": 2.1245131492614746, "Pretrain/Step": 14103, "Pretrain/Step Time": 8.445704016834497} +{"Pretrain/Learning Rate": 8.383715366617662e-06, "Pretrain/Loss": 2.0012166500091553, "Pretrain/Loss (Raw)": 1.998900055885315, "Pretrain/Step": 14104, "Pretrain/Step Time": 8.444060640409589} +{"Pretrain/Learning Rate": 8.380543815029291e-06, "Pretrain/Loss": 2.0010886192321777, "Pretrain/Loss (Raw)": 1.7742488384246826, "Pretrain/Step": 14105, "Pretrain/Step Time": 8.447588078677654} +{"Pretrain/Learning Rate": 8.377372742651221e-06, "Pretrain/Loss": 2.0009915828704834, "Pretrain/Loss (Raw)": 1.9184807538986206, "Pretrain/Step": 14106, "Pretrain/Step Time": 8.446151923388243} +{"Pretrain/Learning Rate": 8.374202149574884e-06, "Pretrain/Loss": 2.0020861625671387, "Pretrain/Loss (Raw)": 2.0078957080841064, "Pretrain/Step": 14107, "Pretrain/Step Time": 8.448630956932902} +{"Pretrain/Learning Rate": 8.371032035891716e-06, "Pretrain/Loss": 1.9978957176208496, "Pretrain/Loss (Raw)": 1.571298599243164, "Pretrain/Step": 14108, "Pretrain/Step Time": 8.44958596676588} +{"Pretrain/Learning Rate": 8.367862401693104e-06, "Pretrain/Loss": 1.9983484745025635, "Pretrain/Loss (Raw)": 1.929327130317688, "Pretrain/Step": 14109, "Pretrain/Step Time": 8.450464500114322} +{"Pretrain/Learning Rate": 8.364693247070468e-06, "Pretrain/Loss": 1.9996243715286255, "Pretrain/Loss (Raw)": 2.139432191848755, "Pretrain/Step": 14110, "Pretrain/Step Time": 8.451486896723509} +{"Pretrain/Learning Rate": 8.361524572115174e-06, "Pretrain/Loss": 1.9986793994903564, "Pretrain/Loss (Raw)": 1.932715892791748, "Pretrain/Step": 14111, "Pretrain/Step Time": 8.446709556505084} +{"Pretrain/Learning Rate": 8.35835637691858e-06, "Pretrain/Loss": 2.0009708404541016, "Pretrain/Loss (Raw)": 2.068358898162842, "Pretrain/Step": 14112, "Pretrain/Step Time": 8.45115908794105} +{"Pretrain/Learning Rate": 8.355188661572056e-06, "Pretrain/Loss": 1.9996297359466553, "Pretrain/Loss (Raw)": 1.858247995376587, "Pretrain/Step": 14113, "Pretrain/Step Time": 8.451988223940134} +{"Pretrain/Learning Rate": 8.352021426166926e-06, "Pretrain/Loss": 1.999830961227417, "Pretrain/Loss (Raw)": 2.1149978637695312, "Pretrain/Step": 14114, "Pretrain/Step Time": 8.453118279576302} +{"Pretrain/Learning Rate": 8.348854670794532e-06, "Pretrain/Loss": 1.995978832244873, "Pretrain/Loss (Raw)": 1.8942654132843018, "Pretrain/Step": 14115, "Pretrain/Step Time": 8.455399829894304} +{"Pretrain/Learning Rate": 8.345688395546164e-06, "Pretrain/Loss": 1.9965741634368896, "Pretrain/Loss (Raw)": 2.1056385040283203, "Pretrain/Step": 14116, "Pretrain/Step Time": 8.453374212607741} +{"Pretrain/Learning Rate": 8.34252260051314e-06, "Pretrain/Loss": 1.998023271560669, "Pretrain/Loss (Raw)": 2.2182984352111816, "Pretrain/Step": 14117, "Pretrain/Step Time": 8.456254709511995} +{"Pretrain/Learning Rate": 8.339357285786734e-06, "Pretrain/Loss": 1.9970650672912598, "Pretrain/Loss (Raw)": 2.088029146194458, "Pretrain/Step": 14118, "Pretrain/Step Time": 8.459052201360464} +{"Pretrain/Learning Rate": 8.336192451458208e-06, "Pretrain/Loss": 1.9972418546676636, "Pretrain/Loss (Raw)": 2.0419983863830566, "Pretrain/Step": 14119, "Pretrain/Step Time": 8.454001724720001} +{"Pretrain/Learning Rate": 8.333028097618834e-06, "Pretrain/Loss": 1.999634027481079, "Pretrain/Loss (Raw)": 1.957025408744812, "Pretrain/Step": 14120, "Pretrain/Step Time": 8.45257362164557} +{"Pretrain/Learning Rate": 8.329864224359835e-06, "Pretrain/Loss": 1.9976555109024048, "Pretrain/Loss (Raw)": 1.8276454210281372, "Pretrain/Step": 14121, "Pretrain/Step Time": 8.450819624587893} +{"Pretrain/Learning Rate": 8.32670083177246e-06, "Pretrain/Loss": 1.9988280534744263, "Pretrain/Loss (Raw)": 2.098496198654175, "Pretrain/Step": 14122, "Pretrain/Step Time": 8.44782673753798} +{"Pretrain/Learning Rate": 8.323537919947914e-06, "Pretrain/Loss": 1.995615839958191, "Pretrain/Loss (Raw)": 2.032801389694214, "Pretrain/Step": 14123, "Pretrain/Step Time": 8.450708854943514} +{"Pretrain/Learning Rate": 8.320375488977383e-06, "Pretrain/Loss": 1.997054100036621, "Pretrain/Loss (Raw)": 2.311296224594116, "Pretrain/Step": 14124, "Pretrain/Step Time": 8.455449141561985} +{"Pretrain/Learning Rate": 8.317213538952076e-06, "Pretrain/Loss": 2.000159978866577, "Pretrain/Loss (Raw)": 2.2701399326324463, "Pretrain/Step": 14125, "Pretrain/Step Time": 8.453370828181505} +{"Pretrain/Learning Rate": 8.314052069963149e-06, "Pretrain/Loss": 1.999176263809204, "Pretrain/Loss (Raw)": 1.7491346597671509, "Pretrain/Step": 14126, "Pretrain/Step Time": 8.456340646371245} +{"Pretrain/Learning Rate": 8.310891082101776e-06, "Pretrain/Loss": 1.9987003803253174, "Pretrain/Loss (Raw)": 1.9580204486846924, "Pretrain/Step": 14127, "Pretrain/Step Time": 8.454182542860508} +{"Pretrain/Learning Rate": 8.307730575459094e-06, "Pretrain/Loss": 1.998502492904663, "Pretrain/Loss (Raw)": 2.1043121814727783, "Pretrain/Step": 14128, "Pretrain/Step Time": 8.447823150083423} +{"Pretrain/Learning Rate": 8.304570550126225e-06, "Pretrain/Loss": 2.001741886138916, "Pretrain/Loss (Raw)": 2.0187268257141113, "Pretrain/Step": 14129, "Pretrain/Step Time": 8.452185798436403} +{"Pretrain/Learning Rate": 8.301411006194304e-06, "Pretrain/Loss": 2.002329111099243, "Pretrain/Loss (Raw)": 2.065155267715454, "Pretrain/Step": 14130, "Pretrain/Step Time": 8.453942783176899} +{"Pretrain/Learning Rate": 8.298251943754415e-06, "Pretrain/Loss": 2.0025112628936768, "Pretrain/Loss (Raw)": 1.952797532081604, "Pretrain/Step": 14131, "Pretrain/Step Time": 8.456729106605053} +{"Pretrain/Learning Rate": 8.295093362897665e-06, "Pretrain/Loss": 2.0037803649902344, "Pretrain/Loss (Raw)": 2.0338358879089355, "Pretrain/Step": 14132, "Pretrain/Step Time": 8.456103026866913} +{"Pretrain/Learning Rate": 8.291935263715123e-06, "Pretrain/Loss": 2.0041704177856445, "Pretrain/Loss (Raw)": 1.955688238143921, "Pretrain/Step": 14133, "Pretrain/Step Time": 8.46226936019957} +{"Pretrain/Learning Rate": 8.288777646297841e-06, "Pretrain/Loss": 2.0024123191833496, "Pretrain/Loss (Raw)": 1.7755345106124878, "Pretrain/Step": 14134, "Pretrain/Step Time": 8.464058227837086} +{"Pretrain/Learning Rate": 8.285620510736883e-06, "Pretrain/Loss": 2.0004053115844727, "Pretrain/Loss (Raw)": 1.983980655670166, "Pretrain/Step": 14135, "Pretrain/Step Time": 8.466509168967605} +{"Pretrain/Learning Rate": 8.282463857123266e-06, "Pretrain/Loss": 2.000938653945923, "Pretrain/Loss (Raw)": 2.0597782135009766, "Pretrain/Step": 14136, "Pretrain/Step Time": 8.468770882114768} +{"Pretrain/Learning Rate": 8.279307685548026e-06, "Pretrain/Loss": 2.003842353820801, "Pretrain/Loss (Raw)": 2.1077311038970947, "Pretrain/Step": 14137, "Pretrain/Step Time": 8.461923092603683} +{"Pretrain/Learning Rate": 8.276151996102164e-06, "Pretrain/Loss": 2.0044517517089844, "Pretrain/Loss (Raw)": 2.2408154010772705, "Pretrain/Step": 14138, "Pretrain/Step Time": 8.45760951563716} +{"Pretrain/Learning Rate": 8.27299678887666e-06, "Pretrain/Loss": 2.005025625228882, "Pretrain/Loss (Raw)": 2.0430185794830322, "Pretrain/Step": 14139, "Pretrain/Step Time": 8.460472382605076} +{"Pretrain/Learning Rate": 8.26984206396251e-06, "Pretrain/Loss": 2.006598949432373, "Pretrain/Loss (Raw)": 2.051741123199463, "Pretrain/Step": 14140, "Pretrain/Step Time": 8.461418822407722} +{"Pretrain/Learning Rate": 8.266687821450661e-06, "Pretrain/Loss": 2.008054733276367, "Pretrain/Loss (Raw)": 2.064194440841675, "Pretrain/Step": 14141, "Pretrain/Step Time": 8.462787061929703} +{"Pretrain/Learning Rate": 8.263534061432082e-06, "Pretrain/Loss": 2.0080204010009766, "Pretrain/Loss (Raw)": 1.9210127592086792, "Pretrain/Step": 14142, "Pretrain/Step Time": 8.466833898797631} +{"Pretrain/Learning Rate": 8.2603807839977e-06, "Pretrain/Loss": 2.009291410446167, "Pretrain/Loss (Raw)": 2.182311534881592, "Pretrain/Step": 14143, "Pretrain/Step Time": 8.462854405865073} +{"Pretrain/Learning Rate": 8.257227989238427e-06, "Pretrain/Loss": 2.0093812942504883, "Pretrain/Loss (Raw)": 2.240337610244751, "Pretrain/Step": 14144, "Pretrain/Step Time": 8.466224597766995} +{"Pretrain/Learning Rate": 8.254075677245194e-06, "Pretrain/Loss": 2.0100317001342773, "Pretrain/Loss (Raw)": 2.172473192214966, "Pretrain/Step": 14145, "Pretrain/Step Time": 8.466478575021029} +{"Pretrain/Learning Rate": 8.250923848108874e-06, "Pretrain/Loss": 2.0093889236450195, "Pretrain/Loss (Raw)": 1.978586196899414, "Pretrain/Step": 14146, "Pretrain/Step Time": 8.467819774523377} +{"Pretrain/Learning Rate": 8.247772501920365e-06, "Pretrain/Loss": 2.009274482727051, "Pretrain/Loss (Raw)": 1.9974881410598755, "Pretrain/Step": 14147, "Pretrain/Step Time": 8.470037763938308} +{"Pretrain/Learning Rate": 8.244621638770527e-06, "Pretrain/Loss": 2.011875867843628, "Pretrain/Loss (Raw)": 2.15761137008667, "Pretrain/Step": 14148, "Pretrain/Step Time": 8.466755401343107} +{"Pretrain/Learning Rate": 8.241471258750203e-06, "Pretrain/Loss": 2.012157440185547, "Pretrain/Loss (Raw)": 2.111739158630371, "Pretrain/Step": 14149, "Pretrain/Step Time": 8.469409560784698} +{"Pretrain/Learning Rate": 8.238321361950253e-06, "Pretrain/Loss": 2.011711597442627, "Pretrain/Loss (Raw)": 2.1118226051330566, "Pretrain/Step": 14150, "Pretrain/Step Time": 8.47164361923933} +{"Pretrain/Learning Rate": 8.23517194846148e-06, "Pretrain/Loss": 2.0106358528137207, "Pretrain/Loss (Raw)": 2.0902955532073975, "Pretrain/Step": 14151, "Pretrain/Step Time": 8.472252337262034} +{"Pretrain/Learning Rate": 8.232023018374709e-06, "Pretrain/Loss": 2.0085930824279785, "Pretrain/Loss (Raw)": 1.607568383216858, "Pretrain/Step": 14152, "Pretrain/Step Time": 8.47027100250125} +{"Pretrain/Learning Rate": 8.22887457178074e-06, "Pretrain/Loss": 2.00846529006958, "Pretrain/Loss (Raw)": 1.8803542852401733, "Pretrain/Step": 14153, "Pretrain/Step Time": 8.470212053507566} +{"Pretrain/Learning Rate": 8.225726608770346e-06, "Pretrain/Loss": 2.010072708129883, "Pretrain/Loss (Raw)": 2.0236480236053467, "Pretrain/Step": 14154, "Pretrain/Step Time": 8.469479471445084} +{"Pretrain/Learning Rate": 8.222579129434302e-06, "Pretrain/Loss": 2.010113477706909, "Pretrain/Loss (Raw)": 1.9132940769195557, "Pretrain/Step": 14155, "Pretrain/Step Time": 8.46549192070961} +{"Pretrain/Learning Rate": 8.219432133863353e-06, "Pretrain/Loss": 2.0118298530578613, "Pretrain/Loss (Raw)": 2.4379663467407227, "Pretrain/Step": 14156, "Pretrain/Step Time": 8.46620661765337} +{"Pretrain/Learning Rate": 8.216285622148256e-06, "Pretrain/Loss": 2.011070489883423, "Pretrain/Loss (Raw)": 1.939415693283081, "Pretrain/Step": 14157, "Pretrain/Step Time": 8.465292731299996} +{"Pretrain/Learning Rate": 8.213139594379727e-06, "Pretrain/Loss": 2.0129475593566895, "Pretrain/Loss (Raw)": 2.2627058029174805, "Pretrain/Step": 14158, "Pretrain/Step Time": 8.467599904164672} +{"Pretrain/Learning Rate": 8.209994050648487e-06, "Pretrain/Loss": 2.015512466430664, "Pretrain/Loss (Raw)": 2.1926708221435547, "Pretrain/Step": 14159, "Pretrain/Step Time": 8.464992828667164} +{"Pretrain/Learning Rate": 8.206848991045235e-06, "Pretrain/Loss": 2.0160861015319824, "Pretrain/Loss (Raw)": 1.945854902267456, "Pretrain/Step": 14160, "Pretrain/Step Time": 8.468276022002101} +{"Pretrain/Learning Rate": 8.203704415660646e-06, "Pretrain/Loss": 2.0150833129882812, "Pretrain/Loss (Raw)": 2.0095930099487305, "Pretrain/Step": 14161, "Pretrain/Step Time": 8.460643652826548} +{"Pretrain/Learning Rate": 8.200560324585407e-06, "Pretrain/Loss": 2.0156121253967285, "Pretrain/Loss (Raw)": 2.060044050216675, "Pretrain/Step": 14162, "Pretrain/Step Time": 8.463213143870234} +{"Pretrain/Learning Rate": 8.197416717910162e-06, "Pretrain/Loss": 2.014127016067505, "Pretrain/Loss (Raw)": 1.7438181638717651, "Pretrain/Step": 14163, "Pretrain/Step Time": 8.461929500102997} +{"Pretrain/Learning Rate": 8.194273595725566e-06, "Pretrain/Loss": 2.01397705078125, "Pretrain/Loss (Raw)": 1.9714088439941406, "Pretrain/Step": 14164, "Pretrain/Step Time": 8.465332543477416} +{"Pretrain/Learning Rate": 8.191130958122246e-06, "Pretrain/Loss": 2.0145716667175293, "Pretrain/Loss (Raw)": 2.037066698074341, "Pretrain/Step": 14165, "Pretrain/Step Time": 8.461468720808625} +{"Pretrain/Learning Rate": 8.187988805190804e-06, "Pretrain/Loss": 2.0190536975860596, "Pretrain/Loss (Raw)": 2.5378828048706055, "Pretrain/Step": 14166, "Pretrain/Step Time": 8.46334134414792} +{"Pretrain/Learning Rate": 8.184847137021864e-06, "Pretrain/Loss": 2.016047477722168, "Pretrain/Loss (Raw)": 1.8098711967468262, "Pretrain/Step": 14167, "Pretrain/Step Time": 8.471373395994306} +{"Pretrain/Learning Rate": 8.181705953705993e-06, "Pretrain/Loss": 2.0174765586853027, "Pretrain/Loss (Raw)": 2.076474189758301, "Pretrain/Step": 14168, "Pretrain/Step Time": 8.470527712255716} +{"Pretrain/Learning Rate": 8.178565255333783e-06, "Pretrain/Loss": 2.016254425048828, "Pretrain/Loss (Raw)": 1.9335038661956787, "Pretrain/Step": 14169, "Pretrain/Step Time": 8.469451190903783} +{"Pretrain/Learning Rate": 8.175425041995788e-06, "Pretrain/Loss": 2.0183043479919434, "Pretrain/Loss (Raw)": 2.186164379119873, "Pretrain/Step": 14170, "Pretrain/Step Time": 8.469955917447805} +{"Pretrain/Learning Rate": 8.17228531378254e-06, "Pretrain/Loss": 2.01932954788208, "Pretrain/Loss (Raw)": 2.1712753772735596, "Pretrain/Step": 14171, "Pretrain/Step Time": 8.472697470337152} +{"Pretrain/Learning Rate": 8.169146070784594e-06, "Pretrain/Loss": 2.021390914916992, "Pretrain/Loss (Raw)": 2.0900230407714844, "Pretrain/Step": 14172, "Pretrain/Step Time": 8.468648005276918} +{"Pretrain/Learning Rate": 8.166007313092448e-06, "Pretrain/Loss": 2.022327423095703, "Pretrain/Loss (Raw)": 2.1198675632476807, "Pretrain/Step": 14173, "Pretrain/Step Time": 8.468542102724314} +{"Pretrain/Learning Rate": 8.162869040796616e-06, "Pretrain/Loss": 2.0231480598449707, "Pretrain/Loss (Raw)": 2.1222519874572754, "Pretrain/Step": 14174, "Pretrain/Step Time": 8.470636870712042} +{"Pretrain/Learning Rate": 8.15973125398759e-06, "Pretrain/Loss": 2.0212738513946533, "Pretrain/Loss (Raw)": 1.8005397319793701, "Pretrain/Step": 14175, "Pretrain/Step Time": 8.46962483972311} +{"Pretrain/Learning Rate": 8.156593952755834e-06, "Pretrain/Loss": 2.018200397491455, "Pretrain/Loss (Raw)": 1.9970276355743408, "Pretrain/Step": 14176, "Pretrain/Step Time": 8.46992307715118} +{"Pretrain/Learning Rate": 8.153457137191826e-06, "Pretrain/Loss": 2.0190367698669434, "Pretrain/Loss (Raw)": 1.9505338668823242, "Pretrain/Step": 14177, "Pretrain/Step Time": 8.471931034699082} +{"Pretrain/Learning Rate": 8.150320807385997e-06, "Pretrain/Loss": 2.0181665420532227, "Pretrain/Loss (Raw)": 2.1108438968658447, "Pretrain/Step": 14178, "Pretrain/Step Time": 8.474116180092096} +{"Pretrain/Learning Rate": 8.147184963428798e-06, "Pretrain/Loss": 2.01723575592041, "Pretrain/Loss (Raw)": 1.8948432207107544, "Pretrain/Step": 14179, "Pretrain/Step Time": 8.472162988036871} +{"Pretrain/Learning Rate": 8.144049605410637e-06, "Pretrain/Loss": 2.01889705657959, "Pretrain/Loss (Raw)": 1.9285961389541626, "Pretrain/Step": 14180, "Pretrain/Step Time": 8.472667349502444} +{"Pretrain/Learning Rate": 8.140914733421918e-06, "Pretrain/Loss": 2.0167245864868164, "Pretrain/Loss (Raw)": 1.8890619277954102, "Pretrain/Step": 14181, "Pretrain/Step Time": 8.481692384928465} +{"Pretrain/Learning Rate": 8.137780347553042e-06, "Pretrain/Loss": 2.017298698425293, "Pretrain/Loss (Raw)": 2.015737295150757, "Pretrain/Step": 14182, "Pretrain/Step Time": 8.487574208527803} +{"Pretrain/Learning Rate": 8.13464644789438e-06, "Pretrain/Loss": 2.016745090484619, "Pretrain/Loss (Raw)": 1.9421329498291016, "Pretrain/Step": 14183, "Pretrain/Step Time": 8.486621499061584} +{"Pretrain/Learning Rate": 8.131513034536304e-06, "Pretrain/Loss": 2.0148186683654785, "Pretrain/Loss (Raw)": 1.9795880317687988, "Pretrain/Step": 14184, "Pretrain/Step Time": 8.488619595766068} +{"Pretrain/Learning Rate": 8.128380107569148e-06, "Pretrain/Loss": 2.015791416168213, "Pretrain/Loss (Raw)": 2.0433831214904785, "Pretrain/Step": 14185, "Pretrain/Step Time": 8.48655609227717} +{"Pretrain/Learning Rate": 8.12524766708327e-06, "Pretrain/Loss": 2.015549659729004, "Pretrain/Loss (Raw)": 1.8063362836837769, "Pretrain/Step": 14186, "Pretrain/Step Time": 8.479998202994466} +{"Pretrain/Learning Rate": 8.122115713168976e-06, "Pretrain/Loss": 2.014880657196045, "Pretrain/Loss (Raw)": 2.0105409622192383, "Pretrain/Step": 14187, "Pretrain/Step Time": 8.476562282070518} +{"Pretrain/Learning Rate": 8.11898424591657e-06, "Pretrain/Loss": 2.015986442565918, "Pretrain/Loss (Raw)": 2.134594202041626, "Pretrain/Step": 14188, "Pretrain/Step Time": 8.477123912423849} +{"Pretrain/Learning Rate": 8.115853265416362e-06, "Pretrain/Loss": 2.017512321472168, "Pretrain/Loss (Raw)": 2.109426498413086, "Pretrain/Step": 14189, "Pretrain/Step Time": 8.477979503571987} +{"Pretrain/Learning Rate": 8.112722771758613e-06, "Pretrain/Loss": 2.019411563873291, "Pretrain/Loss (Raw)": 2.2100019454956055, "Pretrain/Step": 14190, "Pretrain/Step Time": 8.476029504090548} +{"Pretrain/Learning Rate": 8.109592765033608e-06, "Pretrain/Loss": 2.018352746963501, "Pretrain/Loss (Raw)": 1.8760195970535278, "Pretrain/Step": 14191, "Pretrain/Step Time": 8.47895091213286} +{"Pretrain/Learning Rate": 8.106463245331585e-06, "Pretrain/Loss": 2.0184292793273926, "Pretrain/Loss (Raw)": 2.0432724952697754, "Pretrain/Step": 14192, "Pretrain/Step Time": 8.479232368990779} +{"Pretrain/Learning Rate": 8.103334212742783e-06, "Pretrain/Loss": 2.019106388092041, "Pretrain/Loss (Raw)": 1.9857722520828247, "Pretrain/Step": 14193, "Pretrain/Step Time": 8.483078919351101} +{"Pretrain/Learning Rate": 8.100205667357433e-06, "Pretrain/Loss": 2.0180301666259766, "Pretrain/Loss (Raw)": 1.8615872859954834, "Pretrain/Step": 14194, "Pretrain/Step Time": 8.48735080473125} +{"Pretrain/Learning Rate": 8.09707760926573e-06, "Pretrain/Loss": 2.017831802368164, "Pretrain/Loss (Raw)": 2.0339698791503906, "Pretrain/Step": 14195, "Pretrain/Step Time": 8.482628034427762} +{"Pretrain/Learning Rate": 8.093950038557884e-06, "Pretrain/Loss": 2.0202534198760986, "Pretrain/Loss (Raw)": 2.1672658920288086, "Pretrain/Step": 14196, "Pretrain/Step Time": 8.480401404201984} +{"Pretrain/Learning Rate": 8.090822955324076e-06, "Pretrain/Loss": 2.0208444595336914, "Pretrain/Loss (Raw)": 2.0471882820129395, "Pretrain/Step": 14197, "Pretrain/Step Time": 8.484822053462267} +{"Pretrain/Learning Rate": 8.087696359654456e-06, "Pretrain/Loss": 2.0198636054992676, "Pretrain/Loss (Raw)": 1.8728408813476562, "Pretrain/Step": 14198, "Pretrain/Step Time": 8.485849184915423} +{"Pretrain/Learning Rate": 8.084570251639201e-06, "Pretrain/Loss": 2.0192477703094482, "Pretrain/Loss (Raw)": 1.8168699741363525, "Pretrain/Step": 14199, "Pretrain/Step Time": 8.484345154836774} +{"Pretrain/Learning Rate": 8.081444631368425e-06, "Pretrain/Loss": 2.016920328140259, "Pretrain/Loss (Raw)": 1.7977136373519897, "Pretrain/Step": 14200, "Pretrain/Step Time": 8.489429360255599} +{"Pretrain/Learning Rate": 8.07831949893228e-06, "Pretrain/Loss": 2.0165798664093018, "Pretrain/Loss (Raw)": 1.900028109550476, "Pretrain/Step": 14201, "Pretrain/Step Time": 8.48454780317843} +{"Pretrain/Learning Rate": 8.075194854420859e-06, "Pretrain/Loss": 2.01651668548584, "Pretrain/Loss (Raw)": 1.9155408143997192, "Pretrain/Step": 14202, "Pretrain/Step Time": 8.486519394442439} +{"Pretrain/Learning Rate": 8.072070697924255e-06, "Pretrain/Loss": 2.017463207244873, "Pretrain/Loss (Raw)": 2.153181791305542, "Pretrain/Step": 14203, "Pretrain/Step Time": 8.488361362367868} +{"Pretrain/Learning Rate": 8.06894702953257e-06, "Pretrain/Loss": 2.01706600189209, "Pretrain/Loss (Raw)": 1.9938914775848389, "Pretrain/Step": 14204, "Pretrain/Step Time": 8.487237500026822} +{"Pretrain/Learning Rate": 8.065823849335851e-06, "Pretrain/Loss": 2.016188144683838, "Pretrain/Loss (Raw)": 1.896632194519043, "Pretrain/Step": 14205, "Pretrain/Step Time": 8.486528173089027} +{"Pretrain/Learning Rate": 8.062701157424174e-06, "Pretrain/Loss": 2.0166103839874268, "Pretrain/Loss (Raw)": 2.230072259902954, "Pretrain/Step": 14206, "Pretrain/Step Time": 8.484004773199558} +{"Pretrain/Learning Rate": 8.059578953887568e-06, "Pretrain/Loss": 2.0162885189056396, "Pretrain/Loss (Raw)": 2.058298110961914, "Pretrain/Step": 14207, "Pretrain/Step Time": 8.483643088489771} +{"Pretrain/Learning Rate": 8.056457238816051e-06, "Pretrain/Loss": 2.0155911445617676, "Pretrain/Loss (Raw)": 1.9681599140167236, "Pretrain/Step": 14208, "Pretrain/Step Time": 8.48097725957632} +{"Pretrain/Learning Rate": 8.053336012299657e-06, "Pretrain/Loss": 2.0116701126098633, "Pretrain/Loss (Raw)": 1.9208227396011353, "Pretrain/Step": 14209, "Pretrain/Step Time": 8.484192250296474} +{"Pretrain/Learning Rate": 8.05021527442836e-06, "Pretrain/Loss": 2.009554862976074, "Pretrain/Loss (Raw)": 1.8198564052581787, "Pretrain/Step": 14210, "Pretrain/Step Time": 8.479179630056024} +{"Pretrain/Learning Rate": 8.047095025292168e-06, "Pretrain/Loss": 2.008229970932007, "Pretrain/Loss (Raw)": 1.8902465105056763, "Pretrain/Step": 14211, "Pretrain/Step Time": 8.481777800247073} +{"Pretrain/Learning Rate": 8.043975264981038e-06, "Pretrain/Loss": 2.009225368499756, "Pretrain/Loss (Raw)": 2.0445001125335693, "Pretrain/Step": 14212, "Pretrain/Step Time": 8.479037968441844} +{"Pretrain/Learning Rate": 8.040855993584922e-06, "Pretrain/Loss": 2.0079660415649414, "Pretrain/Loss (Raw)": 1.8913960456848145, "Pretrain/Step": 14213, "Pretrain/Step Time": 8.475785521790385} +{"Pretrain/Learning Rate": 8.037737211193775e-06, "Pretrain/Loss": 2.007751226425171, "Pretrain/Loss (Raw)": 1.929913878440857, "Pretrain/Step": 14214, "Pretrain/Step Time": 8.479696780443192} +{"Pretrain/Learning Rate": 8.03461891789751e-06, "Pretrain/Loss": 2.0064351558685303, "Pretrain/Loss (Raw)": 1.9116623401641846, "Pretrain/Step": 14215, "Pretrain/Step Time": 8.478139882907271} +{"Pretrain/Learning Rate": 8.031501113786054e-06, "Pretrain/Loss": 2.007932424545288, "Pretrain/Loss (Raw)": 2.1578335762023926, "Pretrain/Step": 14216, "Pretrain/Step Time": 8.476117599755526} +{"Pretrain/Learning Rate": 8.028383798949304e-06, "Pretrain/Loss": 2.006441593170166, "Pretrain/Loss (Raw)": 1.8993340730667114, "Pretrain/Step": 14217, "Pretrain/Step Time": 8.47674653120339} +{"Pretrain/Learning Rate": 8.025266973477136e-06, "Pretrain/Loss": 2.008236885070801, "Pretrain/Loss (Raw)": 2.0433363914489746, "Pretrain/Step": 14218, "Pretrain/Step Time": 8.47921922057867} +{"Pretrain/Learning Rate": 8.022150637459436e-06, "Pretrain/Loss": 2.0054373741149902, "Pretrain/Loss (Raw)": 1.6258361339569092, "Pretrain/Step": 14219, "Pretrain/Step Time": 8.479842465370893} +{"Pretrain/Learning Rate": 8.019034790986043e-06, "Pretrain/Loss": 2.0065155029296875, "Pretrain/Loss (Raw)": 1.8946843147277832, "Pretrain/Step": 14220, "Pretrain/Step Time": 8.477246411144733} +{"Pretrain/Learning Rate": 8.015919434146821e-06, "Pretrain/Loss": 2.005115032196045, "Pretrain/Loss (Raw)": 1.7749078273773193, "Pretrain/Step": 14221, "Pretrain/Step Time": 8.478484310209751} +{"Pretrain/Learning Rate": 8.01280456703159e-06, "Pretrain/Loss": 2.0034918785095215, "Pretrain/Loss (Raw)": 1.861200213432312, "Pretrain/Step": 14222, "Pretrain/Step Time": 8.478591922670603} +{"Pretrain/Learning Rate": 8.009690189730157e-06, "Pretrain/Loss": 2.0025248527526855, "Pretrain/Loss (Raw)": 1.8498862981796265, "Pretrain/Step": 14223, "Pretrain/Step Time": 8.476793782785535} +{"Pretrain/Learning Rate": 8.006576302332335e-06, "Pretrain/Loss": 2.0022647380828857, "Pretrain/Loss (Raw)": 2.0485475063323975, "Pretrain/Step": 14224, "Pretrain/Step Time": 8.477504428476095} +{"Pretrain/Learning Rate": 8.0034629049279e-06, "Pretrain/Loss": 2.004262924194336, "Pretrain/Loss (Raw)": 2.1574275493621826, "Pretrain/Step": 14225, "Pretrain/Step Time": 8.476855009794235} +{"Pretrain/Learning Rate": 8.000349997606634e-06, "Pretrain/Loss": 2.0050599575042725, "Pretrain/Loss (Raw)": 1.9272764921188354, "Pretrain/Step": 14226, "Pretrain/Step Time": 8.475547770038247} +{"Pretrain/Learning Rate": 7.997237580458297e-06, "Pretrain/Loss": 2.002859592437744, "Pretrain/Loss (Raw)": 1.7952702045440674, "Pretrain/Step": 14227, "Pretrain/Step Time": 8.4751460198313} +{"Pretrain/Learning Rate": 7.994125653572618e-06, "Pretrain/Loss": 2.006861925125122, "Pretrain/Loss (Raw)": 2.4833834171295166, "Pretrain/Step": 14228, "Pretrain/Step Time": 8.473065918311477} +{"Pretrain/Learning Rate": 7.991014217039347e-06, "Pretrain/Loss": 2.007551670074463, "Pretrain/Loss (Raw)": 2.1797330379486084, "Pretrain/Step": 14229, "Pretrain/Step Time": 8.477528976276517} +{"Pretrain/Learning Rate": 7.98790327094818e-06, "Pretrain/Loss": 2.0075583457946777, "Pretrain/Loss (Raw)": 1.9339839220046997, "Pretrain/Step": 14230, "Pretrain/Step Time": 8.476213470101357} +{"Pretrain/Learning Rate": 7.98479281538884e-06, "Pretrain/Loss": 2.0060713291168213, "Pretrain/Loss (Raw)": 1.934185266494751, "Pretrain/Step": 14231, "Pretrain/Step Time": 8.473103513941169} +{"Pretrain/Learning Rate": 7.981682850451002e-06, "Pretrain/Loss": 2.0062637329101562, "Pretrain/Loss (Raw)": 2.0235254764556885, "Pretrain/Step": 14232, "Pretrain/Step Time": 8.473381765186787} +{"Pretrain/Learning Rate": 7.978573376224335e-06, "Pretrain/Loss": 2.00862979888916, "Pretrain/Loss (Raw)": 2.0771119594573975, "Pretrain/Step": 14233, "Pretrain/Step Time": 8.471807422116399} +{"Pretrain/Learning Rate": 7.975464392798515e-06, "Pretrain/Loss": 2.0089762210845947, "Pretrain/Loss (Raw)": 1.9628245830535889, "Pretrain/Step": 14234, "Pretrain/Step Time": 8.471418308094144} +{"Pretrain/Learning Rate": 7.972355900263168e-06, "Pretrain/Loss": 2.00815749168396, "Pretrain/Loss (Raw)": 1.9031113386154175, "Pretrain/Step": 14235, "Pretrain/Step Time": 8.477542510256171} +{"Pretrain/Learning Rate": 7.96924789870794e-06, "Pretrain/Loss": 2.011688709259033, "Pretrain/Loss (Raw)": 2.023287773132324, "Pretrain/Step": 14236, "Pretrain/Step Time": 8.477791406214237} +{"Pretrain/Learning Rate": 7.966140388222448e-06, "Pretrain/Loss": 2.013422966003418, "Pretrain/Loss (Raw)": 2.151304006576538, "Pretrain/Step": 14237, "Pretrain/Step Time": 8.475597213953733} +{"Pretrain/Learning Rate": 7.963033368896286e-06, "Pretrain/Loss": 2.012474536895752, "Pretrain/Loss (Raw)": 2.0180411338806152, "Pretrain/Step": 14238, "Pretrain/Step Time": 8.475304594263434} +{"Pretrain/Learning Rate": 7.959926840819048e-06, "Pretrain/Loss": 2.014012575149536, "Pretrain/Loss (Raw)": 2.1295979022979736, "Pretrain/Step": 14239, "Pretrain/Step Time": 8.478123376145959} +{"Pretrain/Learning Rate": 7.9568208040803e-06, "Pretrain/Loss": 2.0131731033325195, "Pretrain/Loss (Raw)": 1.9608603715896606, "Pretrain/Step": 14240, "Pretrain/Step Time": 8.474774483591318} +{"Pretrain/Learning Rate": 7.953715258769617e-06, "Pretrain/Loss": 2.014645576477051, "Pretrain/Loss (Raw)": 2.046774387359619, "Pretrain/Step": 14241, "Pretrain/Step Time": 8.480074115097523} +{"Pretrain/Learning Rate": 7.95061020497653e-06, "Pretrain/Loss": 2.0129690170288086, "Pretrain/Loss (Raw)": 1.9003673791885376, "Pretrain/Step": 14242, "Pretrain/Step Time": 8.481129689142108} +{"Pretrain/Learning Rate": 7.947505642790586e-06, "Pretrain/Loss": 2.014009475708008, "Pretrain/Loss (Raw)": 2.027482748031616, "Pretrain/Step": 14243, "Pretrain/Step Time": 8.483932968229055} +{"Pretrain/Learning Rate": 7.944401572301296e-06, "Pretrain/Loss": 2.012517213821411, "Pretrain/Loss (Raw)": 1.9146021604537964, "Pretrain/Step": 14244, "Pretrain/Step Time": 8.478999871760607} +{"Pretrain/Learning Rate": 7.941297993598155e-06, "Pretrain/Loss": 2.008523464202881, "Pretrain/Loss (Raw)": 1.7070893049240112, "Pretrain/Step": 14245, "Pretrain/Step Time": 8.476892309263349} +{"Pretrain/Learning Rate": 7.938194906770669e-06, "Pretrain/Loss": 2.0043628215789795, "Pretrain/Loss (Raw)": 1.555467963218689, "Pretrain/Step": 14246, "Pretrain/Step Time": 8.479555839672685} +{"Pretrain/Learning Rate": 7.935092311908297e-06, "Pretrain/Loss": 2.003312587738037, "Pretrain/Loss (Raw)": 1.9075661897659302, "Pretrain/Step": 14247, "Pretrain/Step Time": 8.479519203305244} +{"Pretrain/Learning Rate": 7.931990209100516e-06, "Pretrain/Loss": 2.002851963043213, "Pretrain/Loss (Raw)": 1.8980592489242554, "Pretrain/Step": 14248, "Pretrain/Step Time": 8.483418121933937} +{"Pretrain/Learning Rate": 7.928888598436756e-06, "Pretrain/Loss": 2.0052571296691895, "Pretrain/Loss (Raw)": 2.135528564453125, "Pretrain/Step": 14249, "Pretrain/Step Time": 8.480894519016147} +{"Pretrain/Learning Rate": 7.925787480006469e-06, "Pretrain/Loss": 2.003821611404419, "Pretrain/Loss (Raw)": 1.9147523641586304, "Pretrain/Step": 14250, "Pretrain/Step Time": 8.485223822295666} +{"Pretrain/Learning Rate": 7.922686853899064e-06, "Pretrain/Loss": 2.0046017169952393, "Pretrain/Loss (Raw)": 2.1326534748077393, "Pretrain/Step": 14251, "Pretrain/Step Time": 8.482659053057432} +{"Pretrain/Learning Rate": 7.919586720203934e-06, "Pretrain/Loss": 2.001851797103882, "Pretrain/Loss (Raw)": 1.9592945575714111, "Pretrain/Step": 14252, "Pretrain/Step Time": 8.479965936392546} +{"Pretrain/Learning Rate": 7.91648707901049e-06, "Pretrain/Loss": 2.0003087520599365, "Pretrain/Loss (Raw)": 2.0726311206817627, "Pretrain/Step": 14253, "Pretrain/Step Time": 8.481136981397867} +{"Pretrain/Learning Rate": 7.91338793040809e-06, "Pretrain/Loss": 2.000208616256714, "Pretrain/Loss (Raw)": 1.736309289932251, "Pretrain/Step": 14254, "Pretrain/Step Time": 8.479131629690528} +{"Pretrain/Learning Rate": 7.91028927448611e-06, "Pretrain/Loss": 2.001171588897705, "Pretrain/Loss (Raw)": 2.081296443939209, "Pretrain/Step": 14255, "Pretrain/Step Time": 8.476776130497456} +{"Pretrain/Learning Rate": 7.907191111333892e-06, "Pretrain/Loss": 1.9989451169967651, "Pretrain/Loss (Raw)": 1.819309949874878, "Pretrain/Step": 14256, "Pretrain/Step Time": 8.481005232781172} +{"Pretrain/Learning Rate": 7.90409344104076e-06, "Pretrain/Loss": 1.9990261793136597, "Pretrain/Loss (Raw)": 2.029125452041626, "Pretrain/Step": 14257, "Pretrain/Step Time": 8.476890433579683} +{"Pretrain/Learning Rate": 7.900996263696053e-06, "Pretrain/Loss": 1.9973983764648438, "Pretrain/Loss (Raw)": 1.8567841053009033, "Pretrain/Step": 14258, "Pretrain/Step Time": 8.477449286729097} +{"Pretrain/Learning Rate": 7.897899579389054e-06, "Pretrain/Loss": 1.9985663890838623, "Pretrain/Loss (Raw)": 2.1023037433624268, "Pretrain/Step": 14259, "Pretrain/Step Time": 8.47503755800426} +{"Pretrain/Learning Rate": 7.894803388209073e-06, "Pretrain/Loss": 1.997776985168457, "Pretrain/Loss (Raw)": 1.9327887296676636, "Pretrain/Step": 14260, "Pretrain/Step Time": 8.475069159641862} +{"Pretrain/Learning Rate": 7.891707690245379e-06, "Pretrain/Loss": 1.997570276260376, "Pretrain/Loss (Raw)": 1.9292488098144531, "Pretrain/Step": 14261, "Pretrain/Step Time": 8.470807453617454} +{"Pretrain/Learning Rate": 7.888612485587225e-06, "Pretrain/Loss": 1.9982593059539795, "Pretrain/Loss (Raw)": 1.8637129068374634, "Pretrain/Step": 14262, "Pretrain/Step Time": 8.4710743278265} +{"Pretrain/Learning Rate": 7.885517774323875e-06, "Pretrain/Loss": 1.9981577396392822, "Pretrain/Loss (Raw)": 1.9709720611572266, "Pretrain/Step": 14263, "Pretrain/Step Time": 8.467957323417068} +{"Pretrain/Learning Rate": 7.882423556544547e-06, "Pretrain/Loss": 1.9954050779342651, "Pretrain/Loss (Raw)": 1.7074435949325562, "Pretrain/Step": 14264, "Pretrain/Step Time": 8.467288734391332} +{"Pretrain/Learning Rate": 7.879329832338474e-06, "Pretrain/Loss": 1.9951869249343872, "Pretrain/Loss (Raw)": 2.0798139572143555, "Pretrain/Step": 14265, "Pretrain/Step Time": 8.473839309066534} +{"Pretrain/Learning Rate": 7.876236601794858e-06, "Pretrain/Loss": 1.9952785968780518, "Pretrain/Loss (Raw)": 2.252542734146118, "Pretrain/Step": 14266, "Pretrain/Step Time": 8.474109388887882} +{"Pretrain/Learning Rate": 7.873143865002882e-06, "Pretrain/Loss": 1.9932366609573364, "Pretrain/Loss (Raw)": 1.7816485166549683, "Pretrain/Step": 14267, "Pretrain/Step Time": 8.477812187746167} +{"Pretrain/Learning Rate": 7.870051622051735e-06, "Pretrain/Loss": 1.9908416271209717, "Pretrain/Loss (Raw)": 1.7451802492141724, "Pretrain/Step": 14268, "Pretrain/Step Time": 8.475076459348202} +{"Pretrain/Learning Rate": 7.866959873030566e-06, "Pretrain/Loss": 1.9906985759735107, "Pretrain/Loss (Raw)": 2.0458736419677734, "Pretrain/Step": 14269, "Pretrain/Step Time": 8.475869690999389} +{"Pretrain/Learning Rate": 7.863868618028539e-06, "Pretrain/Loss": 1.9913437366485596, "Pretrain/Loss (Raw)": 2.0035946369171143, "Pretrain/Step": 14270, "Pretrain/Step Time": 8.474371949210763} +{"Pretrain/Learning Rate": 7.860777857134782e-06, "Pretrain/Loss": 1.9897565841674805, "Pretrain/Loss (Raw)": 1.979162573814392, "Pretrain/Step": 14271, "Pretrain/Step Time": 8.476997021585703} +{"Pretrain/Learning Rate": 7.857687590438404e-06, "Pretrain/Loss": 1.9881478548049927, "Pretrain/Loss (Raw)": 2.0344202518463135, "Pretrain/Step": 14272, "Pretrain/Step Time": 8.47334909439087} +{"Pretrain/Learning Rate": 7.854597818028524e-06, "Pretrain/Loss": 1.9877671003341675, "Pretrain/Loss (Raw)": 2.12373948097229, "Pretrain/Step": 14273, "Pretrain/Step Time": 8.474586544558406} +{"Pretrain/Learning Rate": 7.851508539994227e-06, "Pretrain/Loss": 1.9885001182556152, "Pretrain/Loss (Raw)": 2.0724220275878906, "Pretrain/Step": 14274, "Pretrain/Step Time": 8.476114269345999} +{"Pretrain/Learning Rate": 7.848419756424596e-06, "Pretrain/Loss": 1.9914791584014893, "Pretrain/Loss (Raw)": 2.3787944316864014, "Pretrain/Step": 14275, "Pretrain/Step Time": 8.474423022940755} +{"Pretrain/Learning Rate": 7.845331467408692e-06, "Pretrain/Loss": 1.9885671138763428, "Pretrain/Loss (Raw)": 1.78486967086792, "Pretrain/Step": 14276, "Pretrain/Step Time": 8.479432741180062} +{"Pretrain/Learning Rate": 7.842243673035555e-06, "Pretrain/Loss": 1.985541582107544, "Pretrain/Loss (Raw)": 1.7244868278503418, "Pretrain/Step": 14277, "Pretrain/Step Time": 8.477261360734701} +{"Pretrain/Learning Rate": 7.839156373394233e-06, "Pretrain/Loss": 1.985901951789856, "Pretrain/Loss (Raw)": 2.1579389572143555, "Pretrain/Step": 14278, "Pretrain/Step Time": 8.473606122657657} +{"Pretrain/Learning Rate": 7.836069568573732e-06, "Pretrain/Loss": 1.9863226413726807, "Pretrain/Loss (Raw)": 2.144148826599121, "Pretrain/Step": 14279, "Pretrain/Step Time": 8.477743385359645} +{"Pretrain/Learning Rate": 7.832983258663074e-06, "Pretrain/Loss": 1.9890716075897217, "Pretrain/Loss (Raw)": 1.959428310394287, "Pretrain/Step": 14280, "Pretrain/Step Time": 8.47828815318644} +{"Pretrain/Learning Rate": 7.829897443751241e-06, "Pretrain/Loss": 1.9896531105041504, "Pretrain/Loss (Raw)": 1.954795241355896, "Pretrain/Step": 14281, "Pretrain/Step Time": 8.479359885677695} +{"Pretrain/Learning Rate": 7.826812123927202e-06, "Pretrain/Loss": 1.9898462295532227, "Pretrain/Loss (Raw)": 2.048374652862549, "Pretrain/Step": 14282, "Pretrain/Step Time": 8.487166618928313} +{"Pretrain/Learning Rate": 7.823727299279937e-06, "Pretrain/Loss": 1.9905627965927124, "Pretrain/Loss (Raw)": 2.0049960613250732, "Pretrain/Step": 14283, "Pretrain/Step Time": 8.485685298219323} +{"Pretrain/Learning Rate": 7.82064296989838e-06, "Pretrain/Loss": 1.9844255447387695, "Pretrain/Loss (Raw)": 1.6523948907852173, "Pretrain/Step": 14284, "Pretrain/Step Time": 8.490321712568402} +{"Pretrain/Learning Rate": 7.81755913587148e-06, "Pretrain/Loss": 1.9847577810287476, "Pretrain/Loss (Raw)": 1.9819494485855103, "Pretrain/Step": 14285, "Pretrain/Step Time": 8.490455659106374} +{"Pretrain/Learning Rate": 7.814475797288152e-06, "Pretrain/Loss": 1.9806382656097412, "Pretrain/Loss (Raw)": 1.7354017496109009, "Pretrain/Step": 14286, "Pretrain/Step Time": 8.489725038409233} +{"Pretrain/Learning Rate": 7.811392954237287e-06, "Pretrain/Loss": 1.9781091213226318, "Pretrain/Loss (Raw)": 1.8689426183700562, "Pretrain/Step": 14287, "Pretrain/Step Time": 8.487821839749813} +{"Pretrain/Learning Rate": 7.808310606807798e-06, "Pretrain/Loss": 1.9764999151229858, "Pretrain/Loss (Raw)": 1.7398719787597656, "Pretrain/Step": 14288, "Pretrain/Step Time": 8.489595821127295} +{"Pretrain/Learning Rate": 7.805228755088548e-06, "Pretrain/Loss": 1.9757795333862305, "Pretrain/Loss (Raw)": 1.9173824787139893, "Pretrain/Step": 14289, "Pretrain/Step Time": 8.496464546769857} +{"Pretrain/Learning Rate": 7.802147399168411e-06, "Pretrain/Loss": 1.975633978843689, "Pretrain/Loss (Raw)": 2.041425943374634, "Pretrain/Step": 14290, "Pretrain/Step Time": 8.488823372870684} +{"Pretrain/Learning Rate": 7.799066539136229e-06, "Pretrain/Loss": 1.9758224487304688, "Pretrain/Loss (Raw)": 1.7679500579833984, "Pretrain/Step": 14291, "Pretrain/Step Time": 8.493286469951272} +{"Pretrain/Learning Rate": 7.795986175080832e-06, "Pretrain/Loss": 1.9762324094772339, "Pretrain/Loss (Raw)": 2.023874521255493, "Pretrain/Step": 14292, "Pretrain/Step Time": 8.487460309639573} +{"Pretrain/Learning Rate": 7.792906307091052e-06, "Pretrain/Loss": 1.9782859086990356, "Pretrain/Loss (Raw)": 2.2999112606048584, "Pretrain/Step": 14293, "Pretrain/Step Time": 8.48777049407363} +{"Pretrain/Learning Rate": 7.789826935255681e-06, "Pretrain/Loss": 1.9737374782562256, "Pretrain/Loss (Raw)": 1.955684781074524, "Pretrain/Step": 14294, "Pretrain/Step Time": 8.492461860179901} +{"Pretrain/Learning Rate": 7.786748059663526e-06, "Pretrain/Loss": 1.9754444360733032, "Pretrain/Loss (Raw)": 2.028359889984131, "Pretrain/Step": 14295, "Pretrain/Step Time": 8.484001033008099} +{"Pretrain/Learning Rate": 7.783669680403357e-06, "Pretrain/Loss": 1.9750475883483887, "Pretrain/Loss (Raw)": 2.025676965713501, "Pretrain/Step": 14296, "Pretrain/Step Time": 8.483975861221552} +{"Pretrain/Learning Rate": 7.780591797563928e-06, "Pretrain/Loss": 1.9761989116668701, "Pretrain/Loss (Raw)": 2.080880641937256, "Pretrain/Step": 14297, "Pretrain/Step Time": 8.484605319797993} +{"Pretrain/Learning Rate": 7.777514411234003e-06, "Pretrain/Loss": 1.9743528366088867, "Pretrain/Loss (Raw)": 1.9498671293258667, "Pretrain/Step": 14298, "Pretrain/Step Time": 8.491191525012255} +{"Pretrain/Learning Rate": 7.774437521502301e-06, "Pretrain/Loss": 1.9740686416625977, "Pretrain/Loss (Raw)": 2.1348893642425537, "Pretrain/Step": 14299, "Pretrain/Step Time": 8.48730531707406} +{"Pretrain/Learning Rate": 7.771361128457557e-06, "Pretrain/Loss": 1.9723831415176392, "Pretrain/Loss (Raw)": 1.874281883239746, "Pretrain/Step": 14300, "Pretrain/Step Time": 8.487792497500777} +{"Pretrain/Learning Rate": 7.768285232188469e-06, "Pretrain/Loss": 1.9710376262664795, "Pretrain/Loss (Raw)": 1.9476468563079834, "Pretrain/Step": 14301, "Pretrain/Step Time": 8.488542517647147} +{"Pretrain/Learning Rate": 7.765209832783723e-06, "Pretrain/Loss": 1.9704985618591309, "Pretrain/Loss (Raw)": 2.053248405456543, "Pretrain/Step": 14302, "Pretrain/Step Time": 8.483901843428612} +{"Pretrain/Learning Rate": 7.762134930332008e-06, "Pretrain/Loss": 1.9718410968780518, "Pretrain/Loss (Raw)": 1.9723893404006958, "Pretrain/Step": 14303, "Pretrain/Step Time": 8.484320312738419} +{"Pretrain/Learning Rate": 7.759060524921975e-06, "Pretrain/Loss": 1.9723790884017944, "Pretrain/Loss (Raw)": 2.065885305404663, "Pretrain/Step": 14304, "Pretrain/Step Time": 8.485160153359175} +{"Pretrain/Learning Rate": 7.755986616642283e-06, "Pretrain/Loss": 1.969799518585205, "Pretrain/Loss (Raw)": 1.6203490495681763, "Pretrain/Step": 14305, "Pretrain/Step Time": 8.487955287098885} +{"Pretrain/Learning Rate": 7.752913205581561e-06, "Pretrain/Loss": 1.9694541692733765, "Pretrain/Loss (Raw)": 2.066633462905884, "Pretrain/Step": 14306, "Pretrain/Step Time": 8.48636632785201} +{"Pretrain/Learning Rate": 7.74984029182842e-06, "Pretrain/Loss": 1.9696166515350342, "Pretrain/Loss (Raw)": 1.915648341178894, "Pretrain/Step": 14307, "Pretrain/Step Time": 8.490173552185297} +{"Pretrain/Learning Rate": 7.746767875471484e-06, "Pretrain/Loss": 1.9702883958816528, "Pretrain/Loss (Raw)": 2.014570474624634, "Pretrain/Step": 14308, "Pretrain/Step Time": 8.488118898123503} +{"Pretrain/Learning Rate": 7.743695956599323e-06, "Pretrain/Loss": 1.9725899696350098, "Pretrain/Loss (Raw)": 2.1836609840393066, "Pretrain/Step": 14309, "Pretrain/Step Time": 8.478890085592866} +{"Pretrain/Learning Rate": 7.740624535300534e-06, "Pretrain/Loss": 1.9734337329864502, "Pretrain/Loss (Raw)": 2.1237497329711914, "Pretrain/Step": 14310, "Pretrain/Step Time": 8.47494749724865} +{"Pretrain/Learning Rate": 7.737553611663667e-06, "Pretrain/Loss": 1.9717189073562622, "Pretrain/Loss (Raw)": 1.7226340770721436, "Pretrain/Step": 14311, "Pretrain/Step Time": 8.479345463216305} +{"Pretrain/Learning Rate": 7.734483185777267e-06, "Pretrain/Loss": 1.972581386566162, "Pretrain/Loss (Raw)": 2.0899863243103027, "Pretrain/Step": 14312, "Pretrain/Step Time": 8.480277525261045} +{"Pretrain/Learning Rate": 7.73141325772988e-06, "Pretrain/Loss": 1.9726792573928833, "Pretrain/Loss (Raw)": 2.0559000968933105, "Pretrain/Step": 14313, "Pretrain/Step Time": 8.479038462042809} +{"Pretrain/Learning Rate": 7.72834382761001e-06, "Pretrain/Loss": 1.9733729362487793, "Pretrain/Loss (Raw)": 1.895121455192566, "Pretrain/Step": 14314, "Pretrain/Step Time": 8.483102671802044} +{"Pretrain/Learning Rate": 7.725274895506177e-06, "Pretrain/Loss": 1.9736828804016113, "Pretrain/Loss (Raw)": 2.0502219200134277, "Pretrain/Step": 14315, "Pretrain/Step Time": 8.483436420559883} +{"Pretrain/Learning Rate": 7.722206461506865e-06, "Pretrain/Loss": 1.9729599952697754, "Pretrain/Loss (Raw)": 2.042059898376465, "Pretrain/Step": 14316, "Pretrain/Step Time": 8.483185114338994} +{"Pretrain/Learning Rate": 7.719138525700542e-06, "Pretrain/Loss": 1.9727613925933838, "Pretrain/Loss (Raw)": 2.0840237140655518, "Pretrain/Step": 14317, "Pretrain/Step Time": 8.481132673099637} +{"Pretrain/Learning Rate": 7.716071088175685e-06, "Pretrain/Loss": 1.9713730812072754, "Pretrain/Loss (Raw)": 2.032296895980835, "Pretrain/Step": 14318, "Pretrain/Step Time": 8.48154733888805} +{"Pretrain/Learning Rate": 7.713004149020727e-06, "Pretrain/Loss": 1.97220778465271, "Pretrain/Loss (Raw)": 1.9828648567199707, "Pretrain/Step": 14319, "Pretrain/Step Time": 8.47777896001935} +{"Pretrain/Learning Rate": 7.709937708324116e-06, "Pretrain/Loss": 1.97304105758667, "Pretrain/Loss (Raw)": 2.1499195098876953, "Pretrain/Step": 14320, "Pretrain/Step Time": 8.481188217177987} +{"Pretrain/Learning Rate": 7.706871766174253e-06, "Pretrain/Loss": 1.972895622253418, "Pretrain/Loss (Raw)": 1.9671565294265747, "Pretrain/Step": 14321, "Pretrain/Step Time": 8.481795579195023} +{"Pretrain/Learning Rate": 7.703806322659572e-06, "Pretrain/Loss": 1.9723327159881592, "Pretrain/Loss (Raw)": 1.7895314693450928, "Pretrain/Step": 14322, "Pretrain/Step Time": 8.478887250646949} +{"Pretrain/Learning Rate": 7.70074137786842e-06, "Pretrain/Loss": 1.9713865518569946, "Pretrain/Loss (Raw)": 1.9128568172454834, "Pretrain/Step": 14323, "Pretrain/Step Time": 8.47864618897438} +{"Pretrain/Learning Rate": 7.697676931889208e-06, "Pretrain/Loss": 1.972435712814331, "Pretrain/Loss (Raw)": 2.301564931869507, "Pretrain/Step": 14324, "Pretrain/Step Time": 8.482694437727332} +{"Pretrain/Learning Rate": 7.694612984810282e-06, "Pretrain/Loss": 1.9716295003890991, "Pretrain/Loss (Raw)": 1.943999171257019, "Pretrain/Step": 14325, "Pretrain/Step Time": 8.480570785701275} +{"Pretrain/Learning Rate": 7.691549536719982e-06, "Pretrain/Loss": 1.9722410440444946, "Pretrain/Loss (Raw)": 1.9511231184005737, "Pretrain/Step": 14326, "Pretrain/Step Time": 8.477734254673123} +{"Pretrain/Learning Rate": 7.688486587706661e-06, "Pretrain/Loss": 1.973254680633545, "Pretrain/Loss (Raw)": 1.9466137886047363, "Pretrain/Step": 14327, "Pretrain/Step Time": 8.482736872509122} +{"Pretrain/Learning Rate": 7.685424137858615e-06, "Pretrain/Loss": 1.9747016429901123, "Pretrain/Loss (Raw)": 1.9829175472259521, "Pretrain/Step": 14328, "Pretrain/Step Time": 8.47987014055252} +{"Pretrain/Learning Rate": 7.682362187264167e-06, "Pretrain/Loss": 1.9770228862762451, "Pretrain/Loss (Raw)": 2.197143793106079, "Pretrain/Step": 14329, "Pretrain/Step Time": 8.482830645516515} +{"Pretrain/Learning Rate": 7.679300736011596e-06, "Pretrain/Loss": 1.976898193359375, "Pretrain/Loss (Raw)": 1.899574875831604, "Pretrain/Step": 14330, "Pretrain/Step Time": 8.487184608355165} +{"Pretrain/Learning Rate": 7.676239784189174e-06, "Pretrain/Loss": 1.975951910018921, "Pretrain/Loss (Raw)": 2.0320653915405273, "Pretrain/Step": 14331, "Pretrain/Step Time": 8.486260630190372} +{"Pretrain/Learning Rate": 7.67317933188517e-06, "Pretrain/Loss": 1.9772634506225586, "Pretrain/Loss (Raw)": 2.1617591381073, "Pretrain/Step": 14332, "Pretrain/Step Time": 8.484682450070977} +{"Pretrain/Learning Rate": 7.670119379187816e-06, "Pretrain/Loss": 1.9794440269470215, "Pretrain/Loss (Raw)": 2.175760507583618, "Pretrain/Step": 14333, "Pretrain/Step Time": 8.490415377542377} +{"Pretrain/Learning Rate": 7.667059926185363e-06, "Pretrain/Loss": 1.9762523174285889, "Pretrain/Loss (Raw)": 1.821528673171997, "Pretrain/Step": 14334, "Pretrain/Step Time": 8.486969530582428} +{"Pretrain/Learning Rate": 7.664000972966018e-06, "Pretrain/Loss": 1.9771983623504639, "Pretrain/Loss (Raw)": 2.179389476776123, "Pretrain/Step": 14335, "Pretrain/Step Time": 8.488939663395286} +{"Pretrain/Learning Rate": 7.660942519617975e-06, "Pretrain/Loss": 1.9764529466629028, "Pretrain/Loss (Raw)": 1.8727474212646484, "Pretrain/Step": 14336, "Pretrain/Step Time": 8.487631294876337} +{"Pretrain/Learning Rate": 7.65788456622944e-06, "Pretrain/Loss": 1.9768383502960205, "Pretrain/Loss (Raw)": 1.9701520204544067, "Pretrain/Step": 14337, "Pretrain/Step Time": 8.48696056380868} +{"Pretrain/Learning Rate": 7.65482711288857e-06, "Pretrain/Loss": 1.9778072834014893, "Pretrain/Loss (Raw)": 1.9438728094100952, "Pretrain/Step": 14338, "Pretrain/Step Time": 8.486463099718094} +{"Pretrain/Learning Rate": 7.65177015968354e-06, "Pretrain/Loss": 1.9764758348464966, "Pretrain/Loss (Raw)": 1.7198363542556763, "Pretrain/Step": 14339, "Pretrain/Step Time": 8.487602228298783} +{"Pretrain/Learning Rate": 7.64871370670249e-06, "Pretrain/Loss": 1.9759838581085205, "Pretrain/Loss (Raw)": 1.981519341468811, "Pretrain/Step": 14340, "Pretrain/Step Time": 8.483343962579966} +{"Pretrain/Learning Rate": 7.645657754033538e-06, "Pretrain/Loss": 1.9777230024337769, "Pretrain/Loss (Raw)": 2.1140143871307373, "Pretrain/Step": 14341, "Pretrain/Step Time": 8.482436776161194} +{"Pretrain/Learning Rate": 7.642602301764821e-06, "Pretrain/Loss": 1.9798343181610107, "Pretrain/Loss (Raw)": 2.200150966644287, "Pretrain/Step": 14342, "Pretrain/Step Time": 8.479953778907657} +{"Pretrain/Learning Rate": 7.639547349984419e-06, "Pretrain/Loss": 1.9800975322723389, "Pretrain/Loss (Raw)": 1.9453665018081665, "Pretrain/Step": 14343, "Pretrain/Step Time": 8.482098210602999} +{"Pretrain/Learning Rate": 7.63649289878044e-06, "Pretrain/Loss": 1.9794251918792725, "Pretrain/Loss (Raw)": 2.071772575378418, "Pretrain/Step": 14344, "Pretrain/Step Time": 8.485958948731422} +{"Pretrain/Learning Rate": 7.633438948240948e-06, "Pretrain/Loss": 1.978560447692871, "Pretrain/Loss (Raw)": 1.7886470556259155, "Pretrain/Step": 14345, "Pretrain/Step Time": 8.484346725046635} +{"Pretrain/Learning Rate": 7.630385498453996e-06, "Pretrain/Loss": 1.977601408958435, "Pretrain/Loss (Raw)": 1.9205663204193115, "Pretrain/Step": 14346, "Pretrain/Step Time": 8.483235538005829} +{"Pretrain/Learning Rate": 7.627332549507638e-06, "Pretrain/Loss": 1.981032133102417, "Pretrain/Loss (Raw)": 2.064997434616089, "Pretrain/Step": 14347, "Pretrain/Step Time": 8.488665837794542} +{"Pretrain/Learning Rate": 7.624280101489892e-06, "Pretrain/Loss": 1.9784979820251465, "Pretrain/Loss (Raw)": 1.5702868700027466, "Pretrain/Step": 14348, "Pretrain/Step Time": 8.482513340190053} +{"Pretrain/Learning Rate": 7.621228154488788e-06, "Pretrain/Loss": 1.9801857471466064, "Pretrain/Loss (Raw)": 1.9909532070159912, "Pretrain/Step": 14349, "Pretrain/Step Time": 8.481609208509326} +{"Pretrain/Learning Rate": 7.61817670859232e-06, "Pretrain/Loss": 1.9809165000915527, "Pretrain/Loss (Raw)": 1.954724669456482, "Pretrain/Step": 14350, "Pretrain/Step Time": 8.486679112538695} +{"Pretrain/Learning Rate": 7.615125763888464e-06, "Pretrain/Loss": 1.9818609952926636, "Pretrain/Loss (Raw)": 1.97078537940979, "Pretrain/Step": 14351, "Pretrain/Step Time": 8.484847767278552} +{"Pretrain/Learning Rate": 7.6120753204652114e-06, "Pretrain/Loss": 1.9807424545288086, "Pretrain/Loss (Raw)": 1.9053939580917358, "Pretrain/Step": 14352, "Pretrain/Step Time": 8.48854648321867} +{"Pretrain/Learning Rate": 7.6090253784104974e-06, "Pretrain/Loss": 1.9800258874893188, "Pretrain/Loss (Raw)": 2.065694570541382, "Pretrain/Step": 14353, "Pretrain/Step Time": 8.491727964952588} +{"Pretrain/Learning Rate": 7.605975937812288e-06, "Pretrain/Loss": 1.984987735748291, "Pretrain/Loss (Raw)": 2.5623879432678223, "Pretrain/Step": 14354, "Pretrain/Step Time": 8.488597363233566} +{"Pretrain/Learning Rate": 7.6029269987585e-06, "Pretrain/Loss": 1.9866714477539062, "Pretrain/Loss (Raw)": 2.0107932090759277, "Pretrain/Step": 14355, "Pretrain/Step Time": 8.492681048810482} +{"Pretrain/Learning Rate": 7.599878561337037e-06, "Pretrain/Loss": 1.9827299118041992, "Pretrain/Loss (Raw)": 1.978857398033142, "Pretrain/Step": 14356, "Pretrain/Step Time": 8.49196078069508} +{"Pretrain/Learning Rate": 7.5968306256358205e-06, "Pretrain/Loss": 1.982086181640625, "Pretrain/Loss (Raw)": 2.0973434448242188, "Pretrain/Step": 14357, "Pretrain/Step Time": 8.488019093871117} +{"Pretrain/Learning Rate": 7.593783191742715e-06, "Pretrain/Loss": 1.983985424041748, "Pretrain/Loss (Raw)": 2.177088737487793, "Pretrain/Step": 14358, "Pretrain/Step Time": 8.49111987836659} +{"Pretrain/Learning Rate": 7.59073625974561e-06, "Pretrain/Loss": 1.9837695360183716, "Pretrain/Loss (Raw)": 1.906548023223877, "Pretrain/Step": 14359, "Pretrain/Step Time": 8.495355689898133} +{"Pretrain/Learning Rate": 7.587689829732353e-06, "Pretrain/Loss": 1.98274564743042, "Pretrain/Loss (Raw)": 1.8924665451049805, "Pretrain/Step": 14360, "Pretrain/Step Time": 8.495165634900331} +{"Pretrain/Learning Rate": 7.584643901790775e-06, "Pretrain/Loss": 1.9805409908294678, "Pretrain/Loss (Raw)": 1.7949347496032715, "Pretrain/Step": 14361, "Pretrain/Step Time": 8.494150491431355} +{"Pretrain/Learning Rate": 7.58159847600872e-06, "Pretrain/Loss": 1.9775636196136475, "Pretrain/Loss (Raw)": 1.5816984176635742, "Pretrain/Step": 14362, "Pretrain/Step Time": 8.492673303931952} +{"Pretrain/Learning Rate": 7.5785535524739884e-06, "Pretrain/Loss": 1.9770030975341797, "Pretrain/Loss (Raw)": 1.831368327140808, "Pretrain/Step": 14363, "Pretrain/Step Time": 8.488900547847152} +{"Pretrain/Learning Rate": 7.575509131274389e-06, "Pretrain/Loss": 1.974381923675537, "Pretrain/Loss (Raw)": 1.6877665519714355, "Pretrain/Step": 14364, "Pretrain/Step Time": 8.492052214220166} +{"Pretrain/Learning Rate": 7.572465212497703e-06, "Pretrain/Loss": 1.974252700805664, "Pretrain/Loss (Raw)": 2.1347734928131104, "Pretrain/Step": 14365, "Pretrain/Step Time": 8.492932191118598} +{"Pretrain/Learning Rate": 7.569421796231688e-06, "Pretrain/Loss": 1.9737690687179565, "Pretrain/Loss (Raw)": 1.9561313390731812, "Pretrain/Step": 14366, "Pretrain/Step Time": 8.492328528314829} +{"Pretrain/Learning Rate": 7.566378882564115e-06, "Pretrain/Loss": 1.9731125831604004, "Pretrain/Loss (Raw)": 2.0455799102783203, "Pretrain/Step": 14367, "Pretrain/Step Time": 8.495079459622502} +{"Pretrain/Learning Rate": 7.56333647158271e-06, "Pretrain/Loss": 1.9724924564361572, "Pretrain/Loss (Raw)": 1.8814730644226074, "Pretrain/Step": 14368, "Pretrain/Step Time": 8.494493702426553} +{"Pretrain/Learning Rate": 7.5602945633752146e-06, "Pretrain/Loss": 1.9722691774368286, "Pretrain/Loss (Raw)": 2.018205165863037, "Pretrain/Step": 14369, "Pretrain/Step Time": 8.489810822531581} +{"Pretrain/Learning Rate": 7.557253158029329e-06, "Pretrain/Loss": 1.973123550415039, "Pretrain/Loss (Raw)": 2.0097172260284424, "Pretrain/Step": 14370, "Pretrain/Step Time": 8.490251991897821} +{"Pretrain/Learning Rate": 7.554212255632745e-06, "Pretrain/Loss": 1.9735968112945557, "Pretrain/Loss (Raw)": 2.0880637168884277, "Pretrain/Step": 14371, "Pretrain/Step Time": 8.486243974417448} +{"Pretrain/Learning Rate": 7.551171856273162e-06, "Pretrain/Loss": 1.9743773937225342, "Pretrain/Loss (Raw)": 2.0145158767700195, "Pretrain/Step": 14372, "Pretrain/Step Time": 8.48876191675663} +{"Pretrain/Learning Rate": 7.548131960038226e-06, "Pretrain/Loss": 1.976714849472046, "Pretrain/Loss (Raw)": 2.0062851905822754, "Pretrain/Step": 14373, "Pretrain/Step Time": 8.491247154772282} +{"Pretrain/Learning Rate": 7.545092567015613e-06, "Pretrain/Loss": 1.9800710678100586, "Pretrain/Loss (Raw)": 1.9850720167160034, "Pretrain/Step": 14374, "Pretrain/Step Time": 8.487082857638597} +{"Pretrain/Learning Rate": 7.542053677292951e-06, "Pretrain/Loss": 1.9820584058761597, "Pretrain/Loss (Raw)": 2.1619274616241455, "Pretrain/Step": 14375, "Pretrain/Step Time": 8.48391668125987} +{"Pretrain/Learning Rate": 7.539015290957857e-06, "Pretrain/Loss": 1.9844133853912354, "Pretrain/Loss (Raw)": 2.1995139122009277, "Pretrain/Step": 14376, "Pretrain/Step Time": 8.483091700822115} +{"Pretrain/Learning Rate": 7.535977408097955e-06, "Pretrain/Loss": 1.9856109619140625, "Pretrain/Loss (Raw)": 2.2888200283050537, "Pretrain/Step": 14377, "Pretrain/Step Time": 8.488281918689609} +{"Pretrain/Learning Rate": 7.5329400288008225e-06, "Pretrain/Loss": 1.9884918928146362, "Pretrain/Loss (Raw)": 2.283518075942993, "Pretrain/Step": 14378, "Pretrain/Step Time": 8.484474835917354} +{"Pretrain/Learning Rate": 7.529903153154061e-06, "Pretrain/Loss": 1.9880192279815674, "Pretrain/Loss (Raw)": 2.072141408920288, "Pretrain/Step": 14379, "Pretrain/Step Time": 8.482207037508488} +{"Pretrain/Learning Rate": 7.526866781245228e-06, "Pretrain/Loss": 1.9888923168182373, "Pretrain/Loss (Raw)": 2.071051597595215, "Pretrain/Step": 14380, "Pretrain/Step Time": 8.489525951445103} +{"Pretrain/Learning Rate": 7.523830913161864e-06, "Pretrain/Loss": 1.9891278743743896, "Pretrain/Loss (Raw)": 2.1027681827545166, "Pretrain/Step": 14381, "Pretrain/Step Time": 8.49113536812365} +{"Pretrain/Learning Rate": 7.5207955489915245e-06, "Pretrain/Loss": 1.990657925605774, "Pretrain/Loss (Raw)": 1.9321712255477905, "Pretrain/Step": 14382, "Pretrain/Step Time": 8.491473311558366} +{"Pretrain/Learning Rate": 7.517760688821715e-06, "Pretrain/Loss": 1.9898476600646973, "Pretrain/Loss (Raw)": 1.9775608777999878, "Pretrain/Step": 14383, "Pretrain/Step Time": 8.493100874125957} +{"Pretrain/Learning Rate": 7.5147263327399574e-06, "Pretrain/Loss": 1.9919664859771729, "Pretrain/Loss (Raw)": 2.090522527694702, "Pretrain/Step": 14384, "Pretrain/Step Time": 8.489297142252326} +{"Pretrain/Learning Rate": 7.511692480833735e-06, "Pretrain/Loss": 1.9889650344848633, "Pretrain/Loss (Raw)": 1.6449546813964844, "Pretrain/Step": 14385, "Pretrain/Step Time": 8.492486417293549} +{"Pretrain/Learning Rate": 7.508659133190537e-06, "Pretrain/Loss": 1.989745855331421, "Pretrain/Loss (Raw)": 1.9567477703094482, "Pretrain/Step": 14386, "Pretrain/Step Time": 8.48805252276361} +{"Pretrain/Learning Rate": 7.505626289897824e-06, "Pretrain/Loss": 1.9871211051940918, "Pretrain/Loss (Raw)": 1.7663111686706543, "Pretrain/Step": 14387, "Pretrain/Step Time": 8.486670607700944} +{"Pretrain/Learning Rate": 7.502593951043036e-06, "Pretrain/Loss": 1.9879581928253174, "Pretrain/Loss (Raw)": 2.0399303436279297, "Pretrain/Step": 14388, "Pretrain/Step Time": 8.489442935213447} +{"Pretrain/Learning Rate": 7.499562116713624e-06, "Pretrain/Loss": 1.9881150722503662, "Pretrain/Loss (Raw)": 1.949340581893921, "Pretrain/Step": 14389, "Pretrain/Step Time": 8.490246191620827} +{"Pretrain/Learning Rate": 7.496530786996994e-06, "Pretrain/Loss": 1.9878720045089722, "Pretrain/Loss (Raw)": 1.832606315612793, "Pretrain/Step": 14390, "Pretrain/Step Time": 8.485699275508523} +{"Pretrain/Learning Rate": 7.493499961980568e-06, "Pretrain/Loss": 1.9884731769561768, "Pretrain/Loss (Raw)": 2.047905921936035, "Pretrain/Step": 14391, "Pretrain/Step Time": 8.487589079886675} +{"Pretrain/Learning Rate": 7.49046964175173e-06, "Pretrain/Loss": 1.9906196594238281, "Pretrain/Loss (Raw)": 1.9822009801864624, "Pretrain/Step": 14392, "Pretrain/Step Time": 8.48862281627953} +{"Pretrain/Learning Rate": 7.487439826397846e-06, "Pretrain/Loss": 1.9905188083648682, "Pretrain/Loss (Raw)": 2.0669076442718506, "Pretrain/Step": 14393, "Pretrain/Step Time": 8.489573834463954} +{"Pretrain/Learning Rate": 7.484410516006299e-06, "Pretrain/Loss": 1.9882280826568604, "Pretrain/Loss (Raw)": 1.959338903427124, "Pretrain/Step": 14394, "Pretrain/Step Time": 8.489920940250158} +{"Pretrain/Learning Rate": 7.481381710664418e-06, "Pretrain/Loss": 1.9888758659362793, "Pretrain/Loss (Raw)": 1.864553689956665, "Pretrain/Step": 14395, "Pretrain/Step Time": 8.487022308632731} +{"Pretrain/Learning Rate": 7.478353410459554e-06, "Pretrain/Loss": 1.990959644317627, "Pretrain/Loss (Raw)": 2.011906623840332, "Pretrain/Step": 14396, "Pretrain/Step Time": 8.492704482749104} +{"Pretrain/Learning Rate": 7.475325615479017e-06, "Pretrain/Loss": 1.992194652557373, "Pretrain/Loss (Raw)": 2.20395827293396, "Pretrain/Step": 14397, "Pretrain/Step Time": 8.491800969466567} +{"Pretrain/Learning Rate": 7.472298325810103e-06, "Pretrain/Loss": 1.992067813873291, "Pretrain/Loss (Raw)": 1.9873480796813965, "Pretrain/Step": 14398, "Pretrain/Step Time": 8.49265805631876} +{"Pretrain/Learning Rate": 7.469271541540121e-06, "Pretrain/Loss": 1.9909121990203857, "Pretrain/Loss (Raw)": 1.8312456607818604, "Pretrain/Step": 14399, "Pretrain/Step Time": 8.494010979309678} +{"Pretrain/Learning Rate": 7.466245262756327e-06, "Pretrain/Loss": 1.9906041622161865, "Pretrain/Loss (Raw)": 1.9949870109558105, "Pretrain/Step": 14400, "Pretrain/Step Time": 8.49273981153965} +{"Pretrain/Learning Rate": 7.463219489545997e-06, "Pretrain/Loss": 1.9887676239013672, "Pretrain/Loss (Raw)": 1.8886828422546387, "Pretrain/Step": 14401, "Pretrain/Step Time": 8.490848930552602} +{"Pretrain/Learning Rate": 7.460194221996372e-06, "Pretrain/Loss": 1.9892598390579224, "Pretrain/Loss (Raw)": 2.13542103767395, "Pretrain/Step": 14402, "Pretrain/Step Time": 8.485144117847085} +{"Pretrain/Learning Rate": 7.457169460194671e-06, "Pretrain/Loss": 1.985214114189148, "Pretrain/Loss (Raw)": 1.8609282970428467, "Pretrain/Step": 14403, "Pretrain/Step Time": 8.485595110803843} +{"Pretrain/Learning Rate": 7.454145204228133e-06, "Pretrain/Loss": 1.9873170852661133, "Pretrain/Loss (Raw)": 2.0540475845336914, "Pretrain/Step": 14404, "Pretrain/Step Time": 8.477761041373014} +{"Pretrain/Learning Rate": 7.451121454183941e-06, "Pretrain/Loss": 1.9900381565093994, "Pretrain/Loss (Raw)": 2.0727901458740234, "Pretrain/Step": 14405, "Pretrain/Step Time": 8.478203663602471} +{"Pretrain/Learning Rate": 7.448098210149304e-06, "Pretrain/Loss": 1.9887157678604126, "Pretrain/Loss (Raw)": 1.9886726140975952, "Pretrain/Step": 14406, "Pretrain/Step Time": 8.479018969461322} +{"Pretrain/Learning Rate": 7.445075472211369e-06, "Pretrain/Loss": 1.986510992050171, "Pretrain/Loss (Raw)": 1.8619378805160522, "Pretrain/Step": 14407, "Pretrain/Step Time": 8.472898215055466} +{"Pretrain/Learning Rate": 7.4420532404573115e-06, "Pretrain/Loss": 1.986328125, "Pretrain/Loss (Raw)": 1.936017632484436, "Pretrain/Step": 14408, "Pretrain/Step Time": 8.472678257152438} +{"Pretrain/Learning Rate": 7.439031514974273e-06, "Pretrain/Loss": 1.9853832721710205, "Pretrain/Loss (Raw)": 1.833861231803894, "Pretrain/Step": 14409, "Pretrain/Step Time": 8.470156962051988} +{"Pretrain/Learning Rate": 7.436010295849374e-06, "Pretrain/Loss": 1.9844520092010498, "Pretrain/Loss (Raw)": 1.9291764497756958, "Pretrain/Step": 14410, "Pretrain/Step Time": 8.472545195370913} +{"Pretrain/Learning Rate": 7.432989583169744e-06, "Pretrain/Loss": 1.9840788841247559, "Pretrain/Loss (Raw)": 1.9572153091430664, "Pretrain/Step": 14411, "Pretrain/Step Time": 8.47380580380559} +{"Pretrain/Learning Rate": 7.4299693770224695e-06, "Pretrain/Loss": 1.9867322444915771, "Pretrain/Loss (Raw)": 1.9920471906661987, "Pretrain/Step": 14412, "Pretrain/Step Time": 8.470449268817902} +{"Pretrain/Learning Rate": 7.426949677494647e-06, "Pretrain/Loss": 1.9874374866485596, "Pretrain/Loss (Raw)": 2.0722179412841797, "Pretrain/Step": 14413, "Pretrain/Step Time": 8.47049785964191} +{"Pretrain/Learning Rate": 7.4239304846733415e-06, "Pretrain/Loss": 1.9897122383117676, "Pretrain/Loss (Raw)": 2.0265676975250244, "Pretrain/Step": 14414, "Pretrain/Step Time": 8.474268382415175} +{"Pretrain/Learning Rate": 7.420911798645605e-06, "Pretrain/Loss": 1.9895893335342407, "Pretrain/Loss (Raw)": 1.8532094955444336, "Pretrain/Step": 14415, "Pretrain/Step Time": 8.477943655103445} +{"Pretrain/Learning Rate": 7.417893619498492e-06, "Pretrain/Loss": 1.9913294315338135, "Pretrain/Loss (Raw)": 1.9626121520996094, "Pretrain/Step": 14416, "Pretrain/Step Time": 8.476486660540104} +{"Pretrain/Learning Rate": 7.414875947319014e-06, "Pretrain/Loss": 1.9924520254135132, "Pretrain/Loss (Raw)": 2.061062812805176, "Pretrain/Step": 14417, "Pretrain/Step Time": 8.472342059016228} +{"Pretrain/Learning Rate": 7.4118587821941975e-06, "Pretrain/Loss": 1.9930098056793213, "Pretrain/Loss (Raw)": 2.1128101348876953, "Pretrain/Step": 14418, "Pretrain/Step Time": 8.477041259407997} +{"Pretrain/Learning Rate": 7.408842124211035e-06, "Pretrain/Loss": 1.9956437349319458, "Pretrain/Loss (Raw)": 2.105112314224243, "Pretrain/Step": 14419, "Pretrain/Step Time": 8.47417671047151} +{"Pretrain/Learning Rate": 7.405825973456501e-06, "Pretrain/Loss": 1.993509292602539, "Pretrain/Loss (Raw)": 1.750659465789795, "Pretrain/Step": 14420, "Pretrain/Step Time": 8.47749699279666} +{"Pretrain/Learning Rate": 7.402810330017579e-06, "Pretrain/Loss": 1.9909484386444092, "Pretrain/Loss (Raw)": 1.9721287488937378, "Pretrain/Step": 14421, "Pretrain/Step Time": 8.475985992699862} +{"Pretrain/Learning Rate": 7.39979519398121e-06, "Pretrain/Loss": 1.9907846450805664, "Pretrain/Loss (Raw)": 1.9346981048583984, "Pretrain/Step": 14422, "Pretrain/Step Time": 8.477398924529552} +{"Pretrain/Learning Rate": 7.396780565434347e-06, "Pretrain/Loss": 1.988708734512329, "Pretrain/Loss (Raw)": 1.7626557350158691, "Pretrain/Step": 14423, "Pretrain/Step Time": 8.47748669795692} +{"Pretrain/Learning Rate": 7.3937664444639065e-06, "Pretrain/Loss": 1.9894218444824219, "Pretrain/Loss (Raw)": 2.116971015930176, "Pretrain/Step": 14424, "Pretrain/Step Time": 8.473792558535933} +{"Pretrain/Learning Rate": 7.3907528311567885e-06, "Pretrain/Loss": 1.9861938953399658, "Pretrain/Loss (Raw)": 1.6676884889602661, "Pretrain/Step": 14425, "Pretrain/Step Time": 8.47633315064013} +{"Pretrain/Learning Rate": 7.38773972559991e-06, "Pretrain/Loss": 1.9848361015319824, "Pretrain/Loss (Raw)": 1.7760810852050781, "Pretrain/Step": 14426, "Pretrain/Step Time": 8.472796943038702} +{"Pretrain/Learning Rate": 7.384727127880131e-06, "Pretrain/Loss": 1.9836865663528442, "Pretrain/Loss (Raw)": 1.9877349138259888, "Pretrain/Step": 14427, "Pretrain/Step Time": 8.474912596866488} +{"Pretrain/Learning Rate": 7.381715038084336e-06, "Pretrain/Loss": 1.983162522315979, "Pretrain/Loss (Raw)": 1.8072079420089722, "Pretrain/Step": 14428, "Pretrain/Step Time": 8.474139403551817} +{"Pretrain/Learning Rate": 7.3787034562993686e-06, "Pretrain/Loss": 1.9844837188720703, "Pretrain/Loss (Raw)": 2.1167550086975098, "Pretrain/Step": 14429, "Pretrain/Step Time": 8.477735942229629} +{"Pretrain/Learning Rate": 7.375692382612057e-06, "Pretrain/Loss": 1.9845224618911743, "Pretrain/Loss (Raw)": 2.0582058429718018, "Pretrain/Step": 14430, "Pretrain/Step Time": 8.481065947562456} +{"Pretrain/Learning Rate": 7.372681817109237e-06, "Pretrain/Loss": 1.9828684329986572, "Pretrain/Loss (Raw)": 1.7606866359710693, "Pretrain/Step": 14431, "Pretrain/Step Time": 8.480341782793403} +{"Pretrain/Learning Rate": 7.369671759877705e-06, "Pretrain/Loss": 1.9815940856933594, "Pretrain/Loss (Raw)": 1.9027572870254517, "Pretrain/Step": 14432, "Pretrain/Step Time": 8.478737154975533} +{"Pretrain/Learning Rate": 7.366662211004266e-06, "Pretrain/Loss": 1.9844619035720825, "Pretrain/Loss (Raw)": 1.9874327182769775, "Pretrain/Step": 14433, "Pretrain/Step Time": 8.475412709638476} +{"Pretrain/Learning Rate": 7.363653170575691e-06, "Pretrain/Loss": 1.9836660623550415, "Pretrain/Loss (Raw)": 1.9647624492645264, "Pretrain/Step": 14434, "Pretrain/Step Time": 8.47493970580399} +{"Pretrain/Learning Rate": 7.3606446386787375e-06, "Pretrain/Loss": 1.9832062721252441, "Pretrain/Loss (Raw)": 1.8568103313446045, "Pretrain/Step": 14435, "Pretrain/Step Time": 8.470362456515431} +{"Pretrain/Learning Rate": 7.3576366154001655e-06, "Pretrain/Loss": 1.9828805923461914, "Pretrain/Loss (Raw)": 1.9728829860687256, "Pretrain/Step": 14436, "Pretrain/Step Time": 8.469864420592785} +{"Pretrain/Learning Rate": 7.354629100826699e-06, "Pretrain/Loss": 1.9826487302780151, "Pretrain/Loss (Raw)": 2.1539764404296875, "Pretrain/Step": 14437, "Pretrain/Step Time": 8.46999347768724} +{"Pretrain/Learning Rate": 7.351622095045072e-06, "Pretrain/Loss": 1.9812620878219604, "Pretrain/Loss (Raw)": 1.9462417364120483, "Pretrain/Step": 14438, "Pretrain/Step Time": 8.472756084054708} +{"Pretrain/Learning Rate": 7.348615598141981e-06, "Pretrain/Loss": 1.9841210842132568, "Pretrain/Loss (Raw)": 2.0885894298553467, "Pretrain/Step": 14439, "Pretrain/Step Time": 8.466903902590275} +{"Pretrain/Learning Rate": 7.345609610204105e-06, "Pretrain/Loss": 1.9847474098205566, "Pretrain/Loss (Raw)": 2.1701622009277344, "Pretrain/Step": 14440, "Pretrain/Step Time": 8.469138884916902} +{"Pretrain/Learning Rate": 7.34260413131814e-06, "Pretrain/Loss": 1.9848617315292358, "Pretrain/Loss (Raw)": 2.0705418586730957, "Pretrain/Step": 14441, "Pretrain/Step Time": 8.468001570552588} +{"Pretrain/Learning Rate": 7.339599161570729e-06, "Pretrain/Loss": 1.9865906238555908, "Pretrain/Loss (Raw)": 2.116419792175293, "Pretrain/Step": 14442, "Pretrain/Step Time": 8.468425802886486} +{"Pretrain/Learning Rate": 7.336594701048535e-06, "Pretrain/Loss": 1.9871456623077393, "Pretrain/Loss (Raw)": 2.121253728866577, "Pretrain/Step": 14443, "Pretrain/Step Time": 8.469602029770613} +{"Pretrain/Learning Rate": 7.333590749838182e-06, "Pretrain/Loss": 1.986358404159546, "Pretrain/Loss (Raw)": 1.9413015842437744, "Pretrain/Step": 14444, "Pretrain/Step Time": 8.474459763616323} +{"Pretrain/Learning Rate": 7.3305873080262765e-06, "Pretrain/Loss": 1.9850473403930664, "Pretrain/Loss (Raw)": 1.916202187538147, "Pretrain/Step": 14445, "Pretrain/Step Time": 8.477458480745554} +{"Pretrain/Learning Rate": 7.327584375699436e-06, "Pretrain/Loss": 1.9847383499145508, "Pretrain/Loss (Raw)": 1.9927481412887573, "Pretrain/Step": 14446, "Pretrain/Step Time": 8.479252276942134} +{"Pretrain/Learning Rate": 7.3245819529442375e-06, "Pretrain/Loss": 1.9835491180419922, "Pretrain/Loss (Raw)": 1.830653429031372, "Pretrain/Step": 14447, "Pretrain/Step Time": 8.478660851716995} +{"Pretrain/Learning Rate": 7.321580039847262e-06, "Pretrain/Loss": 1.9822344779968262, "Pretrain/Loss (Raw)": 1.981634259223938, "Pretrain/Step": 14448, "Pretrain/Step Time": 8.476766569539905} +{"Pretrain/Learning Rate": 7.318578636495057e-06, "Pretrain/Loss": 1.9834654331207275, "Pretrain/Loss (Raw)": 2.1247098445892334, "Pretrain/Step": 14449, "Pretrain/Step Time": 8.47357220761478} +{"Pretrain/Learning Rate": 7.315577742974181e-06, "Pretrain/Loss": 1.9853166341781616, "Pretrain/Loss (Raw)": 2.026491641998291, "Pretrain/Step": 14450, "Pretrain/Step Time": 8.476699445396662} +{"Pretrain/Learning Rate": 7.312577359371156e-06, "Pretrain/Loss": 1.985020399093628, "Pretrain/Loss (Raw)": 1.8749182224273682, "Pretrain/Step": 14451, "Pretrain/Step Time": 8.478500939905643} +{"Pretrain/Learning Rate": 7.3095774857724846e-06, "Pretrain/Loss": 1.9820945262908936, "Pretrain/Loss (Raw)": 1.9270716905593872, "Pretrain/Step": 14452, "Pretrain/Step Time": 8.471622226759791} +{"Pretrain/Learning Rate": 7.306578122264681e-06, "Pretrain/Loss": 1.9838409423828125, "Pretrain/Loss (Raw)": 2.167538642883301, "Pretrain/Step": 14453, "Pretrain/Step Time": 8.46862805634737} +{"Pretrain/Learning Rate": 7.3035792689342185e-06, "Pretrain/Loss": 1.9842592477798462, "Pretrain/Loss (Raw)": 2.0046725273132324, "Pretrain/Step": 14454, "Pretrain/Step Time": 8.47070673853159} +{"Pretrain/Learning Rate": 7.300580925867581e-06, "Pretrain/Loss": 1.984969139099121, "Pretrain/Loss (Raw)": 2.037466287612915, "Pretrain/Step": 14455, "Pretrain/Step Time": 8.464930905029178} +{"Pretrain/Learning Rate": 7.297583093151214e-06, "Pretrain/Loss": 1.983615756034851, "Pretrain/Loss (Raw)": 1.8096985816955566, "Pretrain/Step": 14456, "Pretrain/Step Time": 8.465064661577344} +{"Pretrain/Learning Rate": 7.294585770871551e-06, "Pretrain/Loss": 1.9816704988479614, "Pretrain/Loss (Raw)": 1.9481509923934937, "Pretrain/Step": 14457, "Pretrain/Step Time": 8.465581312775612} +{"Pretrain/Learning Rate": 7.291588959115034e-06, "Pretrain/Loss": 1.9830936193466187, "Pretrain/Loss (Raw)": 2.0817267894744873, "Pretrain/Step": 14458, "Pretrain/Step Time": 8.45856680162251} +{"Pretrain/Learning Rate": 7.28859265796806e-06, "Pretrain/Loss": 1.983191967010498, "Pretrain/Loss (Raw)": 2.0446479320526123, "Pretrain/Step": 14459, "Pretrain/Step Time": 8.46243755146861} +{"Pretrain/Learning Rate": 7.2855968675170365e-06, "Pretrain/Loss": 1.980823040008545, "Pretrain/Loss (Raw)": 1.8585543632507324, "Pretrain/Step": 14460, "Pretrain/Step Time": 8.463225476443768} +{"Pretrain/Learning Rate": 7.282601587848339e-06, "Pretrain/Loss": 1.9794965982437134, "Pretrain/Loss (Raw)": 2.005964994430542, "Pretrain/Step": 14461, "Pretrain/Step Time": 8.460537744686007} +{"Pretrain/Learning Rate": 7.279606819048329e-06, "Pretrain/Loss": 1.9806783199310303, "Pretrain/Loss (Raw)": 1.9727882146835327, "Pretrain/Step": 14462, "Pretrain/Step Time": 8.464435013011098} +{"Pretrain/Learning Rate": 7.276612561203372e-06, "Pretrain/Loss": 1.9786860942840576, "Pretrain/Loss (Raw)": 1.924373745918274, "Pretrain/Step": 14463, "Pretrain/Step Time": 8.463375566527247} +{"Pretrain/Learning Rate": 7.273618814399788e-06, "Pretrain/Loss": 1.9801771640777588, "Pretrain/Loss (Raw)": 2.0636239051818848, "Pretrain/Step": 14464, "Pretrain/Step Time": 8.464950926601887} +{"Pretrain/Learning Rate": 7.270625578723919e-06, "Pretrain/Loss": 1.980927586555481, "Pretrain/Loss (Raw)": 2.0661940574645996, "Pretrain/Step": 14465, "Pretrain/Step Time": 8.461906272917986} +{"Pretrain/Learning Rate": 7.267632854262061e-06, "Pretrain/Loss": 1.9806232452392578, "Pretrain/Loss (Raw)": 1.9049195051193237, "Pretrain/Step": 14466, "Pretrain/Step Time": 8.467564892023802} +{"Pretrain/Learning Rate": 7.264640641100503e-06, "Pretrain/Loss": 1.9811534881591797, "Pretrain/Loss (Raw)": 1.787696123123169, "Pretrain/Step": 14467, "Pretrain/Step Time": 8.464279791340232} +{"Pretrain/Learning Rate": 7.261648939325536e-06, "Pretrain/Loss": 1.9824579954147339, "Pretrain/Loss (Raw)": 2.1485142707824707, "Pretrain/Step": 14468, "Pretrain/Step Time": 8.466719139367342} +{"Pretrain/Learning Rate": 7.258657749023412e-06, "Pretrain/Loss": 1.9816336631774902, "Pretrain/Loss (Raw)": 2.008484363555908, "Pretrain/Step": 14469, "Pretrain/Step Time": 8.467526726424694} +{"Pretrain/Learning Rate": 7.255667070280389e-06, "Pretrain/Loss": 1.9790130853652954, "Pretrain/Loss (Raw)": 1.864736557006836, "Pretrain/Step": 14470, "Pretrain/Step Time": 8.466478414833546} +{"Pretrain/Learning Rate": 7.2526769031827006e-06, "Pretrain/Loss": 1.9779973030090332, "Pretrain/Loss (Raw)": 1.8153384923934937, "Pretrain/Step": 14471, "Pretrain/Step Time": 8.467981580644846} +{"Pretrain/Learning Rate": 7.249687247816553e-06, "Pretrain/Loss": 1.9774079322814941, "Pretrain/Loss (Raw)": 1.996335506439209, "Pretrain/Step": 14472, "Pretrain/Step Time": 8.463641613721848} +{"Pretrain/Learning Rate": 7.246698104268168e-06, "Pretrain/Loss": 1.9789814949035645, "Pretrain/Loss (Raw)": 1.9900530576705933, "Pretrain/Step": 14473, "Pretrain/Step Time": 8.468162322416902} +{"Pretrain/Learning Rate": 7.243709472623719e-06, "Pretrain/Loss": 1.9797319173812866, "Pretrain/Loss (Raw)": 2.0166332721710205, "Pretrain/Step": 14474, "Pretrain/Step Time": 8.464662278071046} +{"Pretrain/Learning Rate": 7.240721352969402e-06, "Pretrain/Loss": 1.9777084589004517, "Pretrain/Loss (Raw)": 1.8059874773025513, "Pretrain/Step": 14475, "Pretrain/Step Time": 8.464542025700212} +{"Pretrain/Learning Rate": 7.2377337453913615e-06, "Pretrain/Loss": 1.981221079826355, "Pretrain/Loss (Raw)": 2.0199201107025146, "Pretrain/Step": 14476, "Pretrain/Step Time": 8.466264130547643} +{"Pretrain/Learning Rate": 7.23474664997574e-06, "Pretrain/Loss": 1.9823285341262817, "Pretrain/Loss (Raw)": 2.132699728012085, "Pretrain/Step": 14477, "Pretrain/Step Time": 8.469094637781382} +{"Pretrain/Learning Rate": 7.231760066808682e-06, "Pretrain/Loss": 1.9834647178649902, "Pretrain/Loss (Raw)": 2.100160837173462, "Pretrain/Step": 14478, "Pretrain/Step Time": 8.467075133696198} +{"Pretrain/Learning Rate": 7.228773995976293e-06, "Pretrain/Loss": 1.9842967987060547, "Pretrain/Loss (Raw)": 2.077275514602661, "Pretrain/Step": 14479, "Pretrain/Step Time": 8.472761331126094} +{"Pretrain/Learning Rate": 7.225788437564682e-06, "Pretrain/Loss": 1.9839508533477783, "Pretrain/Loss (Raw)": 1.8611239194869995, "Pretrain/Step": 14480, "Pretrain/Step Time": 8.4721715785563} +{"Pretrain/Learning Rate": 7.2228033916599325e-06, "Pretrain/Loss": 1.982426404953003, "Pretrain/Loss (Raw)": 1.8705538511276245, "Pretrain/Step": 14481, "Pretrain/Step Time": 8.47002099826932} +{"Pretrain/Learning Rate": 7.219818858348107e-06, "Pretrain/Loss": 1.9806336164474487, "Pretrain/Loss (Raw)": 2.3329219818115234, "Pretrain/Step": 14482, "Pretrain/Step Time": 8.470991218462586} +{"Pretrain/Learning Rate": 7.216834837715278e-06, "Pretrain/Loss": 1.980759620666504, "Pretrain/Loss (Raw)": 2.026916980743408, "Pretrain/Step": 14483, "Pretrain/Step Time": 8.467649286612868} +{"Pretrain/Learning Rate": 7.213851329847474e-06, "Pretrain/Loss": 1.9820420742034912, "Pretrain/Loss (Raw)": 2.1430153846740723, "Pretrain/Step": 14484, "Pretrain/Step Time": 8.47340009920299} +{"Pretrain/Learning Rate": 7.210868334830734e-06, "Pretrain/Loss": 1.9818377494812012, "Pretrain/Loss (Raw)": 2.071188449859619, "Pretrain/Step": 14485, "Pretrain/Step Time": 8.467120729386806} +{"Pretrain/Learning Rate": 7.207885852751065e-06, "Pretrain/Loss": 1.980381727218628, "Pretrain/Loss (Raw)": 1.9907251596450806, "Pretrain/Step": 14486, "Pretrain/Step Time": 8.463366838172078} +{"Pretrain/Learning Rate": 7.204903883694459e-06, "Pretrain/Loss": 1.9812967777252197, "Pretrain/Loss (Raw)": 2.0236637592315674, "Pretrain/Step": 14487, "Pretrain/Step Time": 8.463146295398474} +{"Pretrain/Learning Rate": 7.2019224277469126e-06, "Pretrain/Loss": 1.9818280935287476, "Pretrain/Loss (Raw)": 1.9604848623275757, "Pretrain/Step": 14488, "Pretrain/Step Time": 8.46419908106327} +{"Pretrain/Learning Rate": 7.198941484994376e-06, "Pretrain/Loss": 1.9842376708984375, "Pretrain/Loss (Raw)": 2.1033554077148438, "Pretrain/Step": 14489, "Pretrain/Step Time": 8.461311653256416} +{"Pretrain/Learning Rate": 7.1959610555228295e-06, "Pretrain/Loss": 1.9863715171813965, "Pretrain/Loss (Raw)": 1.8548436164855957, "Pretrain/Step": 14490, "Pretrain/Step Time": 8.46409785374999} +{"Pretrain/Learning Rate": 7.192981139418181e-06, "Pretrain/Loss": 1.988417625427246, "Pretrain/Loss (Raw)": 2.0932562351226807, "Pretrain/Step": 14491, "Pretrain/Step Time": 8.469649756327271} +{"Pretrain/Learning Rate": 7.190001736766374e-06, "Pretrain/Loss": 1.9919217824935913, "Pretrain/Loss (Raw)": 2.136312246322632, "Pretrain/Step": 14492, "Pretrain/Step Time": 8.465041194111109} +{"Pretrain/Learning Rate": 7.187022847653313e-06, "Pretrain/Loss": 1.9896880388259888, "Pretrain/Loss (Raw)": 1.8488490581512451, "Pretrain/Step": 14493, "Pretrain/Step Time": 8.464588463306427} +{"Pretrain/Learning Rate": 7.184044472164883e-06, "Pretrain/Loss": 1.9904208183288574, "Pretrain/Loss (Raw)": 2.049933433532715, "Pretrain/Step": 14494, "Pretrain/Step Time": 8.46659872867167} +{"Pretrain/Learning Rate": 7.1810666103869775e-06, "Pretrain/Loss": 1.9896633625030518, "Pretrain/Loss (Raw)": 1.9486111402511597, "Pretrain/Step": 14495, "Pretrain/Step Time": 8.465390380471945} +{"Pretrain/Learning Rate": 7.178089262405449e-06, "Pretrain/Loss": 1.9907711744308472, "Pretrain/Loss (Raw)": 2.023287773132324, "Pretrain/Step": 14496, "Pretrain/Step Time": 8.466480251401663} +{"Pretrain/Learning Rate": 7.175112428306157e-06, "Pretrain/Loss": 1.9907079935073853, "Pretrain/Loss (Raw)": 2.010098934173584, "Pretrain/Step": 14497, "Pretrain/Step Time": 8.471479322761297} +{"Pretrain/Learning Rate": 7.172136108174937e-06, "Pretrain/Loss": 1.991727352142334, "Pretrain/Loss (Raw)": 2.1401984691619873, "Pretrain/Step": 14498, "Pretrain/Step Time": 8.466938266530633} +{"Pretrain/Learning Rate": 7.1691603020975935e-06, "Pretrain/Loss": 1.9929523468017578, "Pretrain/Loss (Raw)": 2.244871139526367, "Pretrain/Step": 14499, "Pretrain/Step Time": 8.469604171812534} +{"Pretrain/Learning Rate": 7.166185010159953e-06, "Pretrain/Loss": 1.9919936656951904, "Pretrain/Loss (Raw)": 1.8918007612228394, "Pretrain/Step": 14500, "Pretrain/Step Time": 8.469063410535455} +{"Pretrain/Learning Rate": 7.163210232447787e-06, "Pretrain/Loss": 1.990096092224121, "Pretrain/Loss (Raw)": 1.763377070426941, "Pretrain/Step": 14501, "Pretrain/Step Time": 8.467928593978286} +{"Pretrain/Learning Rate": 7.160235969046888e-06, "Pretrain/Loss": 1.988505482673645, "Pretrain/Loss (Raw)": 1.7814985513687134, "Pretrain/Step": 14502, "Pretrain/Step Time": 8.466444332152605} +{"Pretrain/Learning Rate": 7.157262220043007e-06, "Pretrain/Loss": 1.9871277809143066, "Pretrain/Loss (Raw)": 1.9855704307556152, "Pretrain/Step": 14503, "Pretrain/Step Time": 8.47561303153634} +{"Pretrain/Learning Rate": 7.1542889855218845e-06, "Pretrain/Loss": 1.985368251800537, "Pretrain/Loss (Raw)": 1.9743047952651978, "Pretrain/Step": 14504, "Pretrain/Step Time": 8.471384465694427} +{"Pretrain/Learning Rate": 7.151316265569269e-06, "Pretrain/Loss": 1.983572244644165, "Pretrain/Loss (Raw)": 2.058908700942993, "Pretrain/Step": 14505, "Pretrain/Step Time": 8.468811159953475} +{"Pretrain/Learning Rate": 7.1483440602708565e-06, "Pretrain/Loss": 1.98341703414917, "Pretrain/Loss (Raw)": 2.263667106628418, "Pretrain/Step": 14506, "Pretrain/Step Time": 8.46667111478746} +{"Pretrain/Learning Rate": 7.145372369712367e-06, "Pretrain/Loss": 1.9799182415008545, "Pretrain/Loss (Raw)": 1.6242915391921997, "Pretrain/Step": 14507, "Pretrain/Step Time": 8.472328329458833} +{"Pretrain/Learning Rate": 7.142401193979476e-06, "Pretrain/Loss": 1.9788070917129517, "Pretrain/Loss (Raw)": 1.9288341999053955, "Pretrain/Step": 14508, "Pretrain/Step Time": 8.464070374146104} +{"Pretrain/Learning Rate": 7.139430533157851e-06, "Pretrain/Loss": 1.9769630432128906, "Pretrain/Loss (Raw)": 1.866729974746704, "Pretrain/Step": 14509, "Pretrain/Step Time": 8.460079979151487} +{"Pretrain/Learning Rate": 7.136460387333166e-06, "Pretrain/Loss": 1.978426218032837, "Pretrain/Loss (Raw)": 2.119452953338623, "Pretrain/Step": 14510, "Pretrain/Step Time": 8.459408268332481} +{"Pretrain/Learning Rate": 7.133490756591044e-06, "Pretrain/Loss": 1.9796439409255981, "Pretrain/Loss (Raw)": 2.1334264278411865, "Pretrain/Step": 14511, "Pretrain/Step Time": 8.462186379358172} +{"Pretrain/Learning Rate": 7.130521641017127e-06, "Pretrain/Loss": 1.9790281057357788, "Pretrain/Loss (Raw)": 2.0116961002349854, "Pretrain/Step": 14512, "Pretrain/Step Time": 8.46594600751996} +{"Pretrain/Learning Rate": 7.127553040697022e-06, "Pretrain/Loss": 1.9822372198104858, "Pretrain/Loss (Raw)": 2.0557212829589844, "Pretrain/Step": 14513, "Pretrain/Step Time": 8.466713450849056} +{"Pretrain/Learning Rate": 7.124584955716318e-06, "Pretrain/Loss": 1.982985019683838, "Pretrain/Loss (Raw)": 2.0524699687957764, "Pretrain/Step": 14514, "Pretrain/Step Time": 8.468324052169919} +{"Pretrain/Learning Rate": 7.121617386160614e-06, "Pretrain/Loss": 1.9830827713012695, "Pretrain/Loss (Raw)": 1.7788176536560059, "Pretrain/Step": 14515, "Pretrain/Step Time": 8.471201680600643} +{"Pretrain/Learning Rate": 7.1186503321154616e-06, "Pretrain/Loss": 1.9826526641845703, "Pretrain/Loss (Raw)": 1.9848849773406982, "Pretrain/Step": 14516, "Pretrain/Step Time": 8.471786370500922} +{"Pretrain/Learning Rate": 7.115683793666428e-06, "Pretrain/Loss": 1.9825880527496338, "Pretrain/Loss (Raw)": 1.941075086593628, "Pretrain/Step": 14517, "Pretrain/Step Time": 8.467860732227564} +{"Pretrain/Learning Rate": 7.112717770899039e-06, "Pretrain/Loss": 1.9820083379745483, "Pretrain/Loss (Raw)": 1.7583860158920288, "Pretrain/Step": 14518, "Pretrain/Step Time": 8.471464600414038} +{"Pretrain/Learning Rate": 7.1097522638988276e-06, "Pretrain/Loss": 1.9829251766204834, "Pretrain/Loss (Raw)": 2.165264129638672, "Pretrain/Step": 14519, "Pretrain/Step Time": 8.4724110532552} +{"Pretrain/Learning Rate": 7.1067872727513e-06, "Pretrain/Loss": 1.9837594032287598, "Pretrain/Loss (Raw)": 2.0889792442321777, "Pretrain/Step": 14520, "Pretrain/Step Time": 8.473532408475876} +{"Pretrain/Learning Rate": 7.103822797541939e-06, "Pretrain/Loss": 1.9837069511413574, "Pretrain/Loss (Raw)": 2.0602047443389893, "Pretrain/Step": 14521, "Pretrain/Step Time": 8.464752092957497} +{"Pretrain/Learning Rate": 7.100858838356242e-06, "Pretrain/Loss": 1.9842419624328613, "Pretrain/Loss (Raw)": 2.0277984142303467, "Pretrain/Step": 14522, "Pretrain/Step Time": 8.468767043203115} +{"Pretrain/Learning Rate": 7.097895395279652e-06, "Pretrain/Loss": 1.9860377311706543, "Pretrain/Loss (Raw)": 2.094411611557007, "Pretrain/Step": 14523, "Pretrain/Step Time": 8.468866379931569} +{"Pretrain/Learning Rate": 7.094932468397636e-06, "Pretrain/Loss": 1.9865840673446655, "Pretrain/Loss (Raw)": 2.081860303878784, "Pretrain/Step": 14524, "Pretrain/Step Time": 8.46446349658072} +{"Pretrain/Learning Rate": 7.091970057795622e-06, "Pretrain/Loss": 1.982997179031372, "Pretrain/Loss (Raw)": 1.744836449623108, "Pretrain/Step": 14525, "Pretrain/Step Time": 8.46608455106616} +{"Pretrain/Learning Rate": 7.089008163559019e-06, "Pretrain/Loss": 1.9829552173614502, "Pretrain/Loss (Raw)": 1.981965184211731, "Pretrain/Step": 14526, "Pretrain/Step Time": 8.464510668069124} +{"Pretrain/Learning Rate": 7.0860467857732456e-06, "Pretrain/Loss": 1.9853459596633911, "Pretrain/Loss (Raw)": 2.1372644901275635, "Pretrain/Step": 14527, "Pretrain/Step Time": 8.463632322847843} +{"Pretrain/Learning Rate": 7.083085924523675e-06, "Pretrain/Loss": 1.9851247072219849, "Pretrain/Loss (Raw)": 1.9666677713394165, "Pretrain/Step": 14528, "Pretrain/Step Time": 8.470628241077065} +{"Pretrain/Learning Rate": 7.0801255798957025e-06, "Pretrain/Loss": 1.9841632843017578, "Pretrain/Loss (Raw)": 1.7656177282333374, "Pretrain/Step": 14529, "Pretrain/Step Time": 8.469244226813316} +{"Pretrain/Learning Rate": 7.077165751974674e-06, "Pretrain/Loss": 1.9826966524124146, "Pretrain/Loss (Raw)": 1.9476854801177979, "Pretrain/Step": 14530, "Pretrain/Step Time": 8.472876759245992} +{"Pretrain/Learning Rate": 7.074206440845929e-06, "Pretrain/Loss": 1.9847428798675537, "Pretrain/Loss (Raw)": 2.1228415966033936, "Pretrain/Step": 14531, "Pretrain/Step Time": 8.475080313161016} +{"Pretrain/Learning Rate": 7.071247646594814e-06, "Pretrain/Loss": 1.9853317737579346, "Pretrain/Loss (Raw)": 2.1294288635253906, "Pretrain/Step": 14532, "Pretrain/Step Time": 8.481527538970113} +{"Pretrain/Learning Rate": 7.068289369306625e-06, "Pretrain/Loss": 1.9859012365341187, "Pretrain/Loss (Raw)": 2.1456961631774902, "Pretrain/Step": 14533, "Pretrain/Step Time": 8.478193366900086} +{"Pretrain/Learning Rate": 7.065331609066677e-06, "Pretrain/Loss": 1.9864580631256104, "Pretrain/Loss (Raw)": 2.059931516647339, "Pretrain/Step": 14534, "Pretrain/Step Time": 8.478159694001079} +{"Pretrain/Learning Rate": 7.06237436596025e-06, "Pretrain/Loss": 1.9874719381332397, "Pretrain/Loss (Raw)": 1.9917148351669312, "Pretrain/Step": 14535, "Pretrain/Step Time": 8.48492969200015} +{"Pretrain/Learning Rate": 7.059417640072608e-06, "Pretrain/Loss": 1.986851692199707, "Pretrain/Loss (Raw)": 1.8566373586654663, "Pretrain/Step": 14536, "Pretrain/Step Time": 8.482728192582726} +{"Pretrain/Learning Rate": 7.056461431489015e-06, "Pretrain/Loss": 1.9901988506317139, "Pretrain/Loss (Raw)": 2.2622971534729004, "Pretrain/Step": 14537, "Pretrain/Step Time": 8.486113540828228} +{"Pretrain/Learning Rate": 7.053505740294703e-06, "Pretrain/Loss": 1.990426778793335, "Pretrain/Loss (Raw)": 1.9583425521850586, "Pretrain/Step": 14538, "Pretrain/Step Time": 8.48021780140698} +{"Pretrain/Learning Rate": 7.050550566574907e-06, "Pretrain/Loss": 1.9929916858673096, "Pretrain/Loss (Raw)": 2.285536289215088, "Pretrain/Step": 14539, "Pretrain/Step Time": 8.477400610223413} +{"Pretrain/Learning Rate": 7.047595910414831e-06, "Pretrain/Loss": 1.9943678379058838, "Pretrain/Loss (Raw)": 2.168184518814087, "Pretrain/Step": 14540, "Pretrain/Step Time": 8.475311046466231} +{"Pretrain/Learning Rate": 7.044641771899665e-06, "Pretrain/Loss": 1.993567943572998, "Pretrain/Loss (Raw)": 1.9698402881622314, "Pretrain/Step": 14541, "Pretrain/Step Time": 8.480286300182343} +{"Pretrain/Learning Rate": 7.041688151114603e-06, "Pretrain/Loss": 1.9933116436004639, "Pretrain/Loss (Raw)": 1.9937567710876465, "Pretrain/Step": 14542, "Pretrain/Step Time": 8.476838437840343} +{"Pretrain/Learning Rate": 7.038735048144795e-06, "Pretrain/Loss": 1.993688941001892, "Pretrain/Loss (Raw)": 1.9015049934387207, "Pretrain/Step": 14543, "Pretrain/Step Time": 8.476365284994245} +{"Pretrain/Learning Rate": 7.0357824630754106e-06, "Pretrain/Loss": 1.9940037727355957, "Pretrain/Loss (Raw)": 2.0029189586639404, "Pretrain/Step": 14544, "Pretrain/Step Time": 8.477569170296192} +{"Pretrain/Learning Rate": 7.032830395991574e-06, "Pretrain/Loss": 1.9944953918457031, "Pretrain/Loss (Raw)": 2.123979330062866, "Pretrain/Step": 14545, "Pretrain/Step Time": 8.483186900615692} +{"Pretrain/Learning Rate": 7.029878846978397e-06, "Pretrain/Loss": 1.9933133125305176, "Pretrain/Loss (Raw)": 1.9614982604980469, "Pretrain/Step": 14546, "Pretrain/Step Time": 8.481322575360537} +{"Pretrain/Learning Rate": 7.026927816121004e-06, "Pretrain/Loss": 1.9940831661224365, "Pretrain/Loss (Raw)": 2.203672409057617, "Pretrain/Step": 14547, "Pretrain/Step Time": 8.481437489390373} +{"Pretrain/Learning Rate": 7.0239773035044695e-06, "Pretrain/Loss": 1.9945755004882812, "Pretrain/Loss (Raw)": 1.813659429550171, "Pretrain/Step": 14548, "Pretrain/Step Time": 8.480553902685642} +{"Pretrain/Learning Rate": 7.021027309213887e-06, "Pretrain/Loss": 1.9955799579620361, "Pretrain/Loss (Raw)": 2.1007137298583984, "Pretrain/Step": 14549, "Pretrain/Step Time": 8.481296427547932} +{"Pretrain/Learning Rate": 7.018077833334305e-06, "Pretrain/Loss": 1.9958970546722412, "Pretrain/Loss (Raw)": 1.9752793312072754, "Pretrain/Step": 14550, "Pretrain/Step Time": 8.474668961018324} +{"Pretrain/Learning Rate": 7.015128875950766e-06, "Pretrain/Loss": 2.0025901794433594, "Pretrain/Loss (Raw)": 2.6193976402282715, "Pretrain/Step": 14551, "Pretrain/Step Time": 8.476404698565602} +{"Pretrain/Learning Rate": 7.012180437148313e-06, "Pretrain/Loss": 2.002230167388916, "Pretrain/Loss (Raw)": 2.070849895477295, "Pretrain/Step": 14552, "Pretrain/Step Time": 8.48041545972228} +{"Pretrain/Learning Rate": 7.0092325170119515e-06, "Pretrain/Loss": 2.0059030055999756, "Pretrain/Loss (Raw)": 2.1378173828125, "Pretrain/Step": 14553, "Pretrain/Step Time": 8.478192079812288} +{"Pretrain/Learning Rate": 7.006285115626696e-06, "Pretrain/Loss": 2.00740909576416, "Pretrain/Loss (Raw)": 1.968862771987915, "Pretrain/Step": 14554, "Pretrain/Step Time": 8.478448782116175} +{"Pretrain/Learning Rate": 7.003338233077522e-06, "Pretrain/Loss": 2.0082271099090576, "Pretrain/Loss (Raw)": 2.0924575328826904, "Pretrain/Step": 14555, "Pretrain/Step Time": 8.479177083820105} +{"Pretrain/Learning Rate": 7.000391869449397e-06, "Pretrain/Loss": 2.009720802307129, "Pretrain/Loss (Raw)": 1.9983832836151123, "Pretrain/Step": 14556, "Pretrain/Step Time": 8.480404894798994} +{"Pretrain/Learning Rate": 6.99744602482729e-06, "Pretrain/Loss": 2.0082640647888184, "Pretrain/Loss (Raw)": 1.9303003549575806, "Pretrain/Step": 14557, "Pretrain/Step Time": 8.473379772156477} +{"Pretrain/Learning Rate": 6.994500699296128e-06, "Pretrain/Loss": 2.0050783157348633, "Pretrain/Loss (Raw)": 1.6504333019256592, "Pretrain/Step": 14558, "Pretrain/Step Time": 8.473765704780817} +{"Pretrain/Learning Rate": 6.991555892940854e-06, "Pretrain/Loss": 2.0065345764160156, "Pretrain/Loss (Raw)": 1.9470746517181396, "Pretrain/Step": 14559, "Pretrain/Step Time": 8.47407404705882} +{"Pretrain/Learning Rate": 6.9886116058463705e-06, "Pretrain/Loss": 2.0080251693725586, "Pretrain/Loss (Raw)": 2.0935912132263184, "Pretrain/Step": 14560, "Pretrain/Step Time": 8.478349374607205} +{"Pretrain/Learning Rate": 6.9856678380975675e-06, "Pretrain/Loss": 2.0085813999176025, "Pretrain/Loss (Raw)": 2.0585994720458984, "Pretrain/Step": 14561, "Pretrain/Step Time": 8.47987555153668} +{"Pretrain/Learning Rate": 6.982724589779338e-06, "Pretrain/Loss": 2.0068092346191406, "Pretrain/Loss (Raw)": 1.737931251525879, "Pretrain/Step": 14562, "Pretrain/Step Time": 8.48104726523161} +{"Pretrain/Learning Rate": 6.9797818609765395e-06, "Pretrain/Loss": 2.0092852115631104, "Pretrain/Loss (Raw)": 2.173743486404419, "Pretrain/Step": 14563, "Pretrain/Step Time": 8.482072815299034} +{"Pretrain/Learning Rate": 6.976839651774034e-06, "Pretrain/Loss": 2.008718967437744, "Pretrain/Loss (Raw)": 1.9003783464431763, "Pretrain/Step": 14564, "Pretrain/Step Time": 8.485138250514865} +{"Pretrain/Learning Rate": 6.97389796225665e-06, "Pretrain/Loss": 2.0062975883483887, "Pretrain/Loss (Raw)": 1.8440829515457153, "Pretrain/Step": 14565, "Pretrain/Step Time": 8.48646260984242} +{"Pretrain/Learning Rate": 6.970956792509204e-06, "Pretrain/Loss": 2.0073602199554443, "Pretrain/Loss (Raw)": 2.0822348594665527, "Pretrain/Step": 14566, "Pretrain/Step Time": 8.48340499214828} +{"Pretrain/Learning Rate": 6.968016142616518e-06, "Pretrain/Loss": 2.0038304328918457, "Pretrain/Loss (Raw)": 1.6367839574813843, "Pretrain/Step": 14567, "Pretrain/Step Time": 8.484618062153459} +{"Pretrain/Learning Rate": 6.965076012663366e-06, "Pretrain/Loss": 2.001126766204834, "Pretrain/Loss (Raw)": 1.82407546043396, "Pretrain/Step": 14568, "Pretrain/Step Time": 8.480723051354289} +{"Pretrain/Learning Rate": 6.96213640273454e-06, "Pretrain/Loss": 1.9995087385177612, "Pretrain/Loss (Raw)": 1.8634297847747803, "Pretrain/Step": 14569, "Pretrain/Step Time": 8.481343742460012} +{"Pretrain/Learning Rate": 6.959197312914797e-06, "Pretrain/Loss": 1.9971290826797485, "Pretrain/Loss (Raw)": 1.8118475675582886, "Pretrain/Step": 14570, "Pretrain/Step Time": 8.480648161843419} +{"Pretrain/Learning Rate": 6.9562587432888735e-06, "Pretrain/Loss": 2.000565767288208, "Pretrain/Loss (Raw)": 2.5611355304718018, "Pretrain/Step": 14571, "Pretrain/Step Time": 8.480863312259316} +{"Pretrain/Learning Rate": 6.953320693941517e-06, "Pretrain/Loss": 2.0007541179656982, "Pretrain/Loss (Raw)": 1.965415120124817, "Pretrain/Step": 14572, "Pretrain/Step Time": 8.472572892904282} +{"Pretrain/Learning Rate": 6.9503831649574275e-06, "Pretrain/Loss": 2.0028719902038574, "Pretrain/Loss (Raw)": 2.1873056888580322, "Pretrain/Step": 14573, "Pretrain/Step Time": 8.474498771131039} +{"Pretrain/Learning Rate": 6.94744615642133e-06, "Pretrain/Loss": 2.002213954925537, "Pretrain/Loss (Raw)": 1.9084959030151367, "Pretrain/Step": 14574, "Pretrain/Step Time": 8.472239293158054} +{"Pretrain/Learning Rate": 6.944509668417884e-06, "Pretrain/Loss": 2.002944231033325, "Pretrain/Loss (Raw)": 1.9241442680358887, "Pretrain/Step": 14575, "Pretrain/Step Time": 8.47208064980805} +{"Pretrain/Learning Rate": 6.941573701031778e-06, "Pretrain/Loss": 2.003150701522827, "Pretrain/Loss (Raw)": 2.0080666542053223, "Pretrain/Step": 14576, "Pretrain/Step Time": 8.472784606739879} +{"Pretrain/Learning Rate": 6.9386382543476655e-06, "Pretrain/Loss": 2.003652572631836, "Pretrain/Loss (Raw)": 2.188910722732544, "Pretrain/Step": 14577, "Pretrain/Step Time": 8.472669856622815} +{"Pretrain/Learning Rate": 6.93570332845018e-06, "Pretrain/Loss": 2.003970146179199, "Pretrain/Loss (Raw)": 2.0671913623809814, "Pretrain/Step": 14578, "Pretrain/Step Time": 8.478437528014183} +{"Pretrain/Learning Rate": 6.93276892342396e-06, "Pretrain/Loss": 2.0054898262023926, "Pretrain/Loss (Raw)": 2.0694148540496826, "Pretrain/Step": 14579, "Pretrain/Step Time": 8.480631669983268} +{"Pretrain/Learning Rate": 6.929835039353605e-06, "Pretrain/Loss": 2.004944324493408, "Pretrain/Loss (Raw)": 1.8572602272033691, "Pretrain/Step": 14580, "Pretrain/Step Time": 8.483145456761122} +{"Pretrain/Learning Rate": 6.926901676323724e-06, "Pretrain/Loss": 2.004397392272949, "Pretrain/Loss (Raw)": 2.0975286960601807, "Pretrain/Step": 14581, "Pretrain/Step Time": 8.486928090453148} +{"Pretrain/Learning Rate": 6.923968834418887e-06, "Pretrain/Loss": 2.005812644958496, "Pretrain/Loss (Raw)": 2.185800790786743, "Pretrain/Step": 14582, "Pretrain/Step Time": 8.488343443721533} +{"Pretrain/Learning Rate": 6.921036513723672e-06, "Pretrain/Loss": 2.0038976669311523, "Pretrain/Loss (Raw)": 1.7923392057418823, "Pretrain/Step": 14583, "Pretrain/Step Time": 8.488464295864105} +{"Pretrain/Learning Rate": 6.918104714322626e-06, "Pretrain/Loss": 2.005833148956299, "Pretrain/Loss (Raw)": 2.057490110397339, "Pretrain/Step": 14584, "Pretrain/Step Time": 8.490013999864459} +{"Pretrain/Learning Rate": 6.915173436300273e-06, "Pretrain/Loss": 2.0064852237701416, "Pretrain/Loss (Raw)": 2.031580686569214, "Pretrain/Step": 14585, "Pretrain/Step Time": 8.488990243524313} +{"Pretrain/Learning Rate": 6.912242679741157e-06, "Pretrain/Loss": 2.00559139251709, "Pretrain/Loss (Raw)": 1.9673117399215698, "Pretrain/Step": 14586, "Pretrain/Step Time": 8.490370085462928} +{"Pretrain/Learning Rate": 6.909312444729763e-06, "Pretrain/Loss": 2.006481647491455, "Pretrain/Loss (Raw)": 2.1586172580718994, "Pretrain/Step": 14587, "Pretrain/Step Time": 8.48309189081192} +{"Pretrain/Learning Rate": 6.906382731350597e-06, "Pretrain/Loss": 2.0115437507629395, "Pretrain/Loss (Raw)": 2.506483316421509, "Pretrain/Step": 14588, "Pretrain/Step Time": 8.483683083206415} +{"Pretrain/Learning Rate": 6.9034535396881314e-06, "Pretrain/Loss": 2.0126445293426514, "Pretrain/Loss (Raw)": 2.1468749046325684, "Pretrain/Step": 14589, "Pretrain/Step Time": 8.483120081946254} +{"Pretrain/Learning Rate": 6.900524869826819e-06, "Pretrain/Loss": 2.0130109786987305, "Pretrain/Loss (Raw)": 2.019702672958374, "Pretrain/Step": 14590, "Pretrain/Step Time": 8.490079810842872} +{"Pretrain/Learning Rate": 6.897596721851118e-06, "Pretrain/Loss": 2.0133113861083984, "Pretrain/Loss (Raw)": 1.9628456830978394, "Pretrain/Step": 14591, "Pretrain/Step Time": 8.488792899996042} +{"Pretrain/Learning Rate": 6.8946690958454495e-06, "Pretrain/Loss": 2.0121889114379883, "Pretrain/Loss (Raw)": 1.919939637184143, "Pretrain/Step": 14592, "Pretrain/Step Time": 8.49050130136311} +{"Pretrain/Learning Rate": 6.891741991894238e-06, "Pretrain/Loss": 2.01353120803833, "Pretrain/Loss (Raw)": 2.2380056381225586, "Pretrain/Step": 14593, "Pretrain/Step Time": 8.488826544955373} +{"Pretrain/Learning Rate": 6.888815410081883e-06, "Pretrain/Loss": 2.015270471572876, "Pretrain/Loss (Raw)": 2.1275503635406494, "Pretrain/Step": 14594, "Pretrain/Step Time": 8.492107519879937} +{"Pretrain/Learning Rate": 6.885889350492761e-06, "Pretrain/Loss": 2.017383575439453, "Pretrain/Loss (Raw)": 2.058151960372925, "Pretrain/Step": 14595, "Pretrain/Step Time": 8.496852116659284} +{"Pretrain/Learning Rate": 6.8829638132112576e-06, "Pretrain/Loss": 2.015552520751953, "Pretrain/Loss (Raw)": 1.9141489267349243, "Pretrain/Step": 14596, "Pretrain/Step Time": 8.497079556807876} +{"Pretrain/Learning Rate": 6.880038798321711e-06, "Pretrain/Loss": 2.0198140144348145, "Pretrain/Loss (Raw)": 2.5539231300354004, "Pretrain/Step": 14597, "Pretrain/Step Time": 8.49727083556354} +{"Pretrain/Learning Rate": 6.877114305908483e-06, "Pretrain/Loss": 2.019932270050049, "Pretrain/Loss (Raw)": 1.8798949718475342, "Pretrain/Step": 14598, "Pretrain/Step Time": 8.493726186454296} +{"Pretrain/Learning Rate": 6.874190336055885e-06, "Pretrain/Loss": 2.018890142440796, "Pretrain/Loss (Raw)": 1.6819530725479126, "Pretrain/Step": 14599, "Pretrain/Step Time": 8.493684750050306} +{"Pretrain/Learning Rate": 6.871266888848227e-06, "Pretrain/Loss": 2.018857002258301, "Pretrain/Loss (Raw)": 1.99207603931427, "Pretrain/Step": 14600, "Pretrain/Step Time": 8.492350678890944} +{"Pretrain/Learning Rate": 6.868343964369811e-06, "Pretrain/Loss": 2.018824577331543, "Pretrain/Loss (Raw)": 1.985937237739563, "Pretrain/Step": 14601, "Pretrain/Step Time": 8.490593848749995} +{"Pretrain/Learning Rate": 6.86542156270491e-06, "Pretrain/Loss": 2.0166854858398438, "Pretrain/Loss (Raw)": 1.7428032159805298, "Pretrain/Step": 14602, "Pretrain/Step Time": 8.494046965613961} +{"Pretrain/Learning Rate": 6.862499683937803e-06, "Pretrain/Loss": 2.019817590713501, "Pretrain/Loss (Raw)": 2.2069263458251953, "Pretrain/Step": 14603, "Pretrain/Step Time": 8.490638388320804} +{"Pretrain/Learning Rate": 6.85957832815273e-06, "Pretrain/Loss": 2.0198466777801514, "Pretrain/Loss (Raw)": 2.0236217975616455, "Pretrain/Step": 14604, "Pretrain/Step Time": 8.488210355862975} +{"Pretrain/Learning Rate": 6.856657495433921e-06, "Pretrain/Loss": 2.0184597969055176, "Pretrain/Loss (Raw)": 1.955187201499939, "Pretrain/Step": 14605, "Pretrain/Step Time": 8.486340465024114} +{"Pretrain/Learning Rate": 6.853737185865608e-06, "Pretrain/Loss": 2.0173392295837402, "Pretrain/Loss (Raw)": 1.9567261934280396, "Pretrain/Step": 14606, "Pretrain/Step Time": 8.4826895352453} +{"Pretrain/Learning Rate": 6.8508173995319865e-06, "Pretrain/Loss": 2.017563581466675, "Pretrain/Loss (Raw)": 2.105985403060913, "Pretrain/Step": 14607, "Pretrain/Step Time": 8.479738241061568} +{"Pretrain/Learning Rate": 6.847898136517256e-06, "Pretrain/Loss": 2.0162272453308105, "Pretrain/Loss (Raw)": 1.6900876760482788, "Pretrain/Step": 14608, "Pretrain/Step Time": 8.478681886568666} +{"Pretrain/Learning Rate": 6.844979396905587e-06, "Pretrain/Loss": 2.0173351764678955, "Pretrain/Loss (Raw)": 2.012369155883789, "Pretrain/Step": 14609, "Pretrain/Step Time": 8.477862194180489} +{"Pretrain/Learning Rate": 6.842061180781134e-06, "Pretrain/Loss": 2.0144202709198, "Pretrain/Loss (Raw)": 1.9597985744476318, "Pretrain/Step": 14610, "Pretrain/Step Time": 8.481167510151863} +{"Pretrain/Learning Rate": 6.8391434882280506e-06, "Pretrain/Loss": 2.0123000144958496, "Pretrain/Loss (Raw)": 1.7555283308029175, "Pretrain/Step": 14611, "Pretrain/Step Time": 8.479967826977372} +{"Pretrain/Learning Rate": 6.836226319330455e-06, "Pretrain/Loss": 2.006772518157959, "Pretrain/Loss (Raw)": 1.4354835748672485, "Pretrain/Step": 14612, "Pretrain/Step Time": 8.477610284462571} +{"Pretrain/Learning Rate": 6.8333096741724775e-06, "Pretrain/Loss": 2.005016803741455, "Pretrain/Loss (Raw)": 1.8464614152908325, "Pretrain/Step": 14613, "Pretrain/Step Time": 8.484230807051063} +{"Pretrain/Learning Rate": 6.830393552838207e-06, "Pretrain/Loss": 2.0055644512176514, "Pretrain/Loss (Raw)": 2.0608279705047607, "Pretrain/Step": 14614, "Pretrain/Step Time": 8.48203032836318} +{"Pretrain/Learning Rate": 6.827477955411723e-06, "Pretrain/Loss": 2.0055971145629883, "Pretrain/Loss (Raw)": 2.02783203125, "Pretrain/Step": 14615, "Pretrain/Step Time": 8.486784625798464} +{"Pretrain/Learning Rate": 6.824562881977112e-06, "Pretrain/Loss": 2.0052971839904785, "Pretrain/Loss (Raw)": 1.9220969676971436, "Pretrain/Step": 14616, "Pretrain/Step Time": 8.485392939299345} +{"Pretrain/Learning Rate": 6.821648332618405e-06, "Pretrain/Loss": 2.004619836807251, "Pretrain/Loss (Raw)": 2.016690731048584, "Pretrain/Step": 14617, "Pretrain/Step Time": 8.492246629670262} +{"Pretrain/Learning Rate": 6.818734307419664e-06, "Pretrain/Loss": 2.0058813095092773, "Pretrain/Loss (Raw)": 2.016270875930786, "Pretrain/Step": 14618, "Pretrain/Step Time": 8.487246247008443} +{"Pretrain/Learning Rate": 6.815820806464901e-06, "Pretrain/Loss": 2.005725622177124, "Pretrain/Loss (Raw)": 2.0733518600463867, "Pretrain/Step": 14619, "Pretrain/Step Time": 8.483653247356415} +{"Pretrain/Learning Rate": 6.8129078298381196e-06, "Pretrain/Loss": 2.00642466545105, "Pretrain/Loss (Raw)": 2.2257742881774902, "Pretrain/Step": 14620, "Pretrain/Step Time": 8.482535215094686} +{"Pretrain/Learning Rate": 6.809995377623327e-06, "Pretrain/Loss": 2.006503105163574, "Pretrain/Loss (Raw)": 1.85891592502594, "Pretrain/Step": 14621, "Pretrain/Step Time": 8.485585812479258} +{"Pretrain/Learning Rate": 6.807083449904486e-06, "Pretrain/Loss": 2.0065248012542725, "Pretrain/Loss (Raw)": 2.0526864528656006, "Pretrain/Step": 14622, "Pretrain/Step Time": 8.48398819193244} +{"Pretrain/Learning Rate": 6.804172046765578e-06, "Pretrain/Loss": 2.008831739425659, "Pretrain/Loss (Raw)": 2.2439041137695312, "Pretrain/Step": 14623, "Pretrain/Step Time": 8.484248269349337} +{"Pretrain/Learning Rate": 6.80126116829054e-06, "Pretrain/Loss": 2.0076169967651367, "Pretrain/Loss (Raw)": 1.8678159713745117, "Pretrain/Step": 14624, "Pretrain/Step Time": 8.482642589136958} +{"Pretrain/Learning Rate": 6.7983508145633e-06, "Pretrain/Loss": 2.008491039276123, "Pretrain/Loss (Raw)": 2.121983289718628, "Pretrain/Step": 14625, "Pretrain/Step Time": 8.480976676568389} +{"Pretrain/Learning Rate": 6.7954409856677916e-06, "Pretrain/Loss": 2.0056650638580322, "Pretrain/Loss (Raw)": 1.7784324884414673, "Pretrain/Step": 14626, "Pretrain/Step Time": 8.483650336042047} +{"Pretrain/Learning Rate": 6.7925316816879e-06, "Pretrain/Loss": 2.001887798309326, "Pretrain/Loss (Raw)": 1.7614365816116333, "Pretrain/Step": 14627, "Pretrain/Step Time": 8.47951008938253} +{"Pretrain/Learning Rate": 6.789622902707532e-06, "Pretrain/Loss": 2.0018420219421387, "Pretrain/Loss (Raw)": 1.8859072923660278, "Pretrain/Step": 14628, "Pretrain/Step Time": 8.480920124799013} +{"Pretrain/Learning Rate": 6.7867146488105465e-06, "Pretrain/Loss": 2.0037431716918945, "Pretrain/Loss (Raw)": 2.006741523742676, "Pretrain/Step": 14629, "Pretrain/Step Time": 8.48284056223929} +{"Pretrain/Learning Rate": 6.783806920080798e-06, "Pretrain/Loss": 2.0042359828948975, "Pretrain/Loss (Raw)": 1.844538927078247, "Pretrain/Step": 14630, "Pretrain/Step Time": 8.487805809825659} +{"Pretrain/Learning Rate": 6.7808997166021455e-06, "Pretrain/Loss": 2.0039210319519043, "Pretrain/Loss (Raw)": 1.945286750793457, "Pretrain/Step": 14631, "Pretrain/Step Time": 8.481758708134294} +{"Pretrain/Learning Rate": 6.777993038458397e-06, "Pretrain/Loss": 2.0056166648864746, "Pretrain/Loss (Raw)": 2.19134259223938, "Pretrain/Step": 14632, "Pretrain/Step Time": 8.484335826709867} +{"Pretrain/Learning Rate": 6.775086885733381e-06, "Pretrain/Loss": 2.00335955619812, "Pretrain/Loss (Raw)": 1.770005226135254, "Pretrain/Step": 14633, "Pretrain/Step Time": 8.48430578224361} +{"Pretrain/Learning Rate": 6.772181258510884e-06, "Pretrain/Loss": 2.0010299682617188, "Pretrain/Loss (Raw)": 1.965478777885437, "Pretrain/Step": 14634, "Pretrain/Step Time": 8.488672632724047} +{"Pretrain/Learning Rate": 6.769276156874688e-06, "Pretrain/Loss": 2.0043795108795166, "Pretrain/Loss (Raw)": 2.0530340671539307, "Pretrain/Step": 14635, "Pretrain/Step Time": 8.490163208916783} +{"Pretrain/Learning Rate": 6.766371580908567e-06, "Pretrain/Loss": 2.0066895484924316, "Pretrain/Loss (Raw)": 2.2245001792907715, "Pretrain/Step": 14636, "Pretrain/Step Time": 8.490418111905456} +{"Pretrain/Learning Rate": 6.7634675306962605e-06, "Pretrain/Loss": 2.0061075687408447, "Pretrain/Loss (Raw)": 1.7922453880310059, "Pretrain/Step": 14637, "Pretrain/Step Time": 8.494679855182767} +{"Pretrain/Learning Rate": 6.760564006321518e-06, "Pretrain/Loss": 2.0071892738342285, "Pretrain/Loss (Raw)": 2.2578964233398438, "Pretrain/Step": 14638, "Pretrain/Step Time": 8.492725813761353} +{"Pretrain/Learning Rate": 6.757661007868057e-06, "Pretrain/Loss": 2.004983901977539, "Pretrain/Loss (Raw)": 1.851166009902954, "Pretrain/Step": 14639, "Pretrain/Step Time": 8.490182846784592} +{"Pretrain/Learning Rate": 6.754758535419573e-06, "Pretrain/Loss": 2.002944231033325, "Pretrain/Loss (Raw)": 1.7505985498428345, "Pretrain/Step": 14640, "Pretrain/Step Time": 8.491979515179992} +{"Pretrain/Learning Rate": 6.751856589059771e-06, "Pretrain/Loss": 2.0018653869628906, "Pretrain/Loss (Raw)": 1.9176228046417236, "Pretrain/Step": 14641, "Pretrain/Step Time": 8.490089893341064} +{"Pretrain/Learning Rate": 6.748955168872312e-06, "Pretrain/Loss": 2.0014140605926514, "Pretrain/Loss (Raw)": 1.9946951866149902, "Pretrain/Step": 14642, "Pretrain/Step Time": 8.491847056895494} +{"Pretrain/Learning Rate": 6.7460542749408745e-06, "Pretrain/Loss": 2.002152442932129, "Pretrain/Loss (Raw)": 1.8733633756637573, "Pretrain/Step": 14643, "Pretrain/Step Time": 8.489298110827804} +{"Pretrain/Learning Rate": 6.743153907349093e-06, "Pretrain/Loss": 2.004894256591797, "Pretrain/Loss (Raw)": 2.335829734802246, "Pretrain/Step": 14644, "Pretrain/Step Time": 8.48690153285861} +{"Pretrain/Learning Rate": 6.7402540661805905e-06, "Pretrain/Loss": 2.0059709548950195, "Pretrain/Loss (Raw)": 2.078887939453125, "Pretrain/Step": 14645, "Pretrain/Step Time": 8.493250641971827} +{"Pretrain/Learning Rate": 6.737354751518996e-06, "Pretrain/Loss": 2.0083141326904297, "Pretrain/Loss (Raw)": 2.05830454826355, "Pretrain/Step": 14646, "Pretrain/Step Time": 8.492604663595557} +{"Pretrain/Learning Rate": 6.734455963447894e-06, "Pretrain/Loss": 2.007274627685547, "Pretrain/Loss (Raw)": 2.0322275161743164, "Pretrain/Step": 14647, "Pretrain/Step Time": 8.494195124134421} +{"Pretrain/Learning Rate": 6.731557702050889e-06, "Pretrain/Loss": 2.009082317352295, "Pretrain/Loss (Raw)": 2.3203318119049072, "Pretrain/Step": 14648, "Pretrain/Step Time": 8.49109815992415} +{"Pretrain/Learning Rate": 6.728659967411538e-06, "Pretrain/Loss": 2.008103370666504, "Pretrain/Loss (Raw)": 1.9349089860916138, "Pretrain/Step": 14649, "Pretrain/Step Time": 8.493943579494953} +{"Pretrain/Learning Rate": 6.725762759613388e-06, "Pretrain/Loss": 2.0079293251037598, "Pretrain/Loss (Raw)": 2.0055124759674072, "Pretrain/Step": 14650, "Pretrain/Step Time": 8.490184331312776} +{"Pretrain/Learning Rate": 6.722866078739995e-06, "Pretrain/Loss": 2.0032567977905273, "Pretrain/Loss (Raw)": 1.4963514804840088, "Pretrain/Step": 14651, "Pretrain/Step Time": 8.491155166178942} +{"Pretrain/Learning Rate": 6.719969924874866e-06, "Pretrain/Loss": 2.0034942626953125, "Pretrain/Loss (Raw)": 2.112253189086914, "Pretrain/Step": 14652, "Pretrain/Step Time": 8.48957421258092} +{"Pretrain/Learning Rate": 6.717074298101528e-06, "Pretrain/Loss": 2.004929780960083, "Pretrain/Loss (Raw)": 1.928578495979309, "Pretrain/Step": 14653, "Pretrain/Step Time": 8.489510683342814} +{"Pretrain/Learning Rate": 6.714179198503454e-06, "Pretrain/Loss": 2.005465269088745, "Pretrain/Loss (Raw)": 2.050509452819824, "Pretrain/Step": 14654, "Pretrain/Step Time": 8.486857203766704} +{"Pretrain/Learning Rate": 6.711284626164138e-06, "Pretrain/Loss": 2.005047082901001, "Pretrain/Loss (Raw)": 2.083740234375, "Pretrain/Step": 14655, "Pretrain/Step Time": 8.488546524196863} +{"Pretrain/Learning Rate": 6.70839058116704e-06, "Pretrain/Loss": 2.0049192905426025, "Pretrain/Loss (Raw)": 1.9502915143966675, "Pretrain/Step": 14656, "Pretrain/Step Time": 8.485834021121264} +{"Pretrain/Learning Rate": 6.705497063595595e-06, "Pretrain/Loss": 2.005805015563965, "Pretrain/Loss (Raw)": 1.8789993524551392, "Pretrain/Step": 14657, "Pretrain/Step Time": 8.487177724018693} +{"Pretrain/Learning Rate": 6.702604073533261e-06, "Pretrain/Loss": 2.0050606727600098, "Pretrain/Loss (Raw)": 1.8524097204208374, "Pretrain/Step": 14658, "Pretrain/Step Time": 8.488166468217969} +{"Pretrain/Learning Rate": 6.699711611063425e-06, "Pretrain/Loss": 2.002004861831665, "Pretrain/Loss (Raw)": 1.7317053079605103, "Pretrain/Step": 14659, "Pretrain/Step Time": 8.485425304621458} +{"Pretrain/Learning Rate": 6.696819676269514e-06, "Pretrain/Loss": 2.0006608963012695, "Pretrain/Loss (Raw)": 1.9574129581451416, "Pretrain/Step": 14660, "Pretrain/Step Time": 8.482162769883871} +{"Pretrain/Learning Rate": 6.6939282692348944e-06, "Pretrain/Loss": 2.0002784729003906, "Pretrain/Loss (Raw)": 2.09674072265625, "Pretrain/Step": 14661, "Pretrain/Step Time": 8.478270625695586} +{"Pretrain/Learning Rate": 6.691037390042956e-06, "Pretrain/Loss": 1.9991239309310913, "Pretrain/Loss (Raw)": 1.9121448993682861, "Pretrain/Step": 14662, "Pretrain/Step Time": 8.485305856913328} +{"Pretrain/Learning Rate": 6.688147038777045e-06, "Pretrain/Loss": 1.9975686073303223, "Pretrain/Loss (Raw)": 1.7926340103149414, "Pretrain/Step": 14663, "Pretrain/Step Time": 8.480496561154723} +{"Pretrain/Learning Rate": 6.685257215520501e-06, "Pretrain/Loss": 1.9985438585281372, "Pretrain/Loss (Raw)": 1.981446623802185, "Pretrain/Step": 14664, "Pretrain/Step Time": 8.48246100358665} +{"Pretrain/Learning Rate": 6.6823679203566604e-06, "Pretrain/Loss": 1.9963587522506714, "Pretrain/Loss (Raw)": 1.9826170206069946, "Pretrain/Step": 14665, "Pretrain/Step Time": 8.479818481951952} +{"Pretrain/Learning Rate": 6.679479153368823e-06, "Pretrain/Loss": 1.9964227676391602, "Pretrain/Loss (Raw)": 1.9665364027023315, "Pretrain/Step": 14666, "Pretrain/Step Time": 8.478718359023333} +{"Pretrain/Learning Rate": 6.676590914640293e-06, "Pretrain/Loss": 1.9925438165664673, "Pretrain/Loss (Raw)": 1.7890434265136719, "Pretrain/Step": 14667, "Pretrain/Step Time": 8.482139967381954} +{"Pretrain/Learning Rate": 6.673703204254347e-06, "Pretrain/Loss": 1.9908146858215332, "Pretrain/Loss (Raw)": 1.946851372718811, "Pretrain/Step": 14668, "Pretrain/Step Time": 8.485910810530186} +{"Pretrain/Learning Rate": 6.670816022294246e-06, "Pretrain/Loss": 1.9894654750823975, "Pretrain/Loss (Raw)": 1.7971361875534058, "Pretrain/Step": 14669, "Pretrain/Step Time": 8.485098710283637} +{"Pretrain/Learning Rate": 6.667929368843248e-06, "Pretrain/Loss": 1.989965558052063, "Pretrain/Loss (Raw)": 2.057769536972046, "Pretrain/Step": 14670, "Pretrain/Step Time": 8.484794931486249} +{"Pretrain/Learning Rate": 6.665043243984576e-06, "Pretrain/Loss": 1.9907622337341309, "Pretrain/Loss (Raw)": 2.0034782886505127, "Pretrain/Step": 14671, "Pretrain/Step Time": 8.483381247147918} +{"Pretrain/Learning Rate": 6.662157647801465e-06, "Pretrain/Loss": 1.9915993213653564, "Pretrain/Loss (Raw)": 2.110064744949341, "Pretrain/Step": 14672, "Pretrain/Step Time": 8.484542215242982} +{"Pretrain/Learning Rate": 6.659272580377113e-06, "Pretrain/Loss": 1.9915565252304077, "Pretrain/Loss (Raw)": 2.1185052394866943, "Pretrain/Step": 14673, "Pretrain/Step Time": 8.484392281621695} +{"Pretrain/Learning Rate": 6.656388041794695e-06, "Pretrain/Loss": 1.9887502193450928, "Pretrain/Loss (Raw)": 1.6022818088531494, "Pretrain/Step": 14674, "Pretrain/Step Time": 8.484789663925767} +{"Pretrain/Learning Rate": 6.653504032137406e-06, "Pretrain/Loss": 1.9876879453659058, "Pretrain/Loss (Raw)": 2.067707061767578, "Pretrain/Step": 14675, "Pretrain/Step Time": 8.485493775457144} +{"Pretrain/Learning Rate": 6.650620551488387e-06, "Pretrain/Loss": 1.9892656803131104, "Pretrain/Loss (Raw)": 2.015606164932251, "Pretrain/Step": 14676, "Pretrain/Step Time": 8.48446754552424} +{"Pretrain/Learning Rate": 6.647737599930798e-06, "Pretrain/Loss": 1.9881675243377686, "Pretrain/Loss (Raw)": 1.9601577520370483, "Pretrain/Step": 14677, "Pretrain/Step Time": 8.484263500198722} +{"Pretrain/Learning Rate": 6.644855177547757e-06, "Pretrain/Loss": 1.9887032508850098, "Pretrain/Loss (Raw)": 2.043851852416992, "Pretrain/Step": 14678, "Pretrain/Step Time": 8.485078852623701} +{"Pretrain/Learning Rate": 6.641973284422371e-06, "Pretrain/Loss": 1.9829394817352295, "Pretrain/Loss (Raw)": 1.8816229104995728, "Pretrain/Step": 14679, "Pretrain/Step Time": 8.491623664274812} +{"Pretrain/Learning Rate": 6.63909192063775e-06, "Pretrain/Loss": 1.9827020168304443, "Pretrain/Loss (Raw)": 2.04046368598938, "Pretrain/Step": 14680, "Pretrain/Step Time": 8.490948840975761} +{"Pretrain/Learning Rate": 6.636211086276961e-06, "Pretrain/Loss": 1.981727123260498, "Pretrain/Loss (Raw)": 2.0130341053009033, "Pretrain/Step": 14681, "Pretrain/Step Time": 8.495744640007615} +{"Pretrain/Learning Rate": 6.633330781423089e-06, "Pretrain/Loss": 1.9821298122406006, "Pretrain/Loss (Raw)": 2.020408868789673, "Pretrain/Step": 14682, "Pretrain/Step Time": 8.490582201629877} +{"Pretrain/Learning Rate": 6.630451006159174e-06, "Pretrain/Loss": 1.9817391633987427, "Pretrain/Loss (Raw)": 2.0424537658691406, "Pretrain/Step": 14683, "Pretrain/Step Time": 8.49066005460918} +{"Pretrain/Learning Rate": 6.627571760568249e-06, "Pretrain/Loss": 1.9829680919647217, "Pretrain/Loss (Raw)": 2.1556739807128906, "Pretrain/Step": 14684, "Pretrain/Step Time": 8.489579949527979} +{"Pretrain/Learning Rate": 6.6246930447333485e-06, "Pretrain/Loss": 1.9838001728057861, "Pretrain/Loss (Raw)": 2.036818742752075, "Pretrain/Step": 14685, "Pretrain/Step Time": 8.491293981671333} +{"Pretrain/Learning Rate": 6.621814858737463e-06, "Pretrain/Loss": 1.9869211912155151, "Pretrain/Loss (Raw)": 2.049919843673706, "Pretrain/Step": 14686, "Pretrain/Step Time": 8.492584584280849} +{"Pretrain/Learning Rate": 6.618937202663597e-06, "Pretrain/Loss": 1.988224983215332, "Pretrain/Loss (Raw)": 2.1139514446258545, "Pretrain/Step": 14687, "Pretrain/Step Time": 8.492162637412548} +{"Pretrain/Learning Rate": 6.6160600765947184e-06, "Pretrain/Loss": 1.9869740009307861, "Pretrain/Loss (Raw)": 1.9334726333618164, "Pretrain/Step": 14688, "Pretrain/Step Time": 8.494990136474371} +{"Pretrain/Learning Rate": 6.61318348061378e-06, "Pretrain/Loss": 1.9842621088027954, "Pretrain/Loss (Raw)": 1.711479902267456, "Pretrain/Step": 14689, "Pretrain/Step Time": 8.491194888949394} +{"Pretrain/Learning Rate": 6.610307414803743e-06, "Pretrain/Loss": 1.9868559837341309, "Pretrain/Loss (Raw)": 2.0699307918548584, "Pretrain/Step": 14690, "Pretrain/Step Time": 8.493339901790023} +{"Pretrain/Learning Rate": 6.607431879247519e-06, "Pretrain/Loss": 1.9847861528396606, "Pretrain/Loss (Raw)": 1.9088164567947388, "Pretrain/Step": 14691, "Pretrain/Step Time": 8.496208511292934} +{"Pretrain/Learning Rate": 6.60455687402804e-06, "Pretrain/Loss": 1.9856711626052856, "Pretrain/Loss (Raw)": 2.013659954071045, "Pretrain/Step": 14692, "Pretrain/Step Time": 8.493069153279066} +{"Pretrain/Learning Rate": 6.601682399228193e-06, "Pretrain/Loss": 1.9880733489990234, "Pretrain/Loss (Raw)": 2.151559591293335, "Pretrain/Step": 14693, "Pretrain/Step Time": 8.492895431816578} +{"Pretrain/Learning Rate": 6.598808454930858e-06, "Pretrain/Loss": 1.9870364665985107, "Pretrain/Loss (Raw)": 1.9495176076889038, "Pretrain/Step": 14694, "Pretrain/Step Time": 8.491447059437633} +{"Pretrain/Learning Rate": 6.5959350412189175e-06, "Pretrain/Loss": 1.9904968738555908, "Pretrain/Loss (Raw)": 2.079713821411133, "Pretrain/Step": 14695, "Pretrain/Step Time": 8.493039168417454} +{"Pretrain/Learning Rate": 6.593062158175206e-06, "Pretrain/Loss": 1.9927093982696533, "Pretrain/Loss (Raw)": 2.107271432876587, "Pretrain/Step": 14696, "Pretrain/Step Time": 8.492448430508375} +{"Pretrain/Learning Rate": 6.590189805882582e-06, "Pretrain/Loss": 1.9943292140960693, "Pretrain/Loss (Raw)": 2.070774793624878, "Pretrain/Step": 14697, "Pretrain/Step Time": 8.4961994048208} +{"Pretrain/Learning Rate": 6.587317984423855e-06, "Pretrain/Loss": 1.9968550205230713, "Pretrain/Loss (Raw)": 2.1351423263549805, "Pretrain/Step": 14698, "Pretrain/Step Time": 8.494672568514943} +{"Pretrain/Learning Rate": 6.584446693881826e-06, "Pretrain/Loss": 1.9918179512023926, "Pretrain/Loss (Raw)": 1.9163999557495117, "Pretrain/Step": 14699, "Pretrain/Step Time": 8.494505137205124} +{"Pretrain/Learning Rate": 6.581575934339304e-06, "Pretrain/Loss": 1.9918272495269775, "Pretrain/Loss (Raw)": 1.966603398323059, "Pretrain/Step": 14700, "Pretrain/Step Time": 8.494761925190687} +{"Pretrain/Learning Rate": 6.578705705879046e-06, "Pretrain/Loss": 1.9890975952148438, "Pretrain/Loss (Raw)": 1.8379125595092773, "Pretrain/Step": 14701, "Pretrain/Step Time": 8.493635084480047} +{"Pretrain/Learning Rate": 6.575836008583833e-06, "Pretrain/Loss": 1.9930932521820068, "Pretrain/Loss (Raw)": 2.4199326038360596, "Pretrain/Step": 14702, "Pretrain/Step Time": 8.493913684040308} +{"Pretrain/Learning Rate": 6.572966842536399e-06, "Pretrain/Loss": 1.9959893226623535, "Pretrain/Loss (Raw)": 2.2948527336120605, "Pretrain/Step": 14703, "Pretrain/Step Time": 8.495634945109487} +{"Pretrain/Learning Rate": 6.570098207819467e-06, "Pretrain/Loss": 1.9947435855865479, "Pretrain/Loss (Raw)": 1.8486076593399048, "Pretrain/Step": 14704, "Pretrain/Step Time": 8.497114269062877} +{"Pretrain/Learning Rate": 6.5672301045157706e-06, "Pretrain/Loss": 1.9948649406433105, "Pretrain/Loss (Raw)": 2.204439163208008, "Pretrain/Step": 14705, "Pretrain/Step Time": 8.494135590270162} +{"Pretrain/Learning Rate": 6.56436253270799e-06, "Pretrain/Loss": 1.9925289154052734, "Pretrain/Loss (Raw)": 1.7681912183761597, "Pretrain/Step": 14706, "Pretrain/Step Time": 8.486855186522007} +{"Pretrain/Learning Rate": 6.561495492478828e-06, "Pretrain/Loss": 1.9911372661590576, "Pretrain/Loss (Raw)": 1.89128839969635, "Pretrain/Step": 14707, "Pretrain/Step Time": 8.491309363394976} +{"Pretrain/Learning Rate": 6.5586289839109475e-06, "Pretrain/Loss": 1.9928762912750244, "Pretrain/Loss (Raw)": 2.0798487663269043, "Pretrain/Step": 14708, "Pretrain/Step Time": 8.492651661857963} +{"Pretrain/Learning Rate": 6.5557630070869904e-06, "Pretrain/Loss": 1.9923425912857056, "Pretrain/Loss (Raw)": 2.0292134284973145, "Pretrain/Step": 14709, "Pretrain/Step Time": 8.490326413884759} +{"Pretrain/Learning Rate": 6.552897562089611e-06, "Pretrain/Loss": 1.9917266368865967, "Pretrain/Loss (Raw)": 2.106959819793701, "Pretrain/Step": 14710, "Pretrain/Step Time": 8.489786326885223} +{"Pretrain/Learning Rate": 6.55003264900142e-06, "Pretrain/Loss": 1.9951932430267334, "Pretrain/Loss (Raw)": 2.2360575199127197, "Pretrain/Step": 14711, "Pretrain/Step Time": 8.49215098656714} +{"Pretrain/Learning Rate": 6.547168267905038e-06, "Pretrain/Loss": 1.9942487478256226, "Pretrain/Loss (Raw)": 1.9365935325622559, "Pretrain/Step": 14712, "Pretrain/Step Time": 8.488702040165663} +{"Pretrain/Learning Rate": 6.544304418883051e-06, "Pretrain/Loss": 1.9939818382263184, "Pretrain/Loss (Raw)": 1.9974225759506226, "Pretrain/Step": 14713, "Pretrain/Step Time": 8.49283492192626} +{"Pretrain/Learning Rate": 6.541441102018028e-06, "Pretrain/Loss": 1.994951605796814, "Pretrain/Loss (Raw)": 2.0914387702941895, "Pretrain/Step": 14714, "Pretrain/Step Time": 8.490092191845179} +{"Pretrain/Learning Rate": 6.538578317392549e-06, "Pretrain/Loss": 1.9938994646072388, "Pretrain/Loss (Raw)": 2.0239412784576416, "Pretrain/Step": 14715, "Pretrain/Step Time": 8.492945918813348} +{"Pretrain/Learning Rate": 6.535716065089139e-06, "Pretrain/Loss": 1.9891033172607422, "Pretrain/Loss (Raw)": 1.8925601243972778, "Pretrain/Step": 14716, "Pretrain/Step Time": 8.494974425062537} +{"Pretrain/Learning Rate": 6.532854345190348e-06, "Pretrain/Loss": 1.9871618747711182, "Pretrain/Loss (Raw)": 1.8983758687973022, "Pretrain/Step": 14717, "Pretrain/Step Time": 8.493880057707429} +{"Pretrain/Learning Rate": 6.529993157778675e-06, "Pretrain/Loss": 1.9843661785125732, "Pretrain/Loss (Raw)": 1.6618616580963135, "Pretrain/Step": 14718, "Pretrain/Step Time": 8.489733485504985} +{"Pretrain/Learning Rate": 6.5271325029366364e-06, "Pretrain/Loss": 1.9840717315673828, "Pretrain/Loss (Raw)": 1.9251738786697388, "Pretrain/Step": 14719, "Pretrain/Step Time": 8.496024733409286} +{"Pretrain/Learning Rate": 6.52427238074671e-06, "Pretrain/Loss": 1.985257863998413, "Pretrain/Loss (Raw)": 2.071746826171875, "Pretrain/Step": 14720, "Pretrain/Step Time": 8.491893844678998} +{"Pretrain/Learning Rate": 6.521412791291359e-06, "Pretrain/Loss": 1.982431411743164, "Pretrain/Loss (Raw)": 1.876226782798767, "Pretrain/Step": 14721, "Pretrain/Step Time": 8.497151808813214} +{"Pretrain/Learning Rate": 6.518553734653049e-06, "Pretrain/Loss": 1.981786847114563, "Pretrain/Loss (Raw)": 2.0450472831726074, "Pretrain/Step": 14722, "Pretrain/Step Time": 8.492294972762465} +{"Pretrain/Learning Rate": 6.515695210914208e-06, "Pretrain/Loss": 1.982137680053711, "Pretrain/Loss (Raw)": 2.1030690670013428, "Pretrain/Step": 14723, "Pretrain/Step Time": 8.491547854617238} +{"Pretrain/Learning Rate": 6.51283722015727e-06, "Pretrain/Loss": 1.9831745624542236, "Pretrain/Loss (Raw)": 2.04683780670166, "Pretrain/Step": 14724, "Pretrain/Step Time": 8.491678452119231} +{"Pretrain/Learning Rate": 6.509979762464641e-06, "Pretrain/Loss": 1.978908896446228, "Pretrain/Loss (Raw)": 2.0079402923583984, "Pretrain/Step": 14725, "Pretrain/Step Time": 8.488071609288454} +{"Pretrain/Learning Rate": 6.5071228379187e-06, "Pretrain/Loss": 1.9793211221694946, "Pretrain/Loss (Raw)": 1.9326553344726562, "Pretrain/Step": 14726, "Pretrain/Step Time": 8.491295281797647} +{"Pretrain/Learning Rate": 6.504266446601845e-06, "Pretrain/Loss": 1.9818469285964966, "Pretrain/Loss (Raw)": 2.0052666664123535, "Pretrain/Step": 14727, "Pretrain/Step Time": 8.487931920215487} +{"Pretrain/Learning Rate": 6.501410588596421e-06, "Pretrain/Loss": 1.9798463582992554, "Pretrain/Loss (Raw)": 1.7359862327575684, "Pretrain/Step": 14728, "Pretrain/Step Time": 8.490129042416811} +{"Pretrain/Learning Rate": 6.49855526398479e-06, "Pretrain/Loss": 1.980514645576477, "Pretrain/Loss (Raw)": 2.0714855194091797, "Pretrain/Step": 14729, "Pretrain/Step Time": 8.486780058592558} +{"Pretrain/Learning Rate": 6.495700472849275e-06, "Pretrain/Loss": 1.9813222885131836, "Pretrain/Loss (Raw)": 1.8461898565292358, "Pretrain/Step": 14730, "Pretrain/Step Time": 8.486005062237382} +{"Pretrain/Learning Rate": 6.492846215272183e-06, "Pretrain/Loss": 1.979247808456421, "Pretrain/Loss (Raw)": 1.9413933753967285, "Pretrain/Step": 14731, "Pretrain/Step Time": 8.4878947455436} +{"Pretrain/Learning Rate": 6.489992491335834e-06, "Pretrain/Loss": 1.9776852130889893, "Pretrain/Loss (Raw)": 1.823586344718933, "Pretrain/Step": 14732, "Pretrain/Step Time": 8.492438225075603} +{"Pretrain/Learning Rate": 6.487139301122491e-06, "Pretrain/Loss": 1.9788644313812256, "Pretrain/Loss (Raw)": 2.1061463356018066, "Pretrain/Step": 14733, "Pretrain/Step Time": 8.491121370345354} +{"Pretrain/Learning Rate": 6.484286644714446e-06, "Pretrain/Loss": 1.9810019731521606, "Pretrain/Loss (Raw)": 2.230323553085327, "Pretrain/Step": 14734, "Pretrain/Step Time": 8.495029345154762} +{"Pretrain/Learning Rate": 6.481434522193943e-06, "Pretrain/Loss": 1.977252721786499, "Pretrain/Loss (Raw)": 1.6260972023010254, "Pretrain/Step": 14735, "Pretrain/Step Time": 8.493005501106381} +{"Pretrain/Learning Rate": 6.4785829336432156e-06, "Pretrain/Loss": 1.9789750576019287, "Pretrain/Loss (Raw)": 1.9105353355407715, "Pretrain/Step": 14736, "Pretrain/Step Time": 8.494431352242827} +{"Pretrain/Learning Rate": 6.475731879144495e-06, "Pretrain/Loss": 1.9765957593917847, "Pretrain/Loss (Raw)": 1.7078169584274292, "Pretrain/Step": 14737, "Pretrain/Step Time": 8.496784618124366} +{"Pretrain/Learning Rate": 6.472881358779983e-06, "Pretrain/Loss": 1.9764859676361084, "Pretrain/Loss (Raw)": 1.945754885673523, "Pretrain/Step": 14738, "Pretrain/Step Time": 8.495783207938075} +{"Pretrain/Learning Rate": 6.470031372631882e-06, "Pretrain/Loss": 1.9782350063323975, "Pretrain/Loss (Raw)": 1.979398488998413, "Pretrain/Step": 14739, "Pretrain/Step Time": 8.497338756918907} +{"Pretrain/Learning Rate": 6.467181920782364e-06, "Pretrain/Loss": 1.9820899963378906, "Pretrain/Loss (Raw)": 1.9289181232452393, "Pretrain/Step": 14740, "Pretrain/Step Time": 8.494540594518185} +{"Pretrain/Learning Rate": 6.464333003313583e-06, "Pretrain/Loss": 1.982689619064331, "Pretrain/Loss (Raw)": 1.9232141971588135, "Pretrain/Step": 14741, "Pretrain/Step Time": 8.488448655232787} +{"Pretrain/Learning Rate": 6.4614846203077e-06, "Pretrain/Loss": 1.982649326324463, "Pretrain/Loss (Raw)": 2.055670738220215, "Pretrain/Step": 14742, "Pretrain/Step Time": 8.494116814807057} +{"Pretrain/Learning Rate": 6.458636771846841e-06, "Pretrain/Loss": 1.9823439121246338, "Pretrain/Loss (Raw)": 1.9887434244155884, "Pretrain/Step": 14743, "Pretrain/Step Time": 8.48589302226901} +{"Pretrain/Learning Rate": 6.45578945801312e-06, "Pretrain/Loss": 1.9831812381744385, "Pretrain/Loss (Raw)": 2.029261589050293, "Pretrain/Step": 14744, "Pretrain/Step Time": 8.4880879111588} +{"Pretrain/Learning Rate": 6.452942678888626e-06, "Pretrain/Loss": 1.9823858737945557, "Pretrain/Loss (Raw)": 1.9148902893066406, "Pretrain/Step": 14745, "Pretrain/Step Time": 8.486221740022302} +{"Pretrain/Learning Rate": 6.450096434555466e-06, "Pretrain/Loss": 1.9799634218215942, "Pretrain/Loss (Raw)": 1.706199049949646, "Pretrain/Step": 14746, "Pretrain/Step Time": 8.490015847608447} +{"Pretrain/Learning Rate": 6.4472507250956994e-06, "Pretrain/Loss": 1.978981375694275, "Pretrain/Loss (Raw)": 1.9476572275161743, "Pretrain/Step": 14747, "Pretrain/Step Time": 8.486652078107} +{"Pretrain/Learning Rate": 6.44440555059137e-06, "Pretrain/Loss": 1.9771525859832764, "Pretrain/Loss (Raw)": 1.9916895627975464, "Pretrain/Step": 14748, "Pretrain/Step Time": 8.491710362955928} +{"Pretrain/Learning Rate": 6.441560911124534e-06, "Pretrain/Loss": 1.9792399406433105, "Pretrain/Loss (Raw)": 2.126089572906494, "Pretrain/Step": 14749, "Pretrain/Step Time": 8.487776432186365} +{"Pretrain/Learning Rate": 6.438716806777195e-06, "Pretrain/Loss": 1.9800434112548828, "Pretrain/Loss (Raw)": 2.1555185317993164, "Pretrain/Step": 14750, "Pretrain/Step Time": 8.487694811075926} +{"Pretrain/Learning Rate": 6.435873237631385e-06, "Pretrain/Loss": 1.977754831314087, "Pretrain/Loss (Raw)": 1.9509812593460083, "Pretrain/Step": 14751, "Pretrain/Step Time": 8.486178556457162} +{"Pretrain/Learning Rate": 6.43303020376908e-06, "Pretrain/Loss": 1.9783449172973633, "Pretrain/Loss (Raw)": 1.943345308303833, "Pretrain/Step": 14752, "Pretrain/Step Time": 8.487575106322765} +{"Pretrain/Learning Rate": 6.430187705272253e-06, "Pretrain/Loss": 1.9752686023712158, "Pretrain/Loss (Raw)": 1.7282170057296753, "Pretrain/Step": 14753, "Pretrain/Step Time": 8.4860023483634} +{"Pretrain/Learning Rate": 6.427345742222882e-06, "Pretrain/Loss": 1.9778525829315186, "Pretrain/Loss (Raw)": 2.1091697216033936, "Pretrain/Step": 14754, "Pretrain/Step Time": 8.490915514528751} +{"Pretrain/Learning Rate": 6.424504314702895e-06, "Pretrain/Loss": 1.97946298122406, "Pretrain/Loss (Raw)": 1.967579960823059, "Pretrain/Step": 14755, "Pretrain/Step Time": 8.490971894934773} +{"Pretrain/Learning Rate": 6.421663422794239e-06, "Pretrain/Loss": 1.9813570976257324, "Pretrain/Loss (Raw)": 2.128361463546753, "Pretrain/Step": 14756, "Pretrain/Step Time": 8.492797626182437} +{"Pretrain/Learning Rate": 6.418823066578819e-06, "Pretrain/Loss": 1.9793126583099365, "Pretrain/Loss (Raw)": 1.745038628578186, "Pretrain/Step": 14757, "Pretrain/Step Time": 8.492469487711787} +{"Pretrain/Learning Rate": 6.415983246138532e-06, "Pretrain/Loss": 1.9808484315872192, "Pretrain/Loss (Raw)": 2.0411288738250732, "Pretrain/Step": 14758, "Pretrain/Step Time": 8.48771489970386} +{"Pretrain/Learning Rate": 6.4131439615552735e-06, "Pretrain/Loss": 1.982027530670166, "Pretrain/Loss (Raw)": 2.096198558807373, "Pretrain/Step": 14759, "Pretrain/Step Time": 8.485728926956654} +{"Pretrain/Learning Rate": 6.4103052129109e-06, "Pretrain/Loss": 1.9794738292694092, "Pretrain/Loss (Raw)": 1.864464282989502, "Pretrain/Step": 14760, "Pretrain/Step Time": 8.491572281345725} +{"Pretrain/Learning Rate": 6.407467000287276e-06, "Pretrain/Loss": 1.9805045127868652, "Pretrain/Loss (Raw)": 1.901938796043396, "Pretrain/Step": 14761, "Pretrain/Step Time": 8.492036957293749} +{"Pretrain/Learning Rate": 6.404629323766237e-06, "Pretrain/Loss": 1.9835830926895142, "Pretrain/Loss (Raw)": 2.3595385551452637, "Pretrain/Step": 14762, "Pretrain/Step Time": 8.492397118359804} +{"Pretrain/Learning Rate": 6.401792183429594e-06, "Pretrain/Loss": 1.982046365737915, "Pretrain/Loss (Raw)": 1.8563421964645386, "Pretrain/Step": 14763, "Pretrain/Step Time": 8.486081490293145} +{"Pretrain/Learning Rate": 6.39895557935917e-06, "Pretrain/Loss": 1.9800200462341309, "Pretrain/Loss (Raw)": 1.965133547782898, "Pretrain/Step": 14764, "Pretrain/Step Time": 8.485215401276946} +{"Pretrain/Learning Rate": 6.3961195116367416e-06, "Pretrain/Loss": 1.9802508354187012, "Pretrain/Loss (Raw)": 1.8217748403549194, "Pretrain/Step": 14765, "Pretrain/Step Time": 8.485794207081199} +{"Pretrain/Learning Rate": 6.393283980344097e-06, "Pretrain/Loss": 1.9773180484771729, "Pretrain/Loss (Raw)": 1.8825175762176514, "Pretrain/Step": 14766, "Pretrain/Step Time": 8.488735653460026} +{"Pretrain/Learning Rate": 6.3904489855629965e-06, "Pretrain/Loss": 1.978601098060608, "Pretrain/Loss (Raw)": 2.015377998352051, "Pretrain/Step": 14767, "Pretrain/Step Time": 8.486954011023045} +{"Pretrain/Learning Rate": 6.3876145273751716e-06, "Pretrain/Loss": 1.980936050415039, "Pretrain/Loss (Raw)": 2.049480438232422, "Pretrain/Step": 14768, "Pretrain/Step Time": 8.486764257773757} +{"Pretrain/Learning Rate": 6.384780605862367e-06, "Pretrain/Loss": 1.9804186820983887, "Pretrain/Loss (Raw)": 1.8513871431350708, "Pretrain/Step": 14769, "Pretrain/Step Time": 8.487010549753904} +{"Pretrain/Learning Rate": 6.381947221106282e-06, "Pretrain/Loss": 1.980902910232544, "Pretrain/Loss (Raw)": 2.0566799640655518, "Pretrain/Step": 14770, "Pretrain/Step Time": 8.486505331471562} +{"Pretrain/Learning Rate": 6.379114373188635e-06, "Pretrain/Loss": 1.9813079833984375, "Pretrain/Loss (Raw)": 1.925203800201416, "Pretrain/Step": 14771, "Pretrain/Step Time": 8.48872670903802} +{"Pretrain/Learning Rate": 6.376282062191097e-06, "Pretrain/Loss": 1.9785345792770386, "Pretrain/Loss (Raw)": 1.980846643447876, "Pretrain/Step": 14772, "Pretrain/Step Time": 8.487408047541976} +{"Pretrain/Learning Rate": 6.373450288195329e-06, "Pretrain/Loss": 1.9772963523864746, "Pretrain/Loss (Raw)": 1.9203985929489136, "Pretrain/Step": 14773, "Pretrain/Step Time": 8.484699772670865} +{"Pretrain/Learning Rate": 6.370619051283e-06, "Pretrain/Loss": 1.9761545658111572, "Pretrain/Loss (Raw)": 1.9121662378311157, "Pretrain/Step": 14774, "Pretrain/Step Time": 8.489173546433449} +{"Pretrain/Learning Rate": 6.367788351535728e-06, "Pretrain/Loss": 1.9775351285934448, "Pretrain/Loss (Raw)": 2.2089171409606934, "Pretrain/Step": 14775, "Pretrain/Step Time": 8.486289452761412} +{"Pretrain/Learning Rate": 6.364958189035153e-06, "Pretrain/Loss": 1.974782943725586, "Pretrain/Loss (Raw)": 1.9680607318878174, "Pretrain/Step": 14776, "Pretrain/Step Time": 8.48605152964592} +{"Pretrain/Learning Rate": 6.362128563862871e-06, "Pretrain/Loss": 1.9735009670257568, "Pretrain/Loss (Raw)": 1.7708081007003784, "Pretrain/Step": 14777, "Pretrain/Step Time": 8.487312750890851} +{"Pretrain/Learning Rate": 6.359299476100466e-06, "Pretrain/Loss": 1.9732964038848877, "Pretrain/Loss (Raw)": 1.979338526725769, "Pretrain/Step": 14778, "Pretrain/Step Time": 8.493184173479676} +{"Pretrain/Learning Rate": 6.356470925829528e-06, "Pretrain/Loss": 1.9774802923202515, "Pretrain/Loss (Raw)": 2.031886577606201, "Pretrain/Step": 14779, "Pretrain/Step Time": 8.491672040894628} +{"Pretrain/Learning Rate": 6.353642913131599e-06, "Pretrain/Loss": 1.9755254983901978, "Pretrain/Loss (Raw)": 1.8620415925979614, "Pretrain/Step": 14780, "Pretrain/Step Time": 8.493416018784046} +{"Pretrain/Learning Rate": 6.350815438088239e-06, "Pretrain/Loss": 1.975450873374939, "Pretrain/Loss (Raw)": 1.9190281629562378, "Pretrain/Step": 14781, "Pretrain/Step Time": 8.498372634872794} +{"Pretrain/Learning Rate": 6.347988500780963e-06, "Pretrain/Loss": 1.9748742580413818, "Pretrain/Loss (Raw)": 1.9767143726348877, "Pretrain/Step": 14782, "Pretrain/Step Time": 8.505188999697566} +{"Pretrain/Learning Rate": 6.345162101291297e-06, "Pretrain/Loss": 1.9738682508468628, "Pretrain/Loss (Raw)": 1.954959511756897, "Pretrain/Step": 14783, "Pretrain/Step Time": 8.503546718508005} +{"Pretrain/Learning Rate": 6.34233623970073e-06, "Pretrain/Loss": 1.9771678447723389, "Pretrain/Loss (Raw)": 2.3726277351379395, "Pretrain/Step": 14784, "Pretrain/Step Time": 8.504973832517862} +{"Pretrain/Learning Rate": 6.339510916090738e-06, "Pretrain/Loss": 1.9745954275131226, "Pretrain/Loss (Raw)": 1.54974365234375, "Pretrain/Step": 14785, "Pretrain/Step Time": 8.505188262090087} +{"Pretrain/Learning Rate": 6.336686130542802e-06, "Pretrain/Loss": 1.9770689010620117, "Pretrain/Loss (Raw)": 2.1690142154693604, "Pretrain/Step": 14786, "Pretrain/Step Time": 8.504790343344212} +{"Pretrain/Learning Rate": 6.333861883138356e-06, "Pretrain/Loss": 1.9795894622802734, "Pretrain/Loss (Raw)": 2.0543315410614014, "Pretrain/Step": 14787, "Pretrain/Step Time": 8.505361814051867} +{"Pretrain/Learning Rate": 6.3310381739588535e-06, "Pretrain/Loss": 1.978592872619629, "Pretrain/Loss (Raw)": 1.8298516273498535, "Pretrain/Step": 14788, "Pretrain/Step Time": 8.506420141085982} +{"Pretrain/Learning Rate": 6.328215003085702e-06, "Pretrain/Loss": 1.978114128112793, "Pretrain/Loss (Raw)": 2.035463333129883, "Pretrain/Step": 14789, "Pretrain/Step Time": 8.507994189858437} +{"Pretrain/Learning Rate": 6.325392370600303e-06, "Pretrain/Loss": 1.9786200523376465, "Pretrain/Loss (Raw)": 1.9769092798233032, "Pretrain/Step": 14790, "Pretrain/Step Time": 8.503934066742659} +{"Pretrain/Learning Rate": 6.322570276584056e-06, "Pretrain/Loss": 1.9813365936279297, "Pretrain/Loss (Raw)": 2.140327215194702, "Pretrain/Step": 14791, "Pretrain/Step Time": 8.504672579467297} +{"Pretrain/Learning Rate": 6.319748721118321e-06, "Pretrain/Loss": 1.9824159145355225, "Pretrain/Loss (Raw)": 2.11961030960083, "Pretrain/Step": 14792, "Pretrain/Step Time": 8.502463871613145} +{"Pretrain/Learning Rate": 6.31692770428447e-06, "Pretrain/Loss": 1.9792481660842896, "Pretrain/Loss (Raw)": 1.577144742012024, "Pretrain/Step": 14793, "Pretrain/Step Time": 8.505225354805589} +{"Pretrain/Learning Rate": 6.31410722616384e-06, "Pretrain/Loss": 1.9791654348373413, "Pretrain/Loss (Raw)": 1.955955147743225, "Pretrain/Step": 14794, "Pretrain/Step Time": 8.50107747502625} +{"Pretrain/Learning Rate": 6.311287286837747e-06, "Pretrain/Loss": 1.9807140827178955, "Pretrain/Loss (Raw)": 1.9872585535049438, "Pretrain/Step": 14795, "Pretrain/Step Time": 8.500236358493567} +{"Pretrain/Learning Rate": 6.308467886387517e-06, "Pretrain/Loss": 1.9803152084350586, "Pretrain/Loss (Raw)": 1.8957972526550293, "Pretrain/Step": 14796, "Pretrain/Step Time": 8.49730233848095} +{"Pretrain/Learning Rate": 6.3056490248944306e-06, "Pretrain/Loss": 1.9812443256378174, "Pretrain/Loss (Raw)": 1.9160678386688232, "Pretrain/Step": 14797, "Pretrain/Step Time": 8.496967965736985} +{"Pretrain/Learning Rate": 6.302830702439785e-06, "Pretrain/Loss": 1.9791665077209473, "Pretrain/Loss (Raw)": 1.7918275594711304, "Pretrain/Step": 14798, "Pretrain/Step Time": 8.49847169779241} +{"Pretrain/Learning Rate": 6.300012919104836e-06, "Pretrain/Loss": 1.9787707328796387, "Pretrain/Loss (Raw)": 1.9528017044067383, "Pretrain/Step": 14799, "Pretrain/Step Time": 8.49944351054728} +{"Pretrain/Learning Rate": 6.297195674970824e-06, "Pretrain/Loss": 1.9777789115905762, "Pretrain/Loss (Raw)": 1.9831092357635498, "Pretrain/Step": 14800, "Pretrain/Step Time": 8.497624495998025} +{"Pretrain/Learning Rate": 6.2943789701189946e-06, "Pretrain/Loss": 1.9773173332214355, "Pretrain/Loss (Raw)": 2.0594160556793213, "Pretrain/Step": 14801, "Pretrain/Step Time": 8.49330890737474} +{"Pretrain/Learning Rate": 6.291562804630558e-06, "Pretrain/Loss": 1.9818291664123535, "Pretrain/Loss (Raw)": 2.1798043251037598, "Pretrain/Step": 14802, "Pretrain/Step Time": 8.49527688510716} +{"Pretrain/Learning Rate": 6.288747178586724e-06, "Pretrain/Loss": 1.9818381071090698, "Pretrain/Loss (Raw)": 2.0688557624816895, "Pretrain/Step": 14803, "Pretrain/Step Time": 8.493997855111957} +{"Pretrain/Learning Rate": 6.285932092068675e-06, "Pretrain/Loss": 1.9815242290496826, "Pretrain/Loss (Raw)": 1.9754254817962646, "Pretrain/Step": 14804, "Pretrain/Step Time": 8.498035952448845} +{"Pretrain/Learning Rate": 6.283117545157574e-06, "Pretrain/Loss": 1.9817261695861816, "Pretrain/Loss (Raw)": 1.98600172996521, "Pretrain/Step": 14805, "Pretrain/Step Time": 8.498559799045324} +{"Pretrain/Learning Rate": 6.280303537934593e-06, "Pretrain/Loss": 1.9830983877182007, "Pretrain/Loss (Raw)": 2.219507932662964, "Pretrain/Step": 14806, "Pretrain/Step Time": 8.503433898091316} +{"Pretrain/Learning Rate": 6.277490070480854e-06, "Pretrain/Loss": 1.9820148944854736, "Pretrain/Loss (Raw)": 1.7429399490356445, "Pretrain/Step": 14807, "Pretrain/Step Time": 8.495582781732082} +{"Pretrain/Learning Rate": 6.274677142877497e-06, "Pretrain/Loss": 1.9802738428115845, "Pretrain/Loss (Raw)": 1.8176014423370361, "Pretrain/Step": 14808, "Pretrain/Step Time": 8.499181345105171} +{"Pretrain/Learning Rate": 6.271864755205625e-06, "Pretrain/Loss": 1.9796885251998901, "Pretrain/Loss (Raw)": 1.9381111860275269, "Pretrain/Step": 14809, "Pretrain/Step Time": 8.491885248571634} +{"Pretrain/Learning Rate": 6.269052907546325e-06, "Pretrain/Loss": 1.9753403663635254, "Pretrain/Loss (Raw)": 1.463837742805481, "Pretrain/Step": 14810, "Pretrain/Step Time": 8.493332628160715} +{"Pretrain/Learning Rate": 6.266241599980685e-06, "Pretrain/Loss": 1.9770927429199219, "Pretrain/Loss (Raw)": 2.2667531967163086, "Pretrain/Step": 14811, "Pretrain/Step Time": 8.490666514262557} +{"Pretrain/Learning Rate": 6.263430832589756e-06, "Pretrain/Loss": 1.9762928485870361, "Pretrain/Loss (Raw)": 2.0532941818237305, "Pretrain/Step": 14812, "Pretrain/Step Time": 8.493192439898849} +{"Pretrain/Learning Rate": 6.260620605454595e-06, "Pretrain/Loss": 1.9756901264190674, "Pretrain/Loss (Raw)": 1.9596816301345825, "Pretrain/Step": 14813, "Pretrain/Step Time": 8.491310019046068} +{"Pretrain/Learning Rate": 6.257810918656232e-06, "Pretrain/Loss": 1.9762914180755615, "Pretrain/Loss (Raw)": 2.12689208984375, "Pretrain/Step": 14814, "Pretrain/Step Time": 8.494403943419456} +{"Pretrain/Learning Rate": 6.255001772275671e-06, "Pretrain/Loss": 1.9757425785064697, "Pretrain/Loss (Raw)": 2.0436766147613525, "Pretrain/Step": 14815, "Pretrain/Step Time": 8.493479333817959} +{"Pretrain/Learning Rate": 6.2521931663939246e-06, "Pretrain/Loss": 1.9752376079559326, "Pretrain/Loss (Raw)": 1.86884343624115, "Pretrain/Step": 14816, "Pretrain/Step Time": 8.49456981010735} +{"Pretrain/Learning Rate": 6.249385101091967e-06, "Pretrain/Loss": 1.97854745388031, "Pretrain/Loss (Raw)": 2.1351397037506104, "Pretrain/Step": 14817, "Pretrain/Step Time": 8.493066843599081} +{"Pretrain/Learning Rate": 6.246577576450777e-06, "Pretrain/Loss": 1.9774858951568604, "Pretrain/Loss (Raw)": 1.9340497255325317, "Pretrain/Step": 14818, "Pretrain/Step Time": 8.489600272849202} +{"Pretrain/Learning Rate": 6.243770592551304e-06, "Pretrain/Loss": 1.9827871322631836, "Pretrain/Loss (Raw)": 2.5873801708221436, "Pretrain/Step": 14819, "Pretrain/Step Time": 8.487760983407497} +{"Pretrain/Learning Rate": 6.2409641494744735e-06, "Pretrain/Loss": 1.9817261695861816, "Pretrain/Loss (Raw)": 1.8778395652770996, "Pretrain/Step": 14820, "Pretrain/Step Time": 8.48832624964416} +{"Pretrain/Learning Rate": 6.238158247301229e-06, "Pretrain/Loss": 1.9800307750701904, "Pretrain/Loss (Raw)": 1.9345661401748657, "Pretrain/Step": 14821, "Pretrain/Step Time": 8.491054572165012} +{"Pretrain/Learning Rate": 6.2353528861124555e-06, "Pretrain/Loss": 1.9797922372817993, "Pretrain/Loss (Raw)": 1.918988823890686, "Pretrain/Step": 14822, "Pretrain/Step Time": 8.49455264955759} +{"Pretrain/Learning Rate": 6.23254806598906e-06, "Pretrain/Loss": 1.9789578914642334, "Pretrain/Loss (Raw)": 1.9729108810424805, "Pretrain/Step": 14823, "Pretrain/Step Time": 8.49355460330844} +{"Pretrain/Learning Rate": 6.229743787011913e-06, "Pretrain/Loss": 1.9754385948181152, "Pretrain/Loss (Raw)": 1.6567953824996948, "Pretrain/Step": 14824, "Pretrain/Step Time": 8.49958904646337} +{"Pretrain/Learning Rate": 6.2269400492618615e-06, "Pretrain/Loss": 1.974714994430542, "Pretrain/Loss (Raw)": 1.978170394897461, "Pretrain/Step": 14825, "Pretrain/Step Time": 8.494013097137213} +{"Pretrain/Learning Rate": 6.22413685281977e-06, "Pretrain/Loss": 1.9739564657211304, "Pretrain/Loss (Raw)": 2.0380449295043945, "Pretrain/Step": 14826, "Pretrain/Step Time": 8.497845593839884} +{"Pretrain/Learning Rate": 6.221334197766454e-06, "Pretrain/Loss": 1.9736754894256592, "Pretrain/Loss (Raw)": 1.8804279565811157, "Pretrain/Step": 14827, "Pretrain/Step Time": 8.497826378792524} +{"Pretrain/Learning Rate": 6.218532084182729e-06, "Pretrain/Loss": 1.9735959768295288, "Pretrain/Loss (Raw)": 1.956429362297058, "Pretrain/Step": 14828, "Pretrain/Step Time": 8.500389486551285} +{"Pretrain/Learning Rate": 6.215730512149384e-06, "Pretrain/Loss": 1.9745266437530518, "Pretrain/Loss (Raw)": 1.9570387601852417, "Pretrain/Step": 14829, "Pretrain/Step Time": 8.499250005930662} +{"Pretrain/Learning Rate": 6.212929481747215e-06, "Pretrain/Loss": 1.9684760570526123, "Pretrain/Loss (Raw)": 1.645466685295105, "Pretrain/Step": 14830, "Pretrain/Step Time": 8.502098139375448} +{"Pretrain/Learning Rate": 6.2101289930569796e-06, "Pretrain/Loss": 1.9681651592254639, "Pretrain/Loss (Raw)": 2.255054235458374, "Pretrain/Step": 14831, "Pretrain/Step Time": 8.502157472074032} +{"Pretrain/Learning Rate": 6.207329046159424e-06, "Pretrain/Loss": 1.9686150550842285, "Pretrain/Loss (Raw)": 1.9061789512634277, "Pretrain/Step": 14832, "Pretrain/Step Time": 8.49959060922265} +{"Pretrain/Learning Rate": 6.204529641135293e-06, "Pretrain/Loss": 1.9673936367034912, "Pretrain/Loss (Raw)": 2.0481183528900146, "Pretrain/Step": 14833, "Pretrain/Step Time": 8.503566594794393} +{"Pretrain/Learning Rate": 6.20173077806529e-06, "Pretrain/Loss": 1.9694448709487915, "Pretrain/Loss (Raw)": 2.0307421684265137, "Pretrain/Step": 14834, "Pretrain/Step Time": 8.502416430041194} +{"Pretrain/Learning Rate": 6.19893245703014e-06, "Pretrain/Loss": 1.969668984413147, "Pretrain/Loss (Raw)": 1.9199771881103516, "Pretrain/Step": 14835, "Pretrain/Step Time": 8.498416487127542} +{"Pretrain/Learning Rate": 6.1961346781105154e-06, "Pretrain/Loss": 1.9686459302902222, "Pretrain/Loss (Raw)": 1.948880672454834, "Pretrain/Step": 14836, "Pretrain/Step Time": 8.50037563405931} +{"Pretrain/Learning Rate": 6.193337441387087e-06, "Pretrain/Loss": 1.968931794166565, "Pretrain/Loss (Raw)": 2.0658280849456787, "Pretrain/Step": 14837, "Pretrain/Step Time": 8.501266058534384} +{"Pretrain/Learning Rate": 6.1905407469405205e-06, "Pretrain/Loss": 1.9653114080429077, "Pretrain/Loss (Raw)": 1.6435432434082031, "Pretrain/Step": 14838, "Pretrain/Step Time": 8.498841725289822} +{"Pretrain/Learning Rate": 6.187744594851444e-06, "Pretrain/Loss": 1.9626245498657227, "Pretrain/Loss (Raw)": 1.8921431303024292, "Pretrain/Step": 14839, "Pretrain/Step Time": 8.498200399801135} +{"Pretrain/Learning Rate": 6.1849489852005e-06, "Pretrain/Loss": 1.9619832038879395, "Pretrain/Loss (Raw)": 1.854498267173767, "Pretrain/Step": 14840, "Pretrain/Step Time": 8.503051159903407} +{"Pretrain/Learning Rate": 6.182153918068287e-06, "Pretrain/Loss": 1.9621254205703735, "Pretrain/Loss (Raw)": 2.0156261920928955, "Pretrain/Step": 14841, "Pretrain/Step Time": 8.495975591242313} +{"Pretrain/Learning Rate": 6.179359393535392e-06, "Pretrain/Loss": 1.9576663970947266, "Pretrain/Loss (Raw)": 1.520671010017395, "Pretrain/Step": 14842, "Pretrain/Step Time": 8.498250003904104} +{"Pretrain/Learning Rate": 6.1765654116824115e-06, "Pretrain/Loss": 1.95746910572052, "Pretrain/Loss (Raw)": 1.9987053871154785, "Pretrain/Step": 14843, "Pretrain/Step Time": 8.497318126261234} +{"Pretrain/Learning Rate": 6.173771972589887e-06, "Pretrain/Loss": 1.9595084190368652, "Pretrain/Loss (Raw)": 2.1535849571228027, "Pretrain/Step": 14844, "Pretrain/Step Time": 8.493524329736829} +{"Pretrain/Learning Rate": 6.170979076338384e-06, "Pretrain/Loss": 1.9614676237106323, "Pretrain/Loss (Raw)": 2.1491644382476807, "Pretrain/Step": 14845, "Pretrain/Step Time": 8.494351407513022} +{"Pretrain/Learning Rate": 6.16818672300842e-06, "Pretrain/Loss": 1.964942455291748, "Pretrain/Loss (Raw)": 2.106626272201538, "Pretrain/Step": 14846, "Pretrain/Step Time": 8.49286101385951} +{"Pretrain/Learning Rate": 6.165394912680522e-06, "Pretrain/Loss": 1.965624213218689, "Pretrain/Loss (Raw)": 2.0124411582946777, "Pretrain/Step": 14847, "Pretrain/Step Time": 8.488879982382059} +{"Pretrain/Learning Rate": 6.162603645435186e-06, "Pretrain/Loss": 1.9659925699234009, "Pretrain/Loss (Raw)": 2.118898630142212, "Pretrain/Step": 14848, "Pretrain/Step Time": 8.489774962887168} +{"Pretrain/Learning Rate": 6.159812921352886e-06, "Pretrain/Loss": 1.9666633605957031, "Pretrain/Loss (Raw)": 1.962097406387329, "Pretrain/Step": 14849, "Pretrain/Step Time": 8.489571649581194} +{"Pretrain/Learning Rate": 6.157022740514107e-06, "Pretrain/Loss": 1.9656341075897217, "Pretrain/Loss (Raw)": 1.9133012294769287, "Pretrain/Step": 14850, "Pretrain/Step Time": 8.490482749417424} +{"Pretrain/Learning Rate": 6.154233102999285e-06, "Pretrain/Loss": 1.9654566049575806, "Pretrain/Loss (Raw)": 2.0803465843200684, "Pretrain/Step": 14851, "Pretrain/Step Time": 8.488545387983322} +{"Pretrain/Learning Rate": 6.1514440088888735e-06, "Pretrain/Loss": 1.9655914306640625, "Pretrain/Loss (Raw)": 2.064084768295288, "Pretrain/Step": 14852, "Pretrain/Step Time": 8.487949673086405} +{"Pretrain/Learning Rate": 6.1486554582632884e-06, "Pretrain/Loss": 1.965139627456665, "Pretrain/Loss (Raw)": 1.9501227140426636, "Pretrain/Step": 14853, "Pretrain/Step Time": 8.48871349915862} +{"Pretrain/Learning Rate": 6.145867451202925e-06, "Pretrain/Loss": 1.966111421585083, "Pretrain/Loss (Raw)": 2.0570428371429443, "Pretrain/Step": 14854, "Pretrain/Step Time": 8.495186759158969} +{"Pretrain/Learning Rate": 6.143079987788191e-06, "Pretrain/Loss": 1.9665703773498535, "Pretrain/Loss (Raw)": 2.063992977142334, "Pretrain/Step": 14855, "Pretrain/Step Time": 8.498861348256469} +{"Pretrain/Learning Rate": 6.140293068099443e-06, "Pretrain/Loss": 1.9687390327453613, "Pretrain/Loss (Raw)": 2.0135936737060547, "Pretrain/Step": 14856, "Pretrain/Step Time": 8.497106175869703} +{"Pretrain/Learning Rate": 6.1375066922170575e-06, "Pretrain/Loss": 1.9705743789672852, "Pretrain/Loss (Raw)": 2.3064048290252686, "Pretrain/Step": 14857, "Pretrain/Step Time": 8.501387497410178} +{"Pretrain/Learning Rate": 6.134720860221371e-06, "Pretrain/Loss": 1.9713971614837646, "Pretrain/Loss (Raw)": 1.9515033960342407, "Pretrain/Step": 14858, "Pretrain/Step Time": 8.499145017936826} +{"Pretrain/Learning Rate": 6.131935572192699e-06, "Pretrain/Loss": 1.973556637763977, "Pretrain/Loss (Raw)": 2.217806339263916, "Pretrain/Step": 14859, "Pretrain/Step Time": 8.496757688000798} +{"Pretrain/Learning Rate": 6.129150828211372e-06, "Pretrain/Loss": 1.973639726638794, "Pretrain/Loss (Raw)": 1.8342257738113403, "Pretrain/Step": 14860, "Pretrain/Step Time": 8.496459230780602} +{"Pretrain/Learning Rate": 6.1263666283576715e-06, "Pretrain/Loss": 1.9731478691101074, "Pretrain/Loss (Raw)": 2.0431995391845703, "Pretrain/Step": 14861, "Pretrain/Step Time": 8.496365536004305} +{"Pretrain/Learning Rate": 6.123582972711891e-06, "Pretrain/Loss": 1.971951961517334, "Pretrain/Loss (Raw)": 2.077235698699951, "Pretrain/Step": 14862, "Pretrain/Step Time": 8.493155788630247} +{"Pretrain/Learning Rate": 6.12079986135429e-06, "Pretrain/Loss": 1.9752116203308105, "Pretrain/Loss (Raw)": 2.0433342456817627, "Pretrain/Step": 14863, "Pretrain/Step Time": 8.495206218212843} +{"Pretrain/Learning Rate": 6.118017294365105e-06, "Pretrain/Loss": 1.9744144678115845, "Pretrain/Loss (Raw)": 1.8084983825683594, "Pretrain/Step": 14864, "Pretrain/Step Time": 8.494433933869004} +{"Pretrain/Learning Rate": 6.11523527182459e-06, "Pretrain/Loss": 1.9740092754364014, "Pretrain/Loss (Raw)": 1.6559431552886963, "Pretrain/Step": 14865, "Pretrain/Step Time": 8.494417889043689} +{"Pretrain/Learning Rate": 6.112453793812947e-06, "Pretrain/Loss": 1.9741687774658203, "Pretrain/Loss (Raw)": 1.9661916494369507, "Pretrain/Step": 14866, "Pretrain/Step Time": 8.49529404938221} +{"Pretrain/Learning Rate": 6.1096728604103895e-06, "Pretrain/Loss": 1.974327564239502, "Pretrain/Loss (Raw)": 1.9997111558914185, "Pretrain/Step": 14867, "Pretrain/Step Time": 8.49258903414011} +{"Pretrain/Learning Rate": 6.106892471697098e-06, "Pretrain/Loss": 1.973815679550171, "Pretrain/Loss (Raw)": 1.8633953332901, "Pretrain/Step": 14868, "Pretrain/Step Time": 8.49426314048469} +{"Pretrain/Learning Rate": 6.104112627753239e-06, "Pretrain/Loss": 1.9787805080413818, "Pretrain/Loss (Raw)": 2.5587215423583984, "Pretrain/Step": 14869, "Pretrain/Step Time": 8.498804351314902} +{"Pretrain/Learning Rate": 6.101333328658976e-06, "Pretrain/Loss": 1.9776819944381714, "Pretrain/Loss (Raw)": 1.9150558710098267, "Pretrain/Step": 14870, "Pretrain/Step Time": 8.49320867471397} +{"Pretrain/Learning Rate": 6.098554574494436e-06, "Pretrain/Loss": 1.9783143997192383, "Pretrain/Loss (Raw)": 2.069669008255005, "Pretrain/Step": 14871, "Pretrain/Step Time": 8.498035734519362} +{"Pretrain/Learning Rate": 6.095776365339758e-06, "Pretrain/Loss": 1.9786858558654785, "Pretrain/Loss (Raw)": 2.076828718185425, "Pretrain/Step": 14872, "Pretrain/Step Time": 8.498495664447546} +{"Pretrain/Learning Rate": 6.092998701275044e-06, "Pretrain/Loss": 1.9789071083068848, "Pretrain/Loss (Raw)": 1.9432095289230347, "Pretrain/Step": 14873, "Pretrain/Step Time": 8.499667186290026} +{"Pretrain/Learning Rate": 6.090221582380376e-06, "Pretrain/Loss": 1.9800708293914795, "Pretrain/Loss (Raw)": 1.8551571369171143, "Pretrain/Step": 14874, "Pretrain/Step Time": 8.498747177422047} +{"Pretrain/Learning Rate": 6.087445008735846e-06, "Pretrain/Loss": 1.9809600114822388, "Pretrain/Loss (Raw)": 2.0614562034606934, "Pretrain/Step": 14875, "Pretrain/Step Time": 8.495806474238634} +{"Pretrain/Learning Rate": 6.0846689804214955e-06, "Pretrain/Loss": 1.9814716577529907, "Pretrain/Loss (Raw)": 2.0571866035461426, "Pretrain/Step": 14876, "Pretrain/Step Time": 8.493240745738149} +{"Pretrain/Learning Rate": 6.081893497517391e-06, "Pretrain/Loss": 1.980250358581543, "Pretrain/Loss (Raw)": 1.96976637840271, "Pretrain/Step": 14877, "Pretrain/Step Time": 8.497205091640353} +{"Pretrain/Learning Rate": 6.07911856010355e-06, "Pretrain/Loss": 1.9811748266220093, "Pretrain/Loss (Raw)": 2.273851156234741, "Pretrain/Step": 14878, "Pretrain/Step Time": 8.496700249612331} +{"Pretrain/Learning Rate": 6.076344168259981e-06, "Pretrain/Loss": 1.980057954788208, "Pretrain/Loss (Raw)": 1.8080244064331055, "Pretrain/Step": 14879, "Pretrain/Step Time": 8.50143028050661} +{"Pretrain/Learning Rate": 6.073570322066693e-06, "Pretrain/Loss": 1.97935152053833, "Pretrain/Loss (Raw)": 1.852936029434204, "Pretrain/Step": 14880, "Pretrain/Step Time": 8.499056672677398} +{"Pretrain/Learning Rate": 6.070797021603658e-06, "Pretrain/Loss": 1.9803738594055176, "Pretrain/Loss (Raw)": 1.8590673208236694, "Pretrain/Step": 14881, "Pretrain/Step Time": 8.498710315674543} +{"Pretrain/Learning Rate": 6.06802426695085e-06, "Pretrain/Loss": 1.9826629161834717, "Pretrain/Loss (Raw)": 2.402155876159668, "Pretrain/Step": 14882, "Pretrain/Step Time": 8.497616928070784} +{"Pretrain/Learning Rate": 6.06525205818822e-06, "Pretrain/Loss": 1.9837160110473633, "Pretrain/Loss (Raw)": 2.1023740768432617, "Pretrain/Step": 14883, "Pretrain/Step Time": 8.499132353812456} +{"Pretrain/Learning Rate": 6.062480395395689e-06, "Pretrain/Loss": 1.9837403297424316, "Pretrain/Loss (Raw)": 2.1314830780029297, "Pretrain/Step": 14884, "Pretrain/Step Time": 8.4999363347888} +{"Pretrain/Learning Rate": 6.059709278653194e-06, "Pretrain/Loss": 1.9835431575775146, "Pretrain/Loss (Raw)": 1.719804286956787, "Pretrain/Step": 14885, "Pretrain/Step Time": 8.49438227340579} +{"Pretrain/Learning Rate": 6.056938708040622e-06, "Pretrain/Loss": 1.9851467609405518, "Pretrain/Loss (Raw)": 2.2463796138763428, "Pretrain/Step": 14886, "Pretrain/Step Time": 8.495012244209647} +{"Pretrain/Learning Rate": 6.0541686836378755e-06, "Pretrain/Loss": 1.9835586547851562, "Pretrain/Loss (Raw)": 1.8929122686386108, "Pretrain/Step": 14887, "Pretrain/Step Time": 8.495110971853137} +{"Pretrain/Learning Rate": 6.051399205524821e-06, "Pretrain/Loss": 1.985865592956543, "Pretrain/Loss (Raw)": 2.159773111343384, "Pretrain/Step": 14888, "Pretrain/Step Time": 8.487937794998288} +{"Pretrain/Learning Rate": 6.048630273781302e-06, "Pretrain/Loss": 1.9875521659851074, "Pretrain/Loss (Raw)": 2.1178066730499268, "Pretrain/Step": 14889, "Pretrain/Step Time": 8.493442172184587} +{"Pretrain/Learning Rate": 6.045861888487181e-06, "Pretrain/Loss": 1.983473300933838, "Pretrain/Loss (Raw)": 1.837453007698059, "Pretrain/Step": 14890, "Pretrain/Step Time": 8.491628460586071} +{"Pretrain/Learning Rate": 6.043094049722261e-06, "Pretrain/Loss": 1.9866011142730713, "Pretrain/Loss (Raw)": 2.2566914558410645, "Pretrain/Step": 14891, "Pretrain/Step Time": 8.49216614663601} +{"Pretrain/Learning Rate": 6.040326757566367e-06, "Pretrain/Loss": 1.9859832525253296, "Pretrain/Loss (Raw)": 1.8860647678375244, "Pretrain/Step": 14892, "Pretrain/Step Time": 8.492053035646677} +{"Pretrain/Learning Rate": 6.037560012099286e-06, "Pretrain/Loss": 1.9874153137207031, "Pretrain/Loss (Raw)": 2.005077838897705, "Pretrain/Step": 14893, "Pretrain/Step Time": 8.486920597031713} +{"Pretrain/Learning Rate": 6.034793813400785e-06, "Pretrain/Loss": 1.9886651039123535, "Pretrain/Loss (Raw)": 2.0424866676330566, "Pretrain/Step": 14894, "Pretrain/Step Time": 8.483008483424783} +{"Pretrain/Learning Rate": 6.032028161550646e-06, "Pretrain/Loss": 1.9893944263458252, "Pretrain/Loss (Raw)": 2.1087334156036377, "Pretrain/Step": 14895, "Pretrain/Step Time": 8.48624506033957} +{"Pretrain/Learning Rate": 6.029263056628592e-06, "Pretrain/Loss": 1.9901893138885498, "Pretrain/Loss (Raw)": 2.151218891143799, "Pretrain/Step": 14896, "Pretrain/Step Time": 8.48247903957963} +{"Pretrain/Learning Rate": 6.026498498714375e-06, "Pretrain/Loss": 1.9909002780914307, "Pretrain/Loss (Raw)": 1.9423922300338745, "Pretrain/Step": 14897, "Pretrain/Step Time": 8.480490701273084} +{"Pretrain/Learning Rate": 6.023734487887697e-06, "Pretrain/Loss": 1.9898579120635986, "Pretrain/Loss (Raw)": 1.923247218132019, "Pretrain/Step": 14898, "Pretrain/Step Time": 8.482553638517857} +{"Pretrain/Learning Rate": 6.02097102422825e-06, "Pretrain/Loss": 1.9913370609283447, "Pretrain/Loss (Raw)": 2.114539861679077, "Pretrain/Step": 14899, "Pretrain/Step Time": 8.479126522317529} +{"Pretrain/Learning Rate": 6.018208107815732e-06, "Pretrain/Loss": 1.9927012920379639, "Pretrain/Loss (Raw)": 2.1554741859436035, "Pretrain/Step": 14900, "Pretrain/Step Time": 8.487565631046891} +{"Pretrain/Learning Rate": 6.015445738729794e-06, "Pretrain/Loss": 1.9934552907943726, "Pretrain/Loss (Raw)": 2.016899585723877, "Pretrain/Step": 14901, "Pretrain/Step Time": 8.48752073571086} +{"Pretrain/Learning Rate": 6.012683917050102e-06, "Pretrain/Loss": 1.9938628673553467, "Pretrain/Loss (Raw)": 1.9643515348434448, "Pretrain/Step": 14902, "Pretrain/Step Time": 8.480455446988344} +{"Pretrain/Learning Rate": 6.009922642856286e-06, "Pretrain/Loss": 1.992366075515747, "Pretrain/Loss (Raw)": 2.017314910888672, "Pretrain/Step": 14903, "Pretrain/Step Time": 8.480804895982146} +{"Pretrain/Learning Rate": 6.0071619162279545e-06, "Pretrain/Loss": 1.9905292987823486, "Pretrain/Loss (Raw)": 1.7329540252685547, "Pretrain/Step": 14904, "Pretrain/Step Time": 8.48505375161767} +{"Pretrain/Learning Rate": 6.004401737244728e-06, "Pretrain/Loss": 1.9942986965179443, "Pretrain/Loss (Raw)": 2.2533111572265625, "Pretrain/Step": 14905, "Pretrain/Step Time": 8.48309801518917} +{"Pretrain/Learning Rate": 6.00164210598618e-06, "Pretrain/Loss": 1.9963656663894653, "Pretrain/Loss (Raw)": 2.2438981533050537, "Pretrain/Step": 14906, "Pretrain/Step Time": 8.47981097921729} +{"Pretrain/Learning Rate": 5.9988830225318925e-06, "Pretrain/Loss": 1.9943492412567139, "Pretrain/Loss (Raw)": 1.7737880945205688, "Pretrain/Step": 14907, "Pretrain/Step Time": 8.480499275028706} +{"Pretrain/Learning Rate": 5.9961244869614215e-06, "Pretrain/Loss": 1.9956653118133545, "Pretrain/Loss (Raw)": 2.030517816543579, "Pretrain/Step": 14908, "Pretrain/Step Time": 8.480024915188551} +{"Pretrain/Learning Rate": 5.993366499354297e-06, "Pretrain/Loss": 1.9944770336151123, "Pretrain/Loss (Raw)": 1.7669109106063843, "Pretrain/Step": 14909, "Pretrain/Step Time": 8.472433615475893} +{"Pretrain/Learning Rate": 5.990609059790056e-06, "Pretrain/Loss": 1.993247389793396, "Pretrain/Loss (Raw)": 1.8193198442459106, "Pretrain/Step": 14910, "Pretrain/Step Time": 8.467504041269422} +{"Pretrain/Learning Rate": 5.987852168348204e-06, "Pretrain/Loss": 1.9933769702911377, "Pretrain/Loss (Raw)": 1.971540093421936, "Pretrain/Step": 14911, "Pretrain/Step Time": 8.467188833281398} +{"Pretrain/Learning Rate": 5.9850958251082306e-06, "Pretrain/Loss": 1.9903137683868408, "Pretrain/Loss (Raw)": 1.980539321899414, "Pretrain/Step": 14912, "Pretrain/Step Time": 8.464000042527914} +{"Pretrain/Learning Rate": 5.982340030149608e-06, "Pretrain/Loss": 1.9948539733886719, "Pretrain/Loss (Raw)": 2.1308953762054443, "Pretrain/Step": 14913, "Pretrain/Step Time": 8.468042775988579} +{"Pretrain/Learning Rate": 5.979584783551811e-06, "Pretrain/Loss": 1.9954164028167725, "Pretrain/Loss (Raw)": 2.2410123348236084, "Pretrain/Step": 14914, "Pretrain/Step Time": 8.465835526585579} +{"Pretrain/Learning Rate": 5.976830085394269e-06, "Pretrain/Loss": 1.9947338104248047, "Pretrain/Loss (Raw)": 1.9669429063796997, "Pretrain/Step": 14915, "Pretrain/Step Time": 8.471296889707446} +{"Pretrain/Learning Rate": 5.9740759357564315e-06, "Pretrain/Loss": 1.9964359998703003, "Pretrain/Loss (Raw)": 2.04775071144104, "Pretrain/Step": 14916, "Pretrain/Step Time": 8.470998890697956} +{"Pretrain/Learning Rate": 5.971322334717702e-06, "Pretrain/Loss": 1.9972264766693115, "Pretrain/Loss (Raw)": 2.1366262435913086, "Pretrain/Step": 14917, "Pretrain/Step Time": 8.473169516772032} +{"Pretrain/Learning Rate": 5.96856928235747e-06, "Pretrain/Loss": 1.99696683883667, "Pretrain/Loss (Raw)": 1.9436924457550049, "Pretrain/Step": 14918, "Pretrain/Step Time": 8.475259330123663} +{"Pretrain/Learning Rate": 5.965816778755132e-06, "Pretrain/Loss": 1.9990030527114868, "Pretrain/Loss (Raw)": 2.4009413719177246, "Pretrain/Step": 14919, "Pretrain/Step Time": 8.474743032827973} +{"Pretrain/Learning Rate": 5.963064823990044e-06, "Pretrain/Loss": 1.9972193241119385, "Pretrain/Loss (Raw)": 1.8912965059280396, "Pretrain/Step": 14920, "Pretrain/Step Time": 8.475543558597565} +{"Pretrain/Learning Rate": 5.960313418141569e-06, "Pretrain/Loss": 2.0000922679901123, "Pretrain/Loss (Raw)": 1.9448869228363037, "Pretrain/Step": 14921, "Pretrain/Step Time": 8.47462822124362} +{"Pretrain/Learning Rate": 5.957562561289034e-06, "Pretrain/Loss": 2.0010204315185547, "Pretrain/Loss (Raw)": 2.074786901473999, "Pretrain/Step": 14922, "Pretrain/Step Time": 8.478315634652972} +{"Pretrain/Learning Rate": 5.9548122535117515e-06, "Pretrain/Loss": 2.000880241394043, "Pretrain/Loss (Raw)": 1.969286561012268, "Pretrain/Step": 14923, "Pretrain/Step Time": 8.480689998716116} +{"Pretrain/Learning Rate": 5.952062494889038e-06, "Pretrain/Loss": 1.9990136623382568, "Pretrain/Loss (Raw)": 1.6568971872329712, "Pretrain/Step": 14924, "Pretrain/Step Time": 8.479852633550763} +{"Pretrain/Learning Rate": 5.9493132855001685e-06, "Pretrain/Loss": 2.0004055500030518, "Pretrain/Loss (Raw)": 2.0942132472991943, "Pretrain/Step": 14925, "Pretrain/Step Time": 8.475065778940916} +{"Pretrain/Learning Rate": 5.946564625424428e-06, "Pretrain/Loss": 2.002815008163452, "Pretrain/Loss (Raw)": 2.1002392768859863, "Pretrain/Step": 14926, "Pretrain/Step Time": 8.474128268659115} +{"Pretrain/Learning Rate": 5.943816514741063e-06, "Pretrain/Loss": 2.005915403366089, "Pretrain/Loss (Raw)": 2.3496499061584473, "Pretrain/Step": 14927, "Pretrain/Step Time": 8.471755953505635} +{"Pretrain/Learning Rate": 5.941068953529308e-06, "Pretrain/Loss": 2.006577491760254, "Pretrain/Loss (Raw)": 2.0678563117980957, "Pretrain/Step": 14928, "Pretrain/Step Time": 8.470181621611118} +{"Pretrain/Learning Rate": 5.938321941868402e-06, "Pretrain/Loss": 2.0062215328216553, "Pretrain/Loss (Raw)": 2.013864040374756, "Pretrain/Step": 14929, "Pretrain/Step Time": 8.473535098135471} +{"Pretrain/Learning Rate": 5.935575479837538e-06, "Pretrain/Loss": 2.0036516189575195, "Pretrain/Loss (Raw)": 1.850838541984558, "Pretrain/Step": 14930, "Pretrain/Step Time": 8.471655240282416} +{"Pretrain/Learning Rate": 5.932829567515924e-06, "Pretrain/Loss": 2.003157615661621, "Pretrain/Loss (Raw)": 2.0056238174438477, "Pretrain/Step": 14931, "Pretrain/Step Time": 8.472196768969297} +{"Pretrain/Learning Rate": 5.930084204982728e-06, "Pretrain/Loss": 2.003748655319214, "Pretrain/Loss (Raw)": 2.0510928630828857, "Pretrain/Step": 14932, "Pretrain/Step Time": 8.471379820257425} +{"Pretrain/Learning Rate": 5.927339392317099e-06, "Pretrain/Loss": 2.002976894378662, "Pretrain/Loss (Raw)": 1.8872159719467163, "Pretrain/Step": 14933, "Pretrain/Step Time": 8.47241054661572} +{"Pretrain/Learning Rate": 5.924595129598204e-06, "Pretrain/Loss": 2.0002355575561523, "Pretrain/Loss (Raw)": 1.8686063289642334, "Pretrain/Step": 14934, "Pretrain/Step Time": 8.46629630215466} +{"Pretrain/Learning Rate": 5.9218514169051554e-06, "Pretrain/Loss": 2.002209424972534, "Pretrain/Loss (Raw)": 1.9955782890319824, "Pretrain/Step": 14935, "Pretrain/Step Time": 8.476554326713085} +{"Pretrain/Learning Rate": 5.919108254317077e-06, "Pretrain/Loss": 2.0034189224243164, "Pretrain/Loss (Raw)": 1.9724358320236206, "Pretrain/Step": 14936, "Pretrain/Step Time": 8.472441853955388} +{"Pretrain/Learning Rate": 5.91636564191306e-06, "Pretrain/Loss": 2.003310203552246, "Pretrain/Loss (Raw)": 1.9242029190063477, "Pretrain/Step": 14937, "Pretrain/Step Time": 8.47289708815515} +{"Pretrain/Learning Rate": 5.913623579772182e-06, "Pretrain/Loss": 2.0052311420440674, "Pretrain/Loss (Raw)": 1.7097063064575195, "Pretrain/Step": 14938, "Pretrain/Step Time": 8.4776615742594} +{"Pretrain/Learning Rate": 5.910882067973519e-06, "Pretrain/Loss": 2.002883195877075, "Pretrain/Loss (Raw)": 1.9662011861801147, "Pretrain/Step": 14939, "Pretrain/Step Time": 8.480279752984643} +{"Pretrain/Learning Rate": 5.908141106596107e-06, "Pretrain/Loss": 2.002201557159424, "Pretrain/Loss (Raw)": 1.9660532474517822, "Pretrain/Step": 14940, "Pretrain/Step Time": 8.475588263943791} +{"Pretrain/Learning Rate": 5.905400695718994e-06, "Pretrain/Loss": 2.003028631210327, "Pretrain/Loss (Raw)": 2.0655527114868164, "Pretrain/Step": 14941, "Pretrain/Step Time": 8.481180157512426} +{"Pretrain/Learning Rate": 5.902660835421192e-06, "Pretrain/Loss": 2.0055179595947266, "Pretrain/Loss (Raw)": 2.445533275604248, "Pretrain/Step": 14942, "Pretrain/Step Time": 8.473964108154178} +{"Pretrain/Learning Rate": 5.8999215257816955e-06, "Pretrain/Loss": 2.0035808086395264, "Pretrain/Loss (Raw)": 1.7957353591918945, "Pretrain/Step": 14943, "Pretrain/Step Time": 8.478345220908523} +{"Pretrain/Learning Rate": 5.897182766879503e-06, "Pretrain/Loss": 2.0033297538757324, "Pretrain/Loss (Raw)": 1.8366694450378418, "Pretrain/Step": 14944, "Pretrain/Step Time": 8.472899524495006} +{"Pretrain/Learning Rate": 5.894444558793574e-06, "Pretrain/Loss": 2.0038928985595703, "Pretrain/Loss (Raw)": 2.2072482109069824, "Pretrain/Step": 14945, "Pretrain/Step Time": 8.474301975220442} +{"Pretrain/Learning Rate": 5.8917069016028725e-06, "Pretrain/Loss": 2.003782272338867, "Pretrain/Loss (Raw)": 1.9198766946792603, "Pretrain/Step": 14946, "Pretrain/Step Time": 8.473446832969785} +{"Pretrain/Learning Rate": 5.888969795386331e-06, "Pretrain/Loss": 2.0009968280792236, "Pretrain/Loss (Raw)": 2.230844736099243, "Pretrain/Step": 14947, "Pretrain/Step Time": 8.47095474973321} +{"Pretrain/Learning Rate": 5.886233240222869e-06, "Pretrain/Loss": 2.0031118392944336, "Pretrain/Loss (Raw)": 2.1485555171966553, "Pretrain/Step": 14948, "Pretrain/Step Time": 8.474279288202524} +{"Pretrain/Learning Rate": 5.883497236191404e-06, "Pretrain/Loss": 2.0039968490600586, "Pretrain/Loss (Raw)": 2.0478739738464355, "Pretrain/Step": 14949, "Pretrain/Step Time": 8.47525922395289} +{"Pretrain/Learning Rate": 5.880761783370811e-06, "Pretrain/Loss": 2.004652500152588, "Pretrain/Loss (Raw)": 2.002887010574341, "Pretrain/Step": 14950, "Pretrain/Step Time": 8.472345519810915} +{"Pretrain/Learning Rate": 5.878026881839982e-06, "Pretrain/Loss": 2.0032496452331543, "Pretrain/Loss (Raw)": 1.7933539152145386, "Pretrain/Step": 14951, "Pretrain/Step Time": 8.469623755663633} +{"Pretrain/Learning Rate": 5.875292531677767e-06, "Pretrain/Loss": 2.0069339275360107, "Pretrain/Loss (Raw)": 2.1283814907073975, "Pretrain/Step": 14952, "Pretrain/Step Time": 8.472802586853504} +{"Pretrain/Learning Rate": 5.872558732963005e-06, "Pretrain/Loss": 2.00661563873291, "Pretrain/Loss (Raw)": 1.9374340772628784, "Pretrain/Step": 14953, "Pretrain/Step Time": 8.477579722180963} +{"Pretrain/Learning Rate": 5.869825485774533e-06, "Pretrain/Loss": 2.0056674480438232, "Pretrain/Loss (Raw)": 1.9166646003723145, "Pretrain/Step": 14954, "Pretrain/Step Time": 8.471582924947143} +{"Pretrain/Learning Rate": 5.867092790191148e-06, "Pretrain/Loss": 2.010607957839966, "Pretrain/Loss (Raw)": 2.5128333568573, "Pretrain/Step": 14955, "Pretrain/Step Time": 8.469366282224655} +{"Pretrain/Learning Rate": 5.864360646291664e-06, "Pretrain/Loss": 2.0084218978881836, "Pretrain/Loss (Raw)": 1.676584005355835, "Pretrain/Step": 14956, "Pretrain/Step Time": 8.470515659078956} +{"Pretrain/Learning Rate": 5.861629054154852e-06, "Pretrain/Loss": 2.0070691108703613, "Pretrain/Loss (Raw)": 1.7839030027389526, "Pretrain/Step": 14957, "Pretrain/Step Time": 8.469161316752434} +{"Pretrain/Learning Rate": 5.858898013859468e-06, "Pretrain/Loss": 2.010193347930908, "Pretrain/Loss (Raw)": 2.045363426208496, "Pretrain/Step": 14958, "Pretrain/Step Time": 8.46714043803513} +{"Pretrain/Learning Rate": 5.856167525484271e-06, "Pretrain/Loss": 2.0069668292999268, "Pretrain/Loss (Raw)": 1.842063546180725, "Pretrain/Step": 14959, "Pretrain/Step Time": 8.463324511423707} +{"Pretrain/Learning Rate": 5.853437589107983e-06, "Pretrain/Loss": 2.011471748352051, "Pretrain/Loss (Raw)": 2.4828362464904785, "Pretrain/Step": 14960, "Pretrain/Step Time": 8.466668019071221} +{"Pretrain/Learning Rate": 5.85070820480933e-06, "Pretrain/Loss": 2.011716842651367, "Pretrain/Loss (Raw)": 2.0794639587402344, "Pretrain/Step": 14961, "Pretrain/Step Time": 8.466458778828382} +{"Pretrain/Learning Rate": 5.847979372667006e-06, "Pretrain/Loss": 2.010671615600586, "Pretrain/Loss (Raw)": 1.896942377090454, "Pretrain/Step": 14962, "Pretrain/Step Time": 8.465274455025792} +{"Pretrain/Learning Rate": 5.8452510927596875e-06, "Pretrain/Loss": 2.009916067123413, "Pretrain/Loss (Raw)": 1.8232734203338623, "Pretrain/Step": 14963, "Pretrain/Step Time": 8.461958225816488} +{"Pretrain/Learning Rate": 5.842523365166061e-06, "Pretrain/Loss": 2.010063409805298, "Pretrain/Loss (Raw)": 1.9677414894104004, "Pretrain/Step": 14964, "Pretrain/Step Time": 8.460365599021316} +{"Pretrain/Learning Rate": 5.839796189964758e-06, "Pretrain/Loss": 2.0094540119171143, "Pretrain/Loss (Raw)": 1.9878429174423218, "Pretrain/Step": 14965, "Pretrain/Step Time": 8.462008398026228} +{"Pretrain/Learning Rate": 5.837069567234435e-06, "Pretrain/Loss": 2.013277769088745, "Pretrain/Loss (Raw)": 2.1329588890075684, "Pretrain/Step": 14966, "Pretrain/Step Time": 8.463705785572529} +{"Pretrain/Learning Rate": 5.834343497053702e-06, "Pretrain/Loss": 2.0140626430511475, "Pretrain/Loss (Raw)": 1.992621898651123, "Pretrain/Step": 14967, "Pretrain/Step Time": 8.463944092392921} +{"Pretrain/Learning Rate": 5.8316179795011524e-06, "Pretrain/Loss": 2.0155255794525146, "Pretrain/Loss (Raw)": 2.0417587757110596, "Pretrain/Step": 14968, "Pretrain/Step Time": 8.459324143826962} +{"Pretrain/Learning Rate": 5.828893014655396e-06, "Pretrain/Loss": 2.0117335319519043, "Pretrain/Loss (Raw)": 1.5302249193191528, "Pretrain/Step": 14969, "Pretrain/Step Time": 8.472205147147179} +{"Pretrain/Learning Rate": 5.826168602594986e-06, "Pretrain/Loss": 2.015167236328125, "Pretrain/Loss (Raw)": 1.9601985216140747, "Pretrain/Step": 14970, "Pretrain/Step Time": 8.471752529963851} +{"Pretrain/Learning Rate": 5.823444743398495e-06, "Pretrain/Loss": 2.0152699947357178, "Pretrain/Loss (Raw)": 2.0118558406829834, "Pretrain/Step": 14971, "Pretrain/Step Time": 8.476899152621627} +{"Pretrain/Learning Rate": 5.820721437144458e-06, "Pretrain/Loss": 2.0157647132873535, "Pretrain/Loss (Raw)": 2.2169110774993896, "Pretrain/Step": 14972, "Pretrain/Step Time": 8.477446047589183} +{"Pretrain/Learning Rate": 5.817998683911388e-06, "Pretrain/Loss": 2.0150485038757324, "Pretrain/Loss (Raw)": 2.0574710369110107, "Pretrain/Step": 14973, "Pretrain/Step Time": 8.478153327479959} +{"Pretrain/Learning Rate": 5.815276483777812e-06, "Pretrain/Loss": 2.013607978820801, "Pretrain/Loss (Raw)": 1.9222309589385986, "Pretrain/Step": 14974, "Pretrain/Step Time": 8.476551232859492} +{"Pretrain/Learning Rate": 5.812554836822209e-06, "Pretrain/Loss": 2.013645648956299, "Pretrain/Loss (Raw)": 2.017256736755371, "Pretrain/Step": 14975, "Pretrain/Step Time": 8.473596567288041} +{"Pretrain/Learning Rate": 5.809833743123066e-06, "Pretrain/Loss": 2.0126709938049316, "Pretrain/Loss (Raw)": 1.9941822290420532, "Pretrain/Step": 14976, "Pretrain/Step Time": 8.472376680001616} +{"Pretrain/Learning Rate": 5.8071132027588374e-06, "Pretrain/Loss": 2.0119805335998535, "Pretrain/Loss (Raw)": 1.8736761808395386, "Pretrain/Step": 14977, "Pretrain/Step Time": 8.471584301441908} +{"Pretrain/Learning Rate": 5.804393215807966e-06, "Pretrain/Loss": 2.0133323669433594, "Pretrain/Loss (Raw)": 2.086366891860962, "Pretrain/Step": 14978, "Pretrain/Step Time": 8.468227760866284} +{"Pretrain/Learning Rate": 5.801673782348888e-06, "Pretrain/Loss": 2.0141000747680664, "Pretrain/Loss (Raw)": 2.1786015033721924, "Pretrain/Step": 14979, "Pretrain/Step Time": 8.47014743834734} +{"Pretrain/Learning Rate": 5.7989549024600075e-06, "Pretrain/Loss": 2.01524019241333, "Pretrain/Loss (Raw)": 2.2100236415863037, "Pretrain/Step": 14980, "Pretrain/Step Time": 8.46556731313467} +{"Pretrain/Learning Rate": 5.796236576219732e-06, "Pretrain/Loss": 2.0169215202331543, "Pretrain/Loss (Raw)": 2.165363311767578, "Pretrain/Step": 14981, "Pretrain/Step Time": 8.473216386511922} +{"Pretrain/Learning Rate": 5.7935188037064325e-06, "Pretrain/Loss": 2.016645669937134, "Pretrain/Loss (Raw)": 2.0217034816741943, "Pretrain/Step": 14982, "Pretrain/Step Time": 8.469886034727097} +{"Pretrain/Learning Rate": 5.7908015849984845e-06, "Pretrain/Loss": 2.016303062438965, "Pretrain/Loss (Raw)": 2.020136833190918, "Pretrain/Step": 14983, "Pretrain/Step Time": 8.466629102826118} +{"Pretrain/Learning Rate": 5.7880849201742305e-06, "Pretrain/Loss": 2.0149121284484863, "Pretrain/Loss (Raw)": 1.8355575799942017, "Pretrain/Step": 14984, "Pretrain/Step Time": 8.46854156628251} +{"Pretrain/Learning Rate": 5.785368809311997e-06, "Pretrain/Loss": 2.0125412940979004, "Pretrain/Loss (Raw)": 2.002958059310913, "Pretrain/Step": 14985, "Pretrain/Step Time": 8.46811537258327} +{"Pretrain/Learning Rate": 5.782653252490117e-06, "Pretrain/Loss": 2.0127716064453125, "Pretrain/Loss (Raw)": 1.9809640645980835, "Pretrain/Step": 14986, "Pretrain/Step Time": 8.471374530345201} +{"Pretrain/Learning Rate": 5.779938249786876e-06, "Pretrain/Loss": 2.011505365371704, "Pretrain/Loss (Raw)": 2.0557339191436768, "Pretrain/Step": 14987, "Pretrain/Step Time": 8.472265439108014} +{"Pretrain/Learning Rate": 5.777223801280571e-06, "Pretrain/Loss": 2.0125598907470703, "Pretrain/Loss (Raw)": 1.9692051410675049, "Pretrain/Step": 14988, "Pretrain/Step Time": 8.469241343438625} +{"Pretrain/Learning Rate": 5.774509907049469e-06, "Pretrain/Loss": 2.009706735610962, "Pretrain/Loss (Raw)": 1.6779805421829224, "Pretrain/Step": 14989, "Pretrain/Step Time": 8.47198154591024} +{"Pretrain/Learning Rate": 5.771796567171814e-06, "Pretrain/Loss": 2.008423328399658, "Pretrain/Loss (Raw)": 1.9129550457000732, "Pretrain/Step": 14990, "Pretrain/Step Time": 8.471844708546996} +{"Pretrain/Learning Rate": 5.769083781725854e-06, "Pretrain/Loss": 2.0082316398620605, "Pretrain/Loss (Raw)": 2.0188190937042236, "Pretrain/Step": 14991, "Pretrain/Step Time": 8.4722082298249} +{"Pretrain/Learning Rate": 5.7663715507898005e-06, "Pretrain/Loss": 2.0106894969940186, "Pretrain/Loss (Raw)": 2.1231114864349365, "Pretrain/Step": 14992, "Pretrain/Step Time": 8.467831026762724} +{"Pretrain/Learning Rate": 5.763659874441874e-06, "Pretrain/Loss": 2.0124499797821045, "Pretrain/Loss (Raw)": 1.8812675476074219, "Pretrain/Step": 14993, "Pretrain/Step Time": 8.471087476238608} +{"Pretrain/Learning Rate": 5.760948752760254e-06, "Pretrain/Loss": 2.011167049407959, "Pretrain/Loss (Raw)": 1.8019973039627075, "Pretrain/Step": 14994, "Pretrain/Step Time": 8.470691338181496} +{"Pretrain/Learning Rate": 5.758238185823112e-06, "Pretrain/Loss": 2.010575532913208, "Pretrain/Loss (Raw)": 1.9239784479141235, "Pretrain/Step": 14995, "Pretrain/Step Time": 8.472523653879762} +{"Pretrain/Learning Rate": 5.755528173708607e-06, "Pretrain/Loss": 2.010054111480713, "Pretrain/Loss (Raw)": 1.7966341972351074, "Pretrain/Step": 14996, "Pretrain/Step Time": 8.475968500599265} +{"Pretrain/Learning Rate": 5.752818716494873e-06, "Pretrain/Loss": 2.0061724185943604, "Pretrain/Loss (Raw)": 2.061882495880127, "Pretrain/Step": 14997, "Pretrain/Step Time": 8.471784414723516} +{"Pretrain/Learning Rate": 5.7501098142600514e-06, "Pretrain/Loss": 2.009845733642578, "Pretrain/Loss (Raw)": 2.385240316390991, "Pretrain/Step": 14998, "Pretrain/Step Time": 8.477892324328423} +{"Pretrain/Learning Rate": 5.7474014670822365e-06, "Pretrain/Loss": 2.0096254348754883, "Pretrain/Loss (Raw)": 2.041471004486084, "Pretrain/Step": 14999, "Pretrain/Step Time": 8.479362294077873} +{"Pretrain/Learning Rate": 5.744693675039536e-06, "Pretrain/Loss": 2.009040355682373, "Pretrain/Loss (Raw)": 2.0019690990448, "Pretrain/Step": 15000, "Pretrain/Step Time": 8.477536017075181} +{"Pretrain/Learning Rate": 5.741986438210017e-06, "Pretrain/Loss": 2.009990930557251, "Pretrain/Loss (Raw)": 2.064866781234741, "Pretrain/Step": 15001, "Pretrain/Step Time": 9.520096836611629} +{"Pretrain/Learning Rate": 5.7392797566717396e-06, "Pretrain/Loss": 2.01295804977417, "Pretrain/Loss (Raw)": 2.234926700592041, "Pretrain/Step": 15002, "Pretrain/Step Time": 9.525117477402091} +{"Pretrain/Learning Rate": 5.736573630502756e-06, "Pretrain/Loss": 2.011986255645752, "Pretrain/Loss (Raw)": 1.937096357345581, "Pretrain/Step": 15003, "Pretrain/Step Time": 9.528366081416607} +{"Pretrain/Learning Rate": 5.733868059781086e-06, "Pretrain/Loss": 2.010637044906616, "Pretrain/Loss (Raw)": 1.8844565153121948, "Pretrain/Step": 15004, "Pretrain/Step Time": 9.525785900652409} +{"Pretrain/Learning Rate": 5.731163044584756e-06, "Pretrain/Loss": 2.010291576385498, "Pretrain/Loss (Raw)": 1.9255282878875732, "Pretrain/Step": 15005, "Pretrain/Step Time": 9.523766852915287} +{"Pretrain/Learning Rate": 5.728458584991755e-06, "Pretrain/Loss": 2.0089077949523926, "Pretrain/Loss (Raw)": 2.0967776775360107, "Pretrain/Step": 15006, "Pretrain/Step Time": 9.527796491980553} +{"Pretrain/Learning Rate": 5.725754681080059e-06, "Pretrain/Loss": 2.0092062950134277, "Pretrain/Loss (Raw)": 1.8462191820144653, "Pretrain/Step": 15007, "Pretrain/Step Time": 9.521468218415976} +{"Pretrain/Learning Rate": 5.7230513329276454e-06, "Pretrain/Loss": 2.0110244750976562, "Pretrain/Loss (Raw)": 2.0856595039367676, "Pretrain/Step": 15008, "Pretrain/Step Time": 9.51985471881926} +{"Pretrain/Learning Rate": 5.720348540612453e-06, "Pretrain/Loss": 2.011486530303955, "Pretrain/Loss (Raw)": 1.9181917905807495, "Pretrain/Step": 15009, "Pretrain/Step Time": 9.518236104398966} +{"Pretrain/Learning Rate": 5.7176463042124235e-06, "Pretrain/Loss": 2.0086634159088135, "Pretrain/Loss (Raw)": 2.0408194065093994, "Pretrain/Step": 15010, "Pretrain/Step Time": 9.519331689924002} +{"Pretrain/Learning Rate": 5.714944623805468e-06, "Pretrain/Loss": 2.0096383094787598, "Pretrain/Loss (Raw)": 2.227139472961426, "Pretrain/Step": 15011, "Pretrain/Step Time": 9.517799386754632} +{"Pretrain/Learning Rate": 5.7122434994694854e-06, "Pretrain/Loss": 2.0093564987182617, "Pretrain/Loss (Raw)": 2.09541392326355, "Pretrain/Step": 15012, "Pretrain/Step Time": 9.513183573260903} +{"Pretrain/Learning Rate": 5.709542931282372e-06, "Pretrain/Loss": 2.01078200340271, "Pretrain/Loss (Raw)": 1.9022786617279053, "Pretrain/Step": 15013, "Pretrain/Step Time": 9.515149058774114} +{"Pretrain/Learning Rate": 5.706842919321981e-06, "Pretrain/Loss": 2.0095150470733643, "Pretrain/Loss (Raw)": 2.084219217300415, "Pretrain/Step": 15014, "Pretrain/Step Time": 9.516613364219666} +{"Pretrain/Learning Rate": 5.704143463666179e-06, "Pretrain/Loss": 2.0107264518737793, "Pretrain/Loss (Raw)": 2.0479774475097656, "Pretrain/Step": 15015, "Pretrain/Step Time": 9.518186109140515} +{"Pretrain/Learning Rate": 5.701444564392799e-06, "Pretrain/Loss": 2.0099236965179443, "Pretrain/Loss (Raw)": 2.057029962539673, "Pretrain/Step": 15016, "Pretrain/Step Time": 9.523160576820374} +{"Pretrain/Learning Rate": 5.6987462215796535e-06, "Pretrain/Loss": 2.0102851390838623, "Pretrain/Loss (Raw)": 2.1640567779541016, "Pretrain/Step": 15017, "Pretrain/Step Time": 9.51993502303958} +{"Pretrain/Learning Rate": 5.696048435304563e-06, "Pretrain/Loss": 2.0099432468414307, "Pretrain/Loss (Raw)": 1.7936770915985107, "Pretrain/Step": 15018, "Pretrain/Step Time": 9.519714897498488} +{"Pretrain/Learning Rate": 5.693351205645297e-06, "Pretrain/Loss": 2.0091910362243652, "Pretrain/Loss (Raw)": 2.160416841506958, "Pretrain/Step": 15019, "Pretrain/Step Time": 9.52366709895432} +{"Pretrain/Learning Rate": 5.6906545326796485e-06, "Pretrain/Loss": 2.010350227355957, "Pretrain/Loss (Raw)": 2.034456491470337, "Pretrain/Step": 15020, "Pretrain/Step Time": 9.525830905884504} +{"Pretrain/Learning Rate": 5.687958416485361e-06, "Pretrain/Loss": 2.0109763145446777, "Pretrain/Loss (Raw)": 2.085190534591675, "Pretrain/Step": 15021, "Pretrain/Step Time": 9.52519134990871} +{"Pretrain/Learning Rate": 5.685262857140175e-06, "Pretrain/Loss": 2.0096378326416016, "Pretrain/Loss (Raw)": 1.8711882829666138, "Pretrain/Step": 15022, "Pretrain/Step Time": 9.52718405239284} +{"Pretrain/Learning Rate": 5.682567854721824e-06, "Pretrain/Loss": 2.008563280105591, "Pretrain/Loss (Raw)": 1.971181035041809, "Pretrain/Step": 15023, "Pretrain/Step Time": 9.52941682189703} +{"Pretrain/Learning Rate": 5.679873409308003e-06, "Pretrain/Loss": 2.007288932800293, "Pretrain/Loss (Raw)": 1.9881209135055542, "Pretrain/Step": 15024, "Pretrain/Step Time": 9.531088285148144} +{"Pretrain/Learning Rate": 5.677179520976422e-06, "Pretrain/Loss": 2.0053505897521973, "Pretrain/Loss (Raw)": 1.6942741870880127, "Pretrain/Step": 15025, "Pretrain/Step Time": 9.532371940091252} +{"Pretrain/Learning Rate": 5.674486189804748e-06, "Pretrain/Loss": 2.0050575733184814, "Pretrain/Loss (Raw)": 1.885727047920227, "Pretrain/Step": 15026, "Pretrain/Step Time": 9.529704773798585} +{"Pretrain/Learning Rate": 5.671793415870633e-06, "Pretrain/Loss": 2.003866672515869, "Pretrain/Loss (Raw)": 1.9621117115020752, "Pretrain/Step": 15027, "Pretrain/Step Time": 9.53531870432198} +{"Pretrain/Learning Rate": 5.669101199251733e-06, "Pretrain/Loss": 2.0051188468933105, "Pretrain/Loss (Raw)": 2.3157448768615723, "Pretrain/Step": 15028, "Pretrain/Step Time": 9.52765391767025} +{"Pretrain/Learning Rate": 5.666409540025672e-06, "Pretrain/Loss": 2.002631902694702, "Pretrain/Loss (Raw)": 1.6985745429992676, "Pretrain/Step": 15029, "Pretrain/Step Time": 9.526049751788378} +{"Pretrain/Learning Rate": 5.663718438270066e-06, "Pretrain/Loss": 2.002974271774292, "Pretrain/Loss (Raw)": 2.008181571960449, "Pretrain/Step": 15030, "Pretrain/Step Time": 9.526049140840769} +{"Pretrain/Learning Rate": 5.661027894062507e-06, "Pretrain/Loss": 2.001610279083252, "Pretrain/Loss (Raw)": 1.8427391052246094, "Pretrain/Step": 15031, "Pretrain/Step Time": 9.531502006575465} +{"Pretrain/Learning Rate": 5.6583379074805685e-06, "Pretrain/Loss": 2.0039796829223633, "Pretrain/Loss (Raw)": 2.0362133979797363, "Pretrain/Step": 15032, "Pretrain/Step Time": 9.528216369450092} +{"Pretrain/Learning Rate": 5.65564847860183e-06, "Pretrain/Loss": 2.002509117126465, "Pretrain/Loss (Raw)": 2.0650827884674072, "Pretrain/Step": 15033, "Pretrain/Step Time": 9.53139384649694} +{"Pretrain/Learning Rate": 5.652959607503822e-06, "Pretrain/Loss": 2.0005674362182617, "Pretrain/Loss (Raw)": 1.9953577518463135, "Pretrain/Step": 15034, "Pretrain/Step Time": 9.530160004273057} +{"Pretrain/Learning Rate": 5.650271294264095e-06, "Pretrain/Loss": 2.00323486328125, "Pretrain/Loss (Raw)": 2.1152074337005615, "Pretrain/Step": 15035, "Pretrain/Step Time": 9.527928026393056} +{"Pretrain/Learning Rate": 5.647583538960153e-06, "Pretrain/Loss": 2.0027711391448975, "Pretrain/Loss (Raw)": 1.9711735248565674, "Pretrain/Step": 15036, "Pretrain/Step Time": 9.52606645040214} +{"Pretrain/Learning Rate": 5.644896341669489e-06, "Pretrain/Loss": 2.006347417831421, "Pretrain/Loss (Raw)": 2.224675416946411, "Pretrain/Step": 15037, "Pretrain/Step Time": 9.531464217230678} +{"Pretrain/Learning Rate": 5.642209702469603e-06, "Pretrain/Loss": 2.007373332977295, "Pretrain/Loss (Raw)": 1.9506040811538696, "Pretrain/Step": 15038, "Pretrain/Step Time": 9.529527690261602} +{"Pretrain/Learning Rate": 5.639523621437945e-06, "Pretrain/Loss": 2.0085740089416504, "Pretrain/Loss (Raw)": 2.125274658203125, "Pretrain/Step": 15039, "Pretrain/Step Time": 9.52777167968452} +{"Pretrain/Learning Rate": 5.636838098651984e-06, "Pretrain/Loss": 2.0074288845062256, "Pretrain/Loss (Raw)": 1.8339505195617676, "Pretrain/Step": 15040, "Pretrain/Step Time": 9.526879526674747} +{"Pretrain/Learning Rate": 5.634153134189143e-06, "Pretrain/Loss": 2.008514642715454, "Pretrain/Loss (Raw)": 2.2698774337768555, "Pretrain/Step": 15041, "Pretrain/Step Time": 9.520889297127724} +{"Pretrain/Learning Rate": 5.631468728126843e-06, "Pretrain/Loss": 2.0071282386779785, "Pretrain/Loss (Raw)": 2.0635311603546143, "Pretrain/Step": 15042, "Pretrain/Step Time": 9.522149674594402} +{"Pretrain/Learning Rate": 5.6287848805424895e-06, "Pretrain/Loss": 2.0062851905822754, "Pretrain/Loss (Raw)": 1.859074592590332, "Pretrain/Step": 15043, "Pretrain/Step Time": 9.517025904729962} +{"Pretrain/Learning Rate": 5.626101591513466e-06, "Pretrain/Loss": 2.004061460494995, "Pretrain/Loss (Raw)": 1.7630802392959595, "Pretrain/Step": 15044, "Pretrain/Step Time": 9.516148874536157} +{"Pretrain/Learning Rate": 5.62341886111715e-06, "Pretrain/Loss": 2.0023441314697266, "Pretrain/Loss (Raw)": 1.9168412685394287, "Pretrain/Step": 15045, "Pretrain/Step Time": 9.517342157661915} +{"Pretrain/Learning Rate": 5.620736689430891e-06, "Pretrain/Loss": 2.002560615539551, "Pretrain/Loss (Raw)": 1.9713667631149292, "Pretrain/Step": 15046, "Pretrain/Step Time": 9.514742972329259} +{"Pretrain/Learning Rate": 5.618055076532022e-06, "Pretrain/Loss": 2.0015106201171875, "Pretrain/Loss (Raw)": 2.266535758972168, "Pretrain/Step": 15047, "Pretrain/Step Time": 9.513522641733289} +{"Pretrain/Learning Rate": 5.61537402249788e-06, "Pretrain/Loss": 2.0053625106811523, "Pretrain/Loss (Raw)": 2.384340524673462, "Pretrain/Step": 15048, "Pretrain/Step Time": 9.522750215604901} +{"Pretrain/Learning Rate": 5.612693527405755e-06, "Pretrain/Loss": 2.005525588989258, "Pretrain/Loss (Raw)": 1.9657644033432007, "Pretrain/Step": 15049, "Pretrain/Step Time": 9.525113517418504} +{"Pretrain/Learning Rate": 5.6100135913329495e-06, "Pretrain/Loss": 2.0051395893096924, "Pretrain/Loss (Raw)": 2.025386333465576, "Pretrain/Step": 15050, "Pretrain/Step Time": 9.522475123405457} +{"Pretrain/Learning Rate": 5.607334214356727e-06, "Pretrain/Loss": 2.0052895545959473, "Pretrain/Loss (Raw)": 1.988471508026123, "Pretrain/Step": 15051, "Pretrain/Step Time": 9.520830120891333} +{"Pretrain/Learning Rate": 5.604655396554359e-06, "Pretrain/Loss": 2.008863925933838, "Pretrain/Loss (Raw)": 2.114424705505371, "Pretrain/Step": 15052, "Pretrain/Step Time": 9.527416940778494} +{"Pretrain/Learning Rate": 5.601977138003081e-06, "Pretrain/Loss": 2.0072879791259766, "Pretrain/Loss (Raw)": 1.8925144672393799, "Pretrain/Step": 15053, "Pretrain/Step Time": 9.530655136331916} +{"Pretrain/Learning Rate": 5.599299438780109e-06, "Pretrain/Loss": 2.0059685707092285, "Pretrain/Loss (Raw)": 1.931334376335144, "Pretrain/Step": 15054, "Pretrain/Step Time": 9.5294917114079} +{"Pretrain/Learning Rate": 5.59662229896267e-06, "Pretrain/Loss": 2.0032286643981934, "Pretrain/Loss (Raw)": 1.9989447593688965, "Pretrain/Step": 15055, "Pretrain/Step Time": 9.52962726354599} +{"Pretrain/Learning Rate": 5.593945718627941e-06, "Pretrain/Loss": 2.0033631324768066, "Pretrain/Loss (Raw)": 2.0850751399993896, "Pretrain/Step": 15056, "Pretrain/Step Time": 9.527632733806968} +{"Pretrain/Learning Rate": 5.591269697853113e-06, "Pretrain/Loss": 2.0039145946502686, "Pretrain/Loss (Raw)": 2.084437131881714, "Pretrain/Step": 15057, "Pretrain/Step Time": 9.525432685390115} +{"Pretrain/Learning Rate": 5.588594236715341e-06, "Pretrain/Loss": 2.003871202468872, "Pretrain/Loss (Raw)": 1.8452885150909424, "Pretrain/Step": 15058, "Pretrain/Step Time": 9.523322839289904} +{"Pretrain/Learning Rate": 5.585919335291762e-06, "Pretrain/Loss": 2.0030252933502197, "Pretrain/Loss (Raw)": 1.8973631858825684, "Pretrain/Step": 15059, "Pretrain/Step Time": 9.52442024834454} +{"Pretrain/Learning Rate": 5.583244993659523e-06, "Pretrain/Loss": 1.9938557147979736, "Pretrain/Loss (Raw)": 0.8773626685142517, "Pretrain/Step": 15060, "Pretrain/Step Time": 9.520923301577568} +{"Pretrain/Learning Rate": 5.580571211895716e-06, "Pretrain/Loss": 1.9944744110107422, "Pretrain/Loss (Raw)": 1.9664331674575806, "Pretrain/Step": 15061, "Pretrain/Step Time": 9.520029282197356} +{"Pretrain/Learning Rate": 5.577897990077458e-06, "Pretrain/Loss": 1.9953774213790894, "Pretrain/Loss (Raw)": 1.984168291091919, "Pretrain/Step": 15062, "Pretrain/Step Time": 9.523519963026047} +{"Pretrain/Learning Rate": 5.575225328281819e-06, "Pretrain/Loss": 1.9968934059143066, "Pretrain/Loss (Raw)": 2.1896371841430664, "Pretrain/Step": 15063, "Pretrain/Step Time": 9.515099016949534} +{"Pretrain/Learning Rate": 5.572553226585856e-06, "Pretrain/Loss": 1.9978885650634766, "Pretrain/Loss (Raw)": 2.0998008251190186, "Pretrain/Step": 15064, "Pretrain/Step Time": 9.516755666583776} +{"Pretrain/Learning Rate": 5.569881685066633e-06, "Pretrain/Loss": 1.9989289045333862, "Pretrain/Loss (Raw)": 2.057382583618164, "Pretrain/Step": 15065, "Pretrain/Step Time": 9.521903334185481} +{"Pretrain/Learning Rate": 5.567210703801168e-06, "Pretrain/Loss": 2.0002970695495605, "Pretrain/Loss (Raw)": 1.8848364353179932, "Pretrain/Step": 15066, "Pretrain/Step Time": 9.520575638860464} +{"Pretrain/Learning Rate": 5.56454028286649e-06, "Pretrain/Loss": 2.000694513320923, "Pretrain/Loss (Raw)": 2.017066240310669, "Pretrain/Step": 15067, "Pretrain/Step Time": 9.521898491308093} +{"Pretrain/Learning Rate": 5.5618704223395905e-06, "Pretrain/Loss": 2.002004861831665, "Pretrain/Loss (Raw)": 2.1337647438049316, "Pretrain/Step": 15068, "Pretrain/Step Time": 9.522912761196494} +{"Pretrain/Learning Rate": 5.55920112229745e-06, "Pretrain/Loss": 2.002548933029175, "Pretrain/Loss (Raw)": 2.1352078914642334, "Pretrain/Step": 15069, "Pretrain/Step Time": 9.518992096185684} +{"Pretrain/Learning Rate": 5.5565323828170455e-06, "Pretrain/Loss": 1.9996509552001953, "Pretrain/Loss (Raw)": 2.074580669403076, "Pretrain/Step": 15070, "Pretrain/Step Time": 9.519144918769598} +{"Pretrain/Learning Rate": 5.5538642039753145e-06, "Pretrain/Loss": 2.0010621547698975, "Pretrain/Loss (Raw)": 1.9763879776000977, "Pretrain/Step": 15071, "Pretrain/Step Time": 9.51509640365839} +{"Pretrain/Learning Rate": 5.551196585849211e-06, "Pretrain/Loss": 2.0030558109283447, "Pretrain/Loss (Raw)": 2.0918378829956055, "Pretrain/Step": 15072, "Pretrain/Step Time": 9.51326153986156} +{"Pretrain/Learning Rate": 5.548529528515642e-06, "Pretrain/Loss": 2.002443313598633, "Pretrain/Loss (Raw)": 2.1288657188415527, "Pretrain/Step": 15073, "Pretrain/Step Time": 9.512084882706404} +{"Pretrain/Learning Rate": 5.545863032051504e-06, "Pretrain/Loss": 2.002723217010498, "Pretrain/Loss (Raw)": 1.9557002782821655, "Pretrain/Step": 15074, "Pretrain/Step Time": 9.515318792313337} +{"Pretrain/Learning Rate": 5.543197096533698e-06, "Pretrain/Loss": 1.999518871307373, "Pretrain/Loss (Raw)": 1.8206884860992432, "Pretrain/Step": 15075, "Pretrain/Step Time": 9.515097109600902} +{"Pretrain/Learning Rate": 5.54053172203908e-06, "Pretrain/Loss": 1.9983186721801758, "Pretrain/Loss (Raw)": 1.994895577430725, "Pretrain/Step": 15076, "Pretrain/Step Time": 9.512732377275825} +{"Pretrain/Learning Rate": 5.537866908644521e-06, "Pretrain/Loss": 1.9979544878005981, "Pretrain/Loss (Raw)": 2.0012834072113037, "Pretrain/Step": 15077, "Pretrain/Step Time": 9.507719745859504} +{"Pretrain/Learning Rate": 5.53520265642685e-06, "Pretrain/Loss": 1.9984253644943237, "Pretrain/Loss (Raw)": 2.0631587505340576, "Pretrain/Step": 15078, "Pretrain/Step Time": 9.508533680811524} +{"Pretrain/Learning Rate": 5.5325389654628855e-06, "Pretrain/Loss": 1.9985203742980957, "Pretrain/Loss (Raw)": 1.8055310249328613, "Pretrain/Step": 15079, "Pretrain/Step Time": 9.512770710512996} +{"Pretrain/Learning Rate": 5.529875835829437e-06, "Pretrain/Loss": 1.9973795413970947, "Pretrain/Loss (Raw)": 1.9823414087295532, "Pretrain/Step": 15080, "Pretrain/Step Time": 9.50829622335732} +{"Pretrain/Learning Rate": 5.5272132676032875e-06, "Pretrain/Loss": 1.9977103471755981, "Pretrain/Loss (Raw)": 1.979772686958313, "Pretrain/Step": 15081, "Pretrain/Step Time": 9.507253047078848} +{"Pretrain/Learning Rate": 5.524551260861224e-06, "Pretrain/Loss": 1.9985207319259644, "Pretrain/Loss (Raw)": 2.0203893184661865, "Pretrain/Step": 15082, "Pretrain/Step Time": 9.51271884329617} +{"Pretrain/Learning Rate": 5.521889815679987e-06, "Pretrain/Loss": 1.9956107139587402, "Pretrain/Loss (Raw)": 2.1403462886810303, "Pretrain/Step": 15083, "Pretrain/Step Time": 9.511186074465513} +{"Pretrain/Learning Rate": 5.519228932136333e-06, "Pretrain/Loss": 1.9994926452636719, "Pretrain/Loss (Raw)": 2.1734893321990967, "Pretrain/Step": 15084, "Pretrain/Step Time": 9.510447550565004} +{"Pretrain/Learning Rate": 5.51656861030698e-06, "Pretrain/Loss": 2.001516580581665, "Pretrain/Loss (Raw)": 2.0429697036743164, "Pretrain/Step": 15085, "Pretrain/Step Time": 9.509339544922113} +{"Pretrain/Learning Rate": 5.513908850268628e-06, "Pretrain/Loss": 2.0004124641418457, "Pretrain/Loss (Raw)": 1.904030680656433, "Pretrain/Step": 15086, "Pretrain/Step Time": 9.511678194627166} +{"Pretrain/Learning Rate": 5.511249652097988e-06, "Pretrain/Loss": 2.0019853115081787, "Pretrain/Loss (Raw)": 2.043381690979004, "Pretrain/Step": 15087, "Pretrain/Step Time": 9.511427791789174} +{"Pretrain/Learning Rate": 5.5085910158717165e-06, "Pretrain/Loss": 1.9961873292922974, "Pretrain/Loss (Raw)": 1.7407017946243286, "Pretrain/Step": 15088, "Pretrain/Step Time": 9.511294478550553} +{"Pretrain/Learning Rate": 5.505932941666489e-06, "Pretrain/Loss": 1.9944502115249634, "Pretrain/Loss (Raw)": 1.8571141958236694, "Pretrain/Step": 15089, "Pretrain/Step Time": 9.507454086095095} +{"Pretrain/Learning Rate": 5.5032754295589435e-06, "Pretrain/Loss": 1.994370698928833, "Pretrain/Loss (Raw)": 1.8867688179016113, "Pretrain/Step": 15090, "Pretrain/Step Time": 9.513578789308667} +{"Pretrain/Learning Rate": 5.500618479625699e-06, "Pretrain/Loss": 1.9966156482696533, "Pretrain/Loss (Raw)": 2.1106066703796387, "Pretrain/Step": 15091, "Pretrain/Step Time": 9.510595386847854} +{"Pretrain/Learning Rate": 5.497962091943382e-06, "Pretrain/Loss": 1.9990508556365967, "Pretrain/Loss (Raw)": 2.2794456481933594, "Pretrain/Step": 15092, "Pretrain/Step Time": 9.512433534488082} +{"Pretrain/Learning Rate": 5.495306266588574e-06, "Pretrain/Loss": 1.9984173774719238, "Pretrain/Loss (Raw)": 1.906768560409546, "Pretrain/Step": 15093, "Pretrain/Step Time": 9.509372998028994} +{"Pretrain/Learning Rate": 5.4926510036378634e-06, "Pretrain/Loss": 1.9976726770401, "Pretrain/Loss (Raw)": 2.037644147872925, "Pretrain/Step": 15094, "Pretrain/Step Time": 9.5062544811517} +{"Pretrain/Learning Rate": 5.489996303167813e-06, "Pretrain/Loss": 1.9981142282485962, "Pretrain/Loss (Raw)": 2.049144744873047, "Pretrain/Step": 15095, "Pretrain/Step Time": 9.509407481178641} +{"Pretrain/Learning Rate": 5.487342165254958e-06, "Pretrain/Loss": 1.995699405670166, "Pretrain/Loss (Raw)": 1.7326536178588867, "Pretrain/Step": 15096, "Pretrain/Step Time": 9.515101797878742} +{"Pretrain/Learning Rate": 5.484688589975842e-06, "Pretrain/Loss": 1.9971208572387695, "Pretrain/Loss (Raw)": 1.7121796607971191, "Pretrain/Step": 15097, "Pretrain/Step Time": 9.50760405138135} +{"Pretrain/Learning Rate": 5.482035577406966e-06, "Pretrain/Loss": 1.9948723316192627, "Pretrain/Loss (Raw)": 1.6723835468292236, "Pretrain/Step": 15098, "Pretrain/Step Time": 9.50898844935} +{"Pretrain/Learning Rate": 5.479383127624843e-06, "Pretrain/Loss": 1.9935417175292969, "Pretrain/Loss (Raw)": 1.841539740562439, "Pretrain/Step": 15099, "Pretrain/Step Time": 9.508738994598389} +{"Pretrain/Learning Rate": 5.4767312407059455e-06, "Pretrain/Loss": 1.9921529293060303, "Pretrain/Loss (Raw)": 2.039153814315796, "Pretrain/Step": 15100, "Pretrain/Step Time": 9.511062854900956} +{"Pretrain/Learning Rate": 5.474079916726732e-06, "Pretrain/Loss": 1.9911253452301025, "Pretrain/Loss (Raw)": 1.925918698310852, "Pretrain/Step": 15101, "Pretrain/Step Time": 9.510095164179802} +{"Pretrain/Learning Rate": 5.471429155763669e-06, "Pretrain/Loss": 1.9899659156799316, "Pretrain/Loss (Raw)": 1.7738398313522339, "Pretrain/Step": 15102, "Pretrain/Step Time": 9.510978683829308} +{"Pretrain/Learning Rate": 5.46877895789317e-06, "Pretrain/Loss": 1.9893685579299927, "Pretrain/Loss (Raw)": 1.940775752067566, "Pretrain/Step": 15103, "Pretrain/Step Time": 9.514080710709095} +{"Pretrain/Learning Rate": 5.466129323191668e-06, "Pretrain/Loss": 1.9885063171386719, "Pretrain/Loss (Raw)": 1.8838236331939697, "Pretrain/Step": 15104, "Pretrain/Step Time": 9.516486592590809} +{"Pretrain/Learning Rate": 5.463480251735559e-06, "Pretrain/Loss": 1.9874603748321533, "Pretrain/Loss (Raw)": 1.7398005723953247, "Pretrain/Step": 15105, "Pretrain/Step Time": 9.514928162097931} +{"Pretrain/Learning Rate": 5.460831743601216e-06, "Pretrain/Loss": 1.988528847694397, "Pretrain/Loss (Raw)": 2.223133087158203, "Pretrain/Step": 15106, "Pretrain/Step Time": 9.51469411328435} +{"Pretrain/Learning Rate": 5.458183798865022e-06, "Pretrain/Loss": 1.987706184387207, "Pretrain/Loss (Raw)": 2.0733001232147217, "Pretrain/Step": 15107, "Pretrain/Step Time": 9.512692157179117} +{"Pretrain/Learning Rate": 5.455536417603316e-06, "Pretrain/Loss": 1.986212968826294, "Pretrain/Loss (Raw)": 2.018900156021118, "Pretrain/Step": 15108, "Pretrain/Step Time": 9.514623863622546} +{"Pretrain/Learning Rate": 5.452889599892447e-06, "Pretrain/Loss": 1.9850506782531738, "Pretrain/Loss (Raw)": 2.016583204269409, "Pretrain/Step": 15109, "Pretrain/Step Time": 9.512151818722486} +{"Pretrain/Learning Rate": 5.450243345808726e-06, "Pretrain/Loss": 1.9861688613891602, "Pretrain/Loss (Raw)": 2.1648361682891846, "Pretrain/Step": 15110, "Pretrain/Step Time": 9.508606227114797} +{"Pretrain/Learning Rate": 5.447597655428446e-06, "Pretrain/Loss": 1.9849940538406372, "Pretrain/Loss (Raw)": 1.8697497844696045, "Pretrain/Step": 15111, "Pretrain/Step Time": 9.511035053059459} +{"Pretrain/Learning Rate": 5.4449525288279155e-06, "Pretrain/Loss": 1.9867804050445557, "Pretrain/Loss (Raw)": 2.064218759536743, "Pretrain/Step": 15112, "Pretrain/Step Time": 9.511333672329783} +{"Pretrain/Learning Rate": 5.442307966083385e-06, "Pretrain/Loss": 1.9863133430480957, "Pretrain/Loss (Raw)": 1.9431796073913574, "Pretrain/Step": 15113, "Pretrain/Step Time": 9.511149013414979} +{"Pretrain/Learning Rate": 5.439663967271125e-06, "Pretrain/Loss": 1.9868748188018799, "Pretrain/Loss (Raw)": 2.052825927734375, "Pretrain/Step": 15114, "Pretrain/Step Time": 9.511815203353763} +{"Pretrain/Learning Rate": 5.437020532467357e-06, "Pretrain/Loss": 1.987377405166626, "Pretrain/Loss (Raw)": 2.120073080062866, "Pretrain/Step": 15115, "Pretrain/Step Time": 9.511242559179664} +{"Pretrain/Learning Rate": 5.434377661748319e-06, "Pretrain/Loss": 1.9903829097747803, "Pretrain/Loss (Raw)": 2.353907585144043, "Pretrain/Step": 15116, "Pretrain/Step Time": 9.515291633084416} +{"Pretrain/Learning Rate": 5.431735355190207e-06, "Pretrain/Loss": 1.9923794269561768, "Pretrain/Loss (Raw)": 1.933515191078186, "Pretrain/Step": 15117, "Pretrain/Step Time": 9.513353968039155} +{"Pretrain/Learning Rate": 5.429093612869204e-06, "Pretrain/Loss": 1.993872880935669, "Pretrain/Loss (Raw)": 2.1041195392608643, "Pretrain/Step": 15118, "Pretrain/Step Time": 9.517733110114932} +{"Pretrain/Learning Rate": 5.426452434861498e-06, "Pretrain/Loss": 1.9927196502685547, "Pretrain/Loss (Raw)": 1.871214747428894, "Pretrain/Step": 15119, "Pretrain/Step Time": 9.517314333468676} +{"Pretrain/Learning Rate": 5.423811821243232e-06, "Pretrain/Loss": 1.99196195602417, "Pretrain/Loss (Raw)": 2.0261178016662598, "Pretrain/Step": 15120, "Pretrain/Step Time": 9.517181672155857} +{"Pretrain/Learning Rate": 5.421171772090558e-06, "Pretrain/Loss": 1.9931540489196777, "Pretrain/Loss (Raw)": 2.0338501930236816, "Pretrain/Step": 15121, "Pretrain/Step Time": 9.512577613815665} +{"Pretrain/Learning Rate": 5.4185322874795915e-06, "Pretrain/Loss": 1.993086338043213, "Pretrain/Loss (Raw)": 1.7933419942855835, "Pretrain/Step": 15122, "Pretrain/Step Time": 9.509980900213122} +{"Pretrain/Learning Rate": 5.415893367486438e-06, "Pretrain/Loss": 1.9945248365402222, "Pretrain/Loss (Raw)": 2.1081106662750244, "Pretrain/Step": 15123, "Pretrain/Step Time": 9.509019266813993} +{"Pretrain/Learning Rate": 5.413255012187199e-06, "Pretrain/Loss": 1.996201992034912, "Pretrain/Loss (Raw)": 2.011314868927002, "Pretrain/Step": 15124, "Pretrain/Step Time": 9.504621772095561} +{"Pretrain/Learning Rate": 5.410617221657938e-06, "Pretrain/Loss": 1.9965949058532715, "Pretrain/Loss (Raw)": 2.1121666431427, "Pretrain/Step": 15125, "Pretrain/Step Time": 9.510111432522535} +{"Pretrain/Learning Rate": 5.407979995974727e-06, "Pretrain/Loss": 1.994438648223877, "Pretrain/Loss (Raw)": 2.1092464923858643, "Pretrain/Step": 15126, "Pretrain/Step Time": 9.505937183275819} +{"Pretrain/Learning Rate": 5.4053433352136004e-06, "Pretrain/Loss": 1.9949321746826172, "Pretrain/Loss (Raw)": 2.1046295166015625, "Pretrain/Step": 15127, "Pretrain/Step Time": 9.500418938696384} +{"Pretrain/Learning Rate": 5.4027072394505805e-06, "Pretrain/Loss": 1.9939255714416504, "Pretrain/Loss (Raw)": 1.8731269836425781, "Pretrain/Step": 15128, "Pretrain/Step Time": 9.504544772207737} +{"Pretrain/Learning Rate": 5.400071708761686e-06, "Pretrain/Loss": 1.9927979707717896, "Pretrain/Loss (Raw)": 1.920543909072876, "Pretrain/Step": 15129, "Pretrain/Step Time": 8.462492741644382} +{"Pretrain/Learning Rate": 5.3974367432229e-06, "Pretrain/Loss": 1.991105318069458, "Pretrain/Loss (Raw)": 2.0182604789733887, "Pretrain/Step": 15130, "Pretrain/Step Time": 8.457991443574429} +{"Pretrain/Learning Rate": 5.3948023429102155e-06, "Pretrain/Loss": 1.9945485591888428, "Pretrain/Loss (Raw)": 2.3778326511383057, "Pretrain/Step": 15131, "Pretrain/Step Time": 8.458991708233953} +{"Pretrain/Learning Rate": 5.392168507899584e-06, "Pretrain/Loss": 1.9947830438613892, "Pretrain/Loss (Raw)": 1.9144705533981323, "Pretrain/Step": 15132, "Pretrain/Step Time": 8.46267006546259} +{"Pretrain/Learning Rate": 5.389535238266943e-06, "Pretrain/Loss": 1.9959534406661987, "Pretrain/Loss (Raw)": 2.0753421783447266, "Pretrain/Step": 15133, "Pretrain/Step Time": 8.464508481323719} +{"Pretrain/Learning Rate": 5.386902534088236e-06, "Pretrain/Loss": 1.9942899942398071, "Pretrain/Loss (Raw)": 1.8838589191436768, "Pretrain/Step": 15134, "Pretrain/Step Time": 8.462478019297123} +{"Pretrain/Learning Rate": 5.384270395439364e-06, "Pretrain/Loss": 1.9951393604278564, "Pretrain/Loss (Raw)": 1.954935073852539, "Pretrain/Step": 15135, "Pretrain/Step Time": 8.464786307886243} +{"Pretrain/Learning Rate": 5.381638822396232e-06, "Pretrain/Loss": 1.993973731994629, "Pretrain/Loss (Raw)": 1.9364503622055054, "Pretrain/Step": 15136, "Pretrain/Step Time": 8.468623859807849} +{"Pretrain/Learning Rate": 5.3790078150347145e-06, "Pretrain/Loss": 1.9954922199249268, "Pretrain/Loss (Raw)": 2.1125681400299072, "Pretrain/Step": 15137, "Pretrain/Step Time": 8.467210423201323} +{"Pretrain/Learning Rate": 5.376377373430669e-06, "Pretrain/Loss": 1.9955484867095947, "Pretrain/Loss (Raw)": 2.0480127334594727, "Pretrain/Step": 15138, "Pretrain/Step Time": 8.46396317332983} +{"Pretrain/Learning Rate": 5.373747497659954e-06, "Pretrain/Loss": 1.993025779724121, "Pretrain/Loss (Raw)": 1.904245138168335, "Pretrain/Step": 15139, "Pretrain/Step Time": 8.471206890419126} +{"Pretrain/Learning Rate": 5.3711181877983854e-06, "Pretrain/Loss": 1.9930362701416016, "Pretrain/Loss (Raw)": 2.0967588424682617, "Pretrain/Step": 15140, "Pretrain/Step Time": 8.469519237056375} +{"Pretrain/Learning Rate": 5.368489443921795e-06, "Pretrain/Loss": 1.993537425994873, "Pretrain/Loss (Raw)": 1.9664274454116821, "Pretrain/Step": 15141, "Pretrain/Step Time": 8.468806790187955} +{"Pretrain/Learning Rate": 5.365861266105973e-06, "Pretrain/Loss": 1.9950692653656006, "Pretrain/Loss (Raw)": 2.2802889347076416, "Pretrain/Step": 15142, "Pretrain/Step Time": 8.469596818089485} +{"Pretrain/Learning Rate": 5.363233654426691e-06, "Pretrain/Loss": 1.9919946193695068, "Pretrain/Loss (Raw)": 1.654413104057312, "Pretrain/Step": 15143, "Pretrain/Step Time": 8.470766495913267} +{"Pretrain/Learning Rate": 5.360606608959734e-06, "Pretrain/Loss": 1.9903424978256226, "Pretrain/Loss (Raw)": 1.8455644845962524, "Pretrain/Step": 15144, "Pretrain/Step Time": 8.472632704302669} +{"Pretrain/Learning Rate": 5.357980129780832e-06, "Pretrain/Loss": 1.9890475273132324, "Pretrain/Loss (Raw)": 1.9983102083206177, "Pretrain/Step": 15145, "Pretrain/Step Time": 8.472923915833235} +{"Pretrain/Learning Rate": 5.355354216965733e-06, "Pretrain/Loss": 1.9911185503005981, "Pretrain/Loss (Raw)": 2.0587539672851562, "Pretrain/Step": 15146, "Pretrain/Step Time": 8.471677569672465} +{"Pretrain/Learning Rate": 5.352728870590146e-06, "Pretrain/Loss": 1.9902467727661133, "Pretrain/Loss (Raw)": 2.048830986022949, "Pretrain/Step": 15147, "Pretrain/Step Time": 8.46559520997107} +{"Pretrain/Learning Rate": 5.3501040907297655e-06, "Pretrain/Loss": 1.9913208484649658, "Pretrain/Loss (Raw)": 2.171937942504883, "Pretrain/Step": 15148, "Pretrain/Step Time": 8.47116837464273} +{"Pretrain/Learning Rate": 5.347479877460288e-06, "Pretrain/Loss": 1.990110993385315, "Pretrain/Loss (Raw)": 1.9303233623504639, "Pretrain/Step": 15149, "Pretrain/Step Time": 8.479715077206492} +{"Pretrain/Learning Rate": 5.344856230857368e-06, "Pretrain/Loss": 1.9913766384124756, "Pretrain/Loss (Raw)": 2.0332000255584717, "Pretrain/Step": 15150, "Pretrain/Step Time": 8.47985690459609} +{"Pretrain/Learning Rate": 5.342233150996667e-06, "Pretrain/Loss": 1.9899803400039673, "Pretrain/Loss (Raw)": 1.792446255683899, "Pretrain/Step": 15151, "Pretrain/Step Time": 8.477274803444743} +{"Pretrain/Learning Rate": 5.339610637953818e-06, "Pretrain/Loss": 1.9905357360839844, "Pretrain/Loss (Raw)": 2.0592198371887207, "Pretrain/Step": 15152, "Pretrain/Step Time": 8.476855808869004} +{"Pretrain/Learning Rate": 5.3369886918044285e-06, "Pretrain/Loss": 1.9927971363067627, "Pretrain/Loss (Raw)": 1.9837422370910645, "Pretrain/Step": 15153, "Pretrain/Step Time": 8.474178928881884} +{"Pretrain/Learning Rate": 5.334367312624117e-06, "Pretrain/Loss": 1.9925217628479004, "Pretrain/Loss (Raw)": 1.8504735231399536, "Pretrain/Step": 15154, "Pretrain/Step Time": 8.472275650128722} +{"Pretrain/Learning Rate": 5.331746500488452e-06, "Pretrain/Loss": 1.9923748970031738, "Pretrain/Loss (Raw)": 1.9433170557022095, "Pretrain/Step": 15155, "Pretrain/Step Time": 8.467744337394834} +{"Pretrain/Learning Rate": 5.329126255473018e-06, "Pretrain/Loss": 1.9890623092651367, "Pretrain/Loss (Raw)": 1.8917255401611328, "Pretrain/Step": 15156, "Pretrain/Step Time": 8.469136700034142} +{"Pretrain/Learning Rate": 5.326506577653362e-06, "Pretrain/Loss": 1.992743968963623, "Pretrain/Loss (Raw)": 2.16982102394104, "Pretrain/Step": 15157, "Pretrain/Step Time": 8.472092848271132} +{"Pretrain/Learning Rate": 5.323887467105013e-06, "Pretrain/Loss": 1.9922268390655518, "Pretrain/Loss (Raw)": 1.941988229751587, "Pretrain/Step": 15158, "Pretrain/Step Time": 8.471884466707706} +{"Pretrain/Learning Rate": 5.321268923903505e-06, "Pretrain/Loss": 1.994588851928711, "Pretrain/Loss (Raw)": 2.1450796127319336, "Pretrain/Step": 15159, "Pretrain/Step Time": 8.470674082636833} +{"Pretrain/Learning Rate": 5.318650948124329e-06, "Pretrain/Loss": 1.9936541318893433, "Pretrain/Loss (Raw)": 1.9165712594985962, "Pretrain/Step": 15160, "Pretrain/Step Time": 8.473416056483984} +{"Pretrain/Learning Rate": 5.316033539842985e-06, "Pretrain/Loss": 1.995271921157837, "Pretrain/Loss (Raw)": 2.2721450328826904, "Pretrain/Step": 15161, "Pretrain/Step Time": 8.47219349257648} +{"Pretrain/Learning Rate": 5.313416699134938e-06, "Pretrain/Loss": 1.9941887855529785, "Pretrain/Loss (Raw)": 1.8567296266555786, "Pretrain/Step": 15162, "Pretrain/Step Time": 8.476444162428379} +{"Pretrain/Learning Rate": 5.3108004260756406e-06, "Pretrain/Loss": 1.9937348365783691, "Pretrain/Loss (Raw)": 2.057102918624878, "Pretrain/Step": 15163, "Pretrain/Step Time": 8.479344325140119} +{"Pretrain/Learning Rate": 5.308184720740534e-06, "Pretrain/Loss": 1.9939460754394531, "Pretrain/Loss (Raw)": 1.9982243776321411, "Pretrain/Step": 15164, "Pretrain/Step Time": 8.479344530031085} +{"Pretrain/Learning Rate": 5.30556958320503e-06, "Pretrain/Loss": 1.9924049377441406, "Pretrain/Loss (Raw)": 2.0273919105529785, "Pretrain/Step": 15165, "Pretrain/Step Time": 8.479753658175468} +{"Pretrain/Learning Rate": 5.3029550135445525e-06, "Pretrain/Loss": 1.9919257164001465, "Pretrain/Loss (Raw)": 1.8892732858657837, "Pretrain/Step": 15166, "Pretrain/Step Time": 8.479490671306849} +{"Pretrain/Learning Rate": 5.300341011834475e-06, "Pretrain/Loss": 1.9887442588806152, "Pretrain/Loss (Raw)": 1.7180474996566772, "Pretrain/Step": 15167, "Pretrain/Step Time": 8.484346037730575} +{"Pretrain/Learning Rate": 5.297727578150186e-06, "Pretrain/Loss": 1.9896864891052246, "Pretrain/Loss (Raw)": 1.9545645713806152, "Pretrain/Step": 15168, "Pretrain/Step Time": 8.485216910019517} +{"Pretrain/Learning Rate": 5.295114712567029e-06, "Pretrain/Loss": 1.9894118309020996, "Pretrain/Loss (Raw)": 2.2347097396850586, "Pretrain/Step": 15169, "Pretrain/Step Time": 8.486111043021083} +{"Pretrain/Learning Rate": 5.292502415160344e-06, "Pretrain/Loss": 1.9888513088226318, "Pretrain/Loss (Raw)": 1.9917927980422974, "Pretrain/Step": 15170, "Pretrain/Step Time": 8.485606113448739} +{"Pretrain/Learning Rate": 5.289890686005466e-06, "Pretrain/Loss": 1.9889023303985596, "Pretrain/Loss (Raw)": 1.8656096458435059, "Pretrain/Step": 15171, "Pretrain/Step Time": 8.485640736296773} +{"Pretrain/Learning Rate": 5.287279525177688e-06, "Pretrain/Loss": 1.9925544261932373, "Pretrain/Loss (Raw)": 2.2305502891540527, "Pretrain/Step": 15172, "Pretrain/Step Time": 8.485141810029745} +{"Pretrain/Learning Rate": 5.284668932752313e-06, "Pretrain/Loss": 1.9933559894561768, "Pretrain/Loss (Raw)": 2.0194284915924072, "Pretrain/Step": 15173, "Pretrain/Step Time": 8.482139317318797} +{"Pretrain/Learning Rate": 5.282058908804613e-06, "Pretrain/Loss": 1.993252158164978, "Pretrain/Loss (Raw)": 1.958068609237671, "Pretrain/Step": 15174, "Pretrain/Step Time": 8.48090261220932} +{"Pretrain/Learning Rate": 5.279449453409837e-06, "Pretrain/Loss": 1.9912586212158203, "Pretrain/Loss (Raw)": 2.0113775730133057, "Pretrain/Step": 15175, "Pretrain/Step Time": 8.48216662183404} +{"Pretrain/Learning Rate": 5.27684056664324e-06, "Pretrain/Loss": 1.9867972135543823, "Pretrain/Loss (Raw)": 1.81327223777771, "Pretrain/Step": 15176, "Pretrain/Step Time": 8.476747481152415} +{"Pretrain/Learning Rate": 5.274232248580036e-06, "Pretrain/Loss": 1.9844120740890503, "Pretrain/Loss (Raw)": 1.6604593992233276, "Pretrain/Step": 15177, "Pretrain/Step Time": 8.474470237269998} +{"Pretrain/Learning Rate": 5.2716244992954465e-06, "Pretrain/Loss": 1.984055995941162, "Pretrain/Loss (Raw)": 1.9798167943954468, "Pretrain/Step": 15178, "Pretrain/Step Time": 8.48188179731369} +{"Pretrain/Learning Rate": 5.26901731886465e-06, "Pretrain/Loss": 1.9869567155838013, "Pretrain/Loss (Raw)": 2.3597640991210938, "Pretrain/Step": 15179, "Pretrain/Step Time": 8.480439072474837} +{"Pretrain/Learning Rate": 5.266410707362834e-06, "Pretrain/Loss": 1.9853806495666504, "Pretrain/Loss (Raw)": 1.912691354751587, "Pretrain/Step": 15180, "Pretrain/Step Time": 8.475200444459915} +{"Pretrain/Learning Rate": 5.263804664865155e-06, "Pretrain/Loss": 1.9873967170715332, "Pretrain/Loss (Raw)": 2.150568962097168, "Pretrain/Step": 15181, "Pretrain/Step Time": 8.479470569640398} +{"Pretrain/Learning Rate": 5.2611991914467504e-06, "Pretrain/Loss": 1.9877369403839111, "Pretrain/Loss (Raw)": 1.9748988151550293, "Pretrain/Step": 15182, "Pretrain/Step Time": 8.47910364344716} +{"Pretrain/Learning Rate": 5.2585942871827584e-06, "Pretrain/Loss": 1.9881160259246826, "Pretrain/Loss (Raw)": 2.0474624633789062, "Pretrain/Step": 15183, "Pretrain/Step Time": 8.481010401621461} +{"Pretrain/Learning Rate": 5.255989952148274e-06, "Pretrain/Loss": 1.9870420694351196, "Pretrain/Loss (Raw)": 1.9475990533828735, "Pretrain/Step": 15184, "Pretrain/Step Time": 8.480726025998592} +{"Pretrain/Learning Rate": 5.253386186418411e-06, "Pretrain/Loss": 1.9849684238433838, "Pretrain/Loss (Raw)": 1.8190007209777832, "Pretrain/Step": 15185, "Pretrain/Step Time": 8.48422278277576} +{"Pretrain/Learning Rate": 5.2507829900682345e-06, "Pretrain/Loss": 1.9852275848388672, "Pretrain/Loss (Raw)": 1.8784712553024292, "Pretrain/Step": 15186, "Pretrain/Step Time": 8.481956478208303} +{"Pretrain/Learning Rate": 5.248180363172802e-06, "Pretrain/Loss": 1.9867533445358276, "Pretrain/Loss (Raw)": 2.0926601886749268, "Pretrain/Step": 15187, "Pretrain/Step Time": 8.486866341903806} +{"Pretrain/Learning Rate": 5.245578305807172e-06, "Pretrain/Loss": 1.9957857131958008, "Pretrain/Loss (Raw)": 2.0335075855255127, "Pretrain/Step": 15188, "Pretrain/Step Time": 8.48822626657784} +{"Pretrain/Learning Rate": 5.242976818046358e-06, "Pretrain/Loss": 1.9951977729797363, "Pretrain/Loss (Raw)": 1.8911677598953247, "Pretrain/Step": 15189, "Pretrain/Step Time": 8.489681415259838} +{"Pretrain/Learning Rate": 5.240375899965386e-06, "Pretrain/Loss": 1.9951965808868408, "Pretrain/Loss (Raw)": 1.9840290546417236, "Pretrain/Step": 15190, "Pretrain/Step Time": 8.486981522291899} +{"Pretrain/Learning Rate": 5.237775551639248e-06, "Pretrain/Loss": 1.9926033020019531, "Pretrain/Loss (Raw)": 1.8576865196228027, "Pretrain/Step": 15191, "Pretrain/Step Time": 8.486440848559141} +{"Pretrain/Learning Rate": 5.235175773142911e-06, "Pretrain/Loss": 1.9916043281555176, "Pretrain/Loss (Raw)": 1.9719468355178833, "Pretrain/Step": 15192, "Pretrain/Step Time": 8.486393036320806} +{"Pretrain/Learning Rate": 5.2325765645513556e-06, "Pretrain/Loss": 1.990950345993042, "Pretrain/Loss (Raw)": 1.9736576080322266, "Pretrain/Step": 15193, "Pretrain/Step Time": 8.484831541776657} +{"Pretrain/Learning Rate": 5.229977925939511e-06, "Pretrain/Loss": 1.9917562007904053, "Pretrain/Loss (Raw)": 1.9879976511001587, "Pretrain/Step": 15194, "Pretrain/Step Time": 8.487687783315778} +{"Pretrain/Learning Rate": 5.2273798573823255e-06, "Pretrain/Loss": 1.992148518562317, "Pretrain/Loss (Raw)": 2.067272663116455, "Pretrain/Step": 15195, "Pretrain/Step Time": 8.483675172552466} +{"Pretrain/Learning Rate": 5.224782358954702e-06, "Pretrain/Loss": 1.9911494255065918, "Pretrain/Loss (Raw)": 2.005887508392334, "Pretrain/Step": 15196, "Pretrain/Step Time": 8.485892610624433} +{"Pretrain/Learning Rate": 5.22218543073153e-06, "Pretrain/Loss": 1.989980936050415, "Pretrain/Loss (Raw)": 1.9856433868408203, "Pretrain/Step": 15197, "Pretrain/Step Time": 8.490877818316221} +{"Pretrain/Learning Rate": 5.219589072787709e-06, "Pretrain/Loss": 1.9935367107391357, "Pretrain/Loss (Raw)": 2.5297300815582275, "Pretrain/Step": 15198, "Pretrain/Step Time": 8.490940352901816} +{"Pretrain/Learning Rate": 5.216993285198082e-06, "Pretrain/Loss": 1.9927592277526855, "Pretrain/Loss (Raw)": 1.8768422603607178, "Pretrain/Step": 15199, "Pretrain/Step Time": 8.490589417517185} +{"Pretrain/Learning Rate": 5.214398068037518e-06, "Pretrain/Loss": 1.9910491704940796, "Pretrain/Loss (Raw)": 1.872961163520813, "Pretrain/Step": 15200, "Pretrain/Step Time": 8.494092341512442} +{"Pretrain/Learning Rate": 5.211803421380834e-06, "Pretrain/Loss": 1.989750862121582, "Pretrain/Loss (Raw)": 1.962682843208313, "Pretrain/Step": 15201, "Pretrain/Step Time": 8.497435759752989} +{"Pretrain/Learning Rate": 5.209209345302846e-06, "Pretrain/Loss": 1.9910204410552979, "Pretrain/Loss (Raw)": 2.1182053089141846, "Pretrain/Step": 15202, "Pretrain/Step Time": 8.492876384407282} +{"Pretrain/Learning Rate": 5.206615839878359e-06, "Pretrain/Loss": 1.9932769536972046, "Pretrain/Loss (Raw)": 2.109522819519043, "Pretrain/Step": 15203, "Pretrain/Step Time": 8.493938267230988} +{"Pretrain/Learning Rate": 5.2040229051821435e-06, "Pretrain/Loss": 1.9936692714691162, "Pretrain/Loss (Raw)": 2.045109272003174, "Pretrain/Step": 15204, "Pretrain/Step Time": 8.49424896389246} +{"Pretrain/Learning Rate": 5.201430541288982e-06, "Pretrain/Loss": 1.9939906597137451, "Pretrain/Loss (Raw)": 2.0424158573150635, "Pretrain/Step": 15205, "Pretrain/Step Time": 8.494928028434515} +{"Pretrain/Learning Rate": 5.19883874827361e-06, "Pretrain/Loss": 1.9934978485107422, "Pretrain/Loss (Raw)": 2.000102996826172, "Pretrain/Step": 15206, "Pretrain/Step Time": 8.496123990043998} +{"Pretrain/Learning Rate": 5.19624752621076e-06, "Pretrain/Loss": 1.9939250946044922, "Pretrain/Loss (Raw)": 1.8602060079574585, "Pretrain/Step": 15207, "Pretrain/Step Time": 8.492608185857534} +{"Pretrain/Learning Rate": 5.1936568751751565e-06, "Pretrain/Loss": 1.9947240352630615, "Pretrain/Loss (Raw)": 2.084599018096924, "Pretrain/Step": 15208, "Pretrain/Step Time": 8.4948470890522} +{"Pretrain/Learning Rate": 5.191066795241489e-06, "Pretrain/Loss": 1.9944937229156494, "Pretrain/Loss (Raw)": 1.950287938117981, "Pretrain/Step": 15209, "Pretrain/Step Time": 8.49893600307405} +{"Pretrain/Learning Rate": 5.188477286484452e-06, "Pretrain/Loss": 1.995450496673584, "Pretrain/Loss (Raw)": 2.1428656578063965, "Pretrain/Step": 15210, "Pretrain/Step Time": 8.494273560121655} +{"Pretrain/Learning Rate": 5.1858883489787096e-06, "Pretrain/Loss": 1.9934332370758057, "Pretrain/Loss (Raw)": 1.8821393251419067, "Pretrain/Step": 15211, "Pretrain/Step Time": 8.498304096981883} +{"Pretrain/Learning Rate": 5.183299982798898e-06, "Pretrain/Loss": 1.9898401498794556, "Pretrain/Loss (Raw)": 1.713564157485962, "Pretrain/Step": 15212, "Pretrain/Step Time": 8.496866220608354} +{"Pretrain/Learning Rate": 5.180712188019671e-06, "Pretrain/Loss": 1.9897217750549316, "Pretrain/Loss (Raw)": 2.0278332233428955, "Pretrain/Step": 15213, "Pretrain/Step Time": 8.505234455689788} +{"Pretrain/Learning Rate": 5.178124964715628e-06, "Pretrain/Loss": 1.9902836084365845, "Pretrain/Loss (Raw)": 1.975948452949524, "Pretrain/Step": 15214, "Pretrain/Step Time": 8.500649688765407} +{"Pretrain/Learning Rate": 5.175538312961384e-06, "Pretrain/Loss": 1.9899377822875977, "Pretrain/Loss (Raw)": 1.9991084337234497, "Pretrain/Step": 15215, "Pretrain/Step Time": 8.504763333126903} +{"Pretrain/Learning Rate": 5.1729522328315185e-06, "Pretrain/Loss": 1.9911229610443115, "Pretrain/Loss (Raw)": 1.8924124240875244, "Pretrain/Step": 15216, "Pretrain/Step Time": 8.500660073012114} +{"Pretrain/Learning Rate": 5.170366724400591e-06, "Pretrain/Loss": 1.9911155700683594, "Pretrain/Loss (Raw)": 1.8561612367630005, "Pretrain/Step": 15217, "Pretrain/Step Time": 8.503060813993216} +{"Pretrain/Learning Rate": 5.167781787743167e-06, "Pretrain/Loss": 1.9937678575515747, "Pretrain/Loss (Raw)": 2.2262582778930664, "Pretrain/Step": 15218, "Pretrain/Step Time": 8.498140631243587} +{"Pretrain/Learning Rate": 5.165197422933768e-06, "Pretrain/Loss": 1.9910004138946533, "Pretrain/Loss (Raw)": 1.7563824653625488, "Pretrain/Step": 15219, "Pretrain/Step Time": 8.498857477679849} +{"Pretrain/Learning Rate": 5.162613630046925e-06, "Pretrain/Loss": 1.9861648082733154, "Pretrain/Loss (Raw)": 1.6604728698730469, "Pretrain/Step": 15220, "Pretrain/Step Time": 8.496162958443165} +{"Pretrain/Learning Rate": 5.1600304091571325e-06, "Pretrain/Loss": 1.9879223108291626, "Pretrain/Loss (Raw)": 2.131732940673828, "Pretrain/Step": 15221, "Pretrain/Step Time": 8.501738715916872} +{"Pretrain/Learning Rate": 5.157447760338874e-06, "Pretrain/Loss": 1.9846973419189453, "Pretrain/Loss (Raw)": 1.6248592138290405, "Pretrain/Step": 15222, "Pretrain/Step Time": 8.503335306420922} +{"Pretrain/Learning Rate": 5.154865683666624e-06, "Pretrain/Loss": 1.985048532485962, "Pretrain/Loss (Raw)": 2.0940825939178467, "Pretrain/Step": 15223, "Pretrain/Step Time": 8.500216597691178} +{"Pretrain/Learning Rate": 5.1522841792148254e-06, "Pretrain/Loss": 1.9878995418548584, "Pretrain/Loss (Raw)": 2.0975852012634277, "Pretrain/Step": 15224, "Pretrain/Step Time": 8.49554568901658} +{"Pretrain/Learning Rate": 5.14970324705793e-06, "Pretrain/Loss": 1.9916596412658691, "Pretrain/Loss (Raw)": 2.1934778690338135, "Pretrain/Step": 15225, "Pretrain/Step Time": 8.495643496513367} +{"Pretrain/Learning Rate": 5.1471228872703474e-06, "Pretrain/Loss": 1.9978969097137451, "Pretrain/Loss (Raw)": 2.4707589149475098, "Pretrain/Step": 15226, "Pretrain/Step Time": 8.494597744196653} +{"Pretrain/Learning Rate": 5.144543099926475e-06, "Pretrain/Loss": 1.998561143875122, "Pretrain/Loss (Raw)": 1.9265589714050293, "Pretrain/Step": 15227, "Pretrain/Step Time": 8.49337239190936} +{"Pretrain/Learning Rate": 5.141963885100709e-06, "Pretrain/Loss": 1.9988212585449219, "Pretrain/Loss (Raw)": 2.072439670562744, "Pretrain/Step": 15228, "Pretrain/Step Time": 8.494322821497917} +{"Pretrain/Learning Rate": 5.139385242867409e-06, "Pretrain/Loss": 1.9991693496704102, "Pretrain/Loss (Raw)": 1.9704817533493042, "Pretrain/Step": 15229, "Pretrain/Step Time": 8.498770345002413} +{"Pretrain/Learning Rate": 5.136807173300942e-06, "Pretrain/Loss": 1.9998102188110352, "Pretrain/Loss (Raw)": 1.8558664321899414, "Pretrain/Step": 15230, "Pretrain/Step Time": 8.500989753752947} +{"Pretrain/Learning Rate": 5.134229676475638e-06, "Pretrain/Loss": 1.9995448589324951, "Pretrain/Loss (Raw)": 1.9068021774291992, "Pretrain/Step": 15231, "Pretrain/Step Time": 8.496753972023726} +{"Pretrain/Learning Rate": 5.131652752465812e-06, "Pretrain/Loss": 2.0014877319335938, "Pretrain/Loss (Raw)": 2.1325409412384033, "Pretrain/Step": 15232, "Pretrain/Step Time": 8.497482981532812} +{"Pretrain/Learning Rate": 5.129076401345778e-06, "Pretrain/Loss": 2.004728078842163, "Pretrain/Loss (Raw)": 2.1545331478118896, "Pretrain/Step": 15233, "Pretrain/Step Time": 8.493917156010866} +{"Pretrain/Learning Rate": 5.1265006231898084e-06, "Pretrain/Loss": 2.0018887519836426, "Pretrain/Loss (Raw)": 1.8597261905670166, "Pretrain/Step": 15234, "Pretrain/Step Time": 8.497246900573373} +{"Pretrain/Learning Rate": 5.123925418072195e-06, "Pretrain/Loss": 2.000967502593994, "Pretrain/Loss (Raw)": 1.9553661346435547, "Pretrain/Step": 15235, "Pretrain/Step Time": 8.495211822912097} +{"Pretrain/Learning Rate": 5.121350786067178e-06, "Pretrain/Loss": 2.001235008239746, "Pretrain/Loss (Raw)": 2.0531203746795654, "Pretrain/Step": 15236, "Pretrain/Step Time": 8.49906767718494} +{"Pretrain/Learning Rate": 5.118776727248989e-06, "Pretrain/Loss": 2.0041117668151855, "Pretrain/Loss (Raw)": 2.384840965270996, "Pretrain/Step": 15237, "Pretrain/Step Time": 8.498253162950277} +{"Pretrain/Learning Rate": 5.116203241691866e-06, "Pretrain/Loss": 2.001706600189209, "Pretrain/Loss (Raw)": 1.8569637537002563, "Pretrain/Step": 15238, "Pretrain/Step Time": 8.501059770584106} +{"Pretrain/Learning Rate": 5.1136303294700015e-06, "Pretrain/Loss": 2.0026369094848633, "Pretrain/Loss (Raw)": 1.9888321161270142, "Pretrain/Step": 15239, "Pretrain/Step Time": 8.497863421216607} +{"Pretrain/Learning Rate": 5.111057990657589e-06, "Pretrain/Loss": 2.0027103424072266, "Pretrain/Loss (Raw)": 2.0736083984375, "Pretrain/Step": 15240, "Pretrain/Step Time": 8.496734276413918} +{"Pretrain/Learning Rate": 5.108486225328801e-06, "Pretrain/Loss": 2.004852533340454, "Pretrain/Loss (Raw)": 2.2173802852630615, "Pretrain/Step": 15241, "Pretrain/Step Time": 8.494759146124125} +{"Pretrain/Learning Rate": 5.105915033557784e-06, "Pretrain/Loss": 2.0021884441375732, "Pretrain/Loss (Raw)": 1.7118264436721802, "Pretrain/Step": 15242, "Pretrain/Step Time": 8.500006575137377} +{"Pretrain/Learning Rate": 5.10334441541869e-06, "Pretrain/Loss": 2.002673625946045, "Pretrain/Loss (Raw)": 2.182175397872925, "Pretrain/Step": 15243, "Pretrain/Step Time": 8.49967042170465} +{"Pretrain/Learning Rate": 5.100774370985626e-06, "Pretrain/Loss": 1.9996594190597534, "Pretrain/Loss (Raw)": 1.9680938720703125, "Pretrain/Step": 15244, "Pretrain/Step Time": 8.495872626081109} +{"Pretrain/Learning Rate": 5.098204900332712e-06, "Pretrain/Loss": 1.9988808631896973, "Pretrain/Loss (Raw)": 1.8338578939437866, "Pretrain/Step": 15245, "Pretrain/Step Time": 8.501564463600516} +{"Pretrain/Learning Rate": 5.0956360035340266e-06, "Pretrain/Loss": 1.9986591339111328, "Pretrain/Loss (Raw)": 2.0757360458374023, "Pretrain/Step": 15246, "Pretrain/Step Time": 8.502415301278234} +{"Pretrain/Learning Rate": 5.093067680663649e-06, "Pretrain/Loss": 1.9996917247772217, "Pretrain/Loss (Raw)": 2.0033926963806152, "Pretrain/Step": 15247, "Pretrain/Step Time": 8.501277964562178} +{"Pretrain/Learning Rate": 5.090499931795625e-06, "Pretrain/Loss": 1.998450756072998, "Pretrain/Loss (Raw)": 1.8672637939453125, "Pretrain/Step": 15248, "Pretrain/Step Time": 8.501653300598264} +{"Pretrain/Learning Rate": 5.087932757004005e-06, "Pretrain/Loss": 1.997456669807434, "Pretrain/Loss (Raw)": 1.906607747077942, "Pretrain/Step": 15249, "Pretrain/Step Time": 8.504127847030759} +{"Pretrain/Learning Rate": 5.0853661563628055e-06, "Pretrain/Loss": 1.9993833303451538, "Pretrain/Loss (Raw)": 2.0399563312530518, "Pretrain/Step": 15250, "Pretrain/Step Time": 8.501774901524186} +{"Pretrain/Learning Rate": 5.0828001299460306e-06, "Pretrain/Loss": 1.9986419677734375, "Pretrain/Loss (Raw)": 2.0132102966308594, "Pretrain/Step": 15251, "Pretrain/Step Time": 8.502435557544231} +{"Pretrain/Learning Rate": 5.080234677827678e-06, "Pretrain/Loss": 1.9991886615753174, "Pretrain/Loss (Raw)": 2.081282138824463, "Pretrain/Step": 15252, "Pretrain/Step Time": 8.5042335242033} +{"Pretrain/Learning Rate": 5.077669800081711e-06, "Pretrain/Loss": 1.9967418909072876, "Pretrain/Loss (Raw)": 1.7989994287490845, "Pretrain/Step": 15253, "Pretrain/Step Time": 8.502691173925996} +{"Pretrain/Learning Rate": 5.0751054967820955e-06, "Pretrain/Loss": 1.993225336074829, "Pretrain/Loss (Raw)": 1.659131646156311, "Pretrain/Step": 15254, "Pretrain/Step Time": 8.502256346866488} +{"Pretrain/Learning Rate": 5.07254176800277e-06, "Pretrain/Loss": 1.9916669130325317, "Pretrain/Loss (Raw)": 1.9051339626312256, "Pretrain/Step": 15255, "Pretrain/Step Time": 8.502482321113348} +{"Pretrain/Learning Rate": 5.069978613817644e-06, "Pretrain/Loss": 1.9918022155761719, "Pretrain/Loss (Raw)": 1.8904657363891602, "Pretrain/Step": 15256, "Pretrain/Step Time": 8.50417222455144} +{"Pretrain/Learning Rate": 5.067416034300643e-06, "Pretrain/Loss": 1.9925727844238281, "Pretrain/Loss (Raw)": 2.0191690921783447, "Pretrain/Step": 15257, "Pretrain/Step Time": 8.501832738518715} +{"Pretrain/Learning Rate": 5.064854029525645e-06, "Pretrain/Loss": 1.9959793090820312, "Pretrain/Loss (Raw)": 2.4542956352233887, "Pretrain/Step": 15258, "Pretrain/Step Time": 8.506591586396098} +{"Pretrain/Learning Rate": 5.062292599566532e-06, "Pretrain/Loss": 1.9913105964660645, "Pretrain/Loss (Raw)": 1.7802374362945557, "Pretrain/Step": 15259, "Pretrain/Step Time": 8.504090052098036} +{"Pretrain/Learning Rate": 5.059731744497157e-06, "Pretrain/Loss": 1.9916646480560303, "Pretrain/Loss (Raw)": 1.9598006010055542, "Pretrain/Step": 15260, "Pretrain/Step Time": 8.501129170879722} +{"Pretrain/Learning Rate": 5.057171464391352e-06, "Pretrain/Loss": 1.9922629594802856, "Pretrain/Loss (Raw)": 2.151914358139038, "Pretrain/Step": 15261, "Pretrain/Step Time": 8.500928085297346} +{"Pretrain/Learning Rate": 5.054611759322958e-06, "Pretrain/Loss": 1.9942071437835693, "Pretrain/Loss (Raw)": 2.132721424102783, "Pretrain/Step": 15262, "Pretrain/Step Time": 8.498298212885857} +{"Pretrain/Learning Rate": 5.052052629365767e-06, "Pretrain/Loss": 1.9923564195632935, "Pretrain/Loss (Raw)": 1.7180449962615967, "Pretrain/Step": 15263, "Pretrain/Step Time": 8.502204300835729} +{"Pretrain/Learning Rate": 5.04949407459358e-06, "Pretrain/Loss": 1.9928159713745117, "Pretrain/Loss (Raw)": 1.995254397392273, "Pretrain/Step": 15264, "Pretrain/Step Time": 8.500892950221896} +{"Pretrain/Learning Rate": 5.046936095080171e-06, "Pretrain/Loss": 1.9923114776611328, "Pretrain/Loss (Raw)": 2.0480172634124756, "Pretrain/Step": 15265, "Pretrain/Step Time": 8.5004853438586} +{"Pretrain/Learning Rate": 5.044378690899285e-06, "Pretrain/Loss": 1.990598440170288, "Pretrain/Loss (Raw)": 1.8287333250045776, "Pretrain/Step": 15266, "Pretrain/Step Time": 8.503430174663663} +{"Pretrain/Learning Rate": 5.041821862124677e-06, "Pretrain/Loss": 1.9916014671325684, "Pretrain/Loss (Raw)": 2.032625198364258, "Pretrain/Step": 15267, "Pretrain/Step Time": 8.497953828424215} +{"Pretrain/Learning Rate": 5.03926560883006e-06, "Pretrain/Loss": 1.9912068843841553, "Pretrain/Loss (Raw)": 2.0462472438812256, "Pretrain/Step": 15268, "Pretrain/Step Time": 8.49952981248498} +{"Pretrain/Learning Rate": 5.036709931089156e-06, "Pretrain/Loss": 1.9932223558425903, "Pretrain/Loss (Raw)": 2.2244112491607666, "Pretrain/Step": 15269, "Pretrain/Step Time": 8.500900557264686} +{"Pretrain/Learning Rate": 5.034154828975646e-06, "Pretrain/Loss": 1.9898240566253662, "Pretrain/Loss (Raw)": 1.845306634902954, "Pretrain/Step": 15270, "Pretrain/Step Time": 8.496978601440787} +{"Pretrain/Learning Rate": 5.031600302563202e-06, "Pretrain/Loss": 1.99514639377594, "Pretrain/Loss (Raw)": 2.3356754779815674, "Pretrain/Step": 15271, "Pretrain/Step Time": 8.4985345415771} +{"Pretrain/Learning Rate": 5.0290463519254925e-06, "Pretrain/Loss": 1.9968349933624268, "Pretrain/Loss (Raw)": 2.0616934299468994, "Pretrain/Step": 15272, "Pretrain/Step Time": 8.495215680450201} +{"Pretrain/Learning Rate": 5.026492977136144e-06, "Pretrain/Loss": 1.9978554248809814, "Pretrain/Loss (Raw)": 2.1289408206939697, "Pretrain/Step": 15273, "Pretrain/Step Time": 8.489811746403575} +{"Pretrain/Learning Rate": 5.023940178268799e-06, "Pretrain/Loss": 1.9958105087280273, "Pretrain/Loss (Raw)": 1.7970168590545654, "Pretrain/Step": 15274, "Pretrain/Step Time": 8.497994162142277} +{"Pretrain/Learning Rate": 5.0213879553970555e-06, "Pretrain/Loss": 1.9954360723495483, "Pretrain/Loss (Raw)": 2.0008811950683594, "Pretrain/Step": 15275, "Pretrain/Step Time": 8.498880852013826} +{"Pretrain/Learning Rate": 5.018836308594502e-06, "Pretrain/Loss": 1.9931559562683105, "Pretrain/Loss (Raw)": 1.880092978477478, "Pretrain/Step": 15276, "Pretrain/Step Time": 8.493378793820739} +{"Pretrain/Learning Rate": 5.016285237934723e-06, "Pretrain/Loss": 1.992355465888977, "Pretrain/Loss (Raw)": 1.8278512954711914, "Pretrain/Step": 15277, "Pretrain/Step Time": 8.490786308422685} +{"Pretrain/Learning Rate": 5.013734743491263e-06, "Pretrain/Loss": 1.9918794631958008, "Pretrain/Loss (Raw)": 1.972265601158142, "Pretrain/Step": 15278, "Pretrain/Step Time": 8.49565857835114} +{"Pretrain/Learning Rate": 5.011184825337681e-06, "Pretrain/Loss": 1.9946447610855103, "Pretrain/Loss (Raw)": 2.1464242935180664, "Pretrain/Step": 15279, "Pretrain/Step Time": 8.494905848056078} +{"Pretrain/Learning Rate": 5.008635483547494e-06, "Pretrain/Loss": 1.9939618110656738, "Pretrain/Loss (Raw)": 1.9717947244644165, "Pretrain/Step": 15280, "Pretrain/Step Time": 8.493444204330444} +{"Pretrain/Learning Rate": 5.0060867181942e-06, "Pretrain/Loss": 1.991568922996521, "Pretrain/Loss (Raw)": 1.6774529218673706, "Pretrain/Step": 15281, "Pretrain/Step Time": 8.49624670855701} +{"Pretrain/Learning Rate": 5.003538529351312e-06, "Pretrain/Loss": 1.990554690361023, "Pretrain/Loss (Raw)": 1.720650315284729, "Pretrain/Step": 15282, "Pretrain/Step Time": 8.49676520191133} +{"Pretrain/Learning Rate": 5.000990917092283e-06, "Pretrain/Loss": 1.9953639507293701, "Pretrain/Loss (Raw)": 2.5588977336883545, "Pretrain/Step": 15283, "Pretrain/Step Time": 8.499819338321686} +{"Pretrain/Learning Rate": 4.998443881490592e-06, "Pretrain/Loss": 1.9963994026184082, "Pretrain/Loss (Raw)": 2.02427339553833, "Pretrain/Step": 15284, "Pretrain/Step Time": 8.498494314029813} +{"Pretrain/Learning Rate": 4.995897422619669e-06, "Pretrain/Loss": 1.9947973489761353, "Pretrain/Loss (Raw)": 1.96474289894104, "Pretrain/Step": 15285, "Pretrain/Step Time": 8.495767060667276} +{"Pretrain/Learning Rate": 4.9933515405529375e-06, "Pretrain/Loss": 1.9943807125091553, "Pretrain/Loss (Raw)": 1.8886528015136719, "Pretrain/Step": 15286, "Pretrain/Step Time": 8.495248107239604} +{"Pretrain/Learning Rate": 4.9908062353638155e-06, "Pretrain/Loss": 1.9932490587234497, "Pretrain/Loss (Raw)": 2.000250816345215, "Pretrain/Step": 15287, "Pretrain/Step Time": 8.495560672134161} +{"Pretrain/Learning Rate": 4.988261507125686e-06, "Pretrain/Loss": 1.994035005569458, "Pretrain/Loss (Raw)": 2.017150402069092, "Pretrain/Step": 15288, "Pretrain/Step Time": 8.496345948427916} +{"Pretrain/Learning Rate": 4.985717355911934e-06, "Pretrain/Loss": 1.9909265041351318, "Pretrain/Loss (Raw)": 1.8742650747299194, "Pretrain/Step": 15289, "Pretrain/Step Time": 8.495955439284444} +{"Pretrain/Learning Rate": 4.983173781795911e-06, "Pretrain/Loss": 1.9916049242019653, "Pretrain/Loss (Raw)": 1.9435763359069824, "Pretrain/Step": 15290, "Pretrain/Step Time": 8.49136103130877} +{"Pretrain/Learning Rate": 4.9806307848509565e-06, "Pretrain/Loss": 1.9928466081619263, "Pretrain/Loss (Raw)": 2.216036796569824, "Pretrain/Step": 15291, "Pretrain/Step Time": 8.488105468451977} +{"Pretrain/Learning Rate": 4.9780883651504075e-06, "Pretrain/Loss": 1.9926546812057495, "Pretrain/Loss (Raw)": 1.9736549854278564, "Pretrain/Step": 15292, "Pretrain/Step Time": 8.493150003254414} +{"Pretrain/Learning Rate": 4.975546522767558e-06, "Pretrain/Loss": 1.99306321144104, "Pretrain/Loss (Raw)": 2.079686164855957, "Pretrain/Step": 15293, "Pretrain/Step Time": 8.489055052399635} +{"Pretrain/Learning Rate": 4.973005257775715e-06, "Pretrain/Loss": 1.9953224658966064, "Pretrain/Loss (Raw)": 2.178467035293579, "Pretrain/Step": 15294, "Pretrain/Step Time": 8.493615489453077} +{"Pretrain/Learning Rate": 4.970464570248149e-06, "Pretrain/Loss": 1.9970344305038452, "Pretrain/Loss (Raw)": 1.9371674060821533, "Pretrain/Step": 15295, "Pretrain/Step Time": 8.488496590405703} +{"Pretrain/Learning Rate": 4.967924460258108e-06, "Pretrain/Loss": 1.997444748878479, "Pretrain/Loss (Raw)": 2.007079839706421, "Pretrain/Step": 15296, "Pretrain/Step Time": 8.493261089548469} +{"Pretrain/Learning Rate": 4.9653849278788526e-06, "Pretrain/Loss": 1.9968736171722412, "Pretrain/Loss (Raw)": 2.16162109375, "Pretrain/Step": 15297, "Pretrain/Step Time": 8.493922287598252} +{"Pretrain/Learning Rate": 4.962845973183591e-06, "Pretrain/Loss": 1.9971871376037598, "Pretrain/Loss (Raw)": 2.031914472579956, "Pretrain/Step": 15298, "Pretrain/Step Time": 8.489766113460064} +{"Pretrain/Learning Rate": 4.960307596245548e-06, "Pretrain/Loss": 1.9973065853118896, "Pretrain/Loss (Raw)": 1.8808926343917847, "Pretrain/Step": 15299, "Pretrain/Step Time": 8.49357190169394} +{"Pretrain/Learning Rate": 4.957769797137907e-06, "Pretrain/Loss": 1.9955506324768066, "Pretrain/Loss (Raw)": 2.00580096244812, "Pretrain/Step": 15300, "Pretrain/Step Time": 8.494332516565919} +{"Pretrain/Learning Rate": 4.955232575933841e-06, "Pretrain/Loss": 1.9958630800247192, "Pretrain/Loss (Raw)": 2.05941104888916, "Pretrain/Step": 15301, "Pretrain/Step Time": 8.496593790128827} +{"Pretrain/Learning Rate": 4.952695932706516e-06, "Pretrain/Loss": 1.9967284202575684, "Pretrain/Loss (Raw)": 2.068849563598633, "Pretrain/Step": 15302, "Pretrain/Step Time": 8.494714573025703} +{"Pretrain/Learning Rate": 4.950159867529067e-06, "Pretrain/Loss": 1.996687412261963, "Pretrain/Loss (Raw)": 2.0061116218566895, "Pretrain/Step": 15303, "Pretrain/Step Time": 8.496777540072799} +{"Pretrain/Learning Rate": 4.9476243804746305e-06, "Pretrain/Loss": 1.9963250160217285, "Pretrain/Loss (Raw)": 1.766884446144104, "Pretrain/Step": 15304, "Pretrain/Step Time": 8.495091546326876} +{"Pretrain/Learning Rate": 4.9450894716163096e-06, "Pretrain/Loss": 1.9994232654571533, "Pretrain/Loss (Raw)": 2.0570452213287354, "Pretrain/Step": 15305, "Pretrain/Step Time": 8.498478524386883} +{"Pretrain/Learning Rate": 4.942555141027189e-06, "Pretrain/Loss": 1.9989358186721802, "Pretrain/Loss (Raw)": 1.9174091815948486, "Pretrain/Step": 15306, "Pretrain/Step Time": 8.495731707662344} +{"Pretrain/Learning Rate": 4.940021388780358e-06, "Pretrain/Loss": 1.9954098463058472, "Pretrain/Loss (Raw)": 1.9084515571594238, "Pretrain/Step": 15307, "Pretrain/Step Time": 8.495016137138009} +{"Pretrain/Learning Rate": 4.937488214948863e-06, "Pretrain/Loss": 1.995436191558838, "Pretrain/Loss (Raw)": 1.916068434715271, "Pretrain/Step": 15308, "Pretrain/Step Time": 8.495983965694904} +{"Pretrain/Learning Rate": 4.9349556196057575e-06, "Pretrain/Loss": 1.991933822631836, "Pretrain/Loss (Raw)": 1.702257513999939, "Pretrain/Step": 15309, "Pretrain/Step Time": 8.488149957731366} +{"Pretrain/Learning Rate": 4.93242360282406e-06, "Pretrain/Loss": 1.9911072254180908, "Pretrain/Loss (Raw)": 1.8691074848175049, "Pretrain/Step": 15310, "Pretrain/Step Time": 8.492130298167467} +{"Pretrain/Learning Rate": 4.929892164676778e-06, "Pretrain/Loss": 1.9900375604629517, "Pretrain/Loss (Raw)": 1.9105297327041626, "Pretrain/Step": 15311, "Pretrain/Step Time": 8.49062573350966} +{"Pretrain/Learning Rate": 4.927361305236914e-06, "Pretrain/Loss": 1.989668607711792, "Pretrain/Loss (Raw)": 1.9003651142120361, "Pretrain/Step": 15312, "Pretrain/Step Time": 8.49672805890441} +{"Pretrain/Learning Rate": 4.9248310245774255e-06, "Pretrain/Loss": 1.9911887645721436, "Pretrain/Loss (Raw)": 2.0135865211486816, "Pretrain/Step": 15313, "Pretrain/Step Time": 8.490618078038096} +{"Pretrain/Learning Rate": 4.922301322771292e-06, "Pretrain/Loss": 1.99277663230896, "Pretrain/Loss (Raw)": 2.0817229747772217, "Pretrain/Step": 15314, "Pretrain/Step Time": 8.496112877503037} +{"Pretrain/Learning Rate": 4.91977219989144e-06, "Pretrain/Loss": 1.989745855331421, "Pretrain/Loss (Raw)": 1.7047182321548462, "Pretrain/Step": 15315, "Pretrain/Step Time": 8.489597929641604} +{"Pretrain/Learning Rate": 4.917243656010806e-06, "Pretrain/Loss": 1.9895087480545044, "Pretrain/Loss (Raw)": 2.0031626224517822, "Pretrain/Step": 15316, "Pretrain/Step Time": 8.49218718148768} +{"Pretrain/Learning Rate": 4.914715691202293e-06, "Pretrain/Loss": 1.9902957677841187, "Pretrain/Loss (Raw)": 1.9919006824493408, "Pretrain/Step": 15317, "Pretrain/Step Time": 8.488513050600886} +{"Pretrain/Learning Rate": 4.91218830553879e-06, "Pretrain/Loss": 1.990000605583191, "Pretrain/Loss (Raw)": 1.946250081062317, "Pretrain/Step": 15318, "Pretrain/Step Time": 8.489153543487191} +{"Pretrain/Learning Rate": 4.909661499093182e-06, "Pretrain/Loss": 1.9922258853912354, "Pretrain/Loss (Raw)": 2.1425271034240723, "Pretrain/Step": 15319, "Pretrain/Step Time": 8.494649603962898} +{"Pretrain/Learning Rate": 4.907135271938315e-06, "Pretrain/Loss": 1.9925795793533325, "Pretrain/Loss (Raw)": 2.0172176361083984, "Pretrain/Step": 15320, "Pretrain/Step Time": 8.494777984917164} +{"Pretrain/Learning Rate": 4.904609624147044e-06, "Pretrain/Loss": 1.9918310642242432, "Pretrain/Loss (Raw)": 1.8778393268585205, "Pretrain/Step": 15321, "Pretrain/Step Time": 8.49214200861752} +{"Pretrain/Learning Rate": 4.9020845557921884e-06, "Pretrain/Loss": 1.9918174743652344, "Pretrain/Loss (Raw)": 1.9862595796585083, "Pretrain/Step": 15322, "Pretrain/Step Time": 8.4916816893965} +{"Pretrain/Learning Rate": 4.8995600669465486e-06, "Pretrain/Loss": 1.9918489456176758, "Pretrain/Loss (Raw)": 2.0713112354278564, "Pretrain/Step": 15323, "Pretrain/Step Time": 8.491836654022336} +{"Pretrain/Learning Rate": 4.897036157682933e-06, "Pretrain/Loss": 1.991639256477356, "Pretrain/Loss (Raw)": 1.9790446758270264, "Pretrain/Step": 15324, "Pretrain/Step Time": 8.491337394341826} +{"Pretrain/Learning Rate": 4.894512828074102e-06, "Pretrain/Loss": 1.9906601905822754, "Pretrain/Loss (Raw)": 1.8603135347366333, "Pretrain/Step": 15325, "Pretrain/Step Time": 8.487521141767502} +{"Pretrain/Learning Rate": 4.891990078192823e-06, "Pretrain/Loss": 1.9855456352233887, "Pretrain/Loss (Raw)": 1.8750853538513184, "Pretrain/Step": 15326, "Pretrain/Step Time": 8.488996775820851} +{"Pretrain/Learning Rate": 4.889467908111839e-06, "Pretrain/Loss": 1.9864819049835205, "Pretrain/Loss (Raw)": 1.9966731071472168, "Pretrain/Step": 15327, "Pretrain/Step Time": 8.491030951961875} +{"Pretrain/Learning Rate": 4.886946317903862e-06, "Pretrain/Loss": 1.9873523712158203, "Pretrain/Loss (Raw)": 1.984372615814209, "Pretrain/Step": 15328, "Pretrain/Step Time": 8.488958805799484} +{"Pretrain/Learning Rate": 4.884425307641619e-06, "Pretrain/Loss": 1.9872350692749023, "Pretrain/Loss (Raw)": 1.9476654529571533, "Pretrain/Step": 15329, "Pretrain/Step Time": 8.4913937933743} +{"Pretrain/Learning Rate": 4.881904877397781e-06, "Pretrain/Loss": 1.9846675395965576, "Pretrain/Loss (Raw)": 1.7895698547363281, "Pretrain/Step": 15330, "Pretrain/Step Time": 8.493635231629014} +{"Pretrain/Learning Rate": 4.879385027245048e-06, "Pretrain/Loss": 1.9841797351837158, "Pretrain/Loss (Raw)": 2.0470874309539795, "Pretrain/Step": 15331, "Pretrain/Step Time": 8.493880230933428} +{"Pretrain/Learning Rate": 4.876865757256052e-06, "Pretrain/Loss": 1.9836593866348267, "Pretrain/Loss (Raw)": 1.9785038232803345, "Pretrain/Step": 15332, "Pretrain/Step Time": 8.492680471390486} +{"Pretrain/Learning Rate": 4.874347067503452e-06, "Pretrain/Loss": 1.984634280204773, "Pretrain/Loss (Raw)": 2.167205810546875, "Pretrain/Step": 15333, "Pretrain/Step Time": 8.495932023972273} +{"Pretrain/Learning Rate": 4.871828958059866e-06, "Pretrain/Loss": 1.9858287572860718, "Pretrain/Loss (Raw)": 2.1529886722564697, "Pretrain/Step": 15334, "Pretrain/Step Time": 8.494936924427748} +{"Pretrain/Learning Rate": 4.869311428997894e-06, "Pretrain/Loss": 1.9860470294952393, "Pretrain/Loss (Raw)": 1.8881491422653198, "Pretrain/Step": 15335, "Pretrain/Step Time": 8.496102910488844} +{"Pretrain/Learning Rate": 4.866794480390144e-06, "Pretrain/Loss": 1.9840737581253052, "Pretrain/Loss (Raw)": 1.8320132493972778, "Pretrain/Step": 15336, "Pretrain/Step Time": 8.493320668116212} +{"Pretrain/Learning Rate": 4.864278112309176e-06, "Pretrain/Loss": 1.9865975379943848, "Pretrain/Loss (Raw)": 2.2733349800109863, "Pretrain/Step": 15337, "Pretrain/Step Time": 8.489925015717745} +{"Pretrain/Learning Rate": 4.861762324827562e-06, "Pretrain/Loss": 1.9845037460327148, "Pretrain/Loss (Raw)": 1.874865174293518, "Pretrain/Step": 15338, "Pretrain/Step Time": 8.496668005362153} +{"Pretrain/Learning Rate": 4.859247118017832e-06, "Pretrain/Loss": 1.9850870370864868, "Pretrain/Loss (Raw)": 1.956795573234558, "Pretrain/Step": 15339, "Pretrain/Step Time": 8.494191836565733} +{"Pretrain/Learning Rate": 4.8567324919525095e-06, "Pretrain/Loss": 1.9883936643600464, "Pretrain/Loss (Raw)": 2.1368155479431152, "Pretrain/Step": 15340, "Pretrain/Step Time": 8.497978093102574} +{"Pretrain/Learning Rate": 4.854218446704109e-06, "Pretrain/Loss": 1.9870519638061523, "Pretrain/Loss (Raw)": 1.8560956716537476, "Pretrain/Step": 15341, "Pretrain/Step Time": 8.488432420417666} +{"Pretrain/Learning Rate": 4.851704982345112e-06, "Pretrain/Loss": 1.9876642227172852, "Pretrain/Loss (Raw)": 2.054318428039551, "Pretrain/Step": 15342, "Pretrain/Step Time": 8.489936856552958} +{"Pretrain/Learning Rate": 4.849192098948005e-06, "Pretrain/Loss": 1.9867310523986816, "Pretrain/Loss (Raw)": 1.8796520233154297, "Pretrain/Step": 15343, "Pretrain/Step Time": 8.49414835497737} +{"Pretrain/Learning Rate": 4.846679796585241e-06, "Pretrain/Loss": 1.9876163005828857, "Pretrain/Loss (Raw)": 2.0057389736175537, "Pretrain/Step": 15344, "Pretrain/Step Time": 8.496915804222226} +{"Pretrain/Learning Rate": 4.844168075329247e-06, "Pretrain/Loss": 1.989540696144104, "Pretrain/Loss (Raw)": 2.1024839878082275, "Pretrain/Step": 15345, "Pretrain/Step Time": 8.496346816420555} +{"Pretrain/Learning Rate": 4.841656935252467e-06, "Pretrain/Loss": 1.9872355461120605, "Pretrain/Loss (Raw)": 1.931182861328125, "Pretrain/Step": 15346, "Pretrain/Step Time": 8.494037741795182} +{"Pretrain/Learning Rate": 4.839146376427292e-06, "Pretrain/Loss": 1.9887917041778564, "Pretrain/Loss (Raw)": 1.9555813074111938, "Pretrain/Step": 15347, "Pretrain/Step Time": 8.495083035901189} +{"Pretrain/Learning Rate": 4.836636398926125e-06, "Pretrain/Loss": 1.990502119064331, "Pretrain/Loss (Raw)": 1.8794124126434326, "Pretrain/Step": 15348, "Pretrain/Step Time": 8.496647715568542} +{"Pretrain/Learning Rate": 4.834127002821332e-06, "Pretrain/Loss": 1.9890974760055542, "Pretrain/Loss (Raw)": 1.9519473314285278, "Pretrain/Step": 15349, "Pretrain/Step Time": 8.49289889447391} +{"Pretrain/Learning Rate": 4.831618188185266e-06, "Pretrain/Loss": 1.9916515350341797, "Pretrain/Loss (Raw)": 1.9517689943313599, "Pretrain/Step": 15350, "Pretrain/Step Time": 8.492124216631055} +{"Pretrain/Learning Rate": 4.8291099550902775e-06, "Pretrain/Loss": 1.9902338981628418, "Pretrain/Loss (Raw)": 1.9126248359680176, "Pretrain/Step": 15351, "Pretrain/Step Time": 8.490990763530135} +{"Pretrain/Learning Rate": 4.826602303608676e-06, "Pretrain/Loss": 1.98661208152771, "Pretrain/Loss (Raw)": 1.6339809894561768, "Pretrain/Step": 15352, "Pretrain/Step Time": 8.496402185410261} +{"Pretrain/Learning Rate": 4.824095233812784e-06, "Pretrain/Loss": 1.9868284463882446, "Pretrain/Loss (Raw)": 2.2211859226226807, "Pretrain/Step": 15353, "Pretrain/Step Time": 8.493146853521466} +{"Pretrain/Learning Rate": 4.8215887457748825e-06, "Pretrain/Loss": 1.9834142923355103, "Pretrain/Loss (Raw)": 2.033745050430298, "Pretrain/Step": 15354, "Pretrain/Step Time": 8.49865741096437} +{"Pretrain/Learning Rate": 4.819082839567238e-06, "Pretrain/Loss": 1.9841983318328857, "Pretrain/Loss (Raw)": 2.0268959999084473, "Pretrain/Step": 15355, "Pretrain/Step Time": 8.500138504430652} +{"Pretrain/Learning Rate": 4.816577515262122e-06, "Pretrain/Loss": 1.9834575653076172, "Pretrain/Loss (Raw)": 1.9776338338851929, "Pretrain/Step": 15356, "Pretrain/Step Time": 8.495296774432063} +{"Pretrain/Learning Rate": 4.814072772931755e-06, "Pretrain/Loss": 1.9831233024597168, "Pretrain/Loss (Raw)": 1.9276976585388184, "Pretrain/Step": 15357, "Pretrain/Step Time": 8.493710039183497} +{"Pretrain/Learning Rate": 4.8115686126483765e-06, "Pretrain/Loss": 1.9822373390197754, "Pretrain/Loss (Raw)": 1.7424511909484863, "Pretrain/Step": 15358, "Pretrain/Step Time": 8.488070394843817} +{"Pretrain/Learning Rate": 4.809065034484186e-06, "Pretrain/Loss": 1.9827275276184082, "Pretrain/Loss (Raw)": 1.9695470333099365, "Pretrain/Step": 15359, "Pretrain/Step Time": 8.492106018587947} +{"Pretrain/Learning Rate": 4.806562038511367e-06, "Pretrain/Loss": 1.9819777011871338, "Pretrain/Loss (Raw)": 2.0365684032440186, "Pretrain/Step": 15360, "Pretrain/Step Time": 8.49148390442133} +{"Pretrain/Learning Rate": 4.804059624802098e-06, "Pretrain/Loss": 1.9807789325714111, "Pretrain/Loss (Raw)": 2.0010993480682373, "Pretrain/Step": 15361, "Pretrain/Step Time": 8.496708687394857} +{"Pretrain/Learning Rate": 4.80155779342853e-06, "Pretrain/Loss": 1.9807186126708984, "Pretrain/Loss (Raw)": 1.8520008325576782, "Pretrain/Step": 15362, "Pretrain/Step Time": 8.497121488675475} +{"Pretrain/Learning Rate": 4.79905654446281e-06, "Pretrain/Loss": 1.9804333448410034, "Pretrain/Loss (Raw)": 1.918853998184204, "Pretrain/Step": 15363, "Pretrain/Step Time": 8.499030126258731} +{"Pretrain/Learning Rate": 4.796555877977052e-06, "Pretrain/Loss": 1.9803955554962158, "Pretrain/Loss (Raw)": 2.048295021057129, "Pretrain/Step": 15364, "Pretrain/Step Time": 8.491708893328905} +{"Pretrain/Learning Rate": 4.794055794043359e-06, "Pretrain/Loss": 1.9785572290420532, "Pretrain/Loss (Raw)": 2.1495296955108643, "Pretrain/Step": 15365, "Pretrain/Step Time": 8.494508100673556} +{"Pretrain/Learning Rate": 4.7915562927338256e-06, "Pretrain/Loss": 1.978487253189087, "Pretrain/Loss (Raw)": 1.8480135202407837, "Pretrain/Step": 15366, "Pretrain/Step Time": 8.490751169621944} +{"Pretrain/Learning Rate": 4.789057374120518e-06, "Pretrain/Loss": 1.9774086475372314, "Pretrain/Loss (Raw)": 1.85075843334198, "Pretrain/Step": 15367, "Pretrain/Step Time": 8.494648929685354} +{"Pretrain/Learning Rate": 4.786559038275498e-06, "Pretrain/Loss": 1.9780328273773193, "Pretrain/Loss (Raw)": 2.153503656387329, "Pretrain/Step": 15368, "Pretrain/Step Time": 8.49597630277276} +{"Pretrain/Learning Rate": 4.784061285270797e-06, "Pretrain/Loss": 1.9757035970687866, "Pretrain/Loss (Raw)": 1.9192450046539307, "Pretrain/Step": 15369, "Pretrain/Step Time": 8.496844137087464} +{"Pretrain/Learning Rate": 4.781564115178433e-06, "Pretrain/Loss": 1.9775885343551636, "Pretrain/Loss (Raw)": 1.953094720840454, "Pretrain/Step": 15370, "Pretrain/Step Time": 8.49556246586144} +{"Pretrain/Learning Rate": 4.779067528070422e-06, "Pretrain/Loss": 1.9743421077728271, "Pretrain/Loss (Raw)": 1.7666293382644653, "Pretrain/Step": 15371, "Pretrain/Step Time": 8.497425504028797} +{"Pretrain/Learning Rate": 4.776571524018736e-06, "Pretrain/Loss": 1.9748601913452148, "Pretrain/Loss (Raw)": 2.0343992710113525, "Pretrain/Step": 15372, "Pretrain/Step Time": 8.498706180602312} +{"Pretrain/Learning Rate": 4.77407610309536e-06, "Pretrain/Loss": 1.9756760597229004, "Pretrain/Loss (Raw)": 1.93830406665802, "Pretrain/Step": 15373, "Pretrain/Step Time": 8.491702985018492} +{"Pretrain/Learning Rate": 4.771581265372241e-06, "Pretrain/Loss": 1.976081132888794, "Pretrain/Loss (Raw)": 2.127580404281616, "Pretrain/Step": 15374, "Pretrain/Step Time": 8.49059140495956} +{"Pretrain/Learning Rate": 4.769087010921311e-06, "Pretrain/Loss": 1.9755558967590332, "Pretrain/Loss (Raw)": 1.9361610412597656, "Pretrain/Step": 15375, "Pretrain/Step Time": 8.488589968532324} +{"Pretrain/Learning Rate": 4.766593339814498e-06, "Pretrain/Loss": 1.9768271446228027, "Pretrain/Loss (Raw)": 2.0299813747406006, "Pretrain/Step": 15376, "Pretrain/Step Time": 8.489838918671012} +{"Pretrain/Learning Rate": 4.764100252123702e-06, "Pretrain/Loss": 1.977921962738037, "Pretrain/Loss (Raw)": 2.0467591285705566, "Pretrain/Step": 15377, "Pretrain/Step Time": 8.491572825238109} +{"Pretrain/Learning Rate": 4.761607747920813e-06, "Pretrain/Loss": 1.978752851486206, "Pretrain/Loss (Raw)": 2.1463077068328857, "Pretrain/Step": 15378, "Pretrain/Step Time": 8.496922371909022} +{"Pretrain/Learning Rate": 4.759115827277696e-06, "Pretrain/Loss": 1.9775264263153076, "Pretrain/Loss (Raw)": 1.8562095165252686, "Pretrain/Step": 15379, "Pretrain/Step Time": 8.498547490686178} +{"Pretrain/Learning Rate": 4.756624490266201e-06, "Pretrain/Loss": 1.9773659706115723, "Pretrain/Loss (Raw)": 2.0607454776763916, "Pretrain/Step": 15380, "Pretrain/Step Time": 8.496425811201334} +{"Pretrain/Learning Rate": 4.754133736958172e-06, "Pretrain/Loss": 1.9797899723052979, "Pretrain/Loss (Raw)": 2.10927677154541, "Pretrain/Step": 15381, "Pretrain/Step Time": 8.496237698942423} +{"Pretrain/Learning Rate": 4.75164356742542e-06, "Pretrain/Loss": 1.982412576675415, "Pretrain/Loss (Raw)": 1.9948256015777588, "Pretrain/Step": 15382, "Pretrain/Step Time": 8.498062727972865} +{"Pretrain/Learning Rate": 4.74915398173976e-06, "Pretrain/Loss": 1.9826130867004395, "Pretrain/Loss (Raw)": 1.9307868480682373, "Pretrain/Step": 15383, "Pretrain/Step Time": 8.498304350301623} +{"Pretrain/Learning Rate": 4.746664979972959e-06, "Pretrain/Loss": 1.9828553199768066, "Pretrain/Loss (Raw)": 1.921485185623169, "Pretrain/Step": 15384, "Pretrain/Step Time": 8.490632394328713} +{"Pretrain/Learning Rate": 4.744176562196804e-06, "Pretrain/Loss": 1.9803903102874756, "Pretrain/Loss (Raw)": 1.7036583423614502, "Pretrain/Step": 15385, "Pretrain/Step Time": 8.493136199191213} +{"Pretrain/Learning Rate": 4.741688728483037e-06, "Pretrain/Loss": 1.975578784942627, "Pretrain/Loss (Raw)": 1.8384026288986206, "Pretrain/Step": 15386, "Pretrain/Step Time": 8.490299751982093} +{"Pretrain/Learning Rate": 4.739201478903388e-06, "Pretrain/Loss": 1.977448582649231, "Pretrain/Loss (Raw)": 2.0195810794830322, "Pretrain/Step": 15387, "Pretrain/Step Time": 8.491799335926771} +{"Pretrain/Learning Rate": 4.736714813529589e-06, "Pretrain/Loss": 1.977881908416748, "Pretrain/Loss (Raw)": 2.0152649879455566, "Pretrain/Step": 15388, "Pretrain/Step Time": 8.490122893825173} +{"Pretrain/Learning Rate": 4.734228732433327e-06, "Pretrain/Loss": 1.9760475158691406, "Pretrain/Loss (Raw)": 1.9171221256256104, "Pretrain/Step": 15389, "Pretrain/Step Time": 8.491044539958239} +{"Pretrain/Learning Rate": 4.731743235686301e-06, "Pretrain/Loss": 1.9760890007019043, "Pretrain/Loss (Raw)": 2.138033390045166, "Pretrain/Step": 15390, "Pretrain/Step Time": 8.49296603910625} +{"Pretrain/Learning Rate": 4.729258323360166e-06, "Pretrain/Loss": 1.9775564670562744, "Pretrain/Loss (Raw)": 1.9058725833892822, "Pretrain/Step": 15391, "Pretrain/Step Time": 8.488948283717036} +{"Pretrain/Learning Rate": 4.726773995526576e-06, "Pretrain/Loss": 1.9770185947418213, "Pretrain/Loss (Raw)": 1.9264096021652222, "Pretrain/Step": 15392, "Pretrain/Step Time": 8.48900156468153} +{"Pretrain/Learning Rate": 4.7242902522571715e-06, "Pretrain/Loss": 1.978841781616211, "Pretrain/Loss (Raw)": 2.2813801765441895, "Pretrain/Step": 15393, "Pretrain/Step Time": 8.491858307272196} +{"Pretrain/Learning Rate": 4.7218070936235565e-06, "Pretrain/Loss": 1.9776432514190674, "Pretrain/Loss (Raw)": 1.6753170490264893, "Pretrain/Step": 15394, "Pretrain/Step Time": 8.4866012763232} +{"Pretrain/Learning Rate": 4.719324519697343e-06, "Pretrain/Loss": 1.9774880409240723, "Pretrain/Loss (Raw)": 2.0127604007720947, "Pretrain/Step": 15395, "Pretrain/Step Time": 8.488774038851261} +{"Pretrain/Learning Rate": 4.716842530550114e-06, "Pretrain/Loss": 1.9803998470306396, "Pretrain/Loss (Raw)": 2.418959856033325, "Pretrain/Step": 15396, "Pretrain/Step Time": 8.489051163196564} +{"Pretrain/Learning Rate": 4.7143611262534246e-06, "Pretrain/Loss": 1.97818922996521, "Pretrain/Loss (Raw)": 1.9414535760879517, "Pretrain/Step": 15397, "Pretrain/Step Time": 8.486835945397615} +{"Pretrain/Learning Rate": 4.711880306878838e-06, "Pretrain/Loss": 1.9802663326263428, "Pretrain/Loss (Raw)": 2.11116623878479, "Pretrain/Step": 15398, "Pretrain/Step Time": 8.489476202055812} +{"Pretrain/Learning Rate": 4.709400072497871e-06, "Pretrain/Loss": 1.9774879217147827, "Pretrain/Loss (Raw)": 1.9800362586975098, "Pretrain/Step": 15399, "Pretrain/Step Time": 8.491423422470689} +{"Pretrain/Learning Rate": 4.706920423182059e-06, "Pretrain/Loss": 1.9762983322143555, "Pretrain/Loss (Raw)": 1.909440517425537, "Pretrain/Step": 15400, "Pretrain/Step Time": 8.49000166542828} +{"Pretrain/Learning Rate": 4.704441359002889e-06, "Pretrain/Loss": 1.9736425876617432, "Pretrain/Loss (Raw)": 1.7889938354492188, "Pretrain/Step": 15401, "Pretrain/Step Time": 8.493303438648582} +{"Pretrain/Learning Rate": 4.701962880031841e-06, "Pretrain/Loss": 1.975123643875122, "Pretrain/Loss (Raw)": 1.9866009950637817, "Pretrain/Step": 15402, "Pretrain/Step Time": 8.485840894281864} +{"Pretrain/Learning Rate": 4.699484986340389e-06, "Pretrain/Loss": 1.9758665561676025, "Pretrain/Loss (Raw)": 2.0959601402282715, "Pretrain/Step": 15403, "Pretrain/Step Time": 8.490971339866519} +{"Pretrain/Learning Rate": 4.6970076779999706e-06, "Pretrain/Loss": 1.973822832107544, "Pretrain/Loss (Raw)": 1.618512511253357, "Pretrain/Step": 15404, "Pretrain/Step Time": 8.492960713803768} +{"Pretrain/Learning Rate": 4.6945309550820295e-06, "Pretrain/Loss": 1.9751927852630615, "Pretrain/Loss (Raw)": 2.003217935562134, "Pretrain/Step": 15405, "Pretrain/Step Time": 8.486971458420157} +{"Pretrain/Learning Rate": 4.692054817657973e-06, "Pretrain/Loss": 1.976434350013733, "Pretrain/Loss (Raw)": 2.1311721801757812, "Pretrain/Step": 15406, "Pretrain/Step Time": 8.485286427661777} +{"Pretrain/Learning Rate": 4.689579265799193e-06, "Pretrain/Loss": 1.9762166738510132, "Pretrain/Loss (Raw)": 2.1185569763183594, "Pretrain/Step": 15407, "Pretrain/Step Time": 8.484835367649794} +{"Pretrain/Learning Rate": 4.687104299577086e-06, "Pretrain/Loss": 1.9740480184555054, "Pretrain/Loss (Raw)": 1.694205641746521, "Pretrain/Step": 15408, "Pretrain/Step Time": 8.485109144821763} +{"Pretrain/Learning Rate": 4.684629919062997e-06, "Pretrain/Loss": 1.9761048555374146, "Pretrain/Loss (Raw)": 1.9407262802124023, "Pretrain/Step": 15409, "Pretrain/Step Time": 8.483721662312746} +{"Pretrain/Learning Rate": 4.682156124328291e-06, "Pretrain/Loss": 1.9795029163360596, "Pretrain/Loss (Raw)": 2.155611753463745, "Pretrain/Step": 15410, "Pretrain/Step Time": 8.48930219002068} +{"Pretrain/Learning Rate": 4.679682915444289e-06, "Pretrain/Loss": 1.9748059511184692, "Pretrain/Loss (Raw)": 1.957680344581604, "Pretrain/Step": 15411, "Pretrain/Step Time": 8.487050728872418} +{"Pretrain/Learning Rate": 4.677210292482301e-06, "Pretrain/Loss": 1.9737014770507812, "Pretrain/Loss (Raw)": 1.8828965425491333, "Pretrain/Step": 15412, "Pretrain/Step Time": 8.486946050077677} +{"Pretrain/Learning Rate": 4.674738255513633e-06, "Pretrain/Loss": 1.9741137027740479, "Pretrain/Loss (Raw)": 2.0175156593322754, "Pretrain/Step": 15413, "Pretrain/Step Time": 8.49041673913598} +{"Pretrain/Learning Rate": 4.672266804609552e-06, "Pretrain/Loss": 1.975768804550171, "Pretrain/Loss (Raw)": 2.100507974624634, "Pretrain/Step": 15414, "Pretrain/Step Time": 8.493998439982533} +{"Pretrain/Learning Rate": 4.6697959398413396e-06, "Pretrain/Loss": 1.9766596555709839, "Pretrain/Loss (Raw)": 2.1142725944519043, "Pretrain/Step": 15415, "Pretrain/Step Time": 8.488271741196513} +{"Pretrain/Learning Rate": 4.66732566128022e-06, "Pretrain/Loss": 1.9770599603652954, "Pretrain/Loss (Raw)": 2.068387269973755, "Pretrain/Step": 15416, "Pretrain/Step Time": 8.483746198937297} +{"Pretrain/Learning Rate": 4.664855968997433e-06, "Pretrain/Loss": 1.9783635139465332, "Pretrain/Loss (Raw)": 2.0411198139190674, "Pretrain/Step": 15417, "Pretrain/Step Time": 8.484032163396478} +{"Pretrain/Learning Rate": 4.662386863064194e-06, "Pretrain/Loss": 1.9783989191055298, "Pretrain/Loss (Raw)": 1.9481136798858643, "Pretrain/Step": 15418, "Pretrain/Step Time": 8.484832115471363} +{"Pretrain/Learning Rate": 4.659918343551684e-06, "Pretrain/Loss": 1.976139783859253, "Pretrain/Loss (Raw)": 1.926859974861145, "Pretrain/Step": 15419, "Pretrain/Step Time": 8.487023573368788} +{"Pretrain/Learning Rate": 4.657450410531095e-06, "Pretrain/Loss": 1.9765838384628296, "Pretrain/Loss (Raw)": 2.0304934978485107, "Pretrain/Step": 15420, "Pretrain/Step Time": 8.485804188996553} +{"Pretrain/Learning Rate": 4.654983064073576e-06, "Pretrain/Loss": 1.9805026054382324, "Pretrain/Loss (Raw)": 2.581293821334839, "Pretrain/Step": 15421, "Pretrain/Step Time": 8.484241586178541} +{"Pretrain/Learning Rate": 4.652516304250287e-06, "Pretrain/Loss": 1.980597972869873, "Pretrain/Loss (Raw)": 2.1906697750091553, "Pretrain/Step": 15422, "Pretrain/Step Time": 8.485553851351142} +{"Pretrain/Learning Rate": 4.650050131132344e-06, "Pretrain/Loss": 1.9782614707946777, "Pretrain/Loss (Raw)": 1.6380934715270996, "Pretrain/Step": 15423, "Pretrain/Step Time": 8.487446473911405} +{"Pretrain/Learning Rate": 4.647584544790856e-06, "Pretrain/Loss": 1.9783868789672852, "Pretrain/Loss (Raw)": 2.0231502056121826, "Pretrain/Step": 15424, "Pretrain/Step Time": 8.482325926423073} +{"Pretrain/Learning Rate": 4.645119545296925e-06, "Pretrain/Loss": 1.9767342805862427, "Pretrain/Loss (Raw)": 1.9500733613967896, "Pretrain/Step": 15425, "Pretrain/Step Time": 8.480634268373251} +{"Pretrain/Learning Rate": 4.642655132721615e-06, "Pretrain/Loss": 1.9761931896209717, "Pretrain/Loss (Raw)": 1.9626641273498535, "Pretrain/Step": 15426, "Pretrain/Step Time": 8.487421713769436} +{"Pretrain/Learning Rate": 4.640191307136002e-06, "Pretrain/Loss": 1.9779436588287354, "Pretrain/Loss (Raw)": 2.1049537658691406, "Pretrain/Step": 15427, "Pretrain/Step Time": 8.484793417155743} +{"Pretrain/Learning Rate": 4.637728068611119e-06, "Pretrain/Loss": 1.9781723022460938, "Pretrain/Loss (Raw)": 2.035067081451416, "Pretrain/Step": 15428, "Pretrain/Step Time": 8.4856190495193} +{"Pretrain/Learning Rate": 4.6352654172179845e-06, "Pretrain/Loss": 1.9785404205322266, "Pretrain/Loss (Raw)": 2.1065218448638916, "Pretrain/Step": 15429, "Pretrain/Step Time": 8.48579826951027} +{"Pretrain/Learning Rate": 4.632803353027623e-06, "Pretrain/Loss": 1.9775407314300537, "Pretrain/Loss (Raw)": 1.9409059286117554, "Pretrain/Step": 15430, "Pretrain/Step Time": 8.49023930169642} +{"Pretrain/Learning Rate": 4.630341876111013e-06, "Pretrain/Loss": 1.9756652116775513, "Pretrain/Loss (Raw)": 1.7660421133041382, "Pretrain/Step": 15431, "Pretrain/Step Time": 8.486923798918724} +{"Pretrain/Learning Rate": 4.627880986539143e-06, "Pretrain/Loss": 1.977677822113037, "Pretrain/Loss (Raw)": 2.0244882106781006, "Pretrain/Step": 15432, "Pretrain/Step Time": 8.489956161007285} +{"Pretrain/Learning Rate": 4.625420684382961e-06, "Pretrain/Loss": 1.978481411933899, "Pretrain/Loss (Raw)": 2.1599032878875732, "Pretrain/Step": 15433, "Pretrain/Step Time": 8.4860736168921} +{"Pretrain/Learning Rate": 4.622960969713405e-06, "Pretrain/Loss": 1.9787468910217285, "Pretrain/Loss (Raw)": 1.9514014720916748, "Pretrain/Step": 15434, "Pretrain/Step Time": 8.483803756535053} +{"Pretrain/Learning Rate": 4.620501842601413e-06, "Pretrain/Loss": 1.976731300354004, "Pretrain/Loss (Raw)": 1.650450587272644, "Pretrain/Step": 15435, "Pretrain/Step Time": 8.490435529500246} +{"Pretrain/Learning Rate": 4.6180433031178745e-06, "Pretrain/Loss": 1.9753063917160034, "Pretrain/Loss (Raw)": 1.7336710691452026, "Pretrain/Step": 15436, "Pretrain/Step Time": 8.488825026899576} +{"Pretrain/Learning Rate": 4.615585351333696e-06, "Pretrain/Loss": 1.9792933464050293, "Pretrain/Loss (Raw)": 2.212604522705078, "Pretrain/Step": 15437, "Pretrain/Step Time": 8.492898980155587} +{"Pretrain/Learning Rate": 4.6131279873197455e-06, "Pretrain/Loss": 1.9769870042800903, "Pretrain/Loss (Raw)": 1.5738840103149414, "Pretrain/Step": 15438, "Pretrain/Step Time": 8.492130741477013} +{"Pretrain/Learning Rate": 4.610671211146869e-06, "Pretrain/Loss": 1.977003812789917, "Pretrain/Loss (Raw)": 1.9126741886138916, "Pretrain/Step": 15439, "Pretrain/Step Time": 8.493156120181084} +{"Pretrain/Learning Rate": 4.608215022885923e-06, "Pretrain/Loss": 1.9778791666030884, "Pretrain/Loss (Raw)": 2.012425184249878, "Pretrain/Step": 15440, "Pretrain/Step Time": 8.487219016999006} +{"Pretrain/Learning Rate": 4.6057594226077135e-06, "Pretrain/Loss": 1.9771755933761597, "Pretrain/Loss (Raw)": 1.92352294921875, "Pretrain/Step": 15441, "Pretrain/Step Time": 8.487881312146783} +{"Pretrain/Learning Rate": 4.603304410383061e-06, "Pretrain/Loss": 1.9769721031188965, "Pretrain/Loss (Raw)": 2.0556693077087402, "Pretrain/Step": 15442, "Pretrain/Step Time": 8.484322018921375} +{"Pretrain/Learning Rate": 4.600849986282749e-06, "Pretrain/Loss": 1.9780476093292236, "Pretrain/Loss (Raw)": 1.8423866033554077, "Pretrain/Step": 15443, "Pretrain/Step Time": 8.490118000656366} +{"Pretrain/Learning Rate": 4.5983961503775375e-06, "Pretrain/Loss": 1.978518009185791, "Pretrain/Loss (Raw)": 2.063380241394043, "Pretrain/Step": 15444, "Pretrain/Step Time": 8.48818165436387} +{"Pretrain/Learning Rate": 4.595942902738198e-06, "Pretrain/Loss": 1.9769830703735352, "Pretrain/Loss (Raw)": 1.7954317331314087, "Pretrain/Step": 15445, "Pretrain/Step Time": 8.495410148054361} +{"Pretrain/Learning Rate": 4.593490243435456e-06, "Pretrain/Loss": 1.976909875869751, "Pretrain/Loss (Raw)": 1.9368852376937866, "Pretrain/Step": 15446, "Pretrain/Step Time": 8.495807068422437} +{"Pretrain/Learning Rate": 4.591038172540043e-06, "Pretrain/Loss": 1.9754382371902466, "Pretrain/Loss (Raw)": 1.9541535377502441, "Pretrain/Step": 15447, "Pretrain/Step Time": 8.489839999005198} +{"Pretrain/Learning Rate": 4.5885866901226506e-06, "Pretrain/Loss": 1.9758896827697754, "Pretrain/Loss (Raw)": 2.0749900341033936, "Pretrain/Step": 15448, "Pretrain/Step Time": 8.486595338210464} +{"Pretrain/Learning Rate": 4.586135796253977e-06, "Pretrain/Loss": 1.9771087169647217, "Pretrain/Loss (Raw)": 2.033890724182129, "Pretrain/Step": 15449, "Pretrain/Step Time": 8.488385586068034} +{"Pretrain/Learning Rate": 4.583685491004688e-06, "Pretrain/Loss": 1.976993441581726, "Pretrain/Loss (Raw)": 1.9714986085891724, "Pretrain/Step": 15450, "Pretrain/Step Time": 8.487324699759483} +{"Pretrain/Learning Rate": 4.581235774445431e-06, "Pretrain/Loss": 1.9764995574951172, "Pretrain/Loss (Raw)": 2.0080912113189697, "Pretrain/Step": 15451, "Pretrain/Step Time": 8.490443093702197} +{"Pretrain/Learning Rate": 4.578786646646849e-06, "Pretrain/Loss": 1.97965669631958, "Pretrain/Loss (Raw)": 2.3831536769866943, "Pretrain/Step": 15452, "Pretrain/Step Time": 8.490612359717488} +{"Pretrain/Learning Rate": 4.576338107679553e-06, "Pretrain/Loss": 1.9836210012435913, "Pretrain/Loss (Raw)": 2.36776065826416, "Pretrain/Step": 15453, "Pretrain/Step Time": 8.491825379431248} +{"Pretrain/Learning Rate": 4.573890157614155e-06, "Pretrain/Loss": 1.9840161800384521, "Pretrain/Loss (Raw)": 1.925666332244873, "Pretrain/Step": 15454, "Pretrain/Step Time": 8.491887213662267} +{"Pretrain/Learning Rate": 4.5714427965212384e-06, "Pretrain/Loss": 1.9833378791809082, "Pretrain/Loss (Raw)": 1.9098477363586426, "Pretrain/Step": 15455, "Pretrain/Step Time": 8.48856082931161} +{"Pretrain/Learning Rate": 4.568996024471358e-06, "Pretrain/Loss": 1.9829506874084473, "Pretrain/Loss (Raw)": 1.9348169565200806, "Pretrain/Step": 15456, "Pretrain/Step Time": 8.49357663281262} +{"Pretrain/Learning Rate": 4.566549841535081e-06, "Pretrain/Loss": 1.9824804067611694, "Pretrain/Loss (Raw)": 1.8874566555023193, "Pretrain/Step": 15457, "Pretrain/Step Time": 8.48919327557087} +{"Pretrain/Learning Rate": 4.56410424778293e-06, "Pretrain/Loss": 1.9840173721313477, "Pretrain/Loss (Raw)": 1.9863028526306152, "Pretrain/Step": 15458, "Pretrain/Step Time": 8.488605741411448} +{"Pretrain/Learning Rate": 4.561659243285432e-06, "Pretrain/Loss": 1.9843815565109253, "Pretrain/Loss (Raw)": 2.093705415725708, "Pretrain/Step": 15459, "Pretrain/Step Time": 8.487375508993864} +{"Pretrain/Learning Rate": 4.559214828113082e-06, "Pretrain/Loss": 1.9841309785842896, "Pretrain/Loss (Raw)": 1.9464205503463745, "Pretrain/Step": 15460, "Pretrain/Step Time": 8.48987701535225} +{"Pretrain/Learning Rate": 4.556771002336355e-06, "Pretrain/Loss": 1.982879877090454, "Pretrain/Loss (Raw)": 2.007085084915161, "Pretrain/Step": 15461, "Pretrain/Step Time": 8.48899501748383} +{"Pretrain/Learning Rate": 4.554327766025732e-06, "Pretrain/Loss": 1.9790730476379395, "Pretrain/Loss (Raw)": 1.6656943559646606, "Pretrain/Step": 15462, "Pretrain/Step Time": 8.492949444800615} +{"Pretrain/Learning Rate": 4.5518851192516504e-06, "Pretrain/Loss": 1.9789271354675293, "Pretrain/Loss (Raw)": 1.8694928884506226, "Pretrain/Step": 15463, "Pretrain/Step Time": 8.490750137716532} +{"Pretrain/Learning Rate": 4.549443062084549e-06, "Pretrain/Loss": 1.9814457893371582, "Pretrain/Loss (Raw)": 2.1543772220611572, "Pretrain/Step": 15464, "Pretrain/Step Time": 8.4877725597471} +{"Pretrain/Learning Rate": 4.547001594594841e-06, "Pretrain/Loss": 1.979015588760376, "Pretrain/Loss (Raw)": 1.9622852802276611, "Pretrain/Step": 15465, "Pretrain/Step Time": 8.488642949610949} +{"Pretrain/Learning Rate": 4.544560716852919e-06, "Pretrain/Loss": 1.9788410663604736, "Pretrain/Loss (Raw)": 1.8525093793869019, "Pretrain/Step": 15466, "Pretrain/Step Time": 8.483507359400392} +{"Pretrain/Learning Rate": 4.542120428929175e-06, "Pretrain/Loss": 1.9781904220581055, "Pretrain/Loss (Raw)": 1.8735160827636719, "Pretrain/Step": 15467, "Pretrain/Step Time": 8.487960085272789} +{"Pretrain/Learning Rate": 4.539680730893958e-06, "Pretrain/Loss": 1.9782426357269287, "Pretrain/Loss (Raw)": 2.1434969902038574, "Pretrain/Step": 15468, "Pretrain/Step Time": 8.485692916437984} +{"Pretrain/Learning Rate": 4.5372416228176315e-06, "Pretrain/Loss": 1.979997158050537, "Pretrain/Loss (Raw)": 2.0806758403778076, "Pretrain/Step": 15469, "Pretrain/Step Time": 8.486971497535706} +{"Pretrain/Learning Rate": 4.534803104770516e-06, "Pretrain/Loss": 1.9789044857025146, "Pretrain/Loss (Raw)": 1.9144686460494995, "Pretrain/Step": 15470, "Pretrain/Step Time": 8.486162604764104} +{"Pretrain/Learning Rate": 4.532365176822923e-06, "Pretrain/Loss": 1.9798572063446045, "Pretrain/Loss (Raw)": 2.0016121864318848, "Pretrain/Step": 15471, "Pretrain/Step Time": 8.480247741565108} +{"Pretrain/Learning Rate": 4.529927839045153e-06, "Pretrain/Loss": 1.9802321195602417, "Pretrain/Loss (Raw)": 2.0537185668945312, "Pretrain/Step": 15472, "Pretrain/Step Time": 8.4811592400074} +{"Pretrain/Learning Rate": 4.52749109150748e-06, "Pretrain/Loss": 1.9793040752410889, "Pretrain/Loss (Raw)": 1.983688235282898, "Pretrain/Step": 15473, "Pretrain/Step Time": 8.48595542088151} +{"Pretrain/Learning Rate": 4.525054934280176e-06, "Pretrain/Loss": 1.9818553924560547, "Pretrain/Loss (Raw)": 2.257737636566162, "Pretrain/Step": 15474, "Pretrain/Step Time": 8.487137971445918} +{"Pretrain/Learning Rate": 4.522619367433479e-06, "Pretrain/Loss": 1.98299241065979, "Pretrain/Loss (Raw)": 2.1011412143707275, "Pretrain/Step": 15475, "Pretrain/Step Time": 8.487584110349417} +{"Pretrain/Learning Rate": 4.520184391037608e-06, "Pretrain/Loss": 1.9847769737243652, "Pretrain/Loss (Raw)": 2.1078248023986816, "Pretrain/Step": 15476, "Pretrain/Step Time": 8.48850148357451} +{"Pretrain/Learning Rate": 4.51775000516279e-06, "Pretrain/Loss": 1.9850964546203613, "Pretrain/Loss (Raw)": 1.9928381443023682, "Pretrain/Step": 15477, "Pretrain/Step Time": 8.488607034087181} +{"Pretrain/Learning Rate": 4.515316209879209e-06, "Pretrain/Loss": 1.9854199886322021, "Pretrain/Loss (Raw)": 1.9931889772415161, "Pretrain/Step": 15478, "Pretrain/Step Time": 8.49614212475717} +{"Pretrain/Learning Rate": 4.512883005257046e-06, "Pretrain/Loss": 1.9861092567443848, "Pretrain/Loss (Raw)": 2.0008633136749268, "Pretrain/Step": 15479, "Pretrain/Step Time": 8.495725138112903} +{"Pretrain/Learning Rate": 4.510450391366461e-06, "Pretrain/Loss": 1.987459659576416, "Pretrain/Loss (Raw)": 1.8068287372589111, "Pretrain/Step": 15480, "Pretrain/Step Time": 8.494628209620714} +{"Pretrain/Learning Rate": 4.508018368277589e-06, "Pretrain/Loss": 1.9859552383422852, "Pretrain/Loss (Raw)": 2.0286147594451904, "Pretrain/Step": 15481, "Pretrain/Step Time": 8.49525829963386} +{"Pretrain/Learning Rate": 4.505586936060566e-06, "Pretrain/Loss": 1.9848735332489014, "Pretrain/Loss (Raw)": 1.895269513130188, "Pretrain/Step": 15482, "Pretrain/Step Time": 8.496033689007163} +{"Pretrain/Learning Rate": 4.503156094785491e-06, "Pretrain/Loss": 1.9837889671325684, "Pretrain/Loss (Raw)": 1.8880914449691772, "Pretrain/Step": 15483, "Pretrain/Step Time": 8.49262011051178} +{"Pretrain/Learning Rate": 4.500725844522466e-06, "Pretrain/Loss": 1.9837305545806885, "Pretrain/Loss (Raw)": 1.970162034034729, "Pretrain/Step": 15484, "Pretrain/Step Time": 8.496979869902134} +{"Pretrain/Learning Rate": 4.498296185341561e-06, "Pretrain/Loss": 1.9843885898590088, "Pretrain/Loss (Raw)": 2.0119142532348633, "Pretrain/Step": 15485, "Pretrain/Step Time": 8.492897195741534} +{"Pretrain/Learning Rate": 4.495867117312827e-06, "Pretrain/Loss": 1.9856746196746826, "Pretrain/Loss (Raw)": 1.90705144405365, "Pretrain/Step": 15486, "Pretrain/Step Time": 8.496167480945587} +{"Pretrain/Learning Rate": 4.493438640506317e-06, "Pretrain/Loss": 1.984728455543518, "Pretrain/Loss (Raw)": 1.8484641313552856, "Pretrain/Step": 15487, "Pretrain/Step Time": 8.494746074080467} +{"Pretrain/Learning Rate": 4.49101075499204e-06, "Pretrain/Loss": 1.9835208654403687, "Pretrain/Loss (Raw)": 1.8819981813430786, "Pretrain/Step": 15488, "Pretrain/Step Time": 8.495160324499011} +{"Pretrain/Learning Rate": 4.4885834608400155e-06, "Pretrain/Loss": 1.9834065437316895, "Pretrain/Loss (Raw)": 1.986431360244751, "Pretrain/Step": 15489, "Pretrain/Step Time": 8.495656682178378} +{"Pretrain/Learning Rate": 4.48615675812023e-06, "Pretrain/Loss": 1.983942985534668, "Pretrain/Loss (Raw)": 1.9206758737564087, "Pretrain/Step": 15490, "Pretrain/Step Time": 8.493001772090793} +{"Pretrain/Learning Rate": 4.483730646902645e-06, "Pretrain/Loss": 1.9838621616363525, "Pretrain/Loss (Raw)": 1.9085079431533813, "Pretrain/Step": 15491, "Pretrain/Step Time": 8.494961818680167} +{"Pretrain/Learning Rate": 4.481305127257229e-06, "Pretrain/Loss": 1.9825241565704346, "Pretrain/Loss (Raw)": 1.8770426511764526, "Pretrain/Step": 15492, "Pretrain/Step Time": 8.50112535431981} +{"Pretrain/Learning Rate": 4.4788801992539094e-06, "Pretrain/Loss": 1.9809752702713013, "Pretrain/Loss (Raw)": 1.9512641429901123, "Pretrain/Step": 15493, "Pretrain/Step Time": 8.493467880412936} +{"Pretrain/Learning Rate": 4.4764558629626195e-06, "Pretrain/Loss": 1.983313798904419, "Pretrain/Loss (Raw)": 2.1473450660705566, "Pretrain/Step": 15494, "Pretrain/Step Time": 8.499360477551818} +{"Pretrain/Learning Rate": 4.474032118453259e-06, "Pretrain/Loss": 1.9832303524017334, "Pretrain/Loss (Raw)": 1.840072512626648, "Pretrain/Step": 15495, "Pretrain/Step Time": 8.49657341092825} +{"Pretrain/Learning Rate": 4.471608965795701e-06, "Pretrain/Loss": 1.9816877841949463, "Pretrain/Loss (Raw)": 1.9560651779174805, "Pretrain/Step": 15496, "Pretrain/Step Time": 8.49452037550509} +{"Pretrain/Learning Rate": 4.469186405059839e-06, "Pretrain/Loss": 1.9828474521636963, "Pretrain/Loss (Raw)": 2.0676887035369873, "Pretrain/Step": 15497, "Pretrain/Step Time": 8.495924418792129} +{"Pretrain/Learning Rate": 4.466764436315504e-06, "Pretrain/Loss": 1.982128620147705, "Pretrain/Loss (Raw)": 1.8610707521438599, "Pretrain/Step": 15498, "Pretrain/Step Time": 8.48914828337729} +{"Pretrain/Learning Rate": 4.464343059632553e-06, "Pretrain/Loss": 1.9825282096862793, "Pretrain/Loss (Raw)": 1.8177889585494995, "Pretrain/Step": 15499, "Pretrain/Step Time": 8.488715007901192} +{"Pretrain/Learning Rate": 4.461922275080782e-06, "Pretrain/Loss": 1.9824905395507812, "Pretrain/Loss (Raw)": 2.029561996459961, "Pretrain/Step": 15500, "Pretrain/Step Time": 8.490881146863103} +{"Pretrain/Learning Rate": 4.45950208273001e-06, "Pretrain/Loss": 1.9829365015029907, "Pretrain/Loss (Raw)": 1.9953901767730713, "Pretrain/Step": 15501, "Pretrain/Step Time": 8.490830847993493} +{"Pretrain/Learning Rate": 4.4570824826500155e-06, "Pretrain/Loss": 1.9826030731201172, "Pretrain/Loss (Raw)": 2.0848989486694336, "Pretrain/Step": 15502, "Pretrain/Step Time": 8.488623945042491} +{"Pretrain/Learning Rate": 4.4546634749105614e-06, "Pretrain/Loss": 1.981679916381836, "Pretrain/Loss (Raw)": 1.8180150985717773, "Pretrain/Step": 15503, "Pretrain/Step Time": 8.490898098796606} +{"Pretrain/Learning Rate": 4.4522450595814055e-06, "Pretrain/Loss": 1.980184555053711, "Pretrain/Loss (Raw)": 1.8385642766952515, "Pretrain/Step": 15504, "Pretrain/Step Time": 8.48935329169035} +{"Pretrain/Learning Rate": 4.449827236732276e-06, "Pretrain/Loss": 1.9792588949203491, "Pretrain/Loss (Raw)": 1.9282710552215576, "Pretrain/Step": 15505, "Pretrain/Step Time": 8.485677514225245} +{"Pretrain/Learning Rate": 4.447410006432895e-06, "Pretrain/Loss": 1.9775241613388062, "Pretrain/Loss (Raw)": 1.924267053604126, "Pretrain/Step": 15506, "Pretrain/Step Time": 8.480450134724379} +{"Pretrain/Learning Rate": 4.444993368752956e-06, "Pretrain/Loss": 1.9774004220962524, "Pretrain/Loss (Raw)": 1.8403693437576294, "Pretrain/Step": 15507, "Pretrain/Step Time": 8.485967485234141} +{"Pretrain/Learning Rate": 4.4425773237621395e-06, "Pretrain/Loss": 1.9757146835327148, "Pretrain/Loss (Raw)": 1.8449572324752808, "Pretrain/Step": 15508, "Pretrain/Step Time": 8.487164828926325} +{"Pretrain/Learning Rate": 4.440161871530119e-06, "Pretrain/Loss": 1.9751694202423096, "Pretrain/Loss (Raw)": 2.0394980907440186, "Pretrain/Step": 15509, "Pretrain/Step Time": 8.486899316310883} +{"Pretrain/Learning Rate": 4.43774701212653e-06, "Pretrain/Loss": 1.975935935974121, "Pretrain/Loss (Raw)": 2.0929455757141113, "Pretrain/Step": 15510, "Pretrain/Step Time": 8.486125528812408} +{"Pretrain/Learning Rate": 4.435332745621018e-06, "Pretrain/Loss": 1.9756510257720947, "Pretrain/Loss (Raw)": 1.894311547279358, "Pretrain/Step": 15511, "Pretrain/Step Time": 8.486919730901718} +{"Pretrain/Learning Rate": 4.432919072083183e-06, "Pretrain/Loss": 1.9750616550445557, "Pretrain/Loss (Raw)": 1.8460279703140259, "Pretrain/Step": 15512, "Pretrain/Step Time": 8.491384498775005} +{"Pretrain/Learning Rate": 4.430505991582634e-06, "Pretrain/Loss": 1.974822998046875, "Pretrain/Loss (Raw)": 1.6731348037719727, "Pretrain/Step": 15513, "Pretrain/Step Time": 8.48832387290895} +{"Pretrain/Learning Rate": 4.4280935041889436e-06, "Pretrain/Loss": 1.9719160795211792, "Pretrain/Loss (Raw)": 1.4663101434707642, "Pretrain/Step": 15514, "Pretrain/Step Time": 8.486573871225119} +{"Pretrain/Learning Rate": 4.425681609971668e-06, "Pretrain/Loss": 1.972804069519043, "Pretrain/Loss (Raw)": 2.1332523822784424, "Pretrain/Step": 15515, "Pretrain/Step Time": 8.483822956681252} +{"Pretrain/Learning Rate": 4.423270309000366e-06, "Pretrain/Loss": 1.971930980682373, "Pretrain/Loss (Raw)": 1.9034905433654785, "Pretrain/Step": 15516, "Pretrain/Step Time": 8.488763201981783} +{"Pretrain/Learning Rate": 4.420859601344552e-06, "Pretrain/Loss": 1.9724416732788086, "Pretrain/Loss (Raw)": 1.982506513595581, "Pretrain/Step": 15517, "Pretrain/Step Time": 8.484058950096369} +{"Pretrain/Learning Rate": 4.418449487073753e-06, "Pretrain/Loss": 1.971767544746399, "Pretrain/Loss (Raw)": 2.051744222640991, "Pretrain/Step": 15518, "Pretrain/Step Time": 8.485274501144886} +{"Pretrain/Learning Rate": 4.4160399662574515e-06, "Pretrain/Loss": 1.971897840499878, "Pretrain/Loss (Raw)": 1.9225472211837769, "Pretrain/Step": 15519, "Pretrain/Step Time": 8.489026801660657} +{"Pretrain/Learning Rate": 4.413631038965122e-06, "Pretrain/Loss": 1.9723191261291504, "Pretrain/Loss (Raw)": 1.9803287982940674, "Pretrain/Step": 15520, "Pretrain/Step Time": 8.488614713773131} +{"Pretrain/Learning Rate": 4.4112227052662325e-06, "Pretrain/Loss": 1.9697260856628418, "Pretrain/Loss (Raw)": 1.9494779109954834, "Pretrain/Step": 15521, "Pretrain/Step Time": 8.483551090583205} +{"Pretrain/Learning Rate": 4.408814965230218e-06, "Pretrain/Loss": 1.9725379943847656, "Pretrain/Loss (Raw)": 2.035231828689575, "Pretrain/Step": 15522, "Pretrain/Step Time": 8.488034987822175} +{"Pretrain/Learning Rate": 4.406407818926514e-06, "Pretrain/Loss": 1.9720485210418701, "Pretrain/Loss (Raw)": 1.9501011371612549, "Pretrain/Step": 15523, "Pretrain/Step Time": 8.48523666895926} +{"Pretrain/Learning Rate": 4.404001266424523e-06, "Pretrain/Loss": 1.967807650566101, "Pretrain/Loss (Raw)": 1.8761268854141235, "Pretrain/Step": 15524, "Pretrain/Step Time": 8.483666565269232} +{"Pretrain/Learning Rate": 4.401595307793632e-06, "Pretrain/Loss": 1.9680171012878418, "Pretrain/Loss (Raw)": 1.968276858329773, "Pretrain/Step": 15525, "Pretrain/Step Time": 8.489748915657401} +{"Pretrain/Learning Rate": 4.399189943103224e-06, "Pretrain/Loss": 1.9675660133361816, "Pretrain/Loss (Raw)": 2.0534403324127197, "Pretrain/Step": 15526, "Pretrain/Step Time": 8.489115037024021} +{"Pretrain/Learning Rate": 4.396785172422646e-06, "Pretrain/Loss": 1.9672784805297852, "Pretrain/Loss (Raw)": 1.9432176351547241, "Pretrain/Step": 15527, "Pretrain/Step Time": 8.488964460790157} +{"Pretrain/Learning Rate": 4.394380995821248e-06, "Pretrain/Loss": 1.9678162336349487, "Pretrain/Loss (Raw)": 1.9782658815383911, "Pretrain/Step": 15528, "Pretrain/Step Time": 8.490296579897404} +{"Pretrain/Learning Rate": 4.391977413368348e-06, "Pretrain/Loss": 1.9689780473709106, "Pretrain/Loss (Raw)": 1.9377232789993286, "Pretrain/Step": 15529, "Pretrain/Step Time": 8.489678721874952} +{"Pretrain/Learning Rate": 4.389574425133247e-06, "Pretrain/Loss": 1.9662723541259766, "Pretrain/Loss (Raw)": 1.6402627229690552, "Pretrain/Step": 15530, "Pretrain/Step Time": 8.492209408432245} +{"Pretrain/Learning Rate": 4.387172031185241e-06, "Pretrain/Loss": 1.9660335779190063, "Pretrain/Loss (Raw)": 2.0653929710388184, "Pretrain/Step": 15531, "Pretrain/Step Time": 8.488393671810627} +{"Pretrain/Learning Rate": 4.3847702315935965e-06, "Pretrain/Loss": 1.9688855409622192, "Pretrain/Loss (Raw)": 1.9835619926452637, "Pretrain/Step": 15532, "Pretrain/Step Time": 8.492808876559138} +{"Pretrain/Learning Rate": 4.3823690264275744e-06, "Pretrain/Loss": 1.9669125080108643, "Pretrain/Loss (Raw)": 1.750672698020935, "Pretrain/Step": 15533, "Pretrain/Step Time": 8.493700018152595} +{"Pretrain/Learning Rate": 4.379968415756405e-06, "Pretrain/Loss": 1.9667298793792725, "Pretrain/Loss (Raw)": 2.107799530029297, "Pretrain/Step": 15534, "Pretrain/Step Time": 8.489208605140448} +{"Pretrain/Learning Rate": 4.377568399649304e-06, "Pretrain/Loss": 1.9624269008636475, "Pretrain/Loss (Raw)": 1.5677776336669922, "Pretrain/Step": 15535, "Pretrain/Step Time": 8.492078099399805} +{"Pretrain/Learning Rate": 4.37516897817549e-06, "Pretrain/Loss": 1.9639188051223755, "Pretrain/Loss (Raw)": 1.8851591348648071, "Pretrain/Step": 15536, "Pretrain/Step Time": 8.493097165599465} +{"Pretrain/Learning Rate": 4.372770151404129e-06, "Pretrain/Loss": 1.9647809267044067, "Pretrain/Loss (Raw)": 2.051088333129883, "Pretrain/Step": 15537, "Pretrain/Step Time": 8.492836061865091} +{"Pretrain/Learning Rate": 4.3703719194044066e-06, "Pretrain/Loss": 1.9634736776351929, "Pretrain/Loss (Raw)": 1.9882690906524658, "Pretrain/Step": 15538, "Pretrain/Step Time": 8.496359471231699} +{"Pretrain/Learning Rate": 4.3679742822454685e-06, "Pretrain/Loss": 1.9665074348449707, "Pretrain/Loss (Raw)": 2.3460018634796143, "Pretrain/Step": 15539, "Pretrain/Step Time": 8.495214652270079} +{"Pretrain/Learning Rate": 4.3655772399964405e-06, "Pretrain/Loss": 1.968048095703125, "Pretrain/Loss (Raw)": 2.080098867416382, "Pretrain/Step": 15540, "Pretrain/Step Time": 8.496963052079082} +{"Pretrain/Learning Rate": 4.363180792726451e-06, "Pretrain/Loss": 1.967960000038147, "Pretrain/Loss (Raw)": 2.0062437057495117, "Pretrain/Step": 15541, "Pretrain/Step Time": 8.493274757638574} +{"Pretrain/Learning Rate": 4.360784940504592e-06, "Pretrain/Loss": 1.9670437574386597, "Pretrain/Loss (Raw)": 1.9832406044006348, "Pretrain/Step": 15542, "Pretrain/Step Time": 8.492965642362833} +{"Pretrain/Learning Rate": 4.358389683399955e-06, "Pretrain/Loss": 1.9670636653900146, "Pretrain/Loss (Raw)": 2.116816282272339, "Pretrain/Step": 15543, "Pretrain/Step Time": 8.497635746374726} +{"Pretrain/Learning Rate": 4.355995021481598e-06, "Pretrain/Loss": 1.9645823240280151, "Pretrain/Loss (Raw)": 1.7507678270339966, "Pretrain/Step": 15544, "Pretrain/Step Time": 8.498333832249045} +{"Pretrain/Learning Rate": 4.353600954818568e-06, "Pretrain/Loss": 1.9628229141235352, "Pretrain/Loss (Raw)": 1.815932273864746, "Pretrain/Step": 15545, "Pretrain/Step Time": 8.497943136841059} +{"Pretrain/Learning Rate": 4.351207483479902e-06, "Pretrain/Loss": 1.9634709358215332, "Pretrain/Loss (Raw)": 2.031045913696289, "Pretrain/Step": 15546, "Pretrain/Step Time": 8.496249198913574} +{"Pretrain/Learning Rate": 4.34881460753461e-06, "Pretrain/Loss": 1.9647233486175537, "Pretrain/Loss (Raw)": 2.087170124053955, "Pretrain/Step": 15547, "Pretrain/Step Time": 8.493918038904667} +{"Pretrain/Learning Rate": 4.346422327051694e-06, "Pretrain/Loss": 1.9624812602996826, "Pretrain/Loss (Raw)": 1.7435129880905151, "Pretrain/Step": 15548, "Pretrain/Step Time": 8.500345235690475} +{"Pretrain/Learning Rate": 4.344030642100133e-06, "Pretrain/Loss": 1.9579212665557861, "Pretrain/Loss (Raw)": 1.9975945949554443, "Pretrain/Step": 15549, "Pretrain/Step Time": 8.501077910885215} +{"Pretrain/Learning Rate": 4.3416395527488775e-06, "Pretrain/Loss": 1.955224633216858, "Pretrain/Loss (Raw)": 1.8455206155776978, "Pretrain/Step": 15550, "Pretrain/Step Time": 8.497352933511138} +{"Pretrain/Learning Rate": 4.339249059066891e-06, "Pretrain/Loss": 1.9600282907485962, "Pretrain/Loss (Raw)": 2.252959966659546, "Pretrain/Step": 15551, "Pretrain/Step Time": 8.495657604187727} +{"Pretrain/Learning Rate": 4.336859161123086e-06, "Pretrain/Loss": 1.960683822631836, "Pretrain/Loss (Raw)": 2.1070504188537598, "Pretrain/Step": 15552, "Pretrain/Step Time": 8.499482786282897} +{"Pretrain/Learning Rate": 4.334469858986387e-06, "Pretrain/Loss": 1.9615193605422974, "Pretrain/Loss (Raw)": 2.05702543258667, "Pretrain/Step": 15553, "Pretrain/Step Time": 8.499815188348293} +{"Pretrain/Learning Rate": 4.332081152725681e-06, "Pretrain/Loss": 1.9600989818572998, "Pretrain/Loss (Raw)": 1.7808494567871094, "Pretrain/Step": 15554, "Pretrain/Step Time": 8.495567260310054} +{"Pretrain/Learning Rate": 4.329693042409838e-06, "Pretrain/Loss": 1.9587531089782715, "Pretrain/Loss (Raw)": 1.9327055215835571, "Pretrain/Step": 15555, "Pretrain/Step Time": 8.497420696541667} +{"Pretrain/Learning Rate": 4.3273055281077305e-06, "Pretrain/Loss": 1.9572917222976685, "Pretrain/Loss (Raw)": 1.8479968309402466, "Pretrain/Step": 15556, "Pretrain/Step Time": 8.49428067728877} +{"Pretrain/Learning Rate": 4.32491860988819e-06, "Pretrain/Loss": 1.9575350284576416, "Pretrain/Loss (Raw)": 2.1376588344573975, "Pretrain/Step": 15557, "Pretrain/Step Time": 8.494667744264007} +{"Pretrain/Learning Rate": 4.322532287820053e-06, "Pretrain/Loss": 1.9574077129364014, "Pretrain/Loss (Raw)": 1.924615740776062, "Pretrain/Step": 15558, "Pretrain/Step Time": 8.493978260084987} +{"Pretrain/Learning Rate": 4.320146561972121e-06, "Pretrain/Loss": 1.9602880477905273, "Pretrain/Loss (Raw)": 2.134723424911499, "Pretrain/Step": 15559, "Pretrain/Step Time": 8.496952714398503} +{"Pretrain/Learning Rate": 4.317761432413178e-06, "Pretrain/Loss": 1.9600262641906738, "Pretrain/Loss (Raw)": 1.9909688234329224, "Pretrain/Step": 15560, "Pretrain/Step Time": 8.492183173075318} +{"Pretrain/Learning Rate": 4.315376899212009e-06, "Pretrain/Loss": 1.959150791168213, "Pretrain/Loss (Raw)": 2.0478508472442627, "Pretrain/Step": 15561, "Pretrain/Step Time": 8.494300410151482} +{"Pretrain/Learning Rate": 4.312992962437359e-06, "Pretrain/Loss": 1.959299087524414, "Pretrain/Loss (Raw)": 1.9703922271728516, "Pretrain/Step": 15562, "Pretrain/Step Time": 8.495090389624238} +{"Pretrain/Learning Rate": 4.310609622157982e-06, "Pretrain/Loss": 1.9602651596069336, "Pretrain/Loss (Raw)": 1.7740999460220337, "Pretrain/Step": 15563, "Pretrain/Step Time": 8.488617826253176} +{"Pretrain/Learning Rate": 4.308226878442589e-06, "Pretrain/Loss": 1.9594111442565918, "Pretrain/Loss (Raw)": 1.6243667602539062, "Pretrain/Step": 15564, "Pretrain/Step Time": 8.48819649964571} +{"Pretrain/Learning Rate": 4.3058447313598815e-06, "Pretrain/Loss": 1.9578988552093506, "Pretrain/Loss (Raw)": 2.019012212753296, "Pretrain/Step": 15565, "Pretrain/Step Time": 8.484953671693802} +{"Pretrain/Learning Rate": 4.303463180978562e-06, "Pretrain/Loss": 1.9601998329162598, "Pretrain/Loss (Raw)": 1.8684210777282715, "Pretrain/Step": 15566, "Pretrain/Step Time": 8.48978647775948} +{"Pretrain/Learning Rate": 4.301082227367281e-06, "Pretrain/Loss": 1.9618115425109863, "Pretrain/Loss (Raw)": 2.1189706325531006, "Pretrain/Step": 15567, "Pretrain/Step Time": 8.490378534421325} +{"Pretrain/Learning Rate": 4.298701870594712e-06, "Pretrain/Loss": 1.962099313735962, "Pretrain/Loss (Raw)": 2.0492639541625977, "Pretrain/Step": 15568, "Pretrain/Step Time": 8.493826923891902} +{"Pretrain/Learning Rate": 4.296322110729478e-06, "Pretrain/Loss": 1.9606703519821167, "Pretrain/Loss (Raw)": 1.74061119556427, "Pretrain/Step": 15569, "Pretrain/Step Time": 8.493919668719172} +{"Pretrain/Learning Rate": 4.293942947840196e-06, "Pretrain/Loss": 1.9619311094284058, "Pretrain/Loss (Raw)": 2.2170488834381104, "Pretrain/Step": 15570, "Pretrain/Step Time": 8.497499844059348} +{"Pretrain/Learning Rate": 4.2915643819954805e-06, "Pretrain/Loss": 1.9634743928909302, "Pretrain/Loss (Raw)": 2.0399327278137207, "Pretrain/Step": 15571, "Pretrain/Step Time": 8.49250902235508} +{"Pretrain/Learning Rate": 4.289186413263898e-06, "Pretrain/Loss": 1.9627496004104614, "Pretrain/Loss (Raw)": 1.970616102218628, "Pretrain/Step": 15572, "Pretrain/Step Time": 8.49243296124041} +{"Pretrain/Learning Rate": 4.286809041714035e-06, "Pretrain/Loss": 1.9638748168945312, "Pretrain/Loss (Raw)": 1.9394447803497314, "Pretrain/Step": 15573, "Pretrain/Step Time": 8.490071453154087} +{"Pretrain/Learning Rate": 4.284432267414429e-06, "Pretrain/Loss": 1.962761640548706, "Pretrain/Loss (Raw)": 1.794404149055481, "Pretrain/Step": 15574, "Pretrain/Step Time": 8.490375827997923} +{"Pretrain/Learning Rate": 4.282056090433609e-06, "Pretrain/Loss": 1.9635266065597534, "Pretrain/Loss (Raw)": 2.0520689487457275, "Pretrain/Step": 15575, "Pretrain/Step Time": 8.491294221952558} +{"Pretrain/Learning Rate": 4.279680510840103e-06, "Pretrain/Loss": 1.9629735946655273, "Pretrain/Loss (Raw)": 2.0041985511779785, "Pretrain/Step": 15576, "Pretrain/Step Time": 8.495801789686084} +{"Pretrain/Learning Rate": 4.277305528702394e-06, "Pretrain/Loss": 1.9623147249221802, "Pretrain/Loss (Raw)": 1.9495511054992676, "Pretrain/Step": 15577, "Pretrain/Step Time": 8.501337856054306} +{"Pretrain/Learning Rate": 4.2749311440889815e-06, "Pretrain/Loss": 1.961665391921997, "Pretrain/Loss (Raw)": 1.8883932828903198, "Pretrain/Step": 15578, "Pretrain/Step Time": 8.499797923490405} +{"Pretrain/Learning Rate": 4.272557357068319e-06, "Pretrain/Loss": 1.9628431797027588, "Pretrain/Loss (Raw)": 2.158846139907837, "Pretrain/Step": 15579, "Pretrain/Step Time": 8.496764525771141} +{"Pretrain/Learning Rate": 4.270184167708843e-06, "Pretrain/Loss": 1.9606659412384033, "Pretrain/Loss (Raw)": 2.104462146759033, "Pretrain/Step": 15580, "Pretrain/Step Time": 8.499132685363293} +{"Pretrain/Learning Rate": 4.267811576079003e-06, "Pretrain/Loss": 1.9586845636367798, "Pretrain/Loss (Raw)": 2.1141438484191895, "Pretrain/Step": 15581, "Pretrain/Step Time": 8.49600343592465} +{"Pretrain/Learning Rate": 4.2654395822471935e-06, "Pretrain/Loss": 1.9579944610595703, "Pretrain/Loss (Raw)": 1.8373316526412964, "Pretrain/Step": 15582, "Pretrain/Step Time": 8.499171933159232} +{"Pretrain/Learning Rate": 4.263068186281824e-06, "Pretrain/Loss": 1.9590989351272583, "Pretrain/Loss (Raw)": 2.051222801208496, "Pretrain/Step": 15583, "Pretrain/Step Time": 8.499713288620114} +{"Pretrain/Learning Rate": 4.260697388251264e-06, "Pretrain/Loss": 1.959557056427002, "Pretrain/Loss (Raw)": 1.9934511184692383, "Pretrain/Step": 15584, "Pretrain/Step Time": 8.49609274417162} +{"Pretrain/Learning Rate": 4.258327188223874e-06, "Pretrain/Loss": 1.9608064889907837, "Pretrain/Loss (Raw)": 2.0473899841308594, "Pretrain/Step": 15585, "Pretrain/Step Time": 8.495866337791085} +{"Pretrain/Learning Rate": 4.2559575862679916e-06, "Pretrain/Loss": 1.9613513946533203, "Pretrain/Loss (Raw)": 2.056062698364258, "Pretrain/Step": 15586, "Pretrain/Step Time": 8.494388442486525} +{"Pretrain/Learning Rate": 4.253588582451954e-06, "Pretrain/Loss": 1.9591429233551025, "Pretrain/Loss (Raw)": 1.811021327972412, "Pretrain/Step": 15587, "Pretrain/Step Time": 8.50079095363617} +{"Pretrain/Learning Rate": 4.2512201768440645e-06, "Pretrain/Loss": 1.95986807346344, "Pretrain/Loss (Raw)": 2.0392401218414307, "Pretrain/Step": 15588, "Pretrain/Step Time": 8.496683245524764} +{"Pretrain/Learning Rate": 4.2488523695126095e-06, "Pretrain/Loss": 1.9622361660003662, "Pretrain/Loss (Raw)": 2.31019926071167, "Pretrain/Step": 15589, "Pretrain/Step Time": 8.493507985025644} +{"Pretrain/Learning Rate": 4.246485160525873e-06, "Pretrain/Loss": 1.965300440788269, "Pretrain/Loss (Raw)": 2.0579123497009277, "Pretrain/Step": 15590, "Pretrain/Step Time": 8.491140585392714} +{"Pretrain/Learning Rate": 4.244118549952103e-06, "Pretrain/Loss": 1.967128038406372, "Pretrain/Loss (Raw)": 2.103438377380371, "Pretrain/Step": 15591, "Pretrain/Step Time": 8.491241447627544} +{"Pretrain/Learning Rate": 4.241752537859548e-06, "Pretrain/Loss": 1.96537184715271, "Pretrain/Loss (Raw)": 1.9295705556869507, "Pretrain/Step": 15592, "Pretrain/Step Time": 8.495756523683667} +{"Pretrain/Learning Rate": 4.239387124316421e-06, "Pretrain/Loss": 1.9652174711227417, "Pretrain/Loss (Raw)": 1.9425311088562012, "Pretrain/Step": 15593, "Pretrain/Step Time": 8.492892088368535} +{"Pretrain/Learning Rate": 4.237022309390928e-06, "Pretrain/Loss": 1.966403841972351, "Pretrain/Loss (Raw)": 2.004359006881714, "Pretrain/Step": 15594, "Pretrain/Step Time": 8.495919793844223} +{"Pretrain/Learning Rate": 4.234658093151267e-06, "Pretrain/Loss": 1.9677422046661377, "Pretrain/Loss (Raw)": 2.0448403358459473, "Pretrain/Step": 15595, "Pretrain/Step Time": 8.49740232899785} +{"Pretrain/Learning Rate": 4.232294475665594e-06, "Pretrain/Loss": 1.9649666547775269, "Pretrain/Loss (Raw)": 1.788223147392273, "Pretrain/Step": 15596, "Pretrain/Step Time": 8.494444197043777} +{"Pretrain/Learning Rate": 4.2299314570020736e-06, "Pretrain/Loss": 1.9628615379333496, "Pretrain/Loss (Raw)": 1.8112273216247559, "Pretrain/Step": 15597, "Pretrain/Step Time": 8.500879464671016} +{"Pretrain/Learning Rate": 4.22756903722884e-06, "Pretrain/Loss": 1.9648621082305908, "Pretrain/Loss (Raw)": 2.1705336570739746, "Pretrain/Step": 15598, "Pretrain/Step Time": 8.501369459554553} +{"Pretrain/Learning Rate": 4.225207216414004e-06, "Pretrain/Loss": 1.965573787689209, "Pretrain/Loss (Raw)": 2.0927088260650635, "Pretrain/Step": 15599, "Pretrain/Step Time": 8.500645361840725} +{"Pretrain/Learning Rate": 4.222845994625676e-06, "Pretrain/Loss": 1.9645521640777588, "Pretrain/Loss (Raw)": 1.9229340553283691, "Pretrain/Step": 15600, "Pretrain/Step Time": 8.502156192436814} +{"Pretrain/Learning Rate": 4.220485371931931e-06, "Pretrain/Loss": 1.964388370513916, "Pretrain/Loss (Raw)": 1.9627225399017334, "Pretrain/Step": 15601, "Pretrain/Step Time": 8.49579044058919} +{"Pretrain/Learning Rate": 4.21812534840085e-06, "Pretrain/Loss": 1.9602073431015015, "Pretrain/Loss (Raw)": 1.722582459449768, "Pretrain/Step": 15602, "Pretrain/Step Time": 8.502110656350851} +{"Pretrain/Learning Rate": 4.215765924100473e-06, "Pretrain/Loss": 1.9576616287231445, "Pretrain/Loss (Raw)": 1.7752749919891357, "Pretrain/Step": 15603, "Pretrain/Step Time": 8.499651066958904} +{"Pretrain/Learning Rate": 4.213407099098829e-06, "Pretrain/Loss": 1.9560556411743164, "Pretrain/Loss (Raw)": 1.9022784233093262, "Pretrain/Step": 15604, "Pretrain/Step Time": 8.499006517231464} +{"Pretrain/Learning Rate": 4.211048873463943e-06, "Pretrain/Loss": 1.9551098346710205, "Pretrain/Loss (Raw)": 1.8717690706253052, "Pretrain/Step": 15605, "Pretrain/Step Time": 8.500090975314379} +{"Pretrain/Learning Rate": 4.208691247263802e-06, "Pretrain/Loss": 1.9544779062271118, "Pretrain/Loss (Raw)": 1.9123016595840454, "Pretrain/Step": 15606, "Pretrain/Step Time": 8.494823660701513} +{"Pretrain/Learning Rate": 4.2063342205663964e-06, "Pretrain/Loss": 1.9566435813903809, "Pretrain/Loss (Raw)": 2.278052568435669, "Pretrain/Step": 15607, "Pretrain/Step Time": 8.498941266909242} +{"Pretrain/Learning Rate": 4.2039777934396865e-06, "Pretrain/Loss": 1.9574835300445557, "Pretrain/Loss (Raw)": 1.9143445491790771, "Pretrain/Step": 15608, "Pretrain/Step Time": 8.493355862796307} +{"Pretrain/Learning Rate": 4.201621965951611e-06, "Pretrain/Loss": 1.9581513404846191, "Pretrain/Loss (Raw)": 2.114100217819214, "Pretrain/Step": 15609, "Pretrain/Step Time": 8.495570240542293} +{"Pretrain/Learning Rate": 4.199266738170107e-06, "Pretrain/Loss": 1.9588463306427002, "Pretrain/Loss (Raw)": 1.9842281341552734, "Pretrain/Step": 15610, "Pretrain/Step Time": 8.492031998932362} +{"Pretrain/Learning Rate": 4.1969121101630815e-06, "Pretrain/Loss": 1.9616937637329102, "Pretrain/Loss (Raw)": 2.252563953399658, "Pretrain/Step": 15611, "Pretrain/Step Time": 8.491382036358118} +{"Pretrain/Learning Rate": 4.1945580819984345e-06, "Pretrain/Loss": 1.9612175226211548, "Pretrain/Loss (Raw)": 1.9092113971710205, "Pretrain/Step": 15612, "Pretrain/Step Time": 8.49052968248725} +{"Pretrain/Learning Rate": 4.192204653744036e-06, "Pretrain/Loss": 1.9607276916503906, "Pretrain/Loss (Raw)": 1.9492114782333374, "Pretrain/Step": 15613, "Pretrain/Step Time": 8.493254378437996} +{"Pretrain/Learning Rate": 4.189851825467745e-06, "Pretrain/Loss": 1.9618011713027954, "Pretrain/Loss (Raw)": 2.0444676876068115, "Pretrain/Step": 15614, "Pretrain/Step Time": 8.491599798202515} +{"Pretrain/Learning Rate": 4.18749959723741e-06, "Pretrain/Loss": 1.960202932357788, "Pretrain/Loss (Raw)": 1.6438758373260498, "Pretrain/Step": 15615, "Pretrain/Step Time": 8.49229734390974} +{"Pretrain/Learning Rate": 4.185147969120848e-06, "Pretrain/Loss": 1.9600846767425537, "Pretrain/Loss (Raw)": 1.8668535947799683, "Pretrain/Step": 15616, "Pretrain/Step Time": 8.490698046982288} +{"Pretrain/Learning Rate": 4.182796941185876e-06, "Pretrain/Loss": 1.9599933624267578, "Pretrain/Loss (Raw)": 1.9747674465179443, "Pretrain/Step": 15617, "Pretrain/Step Time": 8.492362616583705} +{"Pretrain/Learning Rate": 4.1804465135002774e-06, "Pretrain/Loss": 1.9604113101959229, "Pretrain/Loss (Raw)": 1.9741624593734741, "Pretrain/Step": 15618, "Pretrain/Step Time": 8.491302449256182} +{"Pretrain/Learning Rate": 4.1780966861318245e-06, "Pretrain/Loss": 1.9615448713302612, "Pretrain/Loss (Raw)": 2.053600549697876, "Pretrain/Step": 15619, "Pretrain/Step Time": 8.492810359224677} +{"Pretrain/Learning Rate": 4.175747459148277e-06, "Pretrain/Loss": 1.9618892669677734, "Pretrain/Loss (Raw)": 1.9211201667785645, "Pretrain/Step": 15620, "Pretrain/Step Time": 8.491307757794857} +{"Pretrain/Learning Rate": 4.173398832617367e-06, "Pretrain/Loss": 1.962639331817627, "Pretrain/Loss (Raw)": 2.047281503677368, "Pretrain/Step": 15621, "Pretrain/Step Time": 8.495506908744574} +{"Pretrain/Learning Rate": 4.171050806606827e-06, "Pretrain/Loss": 1.9622002840042114, "Pretrain/Loss (Raw)": 2.0911505222320557, "Pretrain/Step": 15622, "Pretrain/Step Time": 8.49120612628758} +{"Pretrain/Learning Rate": 4.168703381184355e-06, "Pretrain/Loss": 1.9634461402893066, "Pretrain/Loss (Raw)": 1.9995299577713013, "Pretrain/Step": 15623, "Pretrain/Step Time": 8.493049293756485} +{"Pretrain/Learning Rate": 4.166356556417628e-06, "Pretrain/Loss": 1.9645925760269165, "Pretrain/Loss (Raw)": 2.1028101444244385, "Pretrain/Step": 15624, "Pretrain/Step Time": 8.496005151420832} +{"Pretrain/Learning Rate": 4.164010332374327e-06, "Pretrain/Loss": 1.9622697830200195, "Pretrain/Loss (Raw)": 1.7703617811203003, "Pretrain/Step": 15625, "Pretrain/Step Time": 8.4930132124573} +{"Pretrain/Learning Rate": 4.161664709122096e-06, "Pretrain/Loss": 1.9637267589569092, "Pretrain/Loss (Raw)": 2.047579526901245, "Pretrain/Step": 15626, "Pretrain/Step Time": 8.499183293431997} +{"Pretrain/Learning Rate": 4.15931968672858e-06, "Pretrain/Loss": 1.9637001752853394, "Pretrain/Loss (Raw)": 1.8143818378448486, "Pretrain/Step": 15627, "Pretrain/Step Time": 8.49556890130043} +{"Pretrain/Learning Rate": 4.156975265261387e-06, "Pretrain/Loss": 1.9627156257629395, "Pretrain/Loss (Raw)": 1.9035322666168213, "Pretrain/Step": 15628, "Pretrain/Step Time": 8.4946242980659} +{"Pretrain/Learning Rate": 4.154631444788113e-06, "Pretrain/Loss": 1.9635872840881348, "Pretrain/Loss (Raw)": 2.106973171234131, "Pretrain/Step": 15629, "Pretrain/Step Time": 8.499589145183563} +{"Pretrain/Learning Rate": 4.152288225376352e-06, "Pretrain/Loss": 1.9621613025665283, "Pretrain/Loss (Raw)": 1.9023748636245728, "Pretrain/Step": 15630, "Pretrain/Step Time": 8.50038848258555} +{"Pretrain/Learning Rate": 4.149945607093658e-06, "Pretrain/Loss": 1.965010643005371, "Pretrain/Loss (Raw)": 2.1827330589294434, "Pretrain/Step": 15631, "Pretrain/Step Time": 8.4997205901891} +{"Pretrain/Learning Rate": 4.14760359000759e-06, "Pretrain/Loss": 1.9651800394058228, "Pretrain/Loss (Raw)": 1.8602393865585327, "Pretrain/Step": 15632, "Pretrain/Step Time": 8.50592852011323} +{"Pretrain/Learning Rate": 4.145262174185674e-06, "Pretrain/Loss": 1.9647401571273804, "Pretrain/Loss (Raw)": 1.87196683883667, "Pretrain/Step": 15633, "Pretrain/Step Time": 8.505906268954277} +{"Pretrain/Learning Rate": 4.142921359695415e-06, "Pretrain/Loss": 1.9666544198989868, "Pretrain/Loss (Raw)": 2.1692981719970703, "Pretrain/Step": 15634, "Pretrain/Step Time": 8.506172187626362} +{"Pretrain/Learning Rate": 4.14058114660432e-06, "Pretrain/Loss": 1.9660686254501343, "Pretrain/Loss (Raw)": 1.7653816938400269, "Pretrain/Step": 15635, "Pretrain/Step Time": 8.503102127462626} +{"Pretrain/Learning Rate": 4.138241534979856e-06, "Pretrain/Loss": 1.9673991203308105, "Pretrain/Loss (Raw)": 2.015260696411133, "Pretrain/Step": 15636, "Pretrain/Step Time": 8.50111997127533} +{"Pretrain/Learning Rate": 4.135902524889498e-06, "Pretrain/Loss": 1.9686161279678345, "Pretrain/Loss (Raw)": 2.195274591445923, "Pretrain/Step": 15637, "Pretrain/Step Time": 8.500918980687857} +{"Pretrain/Learning Rate": 4.133564116400684e-06, "Pretrain/Loss": 1.9667975902557373, "Pretrain/Loss (Raw)": 1.8601877689361572, "Pretrain/Step": 15638, "Pretrain/Step Time": 8.506199210882187} +{"Pretrain/Learning Rate": 4.13122630958083e-06, "Pretrain/Loss": 1.967268466949463, "Pretrain/Loss (Raw)": 1.9545555114746094, "Pretrain/Step": 15639, "Pretrain/Step Time": 8.506038775667548} +{"Pretrain/Learning Rate": 4.128889104497363e-06, "Pretrain/Loss": 1.9686522483825684, "Pretrain/Loss (Raw)": 2.0231564044952393, "Pretrain/Step": 15640, "Pretrain/Step Time": 8.505184723064303} +{"Pretrain/Learning Rate": 4.126552501217656e-06, "Pretrain/Loss": 1.9706497192382812, "Pretrain/Loss (Raw)": 1.92881441116333, "Pretrain/Step": 15641, "Pretrain/Step Time": 8.501389414072037} +{"Pretrain/Learning Rate": 4.124216499809103e-06, "Pretrain/Loss": 1.9745502471923828, "Pretrain/Loss (Raw)": 1.9655758142471313, "Pretrain/Step": 15642, "Pretrain/Step Time": 8.509272925555706} +{"Pretrain/Learning Rate": 4.121881100339048e-06, "Pretrain/Loss": 1.973343014717102, "Pretrain/Loss (Raw)": 1.9787304401397705, "Pretrain/Step": 15643, "Pretrain/Step Time": 8.508938012644649} +{"Pretrain/Learning Rate": 4.119546302874827e-06, "Pretrain/Loss": 1.973587989807129, "Pretrain/Loss (Raw)": 1.9348487854003906, "Pretrain/Step": 15644, "Pretrain/Step Time": 8.508106283843517} +{"Pretrain/Learning Rate": 4.117212107483775e-06, "Pretrain/Loss": 1.973002314567566, "Pretrain/Loss (Raw)": 1.9075469970703125, "Pretrain/Step": 15645, "Pretrain/Step Time": 8.51395033672452} +{"Pretrain/Learning Rate": 4.114878514233184e-06, "Pretrain/Loss": 1.9711881875991821, "Pretrain/Loss (Raw)": 1.8195345401763916, "Pretrain/Step": 15646, "Pretrain/Step Time": 8.513516828417778} +{"Pretrain/Learning Rate": 4.1125455231903555e-06, "Pretrain/Loss": 1.9709069728851318, "Pretrain/Loss (Raw)": 1.8865447044372559, "Pretrain/Step": 15647, "Pretrain/Step Time": 8.508358905091882} +{"Pretrain/Learning Rate": 4.1102131344225446e-06, "Pretrain/Loss": 1.970874309539795, "Pretrain/Loss (Raw)": 1.9761419296264648, "Pretrain/Step": 15648, "Pretrain/Step Time": 8.51104954816401} +{"Pretrain/Learning Rate": 4.10788134799702e-06, "Pretrain/Loss": 1.9720869064331055, "Pretrain/Loss (Raw)": 2.1047072410583496, "Pretrain/Step": 15649, "Pretrain/Step Time": 8.512072514742613} +{"Pretrain/Learning Rate": 4.105550163981006e-06, "Pretrain/Loss": 1.968662977218628, "Pretrain/Loss (Raw)": 1.596972942352295, "Pretrain/Step": 15650, "Pretrain/Step Time": 8.51049175299704} +{"Pretrain/Learning Rate": 4.103219582441719e-06, "Pretrain/Loss": 1.9676294326782227, "Pretrain/Loss (Raw)": 1.8177988529205322, "Pretrain/Step": 15651, "Pretrain/Step Time": 8.51259358972311} +{"Pretrain/Learning Rate": 4.10088960344637e-06, "Pretrain/Loss": 1.9708940982818604, "Pretrain/Loss (Raw)": 2.2939915657043457, "Pretrain/Step": 15652, "Pretrain/Step Time": 8.513095639646053} +{"Pretrain/Learning Rate": 4.098560227062129e-06, "Pretrain/Loss": 1.9718976020812988, "Pretrain/Loss (Raw)": 2.09674072265625, "Pretrain/Step": 15653, "Pretrain/Step Time": 8.509815344586968} +{"Pretrain/Learning Rate": 4.096231453356178e-06, "Pretrain/Loss": 1.973839282989502, "Pretrain/Loss (Raw)": 2.3019819259643555, "Pretrain/Step": 15654, "Pretrain/Step Time": 8.506494285538793} +{"Pretrain/Learning Rate": 4.093903282395656e-06, "Pretrain/Loss": 1.9732235670089722, "Pretrain/Loss (Raw)": 1.8643910884857178, "Pretrain/Step": 15655, "Pretrain/Step Time": 8.504420071840286} +{"Pretrain/Learning Rate": 4.0915757142476865e-06, "Pretrain/Loss": 1.9718421697616577, "Pretrain/Loss (Raw)": 1.8014477491378784, "Pretrain/Step": 15656, "Pretrain/Step Time": 8.504680451005697} +{"Pretrain/Learning Rate": 4.089248748979399e-06, "Pretrain/Loss": 1.9725295305252075, "Pretrain/Loss (Raw)": 2.0257115364074707, "Pretrain/Step": 15657, "Pretrain/Step Time": 8.501436989754438} +{"Pretrain/Learning Rate": 4.086922386657879e-06, "Pretrain/Loss": 1.9752434492111206, "Pretrain/Loss (Raw)": 1.9876445531845093, "Pretrain/Step": 15658, "Pretrain/Step Time": 8.501779600977898} +{"Pretrain/Learning Rate": 4.084596627350212e-06, "Pretrain/Loss": 1.9759459495544434, "Pretrain/Loss (Raw)": 2.15531063079834, "Pretrain/Step": 15659, "Pretrain/Step Time": 8.500780306756496} +{"Pretrain/Learning Rate": 4.082271471123459e-06, "Pretrain/Loss": 1.9774577617645264, "Pretrain/Loss (Raw)": 2.177072525024414, "Pretrain/Step": 15660, "Pretrain/Step Time": 8.494152773171663} +{"Pretrain/Learning Rate": 4.079946918044655e-06, "Pretrain/Loss": 1.9799728393554688, "Pretrain/Loss (Raw)": 2.0726020336151123, "Pretrain/Step": 15661, "Pretrain/Step Time": 8.496998064219952} +{"Pretrain/Learning Rate": 4.0776229681808416e-06, "Pretrain/Loss": 1.9772417545318604, "Pretrain/Loss (Raw)": 1.758230209350586, "Pretrain/Step": 15662, "Pretrain/Step Time": 8.499989546835423} +{"Pretrain/Learning Rate": 4.075299621599013e-06, "Pretrain/Loss": 1.9800403118133545, "Pretrain/Loss (Raw)": 1.9259779453277588, "Pretrain/Step": 15663, "Pretrain/Step Time": 8.499138217419386} +{"Pretrain/Learning Rate": 4.072976878366175e-06, "Pretrain/Loss": 1.9799246788024902, "Pretrain/Loss (Raw)": 1.8703583478927612, "Pretrain/Step": 15664, "Pretrain/Step Time": 8.499434551224113} +{"Pretrain/Learning Rate": 4.070654738549298e-06, "Pretrain/Loss": 1.9795432090759277, "Pretrain/Loss (Raw)": 2.0022661685943604, "Pretrain/Step": 15665, "Pretrain/Step Time": 8.499226162210107} +{"Pretrain/Learning Rate": 4.06833320221533e-06, "Pretrain/Loss": 1.9790775775909424, "Pretrain/Loss (Raw)": 1.9286826848983765, "Pretrain/Step": 15666, "Pretrain/Step Time": 8.490315921604633} +{"Pretrain/Learning Rate": 4.0660122694312245e-06, "Pretrain/Loss": 1.9793777465820312, "Pretrain/Loss (Raw)": 2.3844170570373535, "Pretrain/Step": 15667, "Pretrain/Step Time": 8.492193082347512} +{"Pretrain/Learning Rate": 4.063691940263897e-06, "Pretrain/Loss": 1.9779047966003418, "Pretrain/Loss (Raw)": 1.8915581703186035, "Pretrain/Step": 15668, "Pretrain/Step Time": 8.48988382332027} +{"Pretrain/Learning Rate": 4.061372214780251e-06, "Pretrain/Loss": 1.9770703315734863, "Pretrain/Loss (Raw)": 1.899430274963379, "Pretrain/Step": 15669, "Pretrain/Step Time": 8.49233309365809} +{"Pretrain/Learning Rate": 4.0590530930471745e-06, "Pretrain/Loss": 1.9786968231201172, "Pretrain/Loss (Raw)": 2.1914336681365967, "Pretrain/Step": 15670, "Pretrain/Step Time": 8.49760852754116} +{"Pretrain/Learning Rate": 4.056734575131544e-06, "Pretrain/Loss": 1.9786467552185059, "Pretrain/Loss (Raw)": 2.1103920936584473, "Pretrain/Step": 15671, "Pretrain/Step Time": 8.499289076775312} +{"Pretrain/Learning Rate": 4.054416661100208e-06, "Pretrain/Loss": 1.9806690216064453, "Pretrain/Loss (Raw)": 2.0096137523651123, "Pretrain/Step": 15672, "Pretrain/Step Time": 8.501036925241351} +{"Pretrain/Learning Rate": 4.052099351019997e-06, "Pretrain/Loss": 1.9803211688995361, "Pretrain/Loss (Raw)": 1.7714239358901978, "Pretrain/Step": 15673, "Pretrain/Step Time": 8.500494461506605} +{"Pretrain/Learning Rate": 4.049782644957739e-06, "Pretrain/Loss": 1.9802889823913574, "Pretrain/Loss (Raw)": 2.026930570602417, "Pretrain/Step": 15674, "Pretrain/Step Time": 8.500529514625669} +{"Pretrain/Learning Rate": 4.047466542980224e-06, "Pretrain/Loss": 1.9817988872528076, "Pretrain/Loss (Raw)": 2.28043532371521, "Pretrain/Step": 15675, "Pretrain/Step Time": 8.501168236136436} +{"Pretrain/Learning Rate": 4.045151045154246e-06, "Pretrain/Loss": 1.982041358947754, "Pretrain/Loss (Raw)": 1.7745376825332642, "Pretrain/Step": 15676, "Pretrain/Step Time": 8.503056403249502} +{"Pretrain/Learning Rate": 4.042836151546564e-06, "Pretrain/Loss": 1.9812843799591064, "Pretrain/Loss (Raw)": 1.9006969928741455, "Pretrain/Step": 15677, "Pretrain/Step Time": 8.50508589297533} +{"Pretrain/Learning Rate": 4.0405218622239254e-06, "Pretrain/Loss": 1.9855459928512573, "Pretrain/Loss (Raw)": 2.3910164833068848, "Pretrain/Step": 15678, "Pretrain/Step Time": 8.502484910190105} +{"Pretrain/Learning Rate": 4.038208177253066e-06, "Pretrain/Loss": 1.982527256011963, "Pretrain/Loss (Raw)": 1.8665660619735718, "Pretrain/Step": 15679, "Pretrain/Step Time": 8.507695969194174} +{"Pretrain/Learning Rate": 4.0358950967006925e-06, "Pretrain/Loss": 1.979489803314209, "Pretrain/Loss (Raw)": 1.7182481288909912, "Pretrain/Step": 15680, "Pretrain/Step Time": 8.509160675108433} +{"Pretrain/Learning Rate": 4.033582620633511e-06, "Pretrain/Loss": 1.979181170463562, "Pretrain/Loss (Raw)": 2.0175328254699707, "Pretrain/Step": 15681, "Pretrain/Step Time": 8.509116871282458} +{"Pretrain/Learning Rate": 4.031270749118194e-06, "Pretrain/Loss": 1.9809762239456177, "Pretrain/Loss (Raw)": 2.0106146335601807, "Pretrain/Step": 15682, "Pretrain/Step Time": 8.510860757902265} +{"Pretrain/Learning Rate": 4.0289594822213975e-06, "Pretrain/Loss": 1.9807170629501343, "Pretrain/Loss (Raw)": 1.8995273113250732, "Pretrain/Step": 15683, "Pretrain/Step Time": 8.50786468014121} +{"Pretrain/Learning Rate": 4.026648820009777e-06, "Pretrain/Loss": 1.981286644935608, "Pretrain/Loss (Raw)": 1.920906901359558, "Pretrain/Step": 15684, "Pretrain/Step Time": 8.511154022067785} +{"Pretrain/Learning Rate": 4.024338762549945e-06, "Pretrain/Loss": 1.9808549880981445, "Pretrain/Loss (Raw)": 2.0823936462402344, "Pretrain/Step": 15685, "Pretrain/Step Time": 8.510349778458476} +{"Pretrain/Learning Rate": 4.022029309908523e-06, "Pretrain/Loss": 1.9821906089782715, "Pretrain/Loss (Raw)": 2.095590114593506, "Pretrain/Step": 15686, "Pretrain/Step Time": 8.511997103691101} +{"Pretrain/Learning Rate": 4.019720462152101e-06, "Pretrain/Loss": 1.9776761531829834, "Pretrain/Loss (Raw)": 1.5568764209747314, "Pretrain/Step": 15687, "Pretrain/Step Time": 8.511275732889771} +{"Pretrain/Learning Rate": 4.017412219347241e-06, "Pretrain/Loss": 1.9780316352844238, "Pretrain/Loss (Raw)": 2.036449670791626, "Pretrain/Step": 15688, "Pretrain/Step Time": 8.511969087645411} +{"Pretrain/Learning Rate": 4.015104581560513e-06, "Pretrain/Loss": 1.9769527912139893, "Pretrain/Loss (Raw)": 1.9097638130187988, "Pretrain/Step": 15689, "Pretrain/Step Time": 8.510336451232433} +{"Pretrain/Learning Rate": 4.012797548858447e-06, "Pretrain/Loss": 1.9764933586120605, "Pretrain/Loss (Raw)": 1.911599040031433, "Pretrain/Step": 15690, "Pretrain/Step Time": 8.507332807406783} +{"Pretrain/Learning Rate": 4.010491121307575e-06, "Pretrain/Loss": 1.9781816005706787, "Pretrain/Loss (Raw)": 1.9901834726333618, "Pretrain/Step": 15691, "Pretrain/Step Time": 8.509432680904865} +{"Pretrain/Learning Rate": 4.008185298974393e-06, "Pretrain/Loss": 1.9804556369781494, "Pretrain/Loss (Raw)": 1.9154562950134277, "Pretrain/Step": 15692, "Pretrain/Step Time": 8.509832041338086} +{"Pretrain/Learning Rate": 4.005880081925384e-06, "Pretrain/Loss": 1.9798095226287842, "Pretrain/Loss (Raw)": 1.936312198638916, "Pretrain/Step": 15693, "Pretrain/Step Time": 8.514578059315681} +{"Pretrain/Learning Rate": 4.0035754702270305e-06, "Pretrain/Loss": 1.982925534248352, "Pretrain/Loss (Raw)": 2.2672595977783203, "Pretrain/Step": 15694, "Pretrain/Step Time": 8.50629299506545} +{"Pretrain/Learning Rate": 4.001271463945769e-06, "Pretrain/Loss": 1.9813055992126465, "Pretrain/Loss (Raw)": 1.9116164445877075, "Pretrain/Step": 15695, "Pretrain/Step Time": 8.508982358500361} +{"Pretrain/Learning Rate": 3.998968063148048e-06, "Pretrain/Loss": 1.9808001518249512, "Pretrain/Loss (Raw)": 1.9845679998397827, "Pretrain/Step": 15696, "Pretrain/Step Time": 8.507132539525628} +{"Pretrain/Learning Rate": 3.996665267900279e-06, "Pretrain/Loss": 1.984527587890625, "Pretrain/Loss (Raw)": 2.2177343368530273, "Pretrain/Step": 15697, "Pretrain/Step Time": 8.508637186139822} +{"Pretrain/Learning Rate": 3.994363078268856e-06, "Pretrain/Loss": 1.9815970659255981, "Pretrain/Loss (Raw)": 1.8419263362884521, "Pretrain/Step": 15698, "Pretrain/Step Time": 8.507412750273943} +{"Pretrain/Learning Rate": 3.992061494320168e-06, "Pretrain/Loss": 1.9840537309646606, "Pretrain/Loss (Raw)": 2.354386806488037, "Pretrain/Step": 15699, "Pretrain/Step Time": 8.507499678060412} +{"Pretrain/Learning Rate": 3.989760516120575e-06, "Pretrain/Loss": 1.9836509227752686, "Pretrain/Loss (Raw)": 1.9190664291381836, "Pretrain/Step": 15700, "Pretrain/Step Time": 8.509459514170885} +{"Pretrain/Learning Rate": 3.987460143736429e-06, "Pretrain/Loss": 1.984224557876587, "Pretrain/Loss (Raw)": 2.01287579536438, "Pretrain/Step": 15701, "Pretrain/Step Time": 8.504988415166736} +{"Pretrain/Learning Rate": 3.98516037723406e-06, "Pretrain/Loss": 1.987861156463623, "Pretrain/Loss (Raw)": 2.259881019592285, "Pretrain/Step": 15702, "Pretrain/Step Time": 8.505383975803852} +{"Pretrain/Learning Rate": 3.982861216679767e-06, "Pretrain/Loss": 1.988410472869873, "Pretrain/Loss (Raw)": 2.122378349304199, "Pretrain/Step": 15703, "Pretrain/Step Time": 8.50684555247426} +{"Pretrain/Learning Rate": 3.980562662139864e-06, "Pretrain/Loss": 1.9889756441116333, "Pretrain/Loss (Raw)": 2.0765457153320312, "Pretrain/Step": 15704, "Pretrain/Step Time": 8.508049763739109} +{"Pretrain/Learning Rate": 3.978264713680613e-06, "Pretrain/Loss": 1.988922119140625, "Pretrain/Loss (Raw)": 1.942702293395996, "Pretrain/Step": 15705, "Pretrain/Step Time": 8.501938795670867} +{"Pretrain/Learning Rate": 3.975967371368283e-06, "Pretrain/Loss": 1.9909775257110596, "Pretrain/Loss (Raw)": 2.151470899581909, "Pretrain/Step": 15706, "Pretrain/Step Time": 8.502606162801385} +{"Pretrain/Learning Rate": 3.973670635269114e-06, "Pretrain/Loss": 1.9890961647033691, "Pretrain/Loss (Raw)": 1.9180316925048828, "Pretrain/Step": 15707, "Pretrain/Step Time": 8.500216830521822} +{"Pretrain/Learning Rate": 3.971374505449324e-06, "Pretrain/Loss": 1.9877405166625977, "Pretrain/Loss (Raw)": 1.9309484958648682, "Pretrain/Step": 15708, "Pretrain/Step Time": 8.501870578154922} +{"Pretrain/Learning Rate": 3.969078981975133e-06, "Pretrain/Loss": 1.9873230457305908, "Pretrain/Loss (Raw)": 2.0607147216796875, "Pretrain/Step": 15709, "Pretrain/Step Time": 8.502189429476857} +{"Pretrain/Learning Rate": 3.966784064912718e-06, "Pretrain/Loss": 1.9875423908233643, "Pretrain/Loss (Raw)": 1.86539626121521, "Pretrain/Step": 15710, "Pretrain/Step Time": 8.503375519067049} +{"Pretrain/Learning Rate": 3.96448975432826e-06, "Pretrain/Loss": 1.989701271057129, "Pretrain/Loss (Raw)": 2.3275554180145264, "Pretrain/Step": 15711, "Pretrain/Step Time": 8.505912570282817} +{"Pretrain/Learning Rate": 3.962196050287914e-06, "Pretrain/Loss": 1.987932562828064, "Pretrain/Loss (Raw)": 1.7670695781707764, "Pretrain/Step": 15712, "Pretrain/Step Time": 8.507853278890252} +{"Pretrain/Learning Rate": 3.959902952857805e-06, "Pretrain/Loss": 1.9874422550201416, "Pretrain/Loss (Raw)": 1.9846382141113281, "Pretrain/Step": 15713, "Pretrain/Step Time": 8.508618293330073} +{"Pretrain/Learning Rate": 3.9576104621040725e-06, "Pretrain/Loss": 1.986841082572937, "Pretrain/Loss (Raw)": 1.9790946245193481, "Pretrain/Step": 15714, "Pretrain/Step Time": 8.50940353050828} +{"Pretrain/Learning Rate": 3.955318578092798e-06, "Pretrain/Loss": 1.9882557392120361, "Pretrain/Loss (Raw)": 1.992102861404419, "Pretrain/Step": 15715, "Pretrain/Step Time": 8.505570584908128} +{"Pretrain/Learning Rate": 3.9530273008900855e-06, "Pretrain/Loss": 1.9883674383163452, "Pretrain/Loss (Raw)": 2.053542137145996, "Pretrain/Step": 15716, "Pretrain/Step Time": 8.505418689921498} +{"Pretrain/Learning Rate": 3.9507366305619854e-06, "Pretrain/Loss": 1.987457036972046, "Pretrain/Loss (Raw)": 2.1936633586883545, "Pretrain/Step": 15717, "Pretrain/Step Time": 8.508506009355187} +{"Pretrain/Learning Rate": 3.948446567174563e-06, "Pretrain/Loss": 1.9872053861618042, "Pretrain/Loss (Raw)": 2.0257065296173096, "Pretrain/Step": 15718, "Pretrain/Step Time": 8.505834205076098} +{"Pretrain/Learning Rate": 3.946157110793844e-06, "Pretrain/Loss": 1.9864258766174316, "Pretrain/Loss (Raw)": 2.0036609172821045, "Pretrain/Step": 15719, "Pretrain/Step Time": 8.512008417397738} +{"Pretrain/Learning Rate": 3.9438682614858365e-06, "Pretrain/Loss": 1.9878920316696167, "Pretrain/Loss (Raw)": 2.117234945297241, "Pretrain/Step": 15720, "Pretrain/Step Time": 8.510018322616816} +{"Pretrain/Learning Rate": 3.941580019316552e-06, "Pretrain/Loss": 1.9907104969024658, "Pretrain/Loss (Raw)": 2.3032915592193604, "Pretrain/Step": 15721, "Pretrain/Step Time": 8.5131114423275} +{"Pretrain/Learning Rate": 3.939292384351953e-06, "Pretrain/Loss": 1.9912807941436768, "Pretrain/Loss (Raw)": 2.0773463249206543, "Pretrain/Step": 15722, "Pretrain/Step Time": 8.507785284891725} +{"Pretrain/Learning Rate": 3.937005356658019e-06, "Pretrain/Loss": 1.9892387390136719, "Pretrain/Loss (Raw)": 1.7834765911102295, "Pretrain/Step": 15723, "Pretrain/Step Time": 8.504201754927635} +{"Pretrain/Learning Rate": 3.9347189363006855e-06, "Pretrain/Loss": 1.9913954734802246, "Pretrain/Loss (Raw)": 2.0642848014831543, "Pretrain/Step": 15724, "Pretrain/Step Time": 8.508225332945585} +{"Pretrain/Learning Rate": 3.932433123345877e-06, "Pretrain/Loss": 1.9928301572799683, "Pretrain/Loss (Raw)": 1.9948556423187256, "Pretrain/Step": 15725, "Pretrain/Step Time": 8.500613622367382} +{"Pretrain/Learning Rate": 3.930147917859514e-06, "Pretrain/Loss": 1.992537021636963, "Pretrain/Loss (Raw)": 2.1330175399780273, "Pretrain/Step": 15726, "Pretrain/Step Time": 8.502525985240936} +{"Pretrain/Learning Rate": 3.927863319907477e-06, "Pretrain/Loss": 1.991351842880249, "Pretrain/Loss (Raw)": 1.9410037994384766, "Pretrain/Step": 15727, "Pretrain/Step Time": 8.508634865283966} +{"Pretrain/Learning Rate": 3.925579329555651e-06, "Pretrain/Loss": 1.9916919469833374, "Pretrain/Loss (Raw)": 1.9664689302444458, "Pretrain/Step": 15728, "Pretrain/Step Time": 8.506110344082117} +{"Pretrain/Learning Rate": 3.923295946869887e-06, "Pretrain/Loss": 1.9916046857833862, "Pretrain/Loss (Raw)": 1.9515600204467773, "Pretrain/Step": 15729, "Pretrain/Step Time": 8.511127717792988} +{"Pretrain/Learning Rate": 3.9210131719160245e-06, "Pretrain/Loss": 1.9915980100631714, "Pretrain/Loss (Raw)": 1.7217170000076294, "Pretrain/Step": 15730, "Pretrain/Step Time": 8.505559019744396} +{"Pretrain/Learning Rate": 3.91873100475989e-06, "Pretrain/Loss": 1.9937111139297485, "Pretrain/Loss (Raw)": 2.0457682609558105, "Pretrain/Step": 15731, "Pretrain/Step Time": 8.509879302233458} +{"Pretrain/Learning Rate": 3.916449445467279e-06, "Pretrain/Loss": 1.9945183992385864, "Pretrain/Loss (Raw)": 2.00559401512146, "Pretrain/Step": 15732, "Pretrain/Step Time": 8.510010765865445} +{"Pretrain/Learning Rate": 3.914168494103995e-06, "Pretrain/Loss": 1.9963016510009766, "Pretrain/Loss (Raw)": 2.100023031234741, "Pretrain/Step": 15733, "Pretrain/Step Time": 8.50722580589354} +{"Pretrain/Learning Rate": 3.911888150735796e-06, "Pretrain/Loss": 1.9968130588531494, "Pretrain/Loss (Raw)": 1.9777748584747314, "Pretrain/Step": 15734, "Pretrain/Step Time": 8.506312634795904} +{"Pretrain/Learning Rate": 3.909608415428429e-06, "Pretrain/Loss": 1.9948217868804932, "Pretrain/Loss (Raw)": 2.0231568813323975, "Pretrain/Step": 15735, "Pretrain/Step Time": 8.504058493301272} +{"Pretrain/Learning Rate": 3.907329288247644e-06, "Pretrain/Loss": 1.995723009109497, "Pretrain/Loss (Raw)": 2.0297040939331055, "Pretrain/Step": 15736, "Pretrain/Step Time": 8.506299724802375} +{"Pretrain/Learning Rate": 3.905050769259142e-06, "Pretrain/Loss": 1.9951218366622925, "Pretrain/Loss (Raw)": 2.0371577739715576, "Pretrain/Step": 15737, "Pretrain/Step Time": 8.501317353919148} +{"Pretrain/Learning Rate": 3.902772858528636e-06, "Pretrain/Loss": 1.996334195137024, "Pretrain/Loss (Raw)": 2.139414072036743, "Pretrain/Step": 15738, "Pretrain/Step Time": 8.502498008310795} +{"Pretrain/Learning Rate": 3.900495556121802e-06, "Pretrain/Loss": 1.9953420162200928, "Pretrain/Loss (Raw)": 2.1255548000335693, "Pretrain/Step": 15739, "Pretrain/Step Time": 8.500644156709313} +{"Pretrain/Learning Rate": 3.8982188621043e-06, "Pretrain/Loss": 1.994567632675171, "Pretrain/Loss (Raw)": 1.810105323791504, "Pretrain/Step": 15740, "Pretrain/Step Time": 8.497935637831688} +{"Pretrain/Learning Rate": 3.895942776541783e-06, "Pretrain/Loss": 1.9941232204437256, "Pretrain/Loss (Raw)": 1.8923060894012451, "Pretrain/Step": 15741, "Pretrain/Step Time": 8.498232167214155} +{"Pretrain/Learning Rate": 3.893667299499879e-06, "Pretrain/Loss": 1.994065523147583, "Pretrain/Loss (Raw)": 2.0370917320251465, "Pretrain/Step": 15742, "Pretrain/Step Time": 8.49937635473907} +{"Pretrain/Learning Rate": 3.8913924310442e-06, "Pretrain/Loss": 1.9952081441879272, "Pretrain/Loss (Raw)": 1.7901180982589722, "Pretrain/Step": 15743, "Pretrain/Step Time": 8.497760409489274} +{"Pretrain/Learning Rate": 3.889118171240341e-06, "Pretrain/Loss": 1.9964816570281982, "Pretrain/Loss (Raw)": 2.0298686027526855, "Pretrain/Step": 15744, "Pretrain/Step Time": 8.499825054779649} +{"Pretrain/Learning Rate": 3.886844520153873e-06, "Pretrain/Loss": 1.9966609477996826, "Pretrain/Loss (Raw)": 1.9977294206619263, "Pretrain/Step": 15745, "Pretrain/Step Time": 8.499109923839569} +{"Pretrain/Learning Rate": 3.884571477850366e-06, "Pretrain/Loss": 1.995866298675537, "Pretrain/Loss (Raw)": 1.8724403381347656, "Pretrain/Step": 15746, "Pretrain/Step Time": 8.499920247122645} +{"Pretrain/Learning Rate": 3.882299044395346e-06, "Pretrain/Loss": 1.9967230558395386, "Pretrain/Loss (Raw)": 2.163278102874756, "Pretrain/Step": 15747, "Pretrain/Step Time": 8.49803126975894} +{"Pretrain/Learning Rate": 3.880027219854354e-06, "Pretrain/Loss": 1.99722158908844, "Pretrain/Loss (Raw)": 1.984911561012268, "Pretrain/Step": 15748, "Pretrain/Step Time": 8.497984612360597} +{"Pretrain/Learning Rate": 3.87775600429289e-06, "Pretrain/Loss": 1.9948885440826416, "Pretrain/Loss (Raw)": 1.7486501932144165, "Pretrain/Step": 15749, "Pretrain/Step Time": 8.493223233148456} +{"Pretrain/Learning Rate": 3.875485397776432e-06, "Pretrain/Loss": 1.9926236867904663, "Pretrain/Loss (Raw)": 1.8012661933898926, "Pretrain/Step": 15750, "Pretrain/Step Time": 8.496240882202983} +{"Pretrain/Learning Rate": 3.87321540037047e-06, "Pretrain/Loss": 1.9943575859069824, "Pretrain/Loss (Raw)": 2.2214643955230713, "Pretrain/Step": 15751, "Pretrain/Step Time": 8.49758462794125} +{"Pretrain/Learning Rate": 3.8709460121404475e-06, "Pretrain/Loss": 1.9941760301589966, "Pretrain/Loss (Raw)": 2.0795633792877197, "Pretrain/Step": 15752, "Pretrain/Step Time": 8.493823654949665} +{"Pretrain/Learning Rate": 3.868677233151802e-06, "Pretrain/Loss": 1.9939343929290771, "Pretrain/Loss (Raw)": 1.7394497394561768, "Pretrain/Step": 15753, "Pretrain/Step Time": 8.49395670183003} +{"Pretrain/Learning Rate": 3.866409063469944e-06, "Pretrain/Loss": 1.993422031402588, "Pretrain/Loss (Raw)": 1.981993556022644, "Pretrain/Step": 15754, "Pretrain/Step Time": 8.490650035440922} +{"Pretrain/Learning Rate": 3.86414150316029e-06, "Pretrain/Loss": 1.9940462112426758, "Pretrain/Loss (Raw)": 1.8942617177963257, "Pretrain/Step": 15755, "Pretrain/Step Time": 8.49557258747518} +{"Pretrain/Learning Rate": 3.861874552288214e-06, "Pretrain/Loss": 1.995071291923523, "Pretrain/Loss (Raw)": 2.034764289855957, "Pretrain/Step": 15756, "Pretrain/Step Time": 8.490428116172552} +{"Pretrain/Learning Rate": 3.85960821091908e-06, "Pretrain/Loss": 1.9947928190231323, "Pretrain/Loss (Raw)": 2.071321487426758, "Pretrain/Step": 15757, "Pretrain/Step Time": 8.48895108513534} +{"Pretrain/Learning Rate": 3.857342479118245e-06, "Pretrain/Loss": 1.993356466293335, "Pretrain/Loss (Raw)": 1.718515157699585, "Pretrain/Step": 15758, "Pretrain/Step Time": 8.486332153901458} +{"Pretrain/Learning Rate": 3.855077356951031e-06, "Pretrain/Loss": 1.9898611307144165, "Pretrain/Loss (Raw)": 1.7353219985961914, "Pretrain/Step": 15759, "Pretrain/Step Time": 8.490635462105274} +{"Pretrain/Learning Rate": 3.852812844482759e-06, "Pretrain/Loss": 1.9908431768417358, "Pretrain/Loss (Raw)": 1.9859579801559448, "Pretrain/Step": 15760, "Pretrain/Step Time": 8.488372255116701} +{"Pretrain/Learning Rate": 3.8505489417787225e-06, "Pretrain/Loss": 1.9912657737731934, "Pretrain/Loss (Raw)": 1.9260588884353638, "Pretrain/Step": 15761, "Pretrain/Step Time": 8.490460634231567} +{"Pretrain/Learning Rate": 3.84828564890419e-06, "Pretrain/Loss": 1.99102783203125, "Pretrain/Loss (Raw)": 2.1388490200042725, "Pretrain/Step": 15762, "Pretrain/Step Time": 8.494260646402836} +{"Pretrain/Learning Rate": 3.846022965924437e-06, "Pretrain/Loss": 1.9933652877807617, "Pretrain/Loss (Raw)": 2.0645647048950195, "Pretrain/Step": 15763, "Pretrain/Step Time": 8.491078313440084} +{"Pretrain/Learning Rate": 3.843760892904693e-06, "Pretrain/Loss": 1.9918859004974365, "Pretrain/Loss (Raw)": 1.825890302658081, "Pretrain/Step": 15764, "Pretrain/Step Time": 8.490612568333745} +{"Pretrain/Learning Rate": 3.841499429910198e-06, "Pretrain/Loss": 1.9895515441894531, "Pretrain/Loss (Raw)": 1.8964709043502808, "Pretrain/Step": 15765, "Pretrain/Step Time": 8.489988507702947} +{"Pretrain/Learning Rate": 3.839238577006146e-06, "Pretrain/Loss": 1.9905104637145996, "Pretrain/Loss (Raw)": 1.9829461574554443, "Pretrain/Step": 15766, "Pretrain/Step Time": 8.48992246389389} +{"Pretrain/Learning Rate": 3.8369783342577295e-06, "Pretrain/Loss": 1.9912705421447754, "Pretrain/Loss (Raw)": 2.0518314838409424, "Pretrain/Step": 15767, "Pretrain/Step Time": 8.49254783987999} +{"Pretrain/Learning Rate": 3.83471870173013e-06, "Pretrain/Loss": 1.9897063970565796, "Pretrain/Loss (Raw)": 1.8229526281356812, "Pretrain/Step": 15768, "Pretrain/Step Time": 8.49124096147716} +{"Pretrain/Learning Rate": 3.83245967948849e-06, "Pretrain/Loss": 1.9936614036560059, "Pretrain/Loss (Raw)": 2.435075283050537, "Pretrain/Step": 15769, "Pretrain/Step Time": 8.492682989686728} +{"Pretrain/Learning Rate": 3.830201267597958e-06, "Pretrain/Loss": 1.9933440685272217, "Pretrain/Loss (Raw)": 1.9249331951141357, "Pretrain/Step": 15770, "Pretrain/Step Time": 8.491007693111897} +{"Pretrain/Learning Rate": 3.827943466123652e-06, "Pretrain/Loss": 1.99385404586792, "Pretrain/Loss (Raw)": 2.044022798538208, "Pretrain/Step": 15771, "Pretrain/Step Time": 8.492557091638446} +{"Pretrain/Learning Rate": 3.825686275130661e-06, "Pretrain/Loss": 1.9953569173812866, "Pretrain/Loss (Raw)": 2.12722110748291, "Pretrain/Step": 15772, "Pretrain/Step Time": 8.492343982681632} +{"Pretrain/Learning Rate": 3.823429694684086e-06, "Pretrain/Loss": 1.9962854385375977, "Pretrain/Loss (Raw)": 2.026379108428955, "Pretrain/Step": 15773, "Pretrain/Step Time": 8.48861202225089} +{"Pretrain/Learning Rate": 3.821173724848981e-06, "Pretrain/Loss": 1.9965204000473022, "Pretrain/Loss (Raw)": 1.8496066331863403, "Pretrain/Step": 15774, "Pretrain/Step Time": 8.48960879817605} +{"Pretrain/Learning Rate": 3.818918365690408e-06, "Pretrain/Loss": 1.9964855909347534, "Pretrain/Loss (Raw)": 1.8821024894714355, "Pretrain/Step": 15775, "Pretrain/Step Time": 8.491351129487157} +{"Pretrain/Learning Rate": 3.816663617273394e-06, "Pretrain/Loss": 1.9970332384109497, "Pretrain/Loss (Raw)": 2.04624080657959, "Pretrain/Step": 15776, "Pretrain/Step Time": 8.48959513567388} +{"Pretrain/Learning Rate": 3.8144094796629422e-06, "Pretrain/Loss": 1.995314598083496, "Pretrain/Loss (Raw)": 1.8847177028656006, "Pretrain/Step": 15777, "Pretrain/Step Time": 8.49148871935904} +{"Pretrain/Learning Rate": 3.812155952924068e-06, "Pretrain/Loss": 1.9982389211654663, "Pretrain/Loss (Raw)": 1.9712802171707153, "Pretrain/Step": 15778, "Pretrain/Step Time": 8.495022937655449} +{"Pretrain/Learning Rate": 3.8099030371217314e-06, "Pretrain/Loss": 1.999771237373352, "Pretrain/Loss (Raw)": 2.013942003250122, "Pretrain/Step": 15779, "Pretrain/Step Time": 8.492862032726407} +{"Pretrain/Learning Rate": 3.807650732320908e-06, "Pretrain/Loss": 1.9968129396438599, "Pretrain/Loss (Raw)": 1.9153307676315308, "Pretrain/Step": 15780, "Pretrain/Step Time": 8.496569650247693} +{"Pretrain/Learning Rate": 3.8053990385865323e-06, "Pretrain/Loss": 1.993880271911621, "Pretrain/Loss (Raw)": 1.7213680744171143, "Pretrain/Step": 15781, "Pretrain/Step Time": 8.49360173754394} +{"Pretrain/Learning Rate": 3.803147955983541e-06, "Pretrain/Loss": 1.9908721446990967, "Pretrain/Loss (Raw)": 1.9169219732284546, "Pretrain/Step": 15782, "Pretrain/Step Time": 8.497949291020632} +{"Pretrain/Learning Rate": 3.8008974845768346e-06, "Pretrain/Loss": 1.9902138710021973, "Pretrain/Loss (Raw)": 1.7801313400268555, "Pretrain/Step": 15783, "Pretrain/Step Time": 8.498262636363506} +{"Pretrain/Learning Rate": 3.798647624431298e-06, "Pretrain/Loss": 1.992107629776001, "Pretrain/Loss (Raw)": 2.043856620788574, "Pretrain/Step": 15784, "Pretrain/Step Time": 8.495887733995914} +{"Pretrain/Learning Rate": 3.7963983756118177e-06, "Pretrain/Loss": 1.9928982257843018, "Pretrain/Loss (Raw)": 2.126918315887451, "Pretrain/Step": 15785, "Pretrain/Step Time": 8.49856811016798} +{"Pretrain/Learning Rate": 3.7941497381832365e-06, "Pretrain/Loss": 1.9951589107513428, "Pretrain/Loss (Raw)": 2.2770016193389893, "Pretrain/Step": 15786, "Pretrain/Step Time": 8.494753642007709} +{"Pretrain/Learning Rate": 3.791901712210405e-06, "Pretrain/Loss": 1.9943351745605469, "Pretrain/Loss (Raw)": 2.0498745441436768, "Pretrain/Step": 15787, "Pretrain/Step Time": 8.495313681662083} +{"Pretrain/Learning Rate": 3.7896542977581356e-06, "Pretrain/Loss": 1.9929800033569336, "Pretrain/Loss (Raw)": 2.0036203861236572, "Pretrain/Step": 15788, "Pretrain/Step Time": 8.495986085385084} +{"Pretrain/Learning Rate": 3.7874074948912263e-06, "Pretrain/Loss": 1.9925668239593506, "Pretrain/Loss (Raw)": 2.01969051361084, "Pretrain/Step": 15789, "Pretrain/Step Time": 8.498063700273633} +{"Pretrain/Learning Rate": 3.7851613036744755e-06, "Pretrain/Loss": 1.9951541423797607, "Pretrain/Loss (Raw)": 2.0894227027893066, "Pretrain/Step": 15790, "Pretrain/Step Time": 8.496761053800583} +{"Pretrain/Learning Rate": 3.7829157241726364e-06, "Pretrain/Loss": 1.9940153360366821, "Pretrain/Loss (Raw)": 1.780211091041565, "Pretrain/Step": 15791, "Pretrain/Step Time": 8.498207358643413} +{"Pretrain/Learning Rate": 3.780670756450472e-06, "Pretrain/Loss": 1.9941052198410034, "Pretrain/Loss (Raw)": 1.881859540939331, "Pretrain/Step": 15792, "Pretrain/Step Time": 8.499409019947052} +{"Pretrain/Learning Rate": 3.7784264005727045e-06, "Pretrain/Loss": 1.9946855306625366, "Pretrain/Loss (Raw)": 2.076552391052246, "Pretrain/Step": 15793, "Pretrain/Step Time": 8.499566618353128} +{"Pretrain/Learning Rate": 3.7761826566040494e-06, "Pretrain/Loss": 1.9951708316802979, "Pretrain/Loss (Raw)": 1.9908015727996826, "Pretrain/Step": 15794, "Pretrain/Step Time": 8.50348742492497} +{"Pretrain/Learning Rate": 3.77393952460921e-06, "Pretrain/Loss": 1.9907234907150269, "Pretrain/Loss (Raw)": 1.8151497840881348, "Pretrain/Step": 15795, "Pretrain/Step Time": 8.502512538805604} +{"Pretrain/Learning Rate": 3.771697004652855e-06, "Pretrain/Loss": 1.992983341217041, "Pretrain/Loss (Raw)": 2.1808207035064697, "Pretrain/Step": 15796, "Pretrain/Step Time": 8.504971975460649} +{"Pretrain/Learning Rate": 3.7694550967996565e-06, "Pretrain/Loss": 1.9916236400604248, "Pretrain/Loss (Raw)": 1.7253791093826294, "Pretrain/Step": 15797, "Pretrain/Step Time": 8.507385920733213} +{"Pretrain/Learning Rate": 3.7672138011142555e-06, "Pretrain/Loss": 1.9890737533569336, "Pretrain/Loss (Raw)": 1.8650648593902588, "Pretrain/Step": 15798, "Pretrain/Step Time": 8.50164095684886} +{"Pretrain/Learning Rate": 3.764973117661272e-06, "Pretrain/Loss": 1.9875967502593994, "Pretrain/Loss (Raw)": 1.9213241338729858, "Pretrain/Step": 15799, "Pretrain/Step Time": 8.497255839407444} +{"Pretrain/Learning Rate": 3.7627330465053236e-06, "Pretrain/Loss": 1.9846699237823486, "Pretrain/Loss (Raw)": 1.6349859237670898, "Pretrain/Step": 15800, "Pretrain/Step Time": 8.496644610539079} +{"Pretrain/Learning Rate": 3.7604935877109893e-06, "Pretrain/Loss": 1.9852651357650757, "Pretrain/Loss (Raw)": 1.8476104736328125, "Pretrain/Step": 15801, "Pretrain/Step Time": 8.495801420882344} +{"Pretrain/Learning Rate": 3.7582547413428566e-06, "Pretrain/Loss": 1.9822620153427124, "Pretrain/Loss (Raw)": 1.6425362825393677, "Pretrain/Step": 15802, "Pretrain/Step Time": 8.495801927521825} +{"Pretrain/Learning Rate": 3.7560165074654734e-06, "Pretrain/Loss": 1.9811785221099854, "Pretrain/Loss (Raw)": 2.141752004623413, "Pretrain/Step": 15803, "Pretrain/Step Time": 8.496049739420414} +{"Pretrain/Learning Rate": 3.753778886143372e-06, "Pretrain/Loss": 1.9822914600372314, "Pretrain/Loss (Raw)": 1.9169882535934448, "Pretrain/Step": 15804, "Pretrain/Step Time": 8.486854678019881} +{"Pretrain/Learning Rate": 3.7515418774410837e-06, "Pretrain/Loss": 1.9819058179855347, "Pretrain/Loss (Raw)": 1.8513264656066895, "Pretrain/Step": 15805, "Pretrain/Step Time": 8.483578430488706} +{"Pretrain/Learning Rate": 3.7493054814231016e-06, "Pretrain/Loss": 1.9779728651046753, "Pretrain/Loss (Raw)": 1.8876041173934937, "Pretrain/Step": 15806, "Pretrain/Step Time": 8.493347091600299} +{"Pretrain/Learning Rate": 3.747069698153921e-06, "Pretrain/Loss": 1.9779868125915527, "Pretrain/Loss (Raw)": 1.8683395385742188, "Pretrain/Step": 15807, "Pretrain/Step Time": 8.490781053900719} +{"Pretrain/Learning Rate": 3.7448345276980044e-06, "Pretrain/Loss": 1.9800682067871094, "Pretrain/Loss (Raw)": 1.984681248664856, "Pretrain/Step": 15808, "Pretrain/Step Time": 8.483827328309417} +{"Pretrain/Learning Rate": 3.742599970119795e-06, "Pretrain/Loss": 1.97903311252594, "Pretrain/Loss (Raw)": 1.8850500583648682, "Pretrain/Step": 15809, "Pretrain/Step Time": 8.486434187740088} +{"Pretrain/Learning Rate": 3.7403660254837326e-06, "Pretrain/Loss": 1.9784942865371704, "Pretrain/Loss (Raw)": 1.9416344165802002, "Pretrain/Step": 15810, "Pretrain/Step Time": 8.48529551923275} +{"Pretrain/Learning Rate": 3.7381326938542265e-06, "Pretrain/Loss": 1.978794813156128, "Pretrain/Loss (Raw)": 1.9379947185516357, "Pretrain/Step": 15811, "Pretrain/Step Time": 8.489181689918041} +{"Pretrain/Learning Rate": 3.7358999752956786e-06, "Pretrain/Loss": 1.9813849925994873, "Pretrain/Loss (Raw)": 2.252450704574585, "Pretrain/Step": 15812, "Pretrain/Step Time": 8.488664921373129} +{"Pretrain/Learning Rate": 3.7336678698724674e-06, "Pretrain/Loss": 1.9802130460739136, "Pretrain/Loss (Raw)": 1.9323745965957642, "Pretrain/Step": 15813, "Pretrain/Step Time": 8.491745991632342} +{"Pretrain/Learning Rate": 3.731436377648942e-06, "Pretrain/Loss": 1.9773046970367432, "Pretrain/Loss (Raw)": 1.7233318090438843, "Pretrain/Step": 15814, "Pretrain/Step Time": 8.491686522960663} +{"Pretrain/Learning Rate": 3.729205498689464e-06, "Pretrain/Loss": 1.9783587455749512, "Pretrain/Loss (Raw)": 1.6917818784713745, "Pretrain/Step": 15815, "Pretrain/Step Time": 8.495321510359645} +{"Pretrain/Learning Rate": 3.726975233058344e-06, "Pretrain/Loss": 1.9775495529174805, "Pretrain/Loss (Raw)": 1.9328758716583252, "Pretrain/Step": 15816, "Pretrain/Step Time": 8.494147535413504} +{"Pretrain/Learning Rate": 3.7247455808199023e-06, "Pretrain/Loss": 1.9793154001235962, "Pretrain/Loss (Raw)": 2.1357948780059814, "Pretrain/Step": 15817, "Pretrain/Step Time": 8.495986212044954} +{"Pretrain/Learning Rate": 3.7225165420384235e-06, "Pretrain/Loss": 1.9805394411087036, "Pretrain/Loss (Raw)": 2.0682756900787354, "Pretrain/Step": 15818, "Pretrain/Step Time": 8.497013978660107} +{"Pretrain/Learning Rate": 3.7202881167781754e-06, "Pretrain/Loss": 1.98188316822052, "Pretrain/Loss (Raw)": 2.1621832847595215, "Pretrain/Step": 15819, "Pretrain/Step Time": 8.49314377270639} +{"Pretrain/Learning Rate": 3.718060305103424e-06, "Pretrain/Loss": 1.9828095436096191, "Pretrain/Loss (Raw)": 2.034041404724121, "Pretrain/Step": 15820, "Pretrain/Step Time": 8.495447108522058} +{"Pretrain/Learning Rate": 3.7158331070783925e-06, "Pretrain/Loss": 1.982082724571228, "Pretrain/Loss (Raw)": 1.8432667255401611, "Pretrain/Step": 15821, "Pretrain/Step Time": 8.493340112268925} +{"Pretrain/Learning Rate": 3.7136065227673183e-06, "Pretrain/Loss": 1.9780508279800415, "Pretrain/Loss (Raw)": 1.751187801361084, "Pretrain/Step": 15822, "Pretrain/Step Time": 8.498694958165288} +{"Pretrain/Learning Rate": 3.711380552234392e-06, "Pretrain/Loss": 1.9784867763519287, "Pretrain/Loss (Raw)": 1.9673991203308105, "Pretrain/Step": 15823, "Pretrain/Step Time": 8.496977631002665} +{"Pretrain/Learning Rate": 3.7091551955437954e-06, "Pretrain/Loss": 1.9773318767547607, "Pretrain/Loss (Raw)": 1.8367388248443604, "Pretrain/Step": 15824, "Pretrain/Step Time": 8.496508918702602} +{"Pretrain/Learning Rate": 3.7069304527597047e-06, "Pretrain/Loss": 1.9755747318267822, "Pretrain/Loss (Raw)": 1.9928313493728638, "Pretrain/Step": 15825, "Pretrain/Step Time": 8.495148235931993} +{"Pretrain/Learning Rate": 3.7047063239462582e-06, "Pretrain/Loss": 1.9756267070770264, "Pretrain/Loss (Raw)": 1.848591685295105, "Pretrain/Step": 15826, "Pretrain/Step Time": 8.500007301568985} +{"Pretrain/Learning Rate": 3.7024828091675985e-06, "Pretrain/Loss": 1.9726979732513428, "Pretrain/Loss (Raw)": 1.9794840812683105, "Pretrain/Step": 15827, "Pretrain/Step Time": 8.499233672395349} +{"Pretrain/Learning Rate": 3.7002599084878327e-06, "Pretrain/Loss": 1.9744186401367188, "Pretrain/Loss (Raw)": 2.1393227577209473, "Pretrain/Step": 15828, "Pretrain/Step Time": 8.500422738492489} +{"Pretrain/Learning Rate": 3.698037621971054e-06, "Pretrain/Loss": 1.9753344058990479, "Pretrain/Loss (Raw)": 2.1300976276397705, "Pretrain/Step": 15829, "Pretrain/Step Time": 8.5023881085217} +{"Pretrain/Learning Rate": 3.695815949681347e-06, "Pretrain/Loss": 1.972466230392456, "Pretrain/Loss (Raw)": 1.8927631378173828, "Pretrain/Step": 15830, "Pretrain/Step Time": 8.506985325366259} +{"Pretrain/Learning Rate": 3.6935948916827614e-06, "Pretrain/Loss": 1.9715394973754883, "Pretrain/Loss (Raw)": 2.003753423690796, "Pretrain/Step": 15831, "Pretrain/Step Time": 8.505893994122744} +{"Pretrain/Learning Rate": 3.6913744480393557e-06, "Pretrain/Loss": 1.9714633226394653, "Pretrain/Loss (Raw)": 2.0667884349823, "Pretrain/Step": 15832, "Pretrain/Step Time": 8.506828175857663} +{"Pretrain/Learning Rate": 3.689154618815144e-06, "Pretrain/Loss": 1.970798134803772, "Pretrain/Loss (Raw)": 1.857556700706482, "Pretrain/Step": 15833, "Pretrain/Step Time": 8.504054296761751} +{"Pretrain/Learning Rate": 3.6869354040741322e-06, "Pretrain/Loss": 1.9697036743164062, "Pretrain/Loss (Raw)": 2.0113773345947266, "Pretrain/Step": 15834, "Pretrain/Step Time": 8.501211510971189} +{"Pretrain/Learning Rate": 3.6847168038803172e-06, "Pretrain/Loss": 1.9707114696502686, "Pretrain/Loss (Raw)": 2.047027587890625, "Pretrain/Step": 15835, "Pretrain/Step Time": 8.504439236596227} +{"Pretrain/Learning Rate": 3.6824988182976695e-06, "Pretrain/Loss": 1.9718480110168457, "Pretrain/Loss (Raw)": 2.07643461227417, "Pretrain/Step": 15836, "Pretrain/Step Time": 8.498030561953783} +{"Pretrain/Learning Rate": 3.680281447390138e-06, "Pretrain/Loss": 1.9747403860092163, "Pretrain/Loss (Raw)": 2.430925130844116, "Pretrain/Step": 15837, "Pretrain/Step Time": 8.502334550023079} +{"Pretrain/Learning Rate": 3.6780646912216553e-06, "Pretrain/Loss": 1.9754812717437744, "Pretrain/Loss (Raw)": 1.960248589515686, "Pretrain/Step": 15838, "Pretrain/Step Time": 8.503779787570238} +{"Pretrain/Learning Rate": 3.6758485498561536e-06, "Pretrain/Loss": 1.9739570617675781, "Pretrain/Loss (Raw)": 2.1324551105499268, "Pretrain/Step": 15839, "Pretrain/Step Time": 8.501619102433324} +{"Pretrain/Learning Rate": 3.6736330233575257e-06, "Pretrain/Loss": 1.9760849475860596, "Pretrain/Loss (Raw)": 2.0394320487976074, "Pretrain/Step": 15840, "Pretrain/Step Time": 8.499317113310099} +{"Pretrain/Learning Rate": 3.6714181117896514e-06, "Pretrain/Loss": 1.974928379058838, "Pretrain/Loss (Raw)": 1.83660089969635, "Pretrain/Step": 15841, "Pretrain/Step Time": 8.499134698882699} +{"Pretrain/Learning Rate": 3.669203815216404e-06, "Pretrain/Loss": 1.9739718437194824, "Pretrain/Loss (Raw)": 1.8566477298736572, "Pretrain/Step": 15842, "Pretrain/Step Time": 8.505306046456099} +{"Pretrain/Learning Rate": 3.6669901337016197e-06, "Pretrain/Loss": 1.9742543697357178, "Pretrain/Loss (Raw)": 2.0282645225524902, "Pretrain/Step": 15843, "Pretrain/Step Time": 8.504920521751046} +{"Pretrain/Learning Rate": 3.664777067309147e-06, "Pretrain/Loss": 1.9737316370010376, "Pretrain/Loss (Raw)": 1.9866455793380737, "Pretrain/Step": 15844, "Pretrain/Step Time": 8.507282132282853} +{"Pretrain/Learning Rate": 3.662564616102779e-06, "Pretrain/Loss": 1.972254753112793, "Pretrain/Loss (Raw)": 2.0046029090881348, "Pretrain/Step": 15845, "Pretrain/Step Time": 8.501401735469699} +{"Pretrain/Learning Rate": 3.6603527801463228e-06, "Pretrain/Loss": 1.972344160079956, "Pretrain/Loss (Raw)": 2.037168502807617, "Pretrain/Step": 15846, "Pretrain/Step Time": 8.505955215543509} +{"Pretrain/Learning Rate": 3.65814155950355e-06, "Pretrain/Loss": 1.971846342086792, "Pretrain/Loss (Raw)": 1.9399330615997314, "Pretrain/Step": 15847, "Pretrain/Step Time": 8.501955086365342} +{"Pretrain/Learning Rate": 3.655930954238218e-06, "Pretrain/Loss": 1.9703259468078613, "Pretrain/Loss (Raw)": 1.922635555267334, "Pretrain/Step": 15848, "Pretrain/Step Time": 8.505030503496528} +{"Pretrain/Learning Rate": 3.653720964414073e-06, "Pretrain/Loss": 1.9689807891845703, "Pretrain/Loss (Raw)": 2.131091356277466, "Pretrain/Step": 15849, "Pretrain/Step Time": 8.501236587762833} +{"Pretrain/Learning Rate": 3.6515115900948334e-06, "Pretrain/Loss": 1.9674274921417236, "Pretrain/Loss (Raw)": 1.8785408735275269, "Pretrain/Step": 15850, "Pretrain/Step Time": 8.50374760478735} +{"Pretrain/Learning Rate": 3.649302831344212e-06, "Pretrain/Loss": 1.9697155952453613, "Pretrain/Loss (Raw)": 2.076354742050171, "Pretrain/Step": 15851, "Pretrain/Step Time": 8.501581244170666} +{"Pretrain/Learning Rate": 3.647094688225891e-06, "Pretrain/Loss": 1.9680486917495728, "Pretrain/Loss (Raw)": 1.8509098291397095, "Pretrain/Step": 15852, "Pretrain/Step Time": 8.501045318320394} +{"Pretrain/Learning Rate": 3.6448871608035366e-06, "Pretrain/Loss": 1.967247486114502, "Pretrain/Loss (Raw)": 1.8923015594482422, "Pretrain/Step": 15853, "Pretrain/Step Time": 8.501363717019558} +{"Pretrain/Learning Rate": 3.6426802491408117e-06, "Pretrain/Loss": 1.965013861656189, "Pretrain/Loss (Raw)": 1.847120761871338, "Pretrain/Step": 15854, "Pretrain/Step Time": 8.502792358398438} +{"Pretrain/Learning Rate": 3.6404739533013404e-06, "Pretrain/Loss": 1.9665944576263428, "Pretrain/Loss (Raw)": 2.1433260440826416, "Pretrain/Step": 15855, "Pretrain/Step Time": 8.496639659628272} +{"Pretrain/Learning Rate": 3.6382682733487522e-06, "Pretrain/Loss": 1.9671612977981567, "Pretrain/Loss (Raw)": 2.0390231609344482, "Pretrain/Step": 15856, "Pretrain/Step Time": 8.497275095432997} +{"Pretrain/Learning Rate": 3.6360632093466377e-06, "Pretrain/Loss": 1.9669408798217773, "Pretrain/Loss (Raw)": 1.9233404397964478, "Pretrain/Step": 15857, "Pretrain/Step Time": 8.49573309160769} +{"Pretrain/Learning Rate": 3.6338587613585743e-06, "Pretrain/Loss": 1.9695124626159668, "Pretrain/Loss (Raw)": 2.0508856773376465, "Pretrain/Step": 15858, "Pretrain/Step Time": 8.502071730792522} +{"Pretrain/Learning Rate": 3.631654929448139e-06, "Pretrain/Loss": 1.9696842432022095, "Pretrain/Loss (Raw)": 2.067748785018921, "Pretrain/Step": 15859, "Pretrain/Step Time": 8.50095972046256} +{"Pretrain/Learning Rate": 3.6294517136788637e-06, "Pretrain/Loss": 1.9687509536743164, "Pretrain/Loss (Raw)": 1.8861347436904907, "Pretrain/Step": 15860, "Pretrain/Step Time": 8.497573839500546} +{"Pretrain/Learning Rate": 3.6272491141142866e-06, "Pretrain/Loss": 1.968125820159912, "Pretrain/Loss (Raw)": 2.019991397857666, "Pretrain/Step": 15861, "Pretrain/Step Time": 8.50168595276773} +{"Pretrain/Learning Rate": 3.625047130817916e-06, "Pretrain/Loss": 1.967698097229004, "Pretrain/Loss (Raw)": 1.9230389595031738, "Pretrain/Step": 15862, "Pretrain/Step Time": 8.500656569376588} +{"Pretrain/Learning Rate": 3.6228457638532387e-06, "Pretrain/Loss": 1.9633848667144775, "Pretrain/Loss (Raw)": 1.471069574356079, "Pretrain/Step": 15863, "Pretrain/Step Time": 8.502480033785105} +{"Pretrain/Learning Rate": 3.6206450132837385e-06, "Pretrain/Loss": 1.9622857570648193, "Pretrain/Loss (Raw)": 1.888999581336975, "Pretrain/Step": 15864, "Pretrain/Step Time": 8.50561860576272} +{"Pretrain/Learning Rate": 3.618444879172861e-06, "Pretrain/Loss": 1.9594576358795166, "Pretrain/Loss (Raw)": 1.6751644611358643, "Pretrain/Step": 15865, "Pretrain/Step Time": 8.51041278988123} +{"Pretrain/Learning Rate": 3.6162453615840588e-06, "Pretrain/Loss": 1.9571505784988403, "Pretrain/Loss (Raw)": 1.8441141843795776, "Pretrain/Step": 15866, "Pretrain/Step Time": 8.503997649997473} +{"Pretrain/Learning Rate": 3.6140464605807474e-06, "Pretrain/Loss": 1.9552980661392212, "Pretrain/Loss (Raw)": 1.888426423072815, "Pretrain/Step": 15867, "Pretrain/Step Time": 8.50527129881084} +{"Pretrain/Learning Rate": 3.6118481762263235e-06, "Pretrain/Loss": 1.9562783241271973, "Pretrain/Loss (Raw)": 1.9355977773666382, "Pretrain/Step": 15868, "Pretrain/Step Time": 8.503791559487581} +{"Pretrain/Learning Rate": 3.6096505085841863e-06, "Pretrain/Loss": 1.9566729068756104, "Pretrain/Loss (Raw)": 1.9428046941757202, "Pretrain/Step": 15869, "Pretrain/Step Time": 8.504311263561249} +{"Pretrain/Learning Rate": 3.607453457717694e-06, "Pretrain/Loss": 1.9563030004501343, "Pretrain/Loss (Raw)": 1.9897412061691284, "Pretrain/Step": 15870, "Pretrain/Step Time": 8.503485981374979} +{"Pretrain/Learning Rate": 3.605257023690203e-06, "Pretrain/Loss": 1.9584128856658936, "Pretrain/Loss (Raw)": 2.0601887702941895, "Pretrain/Step": 15871, "Pretrain/Step Time": 8.504133878275752} +{"Pretrain/Learning Rate": 3.603061206565045e-06, "Pretrain/Loss": 1.9578239917755127, "Pretrain/Loss (Raw)": 1.9544931650161743, "Pretrain/Step": 15872, "Pretrain/Step Time": 8.500064605847001} +{"Pretrain/Learning Rate": 3.600866006405526e-06, "Pretrain/Loss": 1.9546830654144287, "Pretrain/Loss (Raw)": 1.5956918001174927, "Pretrain/Step": 15873, "Pretrain/Step Time": 8.497075766324997} +{"Pretrain/Learning Rate": 3.5986714232749576e-06, "Pretrain/Loss": 1.9552865028381348, "Pretrain/Loss (Raw)": 1.949673056602478, "Pretrain/Step": 15874, "Pretrain/Step Time": 8.502152390778065} +{"Pretrain/Learning Rate": 3.596477457236605e-06, "Pretrain/Loss": 1.9552444219589233, "Pretrain/Loss (Raw)": 2.1578867435455322, "Pretrain/Step": 15875, "Pretrain/Step Time": 8.501838881522417} +{"Pretrain/Learning Rate": 3.594284108353743e-06, "Pretrain/Loss": 1.9564664363861084, "Pretrain/Loss (Raw)": 2.141340970993042, "Pretrain/Step": 15876, "Pretrain/Step Time": 8.502510918304324} +{"Pretrain/Learning Rate": 3.5920913766896076e-06, "Pretrain/Loss": 1.9577293395996094, "Pretrain/Loss (Raw)": 1.9102909564971924, "Pretrain/Step": 15877, "Pretrain/Step Time": 8.50376408919692} +{"Pretrain/Learning Rate": 3.5898992623074224e-06, "Pretrain/Loss": 1.9578214883804321, "Pretrain/Loss (Raw)": 1.8130601644515991, "Pretrain/Step": 15878, "Pretrain/Step Time": 8.500165266916156} +{"Pretrain/Learning Rate": 3.587707765270404e-06, "Pretrain/Loss": 1.9531757831573486, "Pretrain/Loss (Raw)": 1.6268222332000732, "Pretrain/Step": 15879, "Pretrain/Step Time": 8.503548815846443} +{"Pretrain/Learning Rate": 3.585516885641729e-06, "Pretrain/Loss": 1.9511079788208008, "Pretrain/Loss (Raw)": 1.8148740530014038, "Pretrain/Step": 15880, "Pretrain/Step Time": 8.508614225313067} +{"Pretrain/Learning Rate": 3.583326623484587e-06, "Pretrain/Loss": 1.9528815746307373, "Pretrain/Loss (Raw)": 1.96647310256958, "Pretrain/Step": 15881, "Pretrain/Step Time": 8.507558714598417} +{"Pretrain/Learning Rate": 3.5811369788621237e-06, "Pretrain/Loss": 1.9523966312408447, "Pretrain/Loss (Raw)": 1.9199141263961792, "Pretrain/Step": 15882, "Pretrain/Step Time": 8.505403563380241} +{"Pretrain/Learning Rate": 3.5789479518374692e-06, "Pretrain/Loss": 1.953436017036438, "Pretrain/Loss (Raw)": 2.0273079872131348, "Pretrain/Step": 15883, "Pretrain/Step Time": 8.502538047730923} +{"Pretrain/Learning Rate": 3.5767595424737538e-06, "Pretrain/Loss": 1.952040195465088, "Pretrain/Loss (Raw)": 1.85610830783844, "Pretrain/Step": 15884, "Pretrain/Step Time": 8.506392996758223} +{"Pretrain/Learning Rate": 3.5745717508340715e-06, "Pretrain/Loss": 1.9506161212921143, "Pretrain/Loss (Raw)": 1.8890249729156494, "Pretrain/Step": 15885, "Pretrain/Step Time": 8.503979934379458} +{"Pretrain/Learning Rate": 3.572384576981516e-06, "Pretrain/Loss": 1.9527087211608887, "Pretrain/Loss (Raw)": 1.9863821268081665, "Pretrain/Step": 15886, "Pretrain/Step Time": 8.505781257525086} +{"Pretrain/Learning Rate": 3.570198020979143e-06, "Pretrain/Loss": 1.9542994499206543, "Pretrain/Loss (Raw)": 1.9389170408248901, "Pretrain/Step": 15887, "Pretrain/Step Time": 8.505953768268228} +{"Pretrain/Learning Rate": 3.5680120828899987e-06, "Pretrain/Loss": 1.9554831981658936, "Pretrain/Loss (Raw)": 2.1374847888946533, "Pretrain/Step": 15888, "Pretrain/Step Time": 8.505533300340176} +{"Pretrain/Learning Rate": 3.565826762777122e-06, "Pretrain/Loss": 1.9555392265319824, "Pretrain/Loss (Raw)": 1.9332388639450073, "Pretrain/Step": 15889, "Pretrain/Step Time": 8.507633535191417} +{"Pretrain/Learning Rate": 3.563642060703515e-06, "Pretrain/Loss": 1.9543466567993164, "Pretrain/Loss (Raw)": 1.9862079620361328, "Pretrain/Step": 15890, "Pretrain/Step Time": 8.503973253071308} +{"Pretrain/Learning Rate": 3.5614579767321856e-06, "Pretrain/Loss": 1.9517818689346313, "Pretrain/Loss (Raw)": 1.7362561225891113, "Pretrain/Step": 15891, "Pretrain/Step Time": 8.510469065979123} +{"Pretrain/Learning Rate": 3.5592745109261e-06, "Pretrain/Loss": 1.9542269706726074, "Pretrain/Loss (Raw)": 2.138869285583496, "Pretrain/Step": 15892, "Pretrain/Step Time": 8.51158644258976} +{"Pretrain/Learning Rate": 3.5570916633482137e-06, "Pretrain/Loss": 1.9553427696228027, "Pretrain/Loss (Raw)": 2.039293050765991, "Pretrain/Step": 15893, "Pretrain/Step Time": 8.510280042886734} +{"Pretrain/Learning Rate": 3.554909434061479e-06, "Pretrain/Loss": 1.9540599584579468, "Pretrain/Loss (Raw)": 1.8187370300292969, "Pretrain/Step": 15894, "Pretrain/Step Time": 8.506241824477911} +{"Pretrain/Learning Rate": 3.5527278231288067e-06, "Pretrain/Loss": 1.952709674835205, "Pretrain/Loss (Raw)": 1.8790169954299927, "Pretrain/Step": 15895, "Pretrain/Step Time": 8.50488356500864} +{"Pretrain/Learning Rate": 3.5505468306131133e-06, "Pretrain/Loss": 1.9517253637313843, "Pretrain/Loss (Raw)": 1.6969448328018188, "Pretrain/Step": 15896, "Pretrain/Step Time": 8.509686131030321} +{"Pretrain/Learning Rate": 3.548366456577282e-06, "Pretrain/Loss": 1.94968581199646, "Pretrain/Loss (Raw)": 2.1740219593048096, "Pretrain/Step": 15897, "Pretrain/Step Time": 8.510280733928084} +{"Pretrain/Learning Rate": 3.546186701084178e-06, "Pretrain/Loss": 1.9508260488510132, "Pretrain/Loss (Raw)": 2.0708744525909424, "Pretrain/Step": 15898, "Pretrain/Step Time": 8.506644383072853} +{"Pretrain/Learning Rate": 3.544007564196658e-06, "Pretrain/Loss": 1.950016736984253, "Pretrain/Loss (Raw)": 1.9404401779174805, "Pretrain/Step": 15899, "Pretrain/Step Time": 8.504278905689716} +{"Pretrain/Learning Rate": 3.5418290459775518e-06, "Pretrain/Loss": 1.9506206512451172, "Pretrain/Loss (Raw)": 2.2045235633850098, "Pretrain/Step": 15900, "Pretrain/Step Time": 8.501211278140545} +{"Pretrain/Learning Rate": 3.5396511464896835e-06, "Pretrain/Loss": 1.9503921270370483, "Pretrain/Loss (Raw)": 1.9971158504486084, "Pretrain/Step": 15901, "Pretrain/Step Time": 8.503930035978556} +{"Pretrain/Learning Rate": 3.5374738657958454e-06, "Pretrain/Loss": 1.9527909755706787, "Pretrain/Loss (Raw)": 2.156665563583374, "Pretrain/Step": 15902, "Pretrain/Step Time": 8.502424146980047} +{"Pretrain/Learning Rate": 3.535297203958812e-06, "Pretrain/Loss": 1.9527164697647095, "Pretrain/Loss (Raw)": 1.8725610971450806, "Pretrain/Step": 15903, "Pretrain/Step Time": 8.507773905992508} +{"Pretrain/Learning Rate": 3.533121161041358e-06, "Pretrain/Loss": 1.9536170959472656, "Pretrain/Loss (Raw)": 2.161513566970825, "Pretrain/Step": 15904, "Pretrain/Step Time": 8.509143892675638} +{"Pretrain/Learning Rate": 3.5309457371062172e-06, "Pretrain/Loss": 1.9561281204223633, "Pretrain/Loss (Raw)": 2.206139326095581, "Pretrain/Step": 15905, "Pretrain/Step Time": 8.51086506061256} +{"Pretrain/Learning Rate": 3.5287709322161272e-06, "Pretrain/Loss": 1.9563231468200684, "Pretrain/Loss (Raw)": 1.996252179145813, "Pretrain/Step": 15906, "Pretrain/Step Time": 8.504780476912856} +{"Pretrain/Learning Rate": 3.526596746433791e-06, "Pretrain/Loss": 1.955702543258667, "Pretrain/Loss (Raw)": 1.934496521949768, "Pretrain/Step": 15907, "Pretrain/Step Time": 8.507370682433248} +{"Pretrain/Learning Rate": 3.5244231798218926e-06, "Pretrain/Loss": 1.9545509815216064, "Pretrain/Loss (Raw)": 1.7679246664047241, "Pretrain/Step": 15908, "Pretrain/Step Time": 8.50595142133534} +{"Pretrain/Learning Rate": 3.5222502324431194e-06, "Pretrain/Loss": 1.9580740928649902, "Pretrain/Loss (Raw)": 2.172327995300293, "Pretrain/Step": 15909, "Pretrain/Step Time": 8.509783433750272} +{"Pretrain/Learning Rate": 3.520077904360114e-06, "Pretrain/Loss": 1.9579018354415894, "Pretrain/Loss (Raw)": 1.8948780298233032, "Pretrain/Step": 15910, "Pretrain/Step Time": 8.50834335386753} +{"Pretrain/Learning Rate": 3.517906195635526e-06, "Pretrain/Loss": 1.9610576629638672, "Pretrain/Loss (Raw)": 2.184083938598633, "Pretrain/Step": 15911, "Pretrain/Step Time": 8.512538559734821} +{"Pretrain/Learning Rate": 3.515735106331969e-06, "Pretrain/Loss": 1.9604134559631348, "Pretrain/Loss (Raw)": 1.9613993167877197, "Pretrain/Step": 15912, "Pretrain/Step Time": 8.512772677466273} +{"Pretrain/Learning Rate": 3.51356463651204e-06, "Pretrain/Loss": 1.9609193801879883, "Pretrain/Loss (Raw)": 2.1916723251342773, "Pretrain/Step": 15913, "Pretrain/Step Time": 8.512744085863233} +{"Pretrain/Learning Rate": 3.5113947862383312e-06, "Pretrain/Loss": 1.9597270488739014, "Pretrain/Loss (Raw)": 2.1243789196014404, "Pretrain/Step": 15914, "Pretrain/Step Time": 8.515990560874343} +{"Pretrain/Learning Rate": 3.5092255555734005e-06, "Pretrain/Loss": 1.9585301876068115, "Pretrain/Loss (Raw)": 1.89667546749115, "Pretrain/Step": 15915, "Pretrain/Step Time": 8.515764208510518} +{"Pretrain/Learning Rate": 3.5070569445798092e-06, "Pretrain/Loss": 1.9598050117492676, "Pretrain/Loss (Raw)": 2.166808605194092, "Pretrain/Step": 15916, "Pretrain/Step Time": 8.514682663604617} +{"Pretrain/Learning Rate": 3.5048889533200706e-06, "Pretrain/Loss": 1.9596316814422607, "Pretrain/Loss (Raw)": 1.9974862337112427, "Pretrain/Step": 15917, "Pretrain/Step Time": 8.511285176500678} +{"Pretrain/Learning Rate": 3.5027215818567105e-06, "Pretrain/Loss": 1.9585480690002441, "Pretrain/Loss (Raw)": 1.9507415294647217, "Pretrain/Step": 15918, "Pretrain/Step Time": 8.514214973896742} +{"Pretrain/Learning Rate": 3.500554830252223e-06, "Pretrain/Loss": 1.9600419998168945, "Pretrain/Loss (Raw)": 1.9714105129241943, "Pretrain/Step": 15919, "Pretrain/Step Time": 8.515058182179928} +{"Pretrain/Learning Rate": 3.498388698569077e-06, "Pretrain/Loss": 1.9589228630065918, "Pretrain/Loss (Raw)": 1.7386081218719482, "Pretrain/Step": 15920, "Pretrain/Step Time": 8.513855194672942} +{"Pretrain/Learning Rate": 3.496223186869738e-06, "Pretrain/Loss": 1.9559152126312256, "Pretrain/Loss (Raw)": 1.6915961503982544, "Pretrain/Step": 15921, "Pretrain/Step Time": 8.521440515294671} +{"Pretrain/Learning Rate": 3.4940582952166373e-06, "Pretrain/Loss": 1.955269455909729, "Pretrain/Loss (Raw)": 1.9081404209136963, "Pretrain/Step": 15922, "Pretrain/Step Time": 8.520256159827113} +{"Pretrain/Learning Rate": 3.4918940236722096e-06, "Pretrain/Loss": 1.9573090076446533, "Pretrain/Loss (Raw)": 2.0762131214141846, "Pretrain/Step": 15923, "Pretrain/Step Time": 8.523692036047578} +{"Pretrain/Learning Rate": 3.489730372298852e-06, "Pretrain/Loss": 1.9565842151641846, "Pretrain/Loss (Raw)": 2.088029623031616, "Pretrain/Step": 15924, "Pretrain/Step Time": 8.521515507251024} +{"Pretrain/Learning Rate": 3.487567341158959e-06, "Pretrain/Loss": 1.9596420526504517, "Pretrain/Loss (Raw)": 2.1167917251586914, "Pretrain/Step": 15925, "Pretrain/Step Time": 8.51548189483583} +{"Pretrain/Learning Rate": 3.4854049303148976e-06, "Pretrain/Loss": 1.9620393514633179, "Pretrain/Loss (Raw)": 2.171926259994507, "Pretrain/Step": 15926, "Pretrain/Step Time": 8.514928238466382} +{"Pretrain/Learning Rate": 3.483243139829015e-06, "Pretrain/Loss": 1.9641406536102295, "Pretrain/Loss (Raw)": 2.1902832984924316, "Pretrain/Step": 15927, "Pretrain/Step Time": 8.51809199154377} +{"Pretrain/Learning Rate": 3.48108196976365e-06, "Pretrain/Loss": 1.9677793979644775, "Pretrain/Loss (Raw)": 2.1007375717163086, "Pretrain/Step": 15928, "Pretrain/Step Time": 8.518083455041051} +{"Pretrain/Learning Rate": 3.478921420181114e-06, "Pretrain/Loss": 1.9668010473251343, "Pretrain/Loss (Raw)": 1.7223974466323853, "Pretrain/Step": 15929, "Pretrain/Step Time": 8.520092418417335} +{"Pretrain/Learning Rate": 3.47676149114371e-06, "Pretrain/Loss": 1.9694188833236694, "Pretrain/Loss (Raw)": 1.9776148796081543, "Pretrain/Step": 15930, "Pretrain/Step Time": 8.520104443654418} +{"Pretrain/Learning Rate": 3.4746021827137182e-06, "Pretrain/Loss": 1.9683820009231567, "Pretrain/Loss (Raw)": 2.009028911590576, "Pretrain/Step": 15931, "Pretrain/Step Time": 8.521013176068664} +{"Pretrain/Learning Rate": 3.47244349495339e-06, "Pretrain/Loss": 1.9704302549362183, "Pretrain/Loss (Raw)": 2.1791698932647705, "Pretrain/Step": 15932, "Pretrain/Step Time": 8.519051754847169} +{"Pretrain/Learning Rate": 3.470285427924985e-06, "Pretrain/Loss": 1.9709898233413696, "Pretrain/Loss (Raw)": 1.9229533672332764, "Pretrain/Step": 15933, "Pretrain/Step Time": 8.521011911332607} +{"Pretrain/Learning Rate": 3.4681279816907165e-06, "Pretrain/Loss": 1.9708633422851562, "Pretrain/Loss (Raw)": 1.8714152574539185, "Pretrain/Step": 15934, "Pretrain/Step Time": 8.516565067693591} +{"Pretrain/Learning Rate": 3.465971156312803e-06, "Pretrain/Loss": 1.9733750820159912, "Pretrain/Loss (Raw)": 2.1898343563079834, "Pretrain/Step": 15935, "Pretrain/Step Time": 8.51798147521913} +{"Pretrain/Learning Rate": 3.463814951853431e-06, "Pretrain/Loss": 1.973791241645813, "Pretrain/Loss (Raw)": 2.037951707839966, "Pretrain/Step": 15936, "Pretrain/Step Time": 8.519336469471455} +{"Pretrain/Learning Rate": 3.4616593683747674e-06, "Pretrain/Loss": 1.9763469696044922, "Pretrain/Loss (Raw)": 2.212193250656128, "Pretrain/Step": 15937, "Pretrain/Step Time": 8.52113133855164} +{"Pretrain/Learning Rate": 3.459504405938979e-06, "Pretrain/Loss": 1.9763755798339844, "Pretrain/Loss (Raw)": 1.9452944993972778, "Pretrain/Step": 15938, "Pretrain/Step Time": 8.522677572444081} +{"Pretrain/Learning Rate": 3.457350064608189e-06, "Pretrain/Loss": 1.9773964881896973, "Pretrain/Loss (Raw)": 2.0686728954315186, "Pretrain/Step": 15939, "Pretrain/Step Time": 8.51893913000822} +{"Pretrain/Learning Rate": 3.4551963444445308e-06, "Pretrain/Loss": 1.9762954711914062, "Pretrain/Loss (Raw)": 2.111506938934326, "Pretrain/Step": 15940, "Pretrain/Step Time": 8.51639560982585} +{"Pretrain/Learning Rate": 3.4530432455100988e-06, "Pretrain/Loss": 1.9777889251708984, "Pretrain/Loss (Raw)": 2.1235454082489014, "Pretrain/Step": 15941, "Pretrain/Step Time": 8.515907214954495} +{"Pretrain/Learning Rate": 3.4508907678669657e-06, "Pretrain/Loss": 1.9801439046859741, "Pretrain/Loss (Raw)": 2.0247745513916016, "Pretrain/Step": 15942, "Pretrain/Step Time": 8.513323042541742} +{"Pretrain/Learning Rate": 3.448738911577215e-06, "Pretrain/Loss": 1.9816532135009766, "Pretrain/Loss (Raw)": 1.8849692344665527, "Pretrain/Step": 15943, "Pretrain/Step Time": 8.51025796122849} +{"Pretrain/Learning Rate": 3.446587676702878e-06, "Pretrain/Loss": 1.9820749759674072, "Pretrain/Loss (Raw)": 1.986852765083313, "Pretrain/Step": 15944, "Pretrain/Step Time": 8.508895704522729} +{"Pretrain/Learning Rate": 3.444437063305997e-06, "Pretrain/Loss": 1.9804210662841797, "Pretrain/Loss (Raw)": 1.9241009950637817, "Pretrain/Step": 15945, "Pretrain/Step Time": 8.510833429172635} +{"Pretrain/Learning Rate": 3.442287071448577e-06, "Pretrain/Loss": 1.9823700189590454, "Pretrain/Loss (Raw)": 2.317728042602539, "Pretrain/Step": 15946, "Pretrain/Step Time": 8.516063192859292} +{"Pretrain/Learning Rate": 3.4401377011926083e-06, "Pretrain/Loss": 1.9813607931137085, "Pretrain/Loss (Raw)": 2.0330214500427246, "Pretrain/Step": 15947, "Pretrain/Step Time": 8.51988167874515} +{"Pretrain/Learning Rate": 3.4379889526000742e-06, "Pretrain/Loss": 1.9802815914154053, "Pretrain/Loss (Raw)": 1.895887017250061, "Pretrain/Step": 15948, "Pretrain/Step Time": 8.515464717522264} +{"Pretrain/Learning Rate": 3.4358408257329223e-06, "Pretrain/Loss": 1.981889247894287, "Pretrain/Loss (Raw)": 2.0490570068359375, "Pretrain/Step": 15949, "Pretrain/Step Time": 8.517361879348755} +{"Pretrain/Learning Rate": 3.4336933206531058e-06, "Pretrain/Loss": 1.9820773601531982, "Pretrain/Loss (Raw)": 1.7752748727798462, "Pretrain/Step": 15950, "Pretrain/Step Time": 8.512669766321778} +{"Pretrain/Learning Rate": 3.4315464374225393e-06, "Pretrain/Loss": 1.9824647903442383, "Pretrain/Loss (Raw)": 2.016977310180664, "Pretrain/Step": 15951, "Pretrain/Step Time": 8.51127227768302} +{"Pretrain/Learning Rate": 3.4294001761031203e-06, "Pretrain/Loss": 1.984739899635315, "Pretrain/Loss (Raw)": 2.127958297729492, "Pretrain/Step": 15952, "Pretrain/Step Time": 8.513649858534336} +{"Pretrain/Learning Rate": 3.4272545367567465e-06, "Pretrain/Loss": 1.984067440032959, "Pretrain/Loss (Raw)": 1.9067622423171997, "Pretrain/Step": 15953, "Pretrain/Step Time": 8.514766562730074} +{"Pretrain/Learning Rate": 3.425109519445274e-06, "Pretrain/Loss": 1.9839041233062744, "Pretrain/Loss (Raw)": 1.827691912651062, "Pretrain/Step": 15954, "Pretrain/Step Time": 8.507709361612797} +{"Pretrain/Learning Rate": 3.422965124230565e-06, "Pretrain/Loss": 1.9848551750183105, "Pretrain/Loss (Raw)": 2.101210355758667, "Pretrain/Step": 15955, "Pretrain/Step Time": 8.511618403717875} +{"Pretrain/Learning Rate": 3.420821351174447e-06, "Pretrain/Loss": 1.9824501276016235, "Pretrain/Loss (Raw)": 1.8314716815948486, "Pretrain/Step": 15956, "Pretrain/Step Time": 8.511246295645833} +{"Pretrain/Learning Rate": 3.4186782003387265e-06, "Pretrain/Loss": 1.9818356037139893, "Pretrain/Loss (Raw)": 2.051435708999634, "Pretrain/Step": 15957, "Pretrain/Step Time": 8.509255738928914} +{"Pretrain/Learning Rate": 3.416535671785212e-06, "Pretrain/Loss": 1.9828863143920898, "Pretrain/Loss (Raw)": 2.027275562286377, "Pretrain/Step": 15958, "Pretrain/Step Time": 8.508141016587615} +{"Pretrain/Learning Rate": 3.4143937655756716e-06, "Pretrain/Loss": 1.98362398147583, "Pretrain/Loss (Raw)": 2.0981462001800537, "Pretrain/Step": 15959, "Pretrain/Step Time": 8.50923283584416} +{"Pretrain/Learning Rate": 3.4122524817718743e-06, "Pretrain/Loss": 1.9814090728759766, "Pretrain/Loss (Raw)": 1.7832916975021362, "Pretrain/Step": 15960, "Pretrain/Step Time": 8.504795514047146} +{"Pretrain/Learning Rate": 3.4101118204355578e-06, "Pretrain/Loss": 1.9829528331756592, "Pretrain/Loss (Raw)": 2.0551583766937256, "Pretrain/Step": 15961, "Pretrain/Step Time": 8.504218684509397} +{"Pretrain/Learning Rate": 3.407971781628444e-06, "Pretrain/Loss": 1.9815670251846313, "Pretrain/Loss (Raw)": 1.8339818716049194, "Pretrain/Step": 15962, "Pretrain/Step Time": 8.507135896012187} +{"Pretrain/Learning Rate": 3.4058323654122455e-06, "Pretrain/Loss": 1.9796571731567383, "Pretrain/Loss (Raw)": 1.8025819063186646, "Pretrain/Step": 15963, "Pretrain/Step Time": 8.506821736693382} +{"Pretrain/Learning Rate": 3.403693571848643e-06, "Pretrain/Loss": 1.978137493133545, "Pretrain/Loss (Raw)": 1.8819036483764648, "Pretrain/Step": 15964, "Pretrain/Step Time": 8.509008578956127} +{"Pretrain/Learning Rate": 3.4015554009993178e-06, "Pretrain/Loss": 1.9760444164276123, "Pretrain/Loss (Raw)": 2.163013458251953, "Pretrain/Step": 15965, "Pretrain/Step Time": 8.507750544697046} +{"Pretrain/Learning Rate": 3.399417852925918e-06, "Pretrain/Loss": 1.9748761653900146, "Pretrain/Loss (Raw)": 1.810721516609192, "Pretrain/Step": 15966, "Pretrain/Step Time": 8.50165406242013} +{"Pretrain/Learning Rate": 3.3972809276900693e-06, "Pretrain/Loss": 1.9744471311569214, "Pretrain/Loss (Raw)": 2.0775413513183594, "Pretrain/Step": 15967, "Pretrain/Step Time": 8.505812972784042} +{"Pretrain/Learning Rate": 3.3951446253534024e-06, "Pretrain/Loss": 1.9736908674240112, "Pretrain/Loss (Raw)": 1.9426244497299194, "Pretrain/Step": 15968, "Pretrain/Step Time": 8.506735671311617} +{"Pretrain/Learning Rate": 3.393008945977505e-06, "Pretrain/Loss": 1.9755797386169434, "Pretrain/Loss (Raw)": 2.078381299972534, "Pretrain/Step": 15969, "Pretrain/Step Time": 8.507921658456326} +{"Pretrain/Learning Rate": 3.390873889623966e-06, "Pretrain/Loss": 1.977616310119629, "Pretrain/Loss (Raw)": 2.1173276901245117, "Pretrain/Step": 15970, "Pretrain/Step Time": 8.504657723009586} +{"Pretrain/Learning Rate": 3.388739456354348e-06, "Pretrain/Loss": 1.9782445430755615, "Pretrain/Loss (Raw)": 2.1086761951446533, "Pretrain/Step": 15971, "Pretrain/Step Time": 8.505305655300617} +{"Pretrain/Learning Rate": 3.3866056462301844e-06, "Pretrain/Loss": 1.98061203956604, "Pretrain/Loss (Raw)": 2.2896883487701416, "Pretrain/Step": 15972, "Pretrain/Step Time": 8.510170379653573} +{"Pretrain/Learning Rate": 3.3844724593130177e-06, "Pretrain/Loss": 1.9821829795837402, "Pretrain/Loss (Raw)": 2.2056772708892822, "Pretrain/Step": 15973, "Pretrain/Step Time": 8.514391120523214} +{"Pretrain/Learning Rate": 3.3823398956643463e-06, "Pretrain/Loss": 1.9820258617401123, "Pretrain/Loss (Raw)": 2.0170655250549316, "Pretrain/Step": 15974, "Pretrain/Step Time": 8.511932745575905} +{"Pretrain/Learning Rate": 3.3802079553456657e-06, "Pretrain/Loss": 1.9796571731567383, "Pretrain/Loss (Raw)": 1.6367266178131104, "Pretrain/Step": 15975, "Pretrain/Step Time": 8.509079148992896} +{"Pretrain/Learning Rate": 3.378076638418451e-06, "Pretrain/Loss": 1.9783636331558228, "Pretrain/Loss (Raw)": 1.7570689916610718, "Pretrain/Step": 15976, "Pretrain/Step Time": 8.506767300888896} +{"Pretrain/Learning Rate": 3.3759459449441478e-06, "Pretrain/Loss": 1.9769889116287231, "Pretrain/Loss (Raw)": 1.9551290273666382, "Pretrain/Step": 15977, "Pretrain/Step Time": 8.506891645491123} +{"Pretrain/Learning Rate": 3.373815874984204e-06, "Pretrain/Loss": 1.9772504568099976, "Pretrain/Loss (Raw)": 1.9120151996612549, "Pretrain/Step": 15978, "Pretrain/Step Time": 8.508188616484404} +{"Pretrain/Learning Rate": 3.3716864286000294e-06, "Pretrain/Loss": 1.9766764640808105, "Pretrain/Loss (Raw)": 2.002887725830078, "Pretrain/Step": 15979, "Pretrain/Step Time": 8.515184143558145} +{"Pretrain/Learning Rate": 3.369557605853035e-06, "Pretrain/Loss": 1.9768729209899902, "Pretrain/Loss (Raw)": 1.8760591745376587, "Pretrain/Step": 15980, "Pretrain/Step Time": 8.514074863865972} +{"Pretrain/Learning Rate": 3.3674294068045927e-06, "Pretrain/Loss": 1.97797429561615, "Pretrain/Loss (Raw)": 2.033276319503784, "Pretrain/Step": 15981, "Pretrain/Step Time": 8.514487251639366} +{"Pretrain/Learning Rate": 3.3653018315160796e-06, "Pretrain/Loss": 1.976062536239624, "Pretrain/Loss (Raw)": 1.6024181842803955, "Pretrain/Step": 15982, "Pretrain/Step Time": 8.514021081849933} +{"Pretrain/Learning Rate": 3.363174880048836e-06, "Pretrain/Loss": 1.9731537103652954, "Pretrain/Loss (Raw)": 1.7709877490997314, "Pretrain/Step": 15983, "Pretrain/Step Time": 8.515980418771505} +{"Pretrain/Learning Rate": 3.3610485524641855e-06, "Pretrain/Loss": 1.9750536680221558, "Pretrain/Loss (Raw)": 2.2822234630584717, "Pretrain/Step": 15984, "Pretrain/Step Time": 8.518760001286864} +{"Pretrain/Learning Rate": 3.3589228488234507e-06, "Pretrain/Loss": 1.9767072200775146, "Pretrain/Loss (Raw)": 2.1350038051605225, "Pretrain/Step": 15985, "Pretrain/Step Time": 8.517822690308094} +{"Pretrain/Learning Rate": 3.3567977691879164e-06, "Pretrain/Loss": 1.9743545055389404, "Pretrain/Loss (Raw)": 1.7497254610061646, "Pretrain/Step": 15986, "Pretrain/Step Time": 8.512866899371147} +{"Pretrain/Learning Rate": 3.354673313618864e-06, "Pretrain/Loss": 1.972959280014038, "Pretrain/Loss (Raw)": 1.8891634941101074, "Pretrain/Step": 15987, "Pretrain/Step Time": 8.51054697111249} +{"Pretrain/Learning Rate": 3.3525494821775498e-06, "Pretrain/Loss": 1.973038911819458, "Pretrain/Loss (Raw)": 1.8963338136672974, "Pretrain/Step": 15988, "Pretrain/Step Time": 8.513584746047854} +{"Pretrain/Learning Rate": 3.3504262749252056e-06, "Pretrain/Loss": 1.9736766815185547, "Pretrain/Loss (Raw)": 2.10162091255188, "Pretrain/Step": 15989, "Pretrain/Step Time": 8.514393141493201} +{"Pretrain/Learning Rate": 3.348303691923063e-06, "Pretrain/Loss": 1.9729506969451904, "Pretrain/Loss (Raw)": 1.8301043510437012, "Pretrain/Step": 15990, "Pretrain/Step Time": 8.51747122220695} +{"Pretrain/Learning Rate": 3.346181733232312e-06, "Pretrain/Loss": 1.976957082748413, "Pretrain/Loss (Raw)": 1.9839003086090088, "Pretrain/Step": 15991, "Pretrain/Step Time": 8.512266531586647} +{"Pretrain/Learning Rate": 3.3440603989141535e-06, "Pretrain/Loss": 1.9770746231079102, "Pretrain/Loss (Raw)": 1.9040385484695435, "Pretrain/Step": 15992, "Pretrain/Step Time": 8.509181657806039} +{"Pretrain/Learning Rate": 3.3419396890297465e-06, "Pretrain/Loss": 1.9802477359771729, "Pretrain/Loss (Raw)": 2.081331253051758, "Pretrain/Step": 15993, "Pretrain/Step Time": 8.505565453320742} +{"Pretrain/Learning Rate": 3.3398196036402348e-06, "Pretrain/Loss": 1.9814643859863281, "Pretrain/Loss (Raw)": 1.9998345375061035, "Pretrain/Step": 15994, "Pretrain/Step Time": 8.510691026225686} +{"Pretrain/Learning Rate": 3.3377001428067626e-06, "Pretrain/Loss": 1.9820970296859741, "Pretrain/Loss (Raw)": 1.969402551651001, "Pretrain/Step": 15995, "Pretrain/Step Time": 8.513494359329343} +{"Pretrain/Learning Rate": 3.3355813065904294e-06, "Pretrain/Loss": 1.9824986457824707, "Pretrain/Loss (Raw)": 1.986998200416565, "Pretrain/Step": 15996, "Pretrain/Step Time": 8.517296571284533} +{"Pretrain/Learning Rate": 3.3334630950523416e-06, "Pretrain/Loss": 1.9823412895202637, "Pretrain/Loss (Raw)": 1.9226720333099365, "Pretrain/Step": 15997, "Pretrain/Step Time": 8.518271766602993} +{"Pretrain/Learning Rate": 3.331345508253572e-06, "Pretrain/Loss": 1.9824329614639282, "Pretrain/Loss (Raw)": 2.0014736652374268, "Pretrain/Step": 15998, "Pretrain/Step Time": 8.51871900074184} +{"Pretrain/Learning Rate": 3.3292285462551727e-06, "Pretrain/Loss": 1.9815666675567627, "Pretrain/Loss (Raw)": 1.9492920637130737, "Pretrain/Step": 15999, "Pretrain/Step Time": 8.517458248883486} +{"Pretrain/Learning Rate": 3.3271122091181992e-06, "Pretrain/Loss": 1.9815802574157715, "Pretrain/Loss (Raw)": 1.9562395811080933, "Pretrain/Step": 16000, "Pretrain/Step Time": 8.520316729322076} +{"Pretrain/Learning Rate": 3.3249964969036596e-06, "Pretrain/Loss": 1.984025001525879, "Pretrain/Loss (Raw)": 1.9086297750473022, "Pretrain/Step": 16001, "Pretrain/Step Time": 8.526287332177162} +{"Pretrain/Learning Rate": 3.3228814096725706e-06, "Pretrain/Loss": 1.984964370727539, "Pretrain/Loss (Raw)": 2.0699095726013184, "Pretrain/Step": 16002, "Pretrain/Step Time": 8.519957795739174} +{"Pretrain/Learning Rate": 3.3207669474859175e-06, "Pretrain/Loss": 1.9873251914978027, "Pretrain/Loss (Raw)": 2.460057020187378, "Pretrain/Step": 16003, "Pretrain/Step Time": 8.519125247374177} +{"Pretrain/Learning Rate": 3.3186531104046654e-06, "Pretrain/Loss": 1.9870471954345703, "Pretrain/Loss (Raw)": 2.105764865875244, "Pretrain/Step": 16004, "Pretrain/Step Time": 8.518684022128582} +{"Pretrain/Learning Rate": 3.3165398984897676e-06, "Pretrain/Loss": 1.9887092113494873, "Pretrain/Loss (Raw)": 2.1230318546295166, "Pretrain/Step": 16005, "Pretrain/Step Time": 8.519836612045765} +{"Pretrain/Learning Rate": 3.3144273118021483e-06, "Pretrain/Loss": 1.9899078607559204, "Pretrain/Loss (Raw)": 1.9664748907089233, "Pretrain/Step": 16006, "Pretrain/Step Time": 8.5233569201082} +{"Pretrain/Learning Rate": 3.3123153504027367e-06, "Pretrain/Loss": 1.992178201675415, "Pretrain/Loss (Raw)": 1.9174288511276245, "Pretrain/Step": 16007, "Pretrain/Step Time": 8.519110227003694} +{"Pretrain/Learning Rate": 3.3102040143524166e-06, "Pretrain/Loss": 1.9933323860168457, "Pretrain/Loss (Raw)": 1.9626233577728271, "Pretrain/Step": 16008, "Pretrain/Step Time": 8.515971329063177} +{"Pretrain/Learning Rate": 3.3080933037120816e-06, "Pretrain/Loss": 1.9972116947174072, "Pretrain/Loss (Raw)": 2.4630274772644043, "Pretrain/Step": 16009, "Pretrain/Step Time": 8.515773601830006} +{"Pretrain/Learning Rate": 3.3059832185425827e-06, "Pretrain/Loss": 1.9985920190811157, "Pretrain/Loss (Raw)": 2.096587657928467, "Pretrain/Step": 16010, "Pretrain/Step Time": 8.514572903513908} +{"Pretrain/Learning Rate": 3.3038737589047575e-06, "Pretrain/Loss": 1.9969666004180908, "Pretrain/Loss (Raw)": 1.8192514181137085, "Pretrain/Step": 16011, "Pretrain/Step Time": 8.517044711858034} +{"Pretrain/Learning Rate": 3.3017649248594463e-06, "Pretrain/Loss": 1.9964978694915771, "Pretrain/Loss (Raw)": 1.7961145639419556, "Pretrain/Step": 16012, "Pretrain/Step Time": 8.514673072844744} +{"Pretrain/Learning Rate": 3.299656716467439e-06, "Pretrain/Loss": 1.9970041513442993, "Pretrain/Loss (Raw)": 1.9538284540176392, "Pretrain/Step": 16013, "Pretrain/Step Time": 8.520373806357384} +{"Pretrain/Learning Rate": 3.29754913378954e-06, "Pretrain/Loss": 1.9973853826522827, "Pretrain/Loss (Raw)": 2.0351722240448, "Pretrain/Step": 16014, "Pretrain/Step Time": 8.518634278327227} +{"Pretrain/Learning Rate": 3.2954421768865122e-06, "Pretrain/Loss": 1.9978525638580322, "Pretrain/Loss (Raw)": 1.9987220764160156, "Pretrain/Step": 16015, "Pretrain/Step Time": 8.515349432826042} +{"Pretrain/Learning Rate": 3.293335845819101e-06, "Pretrain/Loss": 1.9963805675506592, "Pretrain/Loss (Raw)": 1.9490684270858765, "Pretrain/Step": 16016, "Pretrain/Step Time": 8.51745867729187} +{"Pretrain/Learning Rate": 3.291230140648055e-06, "Pretrain/Loss": 1.997363567352295, "Pretrain/Loss (Raw)": 2.0590696334838867, "Pretrain/Step": 16017, "Pretrain/Step Time": 8.513295106589794} +{"Pretrain/Learning Rate": 3.2891250614340812e-06, "Pretrain/Loss": 1.997428297996521, "Pretrain/Loss (Raw)": 1.9944854974746704, "Pretrain/Step": 16018, "Pretrain/Step Time": 8.515204574912786} +{"Pretrain/Learning Rate": 3.287020608237884e-06, "Pretrain/Loss": 1.999290943145752, "Pretrain/Loss (Raw)": 1.974680781364441, "Pretrain/Step": 16019, "Pretrain/Step Time": 8.508808424696326} +{"Pretrain/Learning Rate": 3.2849167811201426e-06, "Pretrain/Loss": 1.9975618124008179, "Pretrain/Loss (Raw)": 1.9175299406051636, "Pretrain/Step": 16020, "Pretrain/Step Time": 8.510275995358825} +{"Pretrain/Learning Rate": 3.282813580141511e-06, "Pretrain/Loss": 1.996666431427002, "Pretrain/Loss (Raw)": 1.9246865510940552, "Pretrain/Step": 16021, "Pretrain/Step Time": 8.515270907431841} +{"Pretrain/Learning Rate": 3.280711005362644e-06, "Pretrain/Loss": 1.9973191022872925, "Pretrain/Loss (Raw)": 1.9022773504257202, "Pretrain/Step": 16022, "Pretrain/Step Time": 8.515194352716208} +{"Pretrain/Learning Rate": 3.278609056844162e-06, "Pretrain/Loss": 1.998125433921814, "Pretrain/Loss (Raw)": 1.982232689857483, "Pretrain/Step": 16023, "Pretrain/Step Time": 8.511981684714556} +{"Pretrain/Learning Rate": 3.2765077346466777e-06, "Pretrain/Loss": 1.9995654821395874, "Pretrain/Loss (Raw)": 1.8812769651412964, "Pretrain/Step": 16024, "Pretrain/Step Time": 8.508508261293173} +{"Pretrain/Learning Rate": 3.2744070388307816e-06, "Pretrain/Loss": 1.9965871572494507, "Pretrain/Loss (Raw)": 1.7927963733673096, "Pretrain/Step": 16025, "Pretrain/Step Time": 8.507201412692666} +{"Pretrain/Learning Rate": 3.2723069694570367e-06, "Pretrain/Loss": 1.9968183040618896, "Pretrain/Loss (Raw)": 2.100464105606079, "Pretrain/Step": 16026, "Pretrain/Step Time": 8.504952205345035} +{"Pretrain/Learning Rate": 3.2702075265860083e-06, "Pretrain/Loss": 1.996639609336853, "Pretrain/Loss (Raw)": 1.9175642728805542, "Pretrain/Step": 16027, "Pretrain/Step Time": 8.50754801928997} +{"Pretrain/Learning Rate": 3.26810871027822e-06, "Pretrain/Loss": 1.9945701360702515, "Pretrain/Loss (Raw)": 1.9396271705627441, "Pretrain/Step": 16028, "Pretrain/Step Time": 8.51301434636116} +{"Pretrain/Learning Rate": 3.2660105205942065e-06, "Pretrain/Loss": 1.9941351413726807, "Pretrain/Loss (Raw)": 1.9414329528808594, "Pretrain/Step": 16029, "Pretrain/Step Time": 8.510030252858996} +{"Pretrain/Learning Rate": 3.263912957594456e-06, "Pretrain/Loss": 1.993096947669983, "Pretrain/Loss (Raw)": 2.023771286010742, "Pretrain/Step": 16030, "Pretrain/Step Time": 8.508522985503078} +{"Pretrain/Learning Rate": 3.261816021339445e-06, "Pretrain/Loss": 1.9929075241088867, "Pretrain/Loss (Raw)": 1.8483233451843262, "Pretrain/Step": 16031, "Pretrain/Step Time": 8.501164849847555} +{"Pretrain/Learning Rate": 3.2597197118896526e-06, "Pretrain/Loss": 1.9912692308425903, "Pretrain/Loss (Raw)": 1.9518076181411743, "Pretrain/Step": 16032, "Pretrain/Step Time": 8.506123576313257} +{"Pretrain/Learning Rate": 3.2576240293055114e-06, "Pretrain/Loss": 1.9904230833053589, "Pretrain/Loss (Raw)": 2.0978386402130127, "Pretrain/Step": 16033, "Pretrain/Step Time": 8.50594624876976} +{"Pretrain/Learning Rate": 3.2555289736474592e-06, "Pretrain/Loss": 1.9885177612304688, "Pretrain/Loss (Raw)": 1.7523715496063232, "Pretrain/Step": 16034, "Pretrain/Step Time": 8.506280234083533} +{"Pretrain/Learning Rate": 3.2534345449758976e-06, "Pretrain/Loss": 1.9909673929214478, "Pretrain/Loss (Raw)": 2.248048782348633, "Pretrain/Step": 16035, "Pretrain/Step Time": 8.502047549933195} +{"Pretrain/Learning Rate": 3.2513407433512194e-06, "Pretrain/Loss": 1.9910154342651367, "Pretrain/Loss (Raw)": 1.7740726470947266, "Pretrain/Step": 16036, "Pretrain/Step Time": 8.502526182681322} +{"Pretrain/Learning Rate": 3.249247568833802e-06, "Pretrain/Loss": 1.9911668300628662, "Pretrain/Loss (Raw)": 2.1917049884796143, "Pretrain/Step": 16037, "Pretrain/Step Time": 8.501813691109419} +{"Pretrain/Learning Rate": 3.2471550214839915e-06, "Pretrain/Loss": 1.9930921792984009, "Pretrain/Loss (Raw)": 2.141329288482666, "Pretrain/Step": 16038, "Pretrain/Step Time": 8.506416786462069} +{"Pretrain/Learning Rate": 3.245063101362136e-06, "Pretrain/Loss": 1.9888041019439697, "Pretrain/Loss (Raw)": 1.6352125406265259, "Pretrain/Step": 16039, "Pretrain/Step Time": 8.497523499652743} +{"Pretrain/Learning Rate": 3.2429718085285527e-06, "Pretrain/Loss": 1.989750862121582, "Pretrain/Loss (Raw)": 2.0825798511505127, "Pretrain/Step": 16040, "Pretrain/Step Time": 8.497380211949348} +{"Pretrain/Learning Rate": 3.2408811430435337e-06, "Pretrain/Loss": 1.989060401916504, "Pretrain/Loss (Raw)": 2.103292942047119, "Pretrain/Step": 16041, "Pretrain/Step Time": 8.493616810068488} +{"Pretrain/Learning Rate": 3.2387911049673702e-06, "Pretrain/Loss": 1.987271785736084, "Pretrain/Loss (Raw)": 1.8954485654830933, "Pretrain/Step": 16042, "Pretrain/Step Time": 8.49296024814248} +{"Pretrain/Learning Rate": 3.236701694360322e-06, "Pretrain/Loss": 1.9872995615005493, "Pretrain/Loss (Raw)": 1.9002293348312378, "Pretrain/Step": 16043, "Pretrain/Step Time": 8.494775427505374} +{"Pretrain/Learning Rate": 3.2346129112826446e-06, "Pretrain/Loss": 1.9850269556045532, "Pretrain/Loss (Raw)": 1.8758995532989502, "Pretrain/Step": 16044, "Pretrain/Step Time": 8.49653010815382} +{"Pretrain/Learning Rate": 3.2325247557945526e-06, "Pretrain/Loss": 1.9859070777893066, "Pretrain/Loss (Raw)": 2.110133647918701, "Pretrain/Step": 16045, "Pretrain/Step Time": 8.502617251127958} +{"Pretrain/Learning Rate": 3.2304372279562706e-06, "Pretrain/Loss": 1.986100196838379, "Pretrain/Loss (Raw)": 1.9754772186279297, "Pretrain/Step": 16046, "Pretrain/Step Time": 8.498679213225842} +{"Pretrain/Learning Rate": 3.228350327827984e-06, "Pretrain/Loss": 1.986072301864624, "Pretrain/Loss (Raw)": 1.9678360223770142, "Pretrain/Step": 16047, "Pretrain/Step Time": 8.49772678129375} +{"Pretrain/Learning Rate": 3.2262640554698632e-06, "Pretrain/Loss": 1.987310767173767, "Pretrain/Loss (Raw)": 1.897141933441162, "Pretrain/Step": 16048, "Pretrain/Step Time": 8.500854859128594} +{"Pretrain/Learning Rate": 3.224178410942072e-06, "Pretrain/Loss": 1.988585352897644, "Pretrain/Loss (Raw)": 1.8547347784042358, "Pretrain/Step": 16049, "Pretrain/Step Time": 8.499302703887224} +{"Pretrain/Learning Rate": 3.2220933943047425e-06, "Pretrain/Loss": 1.9899846315383911, "Pretrain/Loss (Raw)": 2.087249279022217, "Pretrain/Step": 16050, "Pretrain/Step Time": 8.496338292956352} +{"Pretrain/Learning Rate": 3.220009005618002e-06, "Pretrain/Loss": 1.9895248413085938, "Pretrain/Loss (Raw)": 2.0173611640930176, "Pretrain/Step": 16051, "Pretrain/Step Time": 8.492348602041602} +{"Pretrain/Learning Rate": 3.2179252449419466e-06, "Pretrain/Loss": 1.9888570308685303, "Pretrain/Loss (Raw)": 2.002549409866333, "Pretrain/Step": 16052, "Pretrain/Step Time": 8.495827049016953} +{"Pretrain/Learning Rate": 3.215842112336659e-06, "Pretrain/Loss": 1.9847056865692139, "Pretrain/Loss (Raw)": 1.585425615310669, "Pretrain/Step": 16053, "Pretrain/Step Time": 8.496109465137124} +{"Pretrain/Learning Rate": 3.2137596078622102e-06, "Pretrain/Loss": 1.9812335968017578, "Pretrain/Loss (Raw)": 1.7274903059005737, "Pretrain/Step": 16054, "Pretrain/Step Time": 8.500881539657712} +{"Pretrain/Learning Rate": 3.211677731578641e-06, "Pretrain/Loss": 1.980534553527832, "Pretrain/Loss (Raw)": 2.100790500640869, "Pretrain/Step": 16055, "Pretrain/Step Time": 8.497155651450157} +{"Pretrain/Learning Rate": 3.20959648354599e-06, "Pretrain/Loss": 1.9790862798690796, "Pretrain/Loss (Raw)": 1.9153764247894287, "Pretrain/Step": 16056, "Pretrain/Step Time": 8.497956980019808} +{"Pretrain/Learning Rate": 3.207515863824262e-06, "Pretrain/Loss": 1.980742335319519, "Pretrain/Loss (Raw)": 1.9343606233596802, "Pretrain/Step": 16057, "Pretrain/Step Time": 8.493578538298607} +{"Pretrain/Learning Rate": 3.2054358724734473e-06, "Pretrain/Loss": 1.979663610458374, "Pretrain/Loss (Raw)": 1.839550495147705, "Pretrain/Step": 16058, "Pretrain/Step Time": 8.496073562651873} +{"Pretrain/Learning Rate": 3.203356509553529e-06, "Pretrain/Loss": 1.9784075021743774, "Pretrain/Loss (Raw)": 1.84824538230896, "Pretrain/Step": 16059, "Pretrain/Step Time": 8.494449768215418} +{"Pretrain/Learning Rate": 3.201277775124456e-06, "Pretrain/Loss": 1.97593092918396, "Pretrain/Loss (Raw)": 1.8621599674224854, "Pretrain/Step": 16060, "Pretrain/Step Time": 8.494272787123919} +{"Pretrain/Learning Rate": 3.199199669246175e-06, "Pretrain/Loss": 1.9727096557617188, "Pretrain/Loss (Raw)": 1.5106351375579834, "Pretrain/Step": 16061, "Pretrain/Step Time": 8.497763451188803} +{"Pretrain/Learning Rate": 3.1971221919786047e-06, "Pretrain/Loss": 1.9723615646362305, "Pretrain/Loss (Raw)": 1.8268569707870483, "Pretrain/Step": 16062, "Pretrain/Step Time": 8.497548187151551} +{"Pretrain/Learning Rate": 3.195045343381639e-06, "Pretrain/Loss": 1.9722520112991333, "Pretrain/Loss (Raw)": 2.1758153438568115, "Pretrain/Step": 16063, "Pretrain/Step Time": 8.49358276836574} +{"Pretrain/Learning Rate": 3.192969123515177e-06, "Pretrain/Loss": 1.9719616174697876, "Pretrain/Loss (Raw)": 2.0007941722869873, "Pretrain/Step": 16064, "Pretrain/Step Time": 8.49490013718605} +{"Pretrain/Learning Rate": 3.190893532439071e-06, "Pretrain/Loss": 1.9709985256195068, "Pretrain/Loss (Raw)": 2.0889053344726562, "Pretrain/Step": 16065, "Pretrain/Step Time": 8.492041639983654} +{"Pretrain/Learning Rate": 3.1888185702131784e-06, "Pretrain/Loss": 1.9719984531402588, "Pretrain/Loss (Raw)": 2.073293924331665, "Pretrain/Step": 16066, "Pretrain/Step Time": 8.490329841151834} +{"Pretrain/Learning Rate": 3.186744236897329e-06, "Pretrain/Loss": 1.9723972082138062, "Pretrain/Loss (Raw)": 2.1197028160095215, "Pretrain/Step": 16067, "Pretrain/Step Time": 8.492784885689616} +{"Pretrain/Learning Rate": 3.1846705325513287e-06, "Pretrain/Loss": 1.9732170104980469, "Pretrain/Loss (Raw)": 2.2164390087127686, "Pretrain/Step": 16068, "Pretrain/Step Time": 8.49015524238348} +{"Pretrain/Learning Rate": 3.182597457234976e-06, "Pretrain/Loss": 1.973423957824707, "Pretrain/Loss (Raw)": 2.1500356197357178, "Pretrain/Step": 16069, "Pretrain/Step Time": 8.492236716672778} +{"Pretrain/Learning Rate": 3.1805250110080427e-06, "Pretrain/Loss": 1.9743417501449585, "Pretrain/Loss (Raw)": 2.1422550678253174, "Pretrain/Step": 16070, "Pretrain/Step Time": 8.497364275157452} +{"Pretrain/Learning Rate": 3.1784531939302947e-06, "Pretrain/Loss": 1.9761936664581299, "Pretrain/Loss (Raw)": 2.1220006942749023, "Pretrain/Step": 16071, "Pretrain/Step Time": 8.495022462680936} +{"Pretrain/Learning Rate": 3.1763820060614623e-06, "Pretrain/Loss": 1.9764840602874756, "Pretrain/Loss (Raw)": 2.024048328399658, "Pretrain/Step": 16072, "Pretrain/Step Time": 8.493950463831425} +{"Pretrain/Learning Rate": 3.1743114474612674e-06, "Pretrain/Loss": 1.9779834747314453, "Pretrain/Loss (Raw)": 2.116018295288086, "Pretrain/Step": 16073, "Pretrain/Step Time": 8.49495537392795} +{"Pretrain/Learning Rate": 3.1722415181894228e-06, "Pretrain/Loss": 1.9747520685195923, "Pretrain/Loss (Raw)": 1.904113531112671, "Pretrain/Step": 16074, "Pretrain/Step Time": 8.486838050186634} +{"Pretrain/Learning Rate": 3.1701722183055976e-06, "Pretrain/Loss": 1.976491093635559, "Pretrain/Loss (Raw)": 2.255592107772827, "Pretrain/Step": 16075, "Pretrain/Step Time": 8.489589905366302} +{"Pretrain/Learning Rate": 3.1681035478694747e-06, "Pretrain/Loss": 1.97702956199646, "Pretrain/Loss (Raw)": 1.9648189544677734, "Pretrain/Step": 16076, "Pretrain/Step Time": 8.491225514560938} +{"Pretrain/Learning Rate": 3.1660355069406954e-06, "Pretrain/Loss": 1.977673053741455, "Pretrain/Loss (Raw)": 2.13143253326416, "Pretrain/Step": 16077, "Pretrain/Step Time": 8.488452212885022} +{"Pretrain/Learning Rate": 3.163968095578884e-06, "Pretrain/Loss": 1.9807798862457275, "Pretrain/Loss (Raw)": 2.1729416847229004, "Pretrain/Step": 16078, "Pretrain/Step Time": 8.492369167506695} +{"Pretrain/Learning Rate": 3.1619013138436653e-06, "Pretrain/Loss": 1.9817880392074585, "Pretrain/Loss (Raw)": 2.146007537841797, "Pretrain/Step": 16079, "Pretrain/Step Time": 8.49149420298636} +{"Pretrain/Learning Rate": 3.159835161794622e-06, "Pretrain/Loss": 1.9816960096359253, "Pretrain/Loss (Raw)": 2.1161906719207764, "Pretrain/Step": 16080, "Pretrain/Step Time": 8.49233964830637} +{"Pretrain/Learning Rate": 3.1577696394913424e-06, "Pretrain/Loss": 1.9797711372375488, "Pretrain/Loss (Raw)": 1.6603984832763672, "Pretrain/Step": 16081, "Pretrain/Step Time": 8.493637029081583} +{"Pretrain/Learning Rate": 3.1557047469933763e-06, "Pretrain/Loss": 1.9807846546173096, "Pretrain/Loss (Raw)": 1.9573973417282104, "Pretrain/Step": 16082, "Pretrain/Step Time": 8.49358125217259} +{"Pretrain/Learning Rate": 3.1536404843602567e-06, "Pretrain/Loss": 1.979601502418518, "Pretrain/Loss (Raw)": 1.949763536453247, "Pretrain/Step": 16083, "Pretrain/Step Time": 8.490909034386277} +{"Pretrain/Learning Rate": 3.151576851651522e-06, "Pretrain/Loss": 1.9797844886779785, "Pretrain/Loss (Raw)": 1.854897379875183, "Pretrain/Step": 16084, "Pretrain/Step Time": 8.489809473976493} +{"Pretrain/Learning Rate": 3.1495138489266607e-06, "Pretrain/Loss": 1.980752944946289, "Pretrain/Loss (Raw)": 2.175417900085449, "Pretrain/Step": 16085, "Pretrain/Step Time": 8.491247091442347} +{"Pretrain/Learning Rate": 3.1474514762451666e-06, "Pretrain/Loss": 1.9801338911056519, "Pretrain/Loss (Raw)": 1.9480355978012085, "Pretrain/Step": 16086, "Pretrain/Step Time": 8.490572916343808} +{"Pretrain/Learning Rate": 3.145389733666507e-06, "Pretrain/Loss": 1.9799070358276367, "Pretrain/Loss (Raw)": 2.0691044330596924, "Pretrain/Step": 16087, "Pretrain/Step Time": 8.486848711967468} +{"Pretrain/Learning Rate": 3.143328621250127e-06, "Pretrain/Loss": 1.9788224697113037, "Pretrain/Loss (Raw)": 1.6444530487060547, "Pretrain/Step": 16088, "Pretrain/Step Time": 8.490417307242751} +{"Pretrain/Learning Rate": 3.1412681390554587e-06, "Pretrain/Loss": 1.9790470600128174, "Pretrain/Loss (Raw)": 2.0839250087738037, "Pretrain/Step": 16089, "Pretrain/Step Time": 8.493516908958554} +{"Pretrain/Learning Rate": 3.1392082871419094e-06, "Pretrain/Loss": 1.9816570281982422, "Pretrain/Loss (Raw)": 2.168062925338745, "Pretrain/Step": 16090, "Pretrain/Step Time": 8.49221914447844} +{"Pretrain/Learning Rate": 3.1371490655688813e-06, "Pretrain/Loss": 1.9848757982254028, "Pretrain/Loss (Raw)": 2.214560031890869, "Pretrain/Step": 16091, "Pretrain/Step Time": 8.492987776175141} +{"Pretrain/Learning Rate": 3.1350904743957438e-06, "Pretrain/Loss": 1.985661506652832, "Pretrain/Loss (Raw)": 1.9824947118759155, "Pretrain/Step": 16092, "Pretrain/Step Time": 8.494061982259154} +{"Pretrain/Learning Rate": 3.1330325136818632e-06, "Pretrain/Loss": 1.9840822219848633, "Pretrain/Loss (Raw)": 1.9608538150787354, "Pretrain/Step": 16093, "Pretrain/Step Time": 8.491038484498858} +{"Pretrain/Learning Rate": 3.130975183486576e-06, "Pretrain/Loss": 1.9855396747589111, "Pretrain/Loss (Raw)": 1.9972796440124512, "Pretrain/Step": 16094, "Pretrain/Step Time": 8.493956403806806} +{"Pretrain/Learning Rate": 3.1289184838691977e-06, "Pretrain/Loss": 1.9849295616149902, "Pretrain/Loss (Raw)": 1.9994194507598877, "Pretrain/Step": 16095, "Pretrain/Step Time": 8.494076268747449} +{"Pretrain/Learning Rate": 3.1268624148890423e-06, "Pretrain/Loss": 1.985985517501831, "Pretrain/Loss (Raw)": 2.07780385017395, "Pretrain/Step": 16096, "Pretrain/Step Time": 8.491773949936032} +{"Pretrain/Learning Rate": 3.124806976605382e-06, "Pretrain/Loss": 1.9852505922317505, "Pretrain/Loss (Raw)": 1.9843261241912842, "Pretrain/Step": 16097, "Pretrain/Step Time": 8.490510614588857} +{"Pretrain/Learning Rate": 3.1227521690775e-06, "Pretrain/Loss": 1.9835823774337769, "Pretrain/Loss (Raw)": 1.903778076171875, "Pretrain/Step": 16098, "Pretrain/Step Time": 8.488560188561678} +{"Pretrain/Learning Rate": 3.120697992364635e-06, "Pretrain/Loss": 1.98183274269104, "Pretrain/Loss (Raw)": 1.8847236633300781, "Pretrain/Step": 16099, "Pretrain/Step Time": 8.491459712386131} +{"Pretrain/Learning Rate": 3.1186444465260144e-06, "Pretrain/Loss": 1.979854941368103, "Pretrain/Loss (Raw)": 2.036536455154419, "Pretrain/Step": 16100, "Pretrain/Step Time": 8.485185598954558} +{"Pretrain/Learning Rate": 3.1165915316208606e-06, "Pretrain/Loss": 1.9786434173583984, "Pretrain/Loss (Raw)": 2.05059814453125, "Pretrain/Step": 16101, "Pretrain/Step Time": 8.482887776568532} +{"Pretrain/Learning Rate": 3.1145392477083565e-06, "Pretrain/Loss": 1.9793850183486938, "Pretrain/Loss (Raw)": 2.1120052337646484, "Pretrain/Step": 16102, "Pretrain/Step Time": 8.484044842422009} +{"Pretrain/Learning Rate": 3.112487594847693e-06, "Pretrain/Loss": 1.9798619747161865, "Pretrain/Loss (Raw)": 1.6977589130401611, "Pretrain/Step": 16103, "Pretrain/Step Time": 8.487172016873956} +{"Pretrain/Learning Rate": 3.110436573098019e-06, "Pretrain/Loss": 1.9821635484695435, "Pretrain/Loss (Raw)": 2.051679849624634, "Pretrain/Step": 16104, "Pretrain/Step Time": 8.488250376656651} +{"Pretrain/Learning Rate": 3.108386182518469e-06, "Pretrain/Loss": 1.9826500415802002, "Pretrain/Loss (Raw)": 2.0173988342285156, "Pretrain/Step": 16105, "Pretrain/Step Time": 8.488871907815337} +{"Pretrain/Learning Rate": 3.1063364231681796e-06, "Pretrain/Loss": 1.9832319021224976, "Pretrain/Loss (Raw)": 1.9865026473999023, "Pretrain/Step": 16106, "Pretrain/Step Time": 8.488514570519328} +{"Pretrain/Learning Rate": 3.104287295106237e-06, "Pretrain/Loss": 1.9832929372787476, "Pretrain/Loss (Raw)": 2.0106968879699707, "Pretrain/Step": 16107, "Pretrain/Step Time": 8.48560306057334} +{"Pretrain/Learning Rate": 3.1022387983917405e-06, "Pretrain/Loss": 1.9821596145629883, "Pretrain/Loss (Raw)": 1.7310062646865845, "Pretrain/Step": 16108, "Pretrain/Step Time": 8.485429380089045} +{"Pretrain/Learning Rate": 3.100190933083752e-06, "Pretrain/Loss": 1.9801139831542969, "Pretrain/Loss (Raw)": 1.7714285850524902, "Pretrain/Step": 16109, "Pretrain/Step Time": 8.485043838620186} +{"Pretrain/Learning Rate": 3.0981436992413128e-06, "Pretrain/Loss": 1.9829720258712769, "Pretrain/Loss (Raw)": 1.9682350158691406, "Pretrain/Step": 16110, "Pretrain/Step Time": 8.485126163810492} +{"Pretrain/Learning Rate": 3.096097096923467e-06, "Pretrain/Loss": 1.9845917224884033, "Pretrain/Loss (Raw)": 1.9783244132995605, "Pretrain/Step": 16111, "Pretrain/Step Time": 8.484462914988399} +{"Pretrain/Learning Rate": 3.0940511261892154e-06, "Pretrain/Loss": 1.9805448055267334, "Pretrain/Loss (Raw)": 1.7642072439193726, "Pretrain/Step": 16112, "Pretrain/Step Time": 8.482626158744097} +{"Pretrain/Learning Rate": 3.0920057870975627e-06, "Pretrain/Loss": 1.9797451496124268, "Pretrain/Loss (Raw)": 2.0326521396636963, "Pretrain/Step": 16113, "Pretrain/Step Time": 8.481625959277153} +{"Pretrain/Learning Rate": 3.0899610797074707e-06, "Pretrain/Loss": 1.9792832136154175, "Pretrain/Loss (Raw)": 1.6906014680862427, "Pretrain/Step": 16114, "Pretrain/Step Time": 8.483587371185422} +{"Pretrain/Learning Rate": 3.0879170040779113e-06, "Pretrain/Loss": 1.9801627397537231, "Pretrain/Loss (Raw)": 2.001729965209961, "Pretrain/Step": 16115, "Pretrain/Step Time": 8.482350122183561} +{"Pretrain/Learning Rate": 3.0858735602678214e-06, "Pretrain/Loss": 1.9778227806091309, "Pretrain/Loss (Raw)": 1.59682035446167, "Pretrain/Step": 16116, "Pretrain/Step Time": 8.482204038649797} +{"Pretrain/Learning Rate": 3.0838307483361113e-06, "Pretrain/Loss": 1.9764235019683838, "Pretrain/Loss (Raw)": 1.922513484954834, "Pretrain/Step": 16117, "Pretrain/Step Time": 8.477685011923313} +{"Pretrain/Learning Rate": 3.081788568341695e-06, "Pretrain/Loss": 1.9765419960021973, "Pretrain/Loss (Raw)": 1.8452693223953247, "Pretrain/Step": 16118, "Pretrain/Step Time": 8.475619392469525} +{"Pretrain/Learning Rate": 3.0797470203434513e-06, "Pretrain/Loss": 1.9775186777114868, "Pretrain/Loss (Raw)": 2.1089274883270264, "Pretrain/Step": 16119, "Pretrain/Step Time": 8.48606557585299} +{"Pretrain/Learning Rate": 3.0777061044002547e-06, "Pretrain/Loss": 1.976943016052246, "Pretrain/Loss (Raw)": 1.8303381204605103, "Pretrain/Step": 16120, "Pretrain/Step Time": 8.486305136233568} +{"Pretrain/Learning Rate": 3.07566582057095e-06, "Pretrain/Loss": 1.9753491878509521, "Pretrain/Loss (Raw)": 1.877328634262085, "Pretrain/Step": 16121, "Pretrain/Step Time": 8.494899509474635} +{"Pretrain/Learning Rate": 3.0736261689143566e-06, "Pretrain/Loss": 1.975682020187378, "Pretrain/Loss (Raw)": 2.0424489974975586, "Pretrain/Step": 16122, "Pretrain/Step Time": 8.490861231461167} +{"Pretrain/Learning Rate": 3.0715871494893024e-06, "Pretrain/Loss": 1.9767708778381348, "Pretrain/Loss (Raw)": 2.108776330947876, "Pretrain/Step": 16123, "Pretrain/Step Time": 8.489791417494416} +{"Pretrain/Learning Rate": 3.069548762354571e-06, "Pretrain/Loss": 1.9776980876922607, "Pretrain/Loss (Raw)": 2.105674982070923, "Pretrain/Step": 16124, "Pretrain/Step Time": 8.488790201023221} +{"Pretrain/Learning Rate": 3.0675110075689432e-06, "Pretrain/Loss": 1.9787753820419312, "Pretrain/Loss (Raw)": 2.060574769973755, "Pretrain/Step": 16125, "Pretrain/Step Time": 8.48681023530662} +{"Pretrain/Learning Rate": 3.065473885191175e-06, "Pretrain/Loss": 1.9802440404891968, "Pretrain/Loss (Raw)": 2.1894428730010986, "Pretrain/Step": 16126, "Pretrain/Step Time": 8.48629666864872} +{"Pretrain/Learning Rate": 3.06343739528e-06, "Pretrain/Loss": 1.9813473224639893, "Pretrain/Loss (Raw)": 2.09053373336792, "Pretrain/Step": 16127, "Pretrain/Step Time": 8.486856561154127} +{"Pretrain/Learning Rate": 3.0614015378941487e-06, "Pretrain/Loss": 1.9808552265167236, "Pretrain/Loss (Raw)": 1.8932315111160278, "Pretrain/Step": 16128, "Pretrain/Step Time": 8.487799640744925} +{"Pretrain/Learning Rate": 3.059366313092313e-06, "Pretrain/Loss": 1.981400728225708, "Pretrain/Loss (Raw)": 1.9784525632858276, "Pretrain/Step": 16129, "Pretrain/Step Time": 8.48251498118043} +{"Pretrain/Learning Rate": 3.0573317209331874e-06, "Pretrain/Loss": 1.9801433086395264, "Pretrain/Loss (Raw)": 1.9089715480804443, "Pretrain/Step": 16130, "Pretrain/Step Time": 8.48981662467122} +{"Pretrain/Learning Rate": 3.055297761475434e-06, "Pretrain/Loss": 1.9758541584014893, "Pretrain/Loss (Raw)": 1.9110453128814697, "Pretrain/Step": 16131, "Pretrain/Step Time": 8.490097193047404} +{"Pretrain/Learning Rate": 3.0532644347776944e-06, "Pretrain/Loss": 1.975395917892456, "Pretrain/Loss (Raw)": 2.0471057891845703, "Pretrain/Step": 16132, "Pretrain/Step Time": 8.486805325374007} +{"Pretrain/Learning Rate": 3.051231740898608e-06, "Pretrain/Loss": 1.9741709232330322, "Pretrain/Loss (Raw)": 1.9662256240844727, "Pretrain/Step": 16133, "Pretrain/Step Time": 8.486917201429605} +{"Pretrain/Learning Rate": 3.0491996798967747e-06, "Pretrain/Loss": 1.9743564128875732, "Pretrain/Loss (Raw)": 1.9902225732803345, "Pretrain/Step": 16134, "Pretrain/Step Time": 8.48501362837851} +{"Pretrain/Learning Rate": 3.0471682518308008e-06, "Pretrain/Loss": 1.9757366180419922, "Pretrain/Loss (Raw)": 2.0940980911254883, "Pretrain/Step": 16135, "Pretrain/Step Time": 8.483292458578944} +{"Pretrain/Learning Rate": 3.045137456759256e-06, "Pretrain/Loss": 1.9765784740447998, "Pretrain/Loss (Raw)": 2.070378303527832, "Pretrain/Step": 16136, "Pretrain/Step Time": 8.481907293200493} +{"Pretrain/Learning Rate": 3.043107294740688e-06, "Pretrain/Loss": 1.9739227294921875, "Pretrain/Loss (Raw)": 2.123087167739868, "Pretrain/Step": 16137, "Pretrain/Step Time": 8.48749758116901} +{"Pretrain/Learning Rate": 3.04107776583365e-06, "Pretrain/Loss": 1.9737317562103271, "Pretrain/Loss (Raw)": 2.072153329849243, "Pretrain/Step": 16138, "Pretrain/Step Time": 8.488556625321507} +{"Pretrain/Learning Rate": 3.0390488700966474e-06, "Pretrain/Loss": 1.9758415222167969, "Pretrain/Loss (Raw)": 2.089292287826538, "Pretrain/Step": 16139, "Pretrain/Step Time": 8.484768135473132} +{"Pretrain/Learning Rate": 3.037020607588195e-06, "Pretrain/Loss": 1.977416753768921, "Pretrain/Loss (Raw)": 1.9977408647537231, "Pretrain/Step": 16140, "Pretrain/Step Time": 8.487146314233541} +{"Pretrain/Learning Rate": 3.0349929783667715e-06, "Pretrain/Loss": 1.978967308998108, "Pretrain/Loss (Raw)": 2.152313709259033, "Pretrain/Step": 16141, "Pretrain/Step Time": 8.481132788583636} +{"Pretrain/Learning Rate": 3.0329659824908345e-06, "Pretrain/Loss": 1.9783259630203247, "Pretrain/Loss (Raw)": 1.9530738592147827, "Pretrain/Step": 16142, "Pretrain/Step Time": 8.484314516186714} +{"Pretrain/Learning Rate": 3.0309396200188437e-06, "Pretrain/Loss": 1.9769256114959717, "Pretrain/Loss (Raw)": 1.8194845914840698, "Pretrain/Step": 16143, "Pretrain/Step Time": 8.489330384880304} +{"Pretrain/Learning Rate": 3.028913891009216e-06, "Pretrain/Loss": 1.9781248569488525, "Pretrain/Loss (Raw)": 2.102571725845337, "Pretrain/Step": 16144, "Pretrain/Step Time": 8.487060831859708} +{"Pretrain/Learning Rate": 3.0268887955203746e-06, "Pretrain/Loss": 1.975603699684143, "Pretrain/Loss (Raw)": 1.736348032951355, "Pretrain/Step": 16145, "Pretrain/Step Time": 8.491814872249961} +{"Pretrain/Learning Rate": 3.0248643336107054e-06, "Pretrain/Loss": 1.9780936241149902, "Pretrain/Loss (Raw)": 2.3132057189941406, "Pretrain/Step": 16146, "Pretrain/Step Time": 8.49077039025724} +{"Pretrain/Learning Rate": 3.0228405053385726e-06, "Pretrain/Loss": 1.9799730777740479, "Pretrain/Loss (Raw)": 2.2152340412139893, "Pretrain/Step": 16147, "Pretrain/Step Time": 8.494413958862424} +{"Pretrain/Learning Rate": 3.0208173107623473e-06, "Pretrain/Loss": 1.979367733001709, "Pretrain/Loss (Raw)": 1.840074062347412, "Pretrain/Step": 16148, "Pretrain/Step Time": 8.492304654791951} +{"Pretrain/Learning Rate": 3.0187947499403566e-06, "Pretrain/Loss": 1.9777026176452637, "Pretrain/Loss (Raw)": 1.71152925491333, "Pretrain/Step": 16149, "Pretrain/Step Time": 8.487904202193022} +{"Pretrain/Learning Rate": 3.01677282293093e-06, "Pretrain/Loss": 1.9791350364685059, "Pretrain/Loss (Raw)": 2.0856382846832275, "Pretrain/Step": 16150, "Pretrain/Step Time": 8.487698685377836} +{"Pretrain/Learning Rate": 3.014751529792359e-06, "Pretrain/Loss": 1.9788851737976074, "Pretrain/Loss (Raw)": 1.9502500295639038, "Pretrain/Step": 16151, "Pretrain/Step Time": 8.488714471459389} +{"Pretrain/Learning Rate": 3.012730870582925e-06, "Pretrain/Loss": 1.9835474491119385, "Pretrain/Loss (Raw)": 2.478062152862549, "Pretrain/Step": 16152, "Pretrain/Step Time": 8.48708575591445} +{"Pretrain/Learning Rate": 3.0107108453609035e-06, "Pretrain/Loss": 1.9859344959259033, "Pretrain/Loss (Raw)": 2.098310947418213, "Pretrain/Step": 16153, "Pretrain/Step Time": 8.490435229614377} +{"Pretrain/Learning Rate": 3.0086914541845255e-06, "Pretrain/Loss": 1.9854061603546143, "Pretrain/Loss (Raw)": 2.032836437225342, "Pretrain/Step": 16154, "Pretrain/Step Time": 8.493897169828415} +{"Pretrain/Learning Rate": 3.0066726971120314e-06, "Pretrain/Loss": 1.9863452911376953, "Pretrain/Loss (Raw)": 2.03776216506958, "Pretrain/Step": 16155, "Pretrain/Step Time": 8.49349008873105} +{"Pretrain/Learning Rate": 3.0046545742016264e-06, "Pretrain/Loss": 1.9877101182937622, "Pretrain/Loss (Raw)": 2.1143417358398438, "Pretrain/Step": 16156, "Pretrain/Step Time": 8.488054398447275} +{"Pretrain/Learning Rate": 3.002637085511498e-06, "Pretrain/Loss": 1.990412950515747, "Pretrain/Loss (Raw)": 2.287391424179077, "Pretrain/Step": 16157, "Pretrain/Step Time": 8.486866286024451} +{"Pretrain/Learning Rate": 3.0006202310998266e-06, "Pretrain/Loss": 1.9900833368301392, "Pretrain/Loss (Raw)": 1.9815905094146729, "Pretrain/Step": 16158, "Pretrain/Step Time": 8.486585872247815} +{"Pretrain/Learning Rate": 2.9986040110247556e-06, "Pretrain/Loss": 1.9913192987442017, "Pretrain/Loss (Raw)": 2.0065412521362305, "Pretrain/Step": 16159, "Pretrain/Step Time": 8.492639627307653} +{"Pretrain/Learning Rate": 2.996588425344432e-06, "Pretrain/Loss": 1.9912652969360352, "Pretrain/Loss (Raw)": 1.9448974132537842, "Pretrain/Step": 16160, "Pretrain/Step Time": 8.487287430092692} +{"Pretrain/Learning Rate": 2.9945734741169738e-06, "Pretrain/Loss": 1.993042230606079, "Pretrain/Loss (Raw)": 2.3252596855163574, "Pretrain/Step": 16161, "Pretrain/Step Time": 8.488632291555405} +{"Pretrain/Learning Rate": 2.992559157400468e-06, "Pretrain/Loss": 1.9951709508895874, "Pretrain/Loss (Raw)": 2.0248658657073975, "Pretrain/Step": 16162, "Pretrain/Step Time": 8.490357166156173} +{"Pretrain/Learning Rate": 2.990545475253012e-06, "Pretrain/Loss": 1.9920490980148315, "Pretrain/Loss (Raw)": 1.8484293222427368, "Pretrain/Step": 16163, "Pretrain/Step Time": 8.49151360616088} +{"Pretrain/Learning Rate": 2.988532427732654e-06, "Pretrain/Loss": 1.9931704998016357, "Pretrain/Loss (Raw)": 1.917630672454834, "Pretrain/Step": 16164, "Pretrain/Step Time": 8.49049411341548} +{"Pretrain/Learning Rate": 2.9865200148974535e-06, "Pretrain/Loss": 1.9916186332702637, "Pretrain/Loss (Raw)": 1.9930638074874878, "Pretrain/Step": 16165, "Pretrain/Step Time": 8.49206954240799} +{"Pretrain/Learning Rate": 2.9845082368054307e-06, "Pretrain/Loss": 1.9925017356872559, "Pretrain/Loss (Raw)": 2.2543716430664062, "Pretrain/Step": 16166, "Pretrain/Step Time": 8.4921854455024} +{"Pretrain/Learning Rate": 2.982497093514586e-06, "Pretrain/Loss": 1.994685411453247, "Pretrain/Loss (Raw)": 1.9147119522094727, "Pretrain/Step": 16167, "Pretrain/Step Time": 8.495710611343384} +{"Pretrain/Learning Rate": 2.980486585082923e-06, "Pretrain/Loss": 1.993679404258728, "Pretrain/Loss (Raw)": 1.9538265466690063, "Pretrain/Step": 16168, "Pretrain/Step Time": 8.494415124878287} +{"Pretrain/Learning Rate": 2.9784767115683983e-06, "Pretrain/Loss": 1.9932975769042969, "Pretrain/Loss (Raw)": 2.0544025897979736, "Pretrain/Step": 16169, "Pretrain/Step Time": 8.497175829485059} +{"Pretrain/Learning Rate": 2.976467473028982e-06, "Pretrain/Loss": 1.9933969974517822, "Pretrain/Loss (Raw)": 1.908196210861206, "Pretrain/Step": 16170, "Pretrain/Step Time": 8.496433179825544} +{"Pretrain/Learning Rate": 2.974458869522598e-06, "Pretrain/Loss": 1.994152545928955, "Pretrain/Loss (Raw)": 1.9969165325164795, "Pretrain/Step": 16171, "Pretrain/Step Time": 8.499939613044262} +{"Pretrain/Learning Rate": 2.9724509011071683e-06, "Pretrain/Loss": 1.9959458112716675, "Pretrain/Loss (Raw)": 2.1054303646087646, "Pretrain/Step": 16172, "Pretrain/Step Time": 8.496958451345563} +{"Pretrain/Learning Rate": 2.9704435678405863e-06, "Pretrain/Loss": 1.9937379360198975, "Pretrain/Loss (Raw)": 1.8275352716445923, "Pretrain/Step": 16173, "Pretrain/Step Time": 8.493423145264387} +{"Pretrain/Learning Rate": 2.9684368697807302e-06, "Pretrain/Loss": 1.9919553995132446, "Pretrain/Loss (Raw)": 1.747314691543579, "Pretrain/Step": 16174, "Pretrain/Step Time": 8.4932332765311} +{"Pretrain/Learning Rate": 2.9664308069854706e-06, "Pretrain/Loss": 1.9919615983963013, "Pretrain/Loss (Raw)": 1.9686312675476074, "Pretrain/Step": 16175, "Pretrain/Step Time": 8.495423328131437} +{"Pretrain/Learning Rate": 2.9644253795126394e-06, "Pretrain/Loss": 1.9925789833068848, "Pretrain/Loss (Raw)": 1.9761706590652466, "Pretrain/Step": 16176, "Pretrain/Step Time": 8.490741543471813} +{"Pretrain/Learning Rate": 2.9624205874200754e-06, "Pretrain/Loss": 1.9936375617980957, "Pretrain/Loss (Raw)": 1.9902251958847046, "Pretrain/Step": 16177, "Pretrain/Step Time": 8.492152934893966} +{"Pretrain/Learning Rate": 2.9604164307655723e-06, "Pretrain/Loss": 1.995583176612854, "Pretrain/Loss (Raw)": 2.3362841606140137, "Pretrain/Step": 16178, "Pretrain/Step Time": 8.495573826134205} +{"Pretrain/Learning Rate": 2.958412909606931e-06, "Pretrain/Loss": 1.9959155321121216, "Pretrain/Loss (Raw)": 2.059908390045166, "Pretrain/Step": 16179, "Pretrain/Step Time": 8.495943436399102} +{"Pretrain/Learning Rate": 2.9564100240019127e-06, "Pretrain/Loss": 1.9947021007537842, "Pretrain/Loss (Raw)": 1.8472142219543457, "Pretrain/Step": 16180, "Pretrain/Step Time": 8.497357776388526} +{"Pretrain/Learning Rate": 2.9544077740082692e-06, "Pretrain/Loss": 1.9981175661087036, "Pretrain/Loss (Raw)": 2.0226199626922607, "Pretrain/Step": 16181, "Pretrain/Step Time": 8.49705239199102} +{"Pretrain/Learning Rate": 2.9524061596837406e-06, "Pretrain/Loss": 2.000772714614868, "Pretrain/Loss (Raw)": 2.067366600036621, "Pretrain/Step": 16182, "Pretrain/Step Time": 8.49234845675528} +{"Pretrain/Learning Rate": 2.95040518108603e-06, "Pretrain/Loss": 2.001293659210205, "Pretrain/Loss (Raw)": 2.167473077774048, "Pretrain/Step": 16183, "Pretrain/Step Time": 8.494354302063584} +{"Pretrain/Learning Rate": 2.94840483827285e-06, "Pretrain/Loss": 2.004196882247925, "Pretrain/Loss (Raw)": 2.2869768142700195, "Pretrain/Step": 16184, "Pretrain/Step Time": 8.49184076860547} +{"Pretrain/Learning Rate": 2.9464051313018715e-06, "Pretrain/Loss": 2.001953601837158, "Pretrain/Loss (Raw)": 1.6472091674804688, "Pretrain/Step": 16185, "Pretrain/Step Time": 8.498853158205748} +{"Pretrain/Learning Rate": 2.9444060602307475e-06, "Pretrain/Loss": 2.0015437602996826, "Pretrain/Loss (Raw)": 1.7871074676513672, "Pretrain/Step": 16186, "Pretrain/Step Time": 8.496009474620223} +{"Pretrain/Learning Rate": 2.942407625117133e-06, "Pretrain/Loss": 2.002412796020508, "Pretrain/Loss (Raw)": 1.9594749212265015, "Pretrain/Step": 16187, "Pretrain/Step Time": 8.495868060737848} +{"Pretrain/Learning Rate": 2.940409826018639e-06, "Pretrain/Loss": 2.0043275356292725, "Pretrain/Loss (Raw)": 2.107220411300659, "Pretrain/Step": 16188, "Pretrain/Step Time": 8.496395375579596} +{"Pretrain/Learning Rate": 2.9384126629928845e-06, "Pretrain/Loss": 2.005397319793701, "Pretrain/Loss (Raw)": 1.6475849151611328, "Pretrain/Step": 16189, "Pretrain/Step Time": 8.49539265781641} +{"Pretrain/Learning Rate": 2.9364161360974444e-06, "Pretrain/Loss": 2.006507396697998, "Pretrain/Loss (Raw)": 1.9689353704452515, "Pretrain/Step": 16190, "Pretrain/Step Time": 8.494240259751678} +{"Pretrain/Learning Rate": 2.934420245389888e-06, "Pretrain/Loss": 1.9997891187667847, "Pretrain/Loss (Raw)": 1.3158899545669556, "Pretrain/Step": 16191, "Pretrain/Step Time": 8.496378989890218} +{"Pretrain/Learning Rate": 2.9324249909277733e-06, "Pretrain/Loss": 1.9996823072433472, "Pretrain/Loss (Raw)": 1.9871134757995605, "Pretrain/Step": 16192, "Pretrain/Step Time": 8.494601363316178} +{"Pretrain/Learning Rate": 2.9304303727686222e-06, "Pretrain/Loss": 1.9998743534088135, "Pretrain/Loss (Raw)": 2.1135027408599854, "Pretrain/Step": 16193, "Pretrain/Step Time": 8.499712161719799} +{"Pretrain/Learning Rate": 2.92843639096996e-06, "Pretrain/Loss": 1.9975898265838623, "Pretrain/Loss (Raw)": 1.7808518409729004, "Pretrain/Step": 16194, "Pretrain/Step Time": 8.501651534810662} +{"Pretrain/Learning Rate": 2.926443045589275e-06, "Pretrain/Loss": 1.9961652755737305, "Pretrain/Loss (Raw)": 1.9373873472213745, "Pretrain/Step": 16195, "Pretrain/Step Time": 8.500677874311805} +{"Pretrain/Learning Rate": 2.924450336684037e-06, "Pretrain/Loss": 1.9946660995483398, "Pretrain/Loss (Raw)": 2.0245361328125, "Pretrain/Step": 16196, "Pretrain/Step Time": 8.504928044974804} +{"Pretrain/Learning Rate": 2.922458264311717e-06, "Pretrain/Loss": 1.9930140972137451, "Pretrain/Loss (Raw)": 1.9385899305343628, "Pretrain/Step": 16197, "Pretrain/Step Time": 8.498955486342311} +{"Pretrain/Learning Rate": 2.9204668285297443e-06, "Pretrain/Loss": 1.9885108470916748, "Pretrain/Loss (Raw)": 1.5658196210861206, "Pretrain/Step": 16198, "Pretrain/Step Time": 8.498017443343997} +{"Pretrain/Learning Rate": 2.9184760293955503e-06, "Pretrain/Loss": 1.9877557754516602, "Pretrain/Loss (Raw)": 2.0253567695617676, "Pretrain/Step": 16199, "Pretrain/Step Time": 8.501264618709683} +{"Pretrain/Learning Rate": 2.916485866966534e-06, "Pretrain/Loss": 1.9886070489883423, "Pretrain/Loss (Raw)": 2.133011817932129, "Pretrain/Step": 16200, "Pretrain/Step Time": 8.504492765292525} +{"Pretrain/Learning Rate": 2.914496341300074e-06, "Pretrain/Loss": 1.9871008396148682, "Pretrain/Loss (Raw)": 1.9232406616210938, "Pretrain/Step": 16201, "Pretrain/Step Time": 8.500087849795818} +{"Pretrain/Learning Rate": 2.91250745245355e-06, "Pretrain/Loss": 1.9880493879318237, "Pretrain/Loss (Raw)": 2.0255088806152344, "Pretrain/Step": 16202, "Pretrain/Step Time": 8.502150300890207} +{"Pretrain/Learning Rate": 2.9105192004842963e-06, "Pretrain/Loss": 1.9847650527954102, "Pretrain/Loss (Raw)": 1.8352142572402954, "Pretrain/Step": 16203, "Pretrain/Step Time": 8.500512709841132} +{"Pretrain/Learning Rate": 2.9085315854496533e-06, "Pretrain/Loss": 1.9849034547805786, "Pretrain/Loss (Raw)": 1.9825199842453003, "Pretrain/Step": 16204, "Pretrain/Step Time": 8.498629406094551} +{"Pretrain/Learning Rate": 2.90654460740693e-06, "Pretrain/Loss": 1.982417345046997, "Pretrain/Loss (Raw)": 1.813224196434021, "Pretrain/Step": 16205, "Pretrain/Step Time": 8.499869169667363} +{"Pretrain/Learning Rate": 2.9045582664134123e-06, "Pretrain/Loss": 1.9798731803894043, "Pretrain/Loss (Raw)": 1.8472689390182495, "Pretrain/Step": 16206, "Pretrain/Step Time": 8.497515503317118} +{"Pretrain/Learning Rate": 2.902572562526387e-06, "Pretrain/Loss": 1.9771502017974854, "Pretrain/Loss (Raw)": 1.7974778413772583, "Pretrain/Step": 16207, "Pretrain/Step Time": 8.496331881731749} +{"Pretrain/Learning Rate": 2.9005874958030976e-06, "Pretrain/Loss": 1.976008415222168, "Pretrain/Loss (Raw)": 1.9700266122817993, "Pretrain/Step": 16208, "Pretrain/Step Time": 8.495115442201495} +{"Pretrain/Learning Rate": 2.8986030663007954e-06, "Pretrain/Loss": 1.9789295196533203, "Pretrain/Loss (Raw)": 2.034323215484619, "Pretrain/Step": 16209, "Pretrain/Step Time": 8.496321260929108} +{"Pretrain/Learning Rate": 2.8966192740766922e-06, "Pretrain/Loss": 1.9778082370758057, "Pretrain/Loss (Raw)": 1.8138452768325806, "Pretrain/Step": 16210, "Pretrain/Step Time": 8.49728536605835} +{"Pretrain/Learning Rate": 2.894636119187985e-06, "Pretrain/Loss": 1.9785709381103516, "Pretrain/Loss (Raw)": 2.047396659851074, "Pretrain/Step": 16211, "Pretrain/Step Time": 8.503157844766974} +{"Pretrain/Learning Rate": 2.892653601691869e-06, "Pretrain/Loss": 1.980691909790039, "Pretrain/Loss (Raw)": 2.1263840198516846, "Pretrain/Step": 16212, "Pretrain/Step Time": 8.499006984755397} +{"Pretrain/Learning Rate": 2.8906717216454937e-06, "Pretrain/Loss": 1.9806089401245117, "Pretrain/Loss (Raw)": 2.164799690246582, "Pretrain/Step": 16213, "Pretrain/Step Time": 8.502580719068646} +{"Pretrain/Learning Rate": 2.888690479106021e-06, "Pretrain/Loss": 1.9788787364959717, "Pretrain/Loss (Raw)": 1.7265652418136597, "Pretrain/Step": 16214, "Pretrain/Step Time": 8.498636046424508} +{"Pretrain/Learning Rate": 2.886709874130569e-06, "Pretrain/Loss": 1.979356288909912, "Pretrain/Loss (Raw)": 2.130234956741333, "Pretrain/Step": 16215, "Pretrain/Step Time": 8.49927425570786} +{"Pretrain/Learning Rate": 2.8847299067762455e-06, "Pretrain/Loss": 1.9822511672973633, "Pretrain/Loss (Raw)": 2.014991044998169, "Pretrain/Step": 16216, "Pretrain/Step Time": 8.498623698949814} +{"Pretrain/Learning Rate": 2.882750577100149e-06, "Pretrain/Loss": 1.9810402393341064, "Pretrain/Loss (Raw)": 1.9289344549179077, "Pretrain/Step": 16217, "Pretrain/Step Time": 8.498341338708997} +{"Pretrain/Learning Rate": 2.8807718851593447e-06, "Pretrain/Loss": 1.980060338973999, "Pretrain/Loss (Raw)": 2.0426318645477295, "Pretrain/Step": 16218, "Pretrain/Step Time": 8.496261222288013} +{"Pretrain/Learning Rate": 2.8787938310108925e-06, "Pretrain/Loss": 1.9812650680541992, "Pretrain/Loss (Raw)": 2.368767738342285, "Pretrain/Step": 16219, "Pretrain/Step Time": 8.498175635933876} +{"Pretrain/Learning Rate": 2.8768164147118276e-06, "Pretrain/Loss": 1.9819647073745728, "Pretrain/Loss (Raw)": 2.0720560550689697, "Pretrain/Step": 16220, "Pretrain/Step Time": 8.49678555317223} +{"Pretrain/Learning Rate": 2.8748396363191597e-06, "Pretrain/Loss": 1.9832603931427002, "Pretrain/Loss (Raw)": 2.1267082691192627, "Pretrain/Step": 16221, "Pretrain/Step Time": 8.496860064566135} +{"Pretrain/Learning Rate": 2.872863495889899e-06, "Pretrain/Loss": 1.983248233795166, "Pretrain/Loss (Raw)": 1.9957146644592285, "Pretrain/Step": 16222, "Pretrain/Step Time": 8.494922934100032} +{"Pretrain/Learning Rate": 2.870887993481014e-06, "Pretrain/Loss": 1.981705665588379, "Pretrain/Loss (Raw)": 1.8019659519195557, "Pretrain/Step": 16223, "Pretrain/Step Time": 8.491643004119396} +{"Pretrain/Learning Rate": 2.868913129149481e-06, "Pretrain/Loss": 1.9807167053222656, "Pretrain/Loss (Raw)": 1.9512176513671875, "Pretrain/Step": 16224, "Pretrain/Step Time": 8.491598192602396} +{"Pretrain/Learning Rate": 2.8669389029522377e-06, "Pretrain/Loss": 1.9823784828186035, "Pretrain/Loss (Raw)": 2.1970388889312744, "Pretrain/Step": 16225, "Pretrain/Step Time": 8.498089142143726} +{"Pretrain/Learning Rate": 2.8649653149461996e-06, "Pretrain/Loss": 1.9834479093551636, "Pretrain/Loss (Raw)": 2.0406606197357178, "Pretrain/Step": 16226, "Pretrain/Step Time": 8.49942304380238} +{"Pretrain/Learning Rate": 2.8629923651882883e-06, "Pretrain/Loss": 1.9848198890686035, "Pretrain/Loss (Raw)": 2.0603296756744385, "Pretrain/Step": 16227, "Pretrain/Step Time": 8.496896900236607} +{"Pretrain/Learning Rate": 2.861020053735383e-06, "Pretrain/Loss": 1.984632968902588, "Pretrain/Loss (Raw)": 2.012620449066162, "Pretrain/Step": 16228, "Pretrain/Step Time": 8.49751896224916} +{"Pretrain/Learning Rate": 2.8590483806443636e-06, "Pretrain/Loss": 1.9817900657653809, "Pretrain/Loss (Raw)": 1.686700463294983, "Pretrain/Step": 16229, "Pretrain/Step Time": 8.503476729616523} +{"Pretrain/Learning Rate": 2.857077345972073e-06, "Pretrain/Loss": 1.9805598258972168, "Pretrain/Loss (Raw)": 1.9545371532440186, "Pretrain/Step": 16230, "Pretrain/Step Time": 8.502374107018113} +{"Pretrain/Learning Rate": 2.8551069497753436e-06, "Pretrain/Loss": 1.982895851135254, "Pretrain/Loss (Raw)": 1.9967693090438843, "Pretrain/Step": 16231, "Pretrain/Step Time": 8.501293249428272} +{"Pretrain/Learning Rate": 2.8531371921109995e-06, "Pretrain/Loss": 1.9811017513275146, "Pretrain/Loss (Raw)": 1.8220351934432983, "Pretrain/Step": 16232, "Pretrain/Step Time": 8.50080700777471} +{"Pretrain/Learning Rate": 2.8511680730358287e-06, "Pretrain/Loss": 1.9794689416885376, "Pretrain/Loss (Raw)": 1.8084053993225098, "Pretrain/Step": 16233, "Pretrain/Step Time": 8.503131216391921} +{"Pretrain/Learning Rate": 2.849199592606613e-06, "Pretrain/Loss": 1.9788395166397095, "Pretrain/Loss (Raw)": 1.905924677848816, "Pretrain/Step": 16234, "Pretrain/Step Time": 8.500309973955154} +{"Pretrain/Learning Rate": 2.8472317508801166e-06, "Pretrain/Loss": 1.9773725271224976, "Pretrain/Loss (Raw)": 1.8229243755340576, "Pretrain/Step": 16235, "Pretrain/Step Time": 8.497094973921776} +{"Pretrain/Learning Rate": 2.845264547913068e-06, "Pretrain/Loss": 1.978549599647522, "Pretrain/Loss (Raw)": 1.881678819656372, "Pretrain/Step": 16236, "Pretrain/Step Time": 8.497253980487585} +{"Pretrain/Learning Rate": 2.8432979837622055e-06, "Pretrain/Loss": 1.9791395664215088, "Pretrain/Loss (Raw)": 1.8469345569610596, "Pretrain/Step": 16237, "Pretrain/Step Time": 8.499072702601552} +{"Pretrain/Learning Rate": 2.841332058484217e-06, "Pretrain/Loss": 1.9800012111663818, "Pretrain/Loss (Raw)": 2.0785462856292725, "Pretrain/Step": 16238, "Pretrain/Step Time": 8.494114911183715} +{"Pretrain/Learning Rate": 2.839366772135807e-06, "Pretrain/Loss": 1.9800143241882324, "Pretrain/Loss (Raw)": 1.9800009727478027, "Pretrain/Step": 16239, "Pretrain/Step Time": 8.494510950520635} +{"Pretrain/Learning Rate": 2.8374021247736306e-06, "Pretrain/Loss": 1.9817922115325928, "Pretrain/Loss (Raw)": 1.9917570352554321, "Pretrain/Step": 16240, "Pretrain/Step Time": 8.492907784879208} +{"Pretrain/Learning Rate": 2.8354381164543393e-06, "Pretrain/Loss": 1.9815185070037842, "Pretrain/Loss (Raw)": 1.9976269006729126, "Pretrain/Step": 16241, "Pretrain/Step Time": 8.495376890525222} +{"Pretrain/Learning Rate": 2.833474747234566e-06, "Pretrain/Loss": 1.985360026359558, "Pretrain/Loss (Raw)": 2.182321071624756, "Pretrain/Step": 16242, "Pretrain/Step Time": 8.495813651010394} +{"Pretrain/Learning Rate": 2.8315120171709204e-06, "Pretrain/Loss": 1.9844683408737183, "Pretrain/Loss (Raw)": 1.8875960111618042, "Pretrain/Step": 16243, "Pretrain/Step Time": 8.497269170358777} +{"Pretrain/Learning Rate": 2.829549926319999e-06, "Pretrain/Loss": 1.9866727590560913, "Pretrain/Loss (Raw)": 1.8789745569229126, "Pretrain/Step": 16244, "Pretrain/Step Time": 8.500249354168773} +{"Pretrain/Learning Rate": 2.8275884747383795e-06, "Pretrain/Loss": 1.986952543258667, "Pretrain/Loss (Raw)": 1.9583394527435303, "Pretrain/Step": 16245, "Pretrain/Step Time": 8.501859767362475} +{"Pretrain/Learning Rate": 2.8256276624826104e-06, "Pretrain/Loss": 1.988768219947815, "Pretrain/Loss (Raw)": 2.0776631832122803, "Pretrain/Step": 16246, "Pretrain/Step Time": 8.501558935269713} +{"Pretrain/Learning Rate": 2.8236674896092385e-06, "Pretrain/Loss": 1.9880681037902832, "Pretrain/Loss (Raw)": 2.0193240642547607, "Pretrain/Step": 16247, "Pretrain/Step Time": 8.493058623746037} +{"Pretrain/Learning Rate": 2.8217079561747794e-06, "Pretrain/Loss": 1.9889521598815918, "Pretrain/Loss (Raw)": 1.9435001611709595, "Pretrain/Step": 16248, "Pretrain/Step Time": 8.49586739577353} +{"Pretrain/Learning Rate": 2.819749062235741e-06, "Pretrain/Loss": 1.991034984588623, "Pretrain/Loss (Raw)": 2.143921136856079, "Pretrain/Step": 16249, "Pretrain/Step Time": 8.49201045744121} +{"Pretrain/Learning Rate": 2.817790807848594e-06, "Pretrain/Loss": 1.9912595748901367, "Pretrain/Loss (Raw)": 2.071190118789673, "Pretrain/Step": 16250, "Pretrain/Step Time": 8.495427062734962} +{"Pretrain/Learning Rate": 2.8158331930698224e-06, "Pretrain/Loss": 1.9893608093261719, "Pretrain/Loss (Raw)": 1.8657463788986206, "Pretrain/Step": 16251, "Pretrain/Step Time": 8.494348825886846} +{"Pretrain/Learning Rate": 2.8138762179558575e-06, "Pretrain/Loss": 1.9877617359161377, "Pretrain/Loss (Raw)": 1.9009997844696045, "Pretrain/Step": 16252, "Pretrain/Step Time": 8.49377035535872} +{"Pretrain/Learning Rate": 2.811919882563127e-06, "Pretrain/Loss": 1.9865543842315674, "Pretrain/Loss (Raw)": 1.9060357809066772, "Pretrain/Step": 16253, "Pretrain/Step Time": 8.494979716837406} +{"Pretrain/Learning Rate": 2.8099641869480527e-06, "Pretrain/Loss": 1.9854509830474854, "Pretrain/Loss (Raw)": 2.048184633255005, "Pretrain/Step": 16254, "Pretrain/Step Time": 8.495869468897581} +{"Pretrain/Learning Rate": 2.808009131167011e-06, "Pretrain/Loss": 1.9825694561004639, "Pretrain/Loss (Raw)": 1.7217093706130981, "Pretrain/Step": 16255, "Pretrain/Step Time": 8.499316483736038} +{"Pretrain/Learning Rate": 2.8060547152763905e-06, "Pretrain/Loss": 1.985048532485962, "Pretrain/Loss (Raw)": 2.210563898086548, "Pretrain/Step": 16256, "Pretrain/Step Time": 8.497852241620421} +{"Pretrain/Learning Rate": 2.8041009393325296e-06, "Pretrain/Loss": 1.984686017036438, "Pretrain/Loss (Raw)": 1.9320297241210938, "Pretrain/Step": 16257, "Pretrain/Step Time": 8.4954150095582} +{"Pretrain/Learning Rate": 2.802147803391775e-06, "Pretrain/Loss": 1.9847042560577393, "Pretrain/Loss (Raw)": 1.9113163948059082, "Pretrain/Step": 16258, "Pretrain/Step Time": 8.493143105879426} +{"Pretrain/Learning Rate": 2.8001953075104393e-06, "Pretrain/Loss": 1.9860538244247437, "Pretrain/Loss (Raw)": 2.083796262741089, "Pretrain/Step": 16259, "Pretrain/Step Time": 8.491996737197042} +{"Pretrain/Learning Rate": 2.7982434517448167e-06, "Pretrain/Loss": 1.986467957496643, "Pretrain/Loss (Raw)": 2.100104808807373, "Pretrain/Step": 16260, "Pretrain/Step Time": 8.494012236595154} +{"Pretrain/Learning Rate": 2.7962922361511988e-06, "Pretrain/Loss": 1.9871927499771118, "Pretrain/Loss (Raw)": 2.059004545211792, "Pretrain/Step": 16261, "Pretrain/Step Time": 8.49543085321784} +{"Pretrain/Learning Rate": 2.7943416607858374e-06, "Pretrain/Loss": 1.987572193145752, "Pretrain/Loss (Raw)": 2.0387959480285645, "Pretrain/Step": 16262, "Pretrain/Step Time": 8.497730437666178} +{"Pretrain/Learning Rate": 2.7923917257049848e-06, "Pretrain/Loss": 1.988464117050171, "Pretrain/Loss (Raw)": 2.2082576751708984, "Pretrain/Step": 16263, "Pretrain/Step Time": 8.499002182856202} +{"Pretrain/Learning Rate": 2.79044243096486e-06, "Pretrain/Loss": 1.9869358539581299, "Pretrain/Loss (Raw)": 1.8747661113739014, "Pretrain/Step": 16264, "Pretrain/Step Time": 8.503313761204481} +{"Pretrain/Learning Rate": 2.7884937766216675e-06, "Pretrain/Loss": 1.9876580238342285, "Pretrain/Loss (Raw)": 2.215526819229126, "Pretrain/Step": 16265, "Pretrain/Step Time": 8.499891912564635} +{"Pretrain/Learning Rate": 2.7865457627316045e-06, "Pretrain/Loss": 1.9852445125579834, "Pretrain/Loss (Raw)": 1.7632249593734741, "Pretrain/Step": 16266, "Pretrain/Step Time": 8.504173684865236} +{"Pretrain/Learning Rate": 2.7845983893508287e-06, "Pretrain/Loss": 1.9840699434280396, "Pretrain/Loss (Raw)": 1.9389441013336182, "Pretrain/Step": 16267, "Pretrain/Step Time": 8.506476121023297} +{"Pretrain/Learning Rate": 2.782651656535501e-06, "Pretrain/Loss": 1.9851566553115845, "Pretrain/Loss (Raw)": 2.1368424892425537, "Pretrain/Step": 16268, "Pretrain/Step Time": 8.505342982709408} +{"Pretrain/Learning Rate": 2.780705564341754e-06, "Pretrain/Loss": 1.9850499629974365, "Pretrain/Loss (Raw)": 2.138651132583618, "Pretrain/Step": 16269, "Pretrain/Step Time": 8.506219405680895} +{"Pretrain/Learning Rate": 2.77876011282569e-06, "Pretrain/Loss": 1.987683653831482, "Pretrain/Loss (Raw)": 2.290179967880249, "Pretrain/Step": 16270, "Pretrain/Step Time": 8.505019599571824} +{"Pretrain/Learning Rate": 2.7768153020434202e-06, "Pretrain/Loss": 1.9878277778625488, "Pretrain/Loss (Raw)": 1.8379337787628174, "Pretrain/Step": 16271, "Pretrain/Step Time": 8.501047963276505} +{"Pretrain/Learning Rate": 2.7748711320510102e-06, "Pretrain/Loss": 1.9891579151153564, "Pretrain/Loss (Raw)": 2.2728421688079834, "Pretrain/Step": 16272, "Pretrain/Step Time": 8.499968443065882} +{"Pretrain/Learning Rate": 2.7729276029045293e-06, "Pretrain/Loss": 1.9919239282608032, "Pretrain/Loss (Raw)": 2.0903749465942383, "Pretrain/Step": 16273, "Pretrain/Step Time": 8.500740630552173} +{"Pretrain/Learning Rate": 2.7709847146600102e-06, "Pretrain/Loss": 1.9891788959503174, "Pretrain/Loss (Raw)": 1.9618475437164307, "Pretrain/Step": 16274, "Pretrain/Step Time": 8.502102702856064} +{"Pretrain/Learning Rate": 2.76904246737347e-06, "Pretrain/Loss": 1.9873257875442505, "Pretrain/Loss (Raw)": 1.9780431985855103, "Pretrain/Step": 16275, "Pretrain/Step Time": 8.497695257887244} +{"Pretrain/Learning Rate": 2.7671008611009267e-06, "Pretrain/Loss": 1.988311767578125, "Pretrain/Loss (Raw)": 1.966288447380066, "Pretrain/Step": 16276, "Pretrain/Step Time": 8.498857190832496} +{"Pretrain/Learning Rate": 2.7651598958983506e-06, "Pretrain/Loss": 1.9912711381912231, "Pretrain/Loss (Raw)": 2.090320587158203, "Pretrain/Step": 16277, "Pretrain/Step Time": 8.499768985435367} +{"Pretrain/Learning Rate": 2.763219571821718e-06, "Pretrain/Loss": 1.9882588386535645, "Pretrain/Loss (Raw)": 1.7000442743301392, "Pretrain/Step": 16278, "Pretrain/Step Time": 8.49957443960011} +{"Pretrain/Learning Rate": 2.761279888926974e-06, "Pretrain/Loss": 1.9896306991577148, "Pretrain/Loss (Raw)": 2.125863552093506, "Pretrain/Step": 16279, "Pretrain/Step Time": 8.502209108322859} +{"Pretrain/Learning Rate": 2.759340847270042e-06, "Pretrain/Loss": 1.986240267753601, "Pretrain/Loss (Raw)": 2.044083833694458, "Pretrain/Step": 16280, "Pretrain/Step Time": 8.50392186269164} +{"Pretrain/Learning Rate": 2.7574024469068456e-06, "Pretrain/Loss": 1.9866480827331543, "Pretrain/Loss (Raw)": 2.1505212783813477, "Pretrain/Step": 16281, "Pretrain/Step Time": 8.500771755352616} +{"Pretrain/Learning Rate": 2.755464687893261e-06, "Pretrain/Loss": 1.9858908653259277, "Pretrain/Loss (Raw)": 1.9359052181243896, "Pretrain/Step": 16282, "Pretrain/Step Time": 8.49612077511847} +{"Pretrain/Learning Rate": 2.7535275702851776e-06, "Pretrain/Loss": 1.9848573207855225, "Pretrain/Loss (Raw)": 1.9054630994796753, "Pretrain/Step": 16283, "Pretrain/Step Time": 8.498082986101508} +{"Pretrain/Learning Rate": 2.7515910941384447e-06, "Pretrain/Loss": 1.9840056896209717, "Pretrain/Loss (Raw)": 2.0053505897521973, "Pretrain/Step": 16284, "Pretrain/Step Time": 8.500504551455379} +{"Pretrain/Learning Rate": 2.7496552595088933e-06, "Pretrain/Loss": 1.9804751873016357, "Pretrain/Loss (Raw)": 1.8354640007019043, "Pretrain/Step": 16285, "Pretrain/Step Time": 8.50063270330429} +{"Pretrain/Learning Rate": 2.74772006645235e-06, "Pretrain/Loss": 1.9800177812576294, "Pretrain/Loss (Raw)": 1.9230458736419678, "Pretrain/Step": 16286, "Pretrain/Step Time": 8.502477772533894} +{"Pretrain/Learning Rate": 2.745785515024607e-06, "Pretrain/Loss": 1.977644443511963, "Pretrain/Loss (Raw)": 1.702758550643921, "Pretrain/Step": 16287, "Pretrain/Step Time": 8.501283535733819} +{"Pretrain/Learning Rate": 2.7438516052814582e-06, "Pretrain/Loss": 1.9759384393692017, "Pretrain/Loss (Raw)": 1.7265359163284302, "Pretrain/Step": 16288, "Pretrain/Step Time": 8.502993503585458} +{"Pretrain/Learning Rate": 2.7419183372786568e-06, "Pretrain/Loss": 1.9731786251068115, "Pretrain/Loss (Raw)": 1.972001075744629, "Pretrain/Step": 16289, "Pretrain/Step Time": 8.498567143455148} +{"Pretrain/Learning Rate": 2.7399857110719436e-06, "Pretrain/Loss": 1.974429965019226, "Pretrain/Loss (Raw)": 2.1850247383117676, "Pretrain/Step": 16290, "Pretrain/Step Time": 8.497726174071431} +{"Pretrain/Learning Rate": 2.7380537267170576e-06, "Pretrain/Loss": 1.9752869606018066, "Pretrain/Loss (Raw)": 1.9581414461135864, "Pretrain/Step": 16291, "Pretrain/Step Time": 8.502000598236918} +{"Pretrain/Learning Rate": 2.7361223842696905e-06, "Pretrain/Loss": 1.9746865034103394, "Pretrain/Loss (Raw)": 1.8407748937606812, "Pretrain/Step": 16292, "Pretrain/Step Time": 8.503565646708012} +{"Pretrain/Learning Rate": 2.7341916837855473e-06, "Pretrain/Loss": 1.9763123989105225, "Pretrain/Loss (Raw)": 2.201169013977051, "Pretrain/Step": 16293, "Pretrain/Step Time": 8.498493308201432} +{"Pretrain/Learning Rate": 2.73226162532029e-06, "Pretrain/Loss": 1.9745153188705444, "Pretrain/Loss (Raw)": 2.0243382453918457, "Pretrain/Step": 16294, "Pretrain/Step Time": 8.4988494515419} +{"Pretrain/Learning Rate": 2.7303322089295647e-06, "Pretrain/Loss": 1.9746975898742676, "Pretrain/Loss (Raw)": 1.9380563497543335, "Pretrain/Step": 16295, "Pretrain/Step Time": 8.495712120085955} +{"Pretrain/Learning Rate": 2.7284034346690162e-06, "Pretrain/Loss": 1.9755802154541016, "Pretrain/Loss (Raw)": 2.0667929649353027, "Pretrain/Step": 16296, "Pretrain/Step Time": 8.499445140361786} +{"Pretrain/Learning Rate": 2.7264753025942504e-06, "Pretrain/Loss": 1.9762367010116577, "Pretrain/Loss (Raw)": 2.1384308338165283, "Pretrain/Step": 16297, "Pretrain/Step Time": 8.49763580225408} +{"Pretrain/Learning Rate": 2.724547812760872e-06, "Pretrain/Loss": 1.9761298894882202, "Pretrain/Loss (Raw)": 1.8945170640945435, "Pretrain/Step": 16298, "Pretrain/Step Time": 8.50316684693098} +{"Pretrain/Learning Rate": 2.7226209652244537e-06, "Pretrain/Loss": 1.9739958047866821, "Pretrain/Loss (Raw)": 1.7237566709518433, "Pretrain/Step": 16299, "Pretrain/Step Time": 8.499209461733699} +{"Pretrain/Learning Rate": 2.7206947600405514e-06, "Pretrain/Loss": 1.9725089073181152, "Pretrain/Loss (Raw)": 1.9151228666305542, "Pretrain/Step": 16300, "Pretrain/Step Time": 8.50108670629561} +{"Pretrain/Learning Rate": 2.7187691972647144e-06, "Pretrain/Loss": 1.9724831581115723, "Pretrain/Loss (Raw)": 1.8242236375808716, "Pretrain/Step": 16301, "Pretrain/Step Time": 8.496273884549737} +{"Pretrain/Learning Rate": 2.7168442769524543e-06, "Pretrain/Loss": 1.974968671798706, "Pretrain/Loss (Raw)": 2.065473794937134, "Pretrain/Step": 16302, "Pretrain/Step Time": 8.49770875647664} +{"Pretrain/Learning Rate": 2.714919999159285e-06, "Pretrain/Loss": 1.9758038520812988, "Pretrain/Loss (Raw)": 2.0755231380462646, "Pretrain/Step": 16303, "Pretrain/Step Time": 8.497390309348702} +{"Pretrain/Learning Rate": 2.7129963639406895e-06, "Pretrain/Loss": 1.9763808250427246, "Pretrain/Loss (Raw)": 2.0500402450561523, "Pretrain/Step": 16304, "Pretrain/Step Time": 8.498702879995108} +{"Pretrain/Learning Rate": 2.7110733713521296e-06, "Pretrain/Loss": 1.9758741855621338, "Pretrain/Loss (Raw)": 1.9253671169281006, "Pretrain/Step": 16305, "Pretrain/Step Time": 8.489641536027193} +{"Pretrain/Learning Rate": 2.709151021449058e-06, "Pretrain/Loss": 1.9735721349716187, "Pretrain/Loss (Raw)": 2.041619062423706, "Pretrain/Step": 16306, "Pretrain/Step Time": 8.491874247789383} +{"Pretrain/Learning Rate": 2.7072293142868993e-06, "Pretrain/Loss": 1.9718031883239746, "Pretrain/Loss (Raw)": 1.8334839344024658, "Pretrain/Step": 16307, "Pretrain/Step Time": 8.492361754179} +{"Pretrain/Learning Rate": 2.7053082499210707e-06, "Pretrain/Loss": 1.9738527536392212, "Pretrain/Loss (Raw)": 2.1095592975616455, "Pretrain/Step": 16308, "Pretrain/Step Time": 8.487164137884974} +{"Pretrain/Learning Rate": 2.7033878284069643e-06, "Pretrain/Loss": 1.9752953052520752, "Pretrain/Loss (Raw)": 2.2072594165802, "Pretrain/Step": 16309, "Pretrain/Step Time": 8.491675967350602} +{"Pretrain/Learning Rate": 2.7014680497999463e-06, "Pretrain/Loss": 1.9749490022659302, "Pretrain/Loss (Raw)": 2.0230438709259033, "Pretrain/Step": 16310, "Pretrain/Step Time": 8.488617425784469} +{"Pretrain/Learning Rate": 2.699548914155384e-06, "Pretrain/Loss": 1.9742103815078735, "Pretrain/Loss (Raw)": 2.0729269981384277, "Pretrain/Step": 16311, "Pretrain/Step Time": 8.489304969087243} +{"Pretrain/Learning Rate": 2.6976304215285993e-06, "Pretrain/Loss": 1.9721256494522095, "Pretrain/Loss (Raw)": 2.0201416015625, "Pretrain/Step": 16312, "Pretrain/Step Time": 8.493637695908546} +{"Pretrain/Learning Rate": 2.695712571974929e-06, "Pretrain/Loss": 1.9743496179580688, "Pretrain/Loss (Raw)": 1.9318662881851196, "Pretrain/Step": 16313, "Pretrain/Step Time": 8.489157393574715} +{"Pretrain/Learning Rate": 2.693795365549653e-06, "Pretrain/Loss": 1.9754945039749146, "Pretrain/Loss (Raw)": 1.933652400970459, "Pretrain/Step": 16314, "Pretrain/Step Time": 8.489225344732404} +{"Pretrain/Learning Rate": 2.691878802308073e-06, "Pretrain/Loss": 1.9771300554275513, "Pretrain/Loss (Raw)": 2.168826103210449, "Pretrain/Step": 16315, "Pretrain/Step Time": 8.49293651431799} +{"Pretrain/Learning Rate": 2.6899628823054383e-06, "Pretrain/Loss": 1.9788678884506226, "Pretrain/Loss (Raw)": 2.3296687602996826, "Pretrain/Step": 16316, "Pretrain/Step Time": 8.494813518598676} +{"Pretrain/Learning Rate": 2.688047605596991e-06, "Pretrain/Loss": 1.9812120199203491, "Pretrain/Loss (Raw)": 1.9476293325424194, "Pretrain/Step": 16317, "Pretrain/Step Time": 8.490753401070833} +{"Pretrain/Learning Rate": 2.6861329722379703e-06, "Pretrain/Loss": 1.9817354679107666, "Pretrain/Loss (Raw)": 2.0359554290771484, "Pretrain/Step": 16318, "Pretrain/Step Time": 8.491408376023173} +{"Pretrain/Learning Rate": 2.6842189822835677e-06, "Pretrain/Loss": 1.9870822429656982, "Pretrain/Loss (Raw)": 2.0002663135528564, "Pretrain/Step": 16319, "Pretrain/Step Time": 8.490644428879023} +{"Pretrain/Learning Rate": 2.682305635788984e-06, "Pretrain/Loss": 1.9864015579223633, "Pretrain/Loss (Raw)": 1.8999842405319214, "Pretrain/Step": 16320, "Pretrain/Step Time": 8.491571735590696} +{"Pretrain/Learning Rate": 2.6803929328093836e-06, "Pretrain/Loss": 1.9851775169372559, "Pretrain/Loss (Raw)": 1.9568276405334473, "Pretrain/Step": 16321, "Pretrain/Step Time": 8.484917482361197} +{"Pretrain/Learning Rate": 2.6784808733999163e-06, "Pretrain/Loss": 1.9887840747833252, "Pretrain/Loss (Raw)": 2.2424983978271484, "Pretrain/Step": 16322, "Pretrain/Step Time": 8.485182458534837} +{"Pretrain/Learning Rate": 2.6765694576157214e-06, "Pretrain/Loss": 1.988929271697998, "Pretrain/Loss (Raw)": 1.9559540748596191, "Pretrain/Step": 16323, "Pretrain/Step Time": 8.484357530251145} +{"Pretrain/Learning Rate": 2.674658685511902e-06, "Pretrain/Loss": 1.9870902299880981, "Pretrain/Loss (Raw)": 1.789150595664978, "Pretrain/Step": 16324, "Pretrain/Step Time": 8.48558278940618} +{"Pretrain/Learning Rate": 2.672748557143567e-06, "Pretrain/Loss": 1.9861854314804077, "Pretrain/Loss (Raw)": 1.8227638006210327, "Pretrain/Step": 16325, "Pretrain/Step Time": 8.487380040809512} +{"Pretrain/Learning Rate": 2.6708390725657894e-06, "Pretrain/Loss": 1.989823818206787, "Pretrain/Loss (Raw)": 2.0315511226654053, "Pretrain/Step": 16326, "Pretrain/Step Time": 8.480525761842728} +{"Pretrain/Learning Rate": 2.668930231833622e-06, "Pretrain/Loss": 1.987879991531372, "Pretrain/Loss (Raw)": 1.776528239250183, "Pretrain/Step": 16327, "Pretrain/Step Time": 8.483227226883173} +{"Pretrain/Learning Rate": 2.6670220350021117e-06, "Pretrain/Loss": 1.9866101741790771, "Pretrain/Loss (Raw)": 1.9704853296279907, "Pretrain/Step": 16328, "Pretrain/Step Time": 8.484502878040075} +{"Pretrain/Learning Rate": 2.6651144821262714e-06, "Pretrain/Loss": 1.9885468482971191, "Pretrain/Loss (Raw)": 2.1711339950561523, "Pretrain/Step": 16329, "Pretrain/Step Time": 8.484248215332627} +{"Pretrain/Learning Rate": 2.6632075732611174e-06, "Pretrain/Loss": 1.9879639148712158, "Pretrain/Loss (Raw)": 1.950895071029663, "Pretrain/Step": 16330, "Pretrain/Step Time": 8.483325129374862} +{"Pretrain/Learning Rate": 2.6613013084616252e-06, "Pretrain/Loss": 1.9904711246490479, "Pretrain/Loss (Raw)": 2.156137466430664, "Pretrain/Step": 16331, "Pretrain/Step Time": 8.487709047272801} +{"Pretrain/Learning Rate": 2.6593956877827563e-06, "Pretrain/Loss": 1.9917962551116943, "Pretrain/Loss (Raw)": 2.1521379947662354, "Pretrain/Step": 16332, "Pretrain/Step Time": 8.488754153251648} +{"Pretrain/Learning Rate": 2.65749071127947e-06, "Pretrain/Loss": 1.9939768314361572, "Pretrain/Loss (Raw)": 2.0923211574554443, "Pretrain/Step": 16333, "Pretrain/Step Time": 8.49102121219039} +{"Pretrain/Learning Rate": 2.6555863790066834e-06, "Pretrain/Loss": 1.9959973096847534, "Pretrain/Loss (Raw)": 2.105909585952759, "Pretrain/Step": 16334, "Pretrain/Step Time": 8.490927273407578} +{"Pretrain/Learning Rate": 2.6536826910193184e-06, "Pretrain/Loss": 1.9980010986328125, "Pretrain/Loss (Raw)": 2.0539567470550537, "Pretrain/Step": 16335, "Pretrain/Step Time": 8.492756642401218} +{"Pretrain/Learning Rate": 2.651779647372257e-06, "Pretrain/Loss": 1.9976556301116943, "Pretrain/Loss (Raw)": 1.9258043766021729, "Pretrain/Step": 16336, "Pretrain/Step Time": 8.489342907443643} +{"Pretrain/Learning Rate": 2.649877248120372e-06, "Pretrain/Loss": 1.9974193572998047, "Pretrain/Loss (Raw)": 2.004084825515747, "Pretrain/Step": 16337, "Pretrain/Step Time": 8.49019586108625} +{"Pretrain/Learning Rate": 2.647975493318525e-06, "Pretrain/Loss": 2.0019593238830566, "Pretrain/Loss (Raw)": 2.3949756622314453, "Pretrain/Step": 16338, "Pretrain/Step Time": 8.492545682936907} +{"Pretrain/Learning Rate": 2.6460743830215433e-06, "Pretrain/Loss": 2.0013840198516846, "Pretrain/Loss (Raw)": 1.9737372398376465, "Pretrain/Step": 16339, "Pretrain/Step Time": 8.486149832606316} +{"Pretrain/Learning Rate": 2.644173917284257e-06, "Pretrain/Loss": 2.0047531127929688, "Pretrain/Loss (Raw)": 2.557644844055176, "Pretrain/Step": 16340, "Pretrain/Step Time": 8.487562354654074} +{"Pretrain/Learning Rate": 2.6422740961614455e-06, "Pretrain/Loss": 2.0049993991851807, "Pretrain/Loss (Raw)": 2.1962947845458984, "Pretrain/Step": 16341, "Pretrain/Step Time": 8.483812922611833} +{"Pretrain/Learning Rate": 2.640374919707905e-06, "Pretrain/Loss": 2.008084297180176, "Pretrain/Loss (Raw)": 2.1214423179626465, "Pretrain/Step": 16342, "Pretrain/Step Time": 8.482848750427365} +{"Pretrain/Learning Rate": 2.638476387978392e-06, "Pretrain/Loss": 2.0053329467773438, "Pretrain/Loss (Raw)": 1.7780835628509521, "Pretrain/Step": 16343, "Pretrain/Step Time": 8.485785925760865} +{"Pretrain/Learning Rate": 2.636578501027645e-06, "Pretrain/Loss": 2.0045793056488037, "Pretrain/Loss (Raw)": 1.9185043573379517, "Pretrain/Step": 16344, "Pretrain/Step Time": 8.483132872730494} +{"Pretrain/Learning Rate": 2.634681258910393e-06, "Pretrain/Loss": 2.0051872730255127, "Pretrain/Loss (Raw)": 2.0067508220672607, "Pretrain/Step": 16345, "Pretrain/Step Time": 8.481789017096162} +{"Pretrain/Learning Rate": 2.632784661681337e-06, "Pretrain/Loss": 2.0039870738983154, "Pretrain/Loss (Raw)": 1.8890061378479004, "Pretrain/Step": 16346, "Pretrain/Step Time": 8.484719077125192} +{"Pretrain/Learning Rate": 2.630888709395174e-06, "Pretrain/Loss": 2.000795364379883, "Pretrain/Loss (Raw)": 1.960228443145752, "Pretrain/Step": 16347, "Pretrain/Step Time": 8.480255408212543} +{"Pretrain/Learning Rate": 2.6289934021065637e-06, "Pretrain/Loss": 1.9977740049362183, "Pretrain/Loss (Raw)": 1.6853320598602295, "Pretrain/Step": 16348, "Pretrain/Step Time": 8.488105982542038} +{"Pretrain/Learning Rate": 2.627098739870154e-06, "Pretrain/Loss": 1.995823621749878, "Pretrain/Loss (Raw)": 1.8770538568496704, "Pretrain/Step": 16349, "Pretrain/Step Time": 8.489566285163164} +{"Pretrain/Learning Rate": 2.6252047227405845e-06, "Pretrain/Loss": 1.995910882949829, "Pretrain/Loss (Raw)": 2.006894588470459, "Pretrain/Step": 16350, "Pretrain/Step Time": 8.489871734753251} +{"Pretrain/Learning Rate": 2.6233113507724587e-06, "Pretrain/Loss": 1.9990360736846924, "Pretrain/Loss (Raw)": 2.2019739151000977, "Pretrain/Step": 16351, "Pretrain/Step Time": 8.48970720730722} +{"Pretrain/Learning Rate": 2.6214186240203832e-06, "Pretrain/Loss": 1.9981820583343506, "Pretrain/Loss (Raw)": 1.84190034866333, "Pretrain/Step": 16352, "Pretrain/Step Time": 8.490184493362904} +{"Pretrain/Learning Rate": 2.619526542538922e-06, "Pretrain/Loss": 1.9957382678985596, "Pretrain/Loss (Raw)": 1.8842339515686035, "Pretrain/Step": 16353, "Pretrain/Step Time": 8.49005508236587} +{"Pretrain/Learning Rate": 2.617635106382632e-06, "Pretrain/Loss": 1.9959208965301514, "Pretrain/Loss (Raw)": 2.0640575885772705, "Pretrain/Step": 16354, "Pretrain/Step Time": 8.48840942978859} +{"Pretrain/Learning Rate": 2.615744315606061e-06, "Pretrain/Loss": 1.9945943355560303, "Pretrain/Loss (Raw)": 1.8905341625213623, "Pretrain/Step": 16355, "Pretrain/Step Time": 8.491050204262137} +{"Pretrain/Learning Rate": 2.6138541702637187e-06, "Pretrain/Loss": 1.995505452156067, "Pretrain/Loss (Raw)": 2.1292405128479004, "Pretrain/Step": 16356, "Pretrain/Step Time": 8.490923965349793} +{"Pretrain/Learning Rate": 2.6119646704101136e-06, "Pretrain/Loss": 1.998250126838684, "Pretrain/Loss (Raw)": 2.038011074066162, "Pretrain/Step": 16357, "Pretrain/Step Time": 8.484723379835486} +{"Pretrain/Learning Rate": 2.6100758160997247e-06, "Pretrain/Loss": 1.9976621866226196, "Pretrain/Loss (Raw)": 1.879273772239685, "Pretrain/Step": 16358, "Pretrain/Step Time": 8.487988650798798} +{"Pretrain/Learning Rate": 2.608187607387011e-06, "Pretrain/Loss": 1.9984787702560425, "Pretrain/Loss (Raw)": 2.1012940406799316, "Pretrain/Step": 16359, "Pretrain/Step Time": 8.487119406461716} +{"Pretrain/Learning Rate": 2.6063000443264292e-06, "Pretrain/Loss": 1.9999451637268066, "Pretrain/Loss (Raw)": 2.0097403526306152, "Pretrain/Step": 16360, "Pretrain/Step Time": 8.486203834414482} +{"Pretrain/Learning Rate": 2.604413126972391e-06, "Pretrain/Loss": 1.9986703395843506, "Pretrain/Loss (Raw)": 1.6452118158340454, "Pretrain/Step": 16361, "Pretrain/Step Time": 8.487565344199538} +{"Pretrain/Learning Rate": 2.6025268553793197e-06, "Pretrain/Loss": 1.9976575374603271, "Pretrain/Loss (Raw)": 1.7763084173202515, "Pretrain/Step": 16362, "Pretrain/Step Time": 8.486673237755895} +{"Pretrain/Learning Rate": 2.6006412296015968e-06, "Pretrain/Loss": 1.9985692501068115, "Pretrain/Loss (Raw)": 1.9396191835403442, "Pretrain/Step": 16363, "Pretrain/Step Time": 8.488427491858602} +{"Pretrain/Learning Rate": 2.5987562496935874e-06, "Pretrain/Loss": 1.9993942975997925, "Pretrain/Loss (Raw)": 1.9872833490371704, "Pretrain/Step": 16364, "Pretrain/Step Time": 8.490735583007336} +{"Pretrain/Learning Rate": 2.596871915709656e-06, "Pretrain/Loss": 2.00015926361084, "Pretrain/Loss (Raw)": 1.9448391199111938, "Pretrain/Step": 16365, "Pretrain/Step Time": 8.490760890766978} +{"Pretrain/Learning Rate": 2.594988227704126e-06, "Pretrain/Loss": 1.9996159076690674, "Pretrain/Loss (Raw)": 2.00901460647583, "Pretrain/Step": 16366, "Pretrain/Step Time": 8.496978532522917} +{"Pretrain/Learning Rate": 2.5931051857313175e-06, "Pretrain/Loss": 1.9997628927230835, "Pretrain/Loss (Raw)": 1.998797059059143, "Pretrain/Step": 16367, "Pretrain/Step Time": 8.49675628170371} +{"Pretrain/Learning Rate": 2.5912227898455268e-06, "Pretrain/Loss": 2.000352382659912, "Pretrain/Loss (Raw)": 2.0672028064727783, "Pretrain/Step": 16368, "Pretrain/Step Time": 8.49813386425376} +{"Pretrain/Learning Rate": 2.5893410401010258e-06, "Pretrain/Loss": 1.99900484085083, "Pretrain/Loss (Raw)": 1.8251761198043823, "Pretrain/Step": 16369, "Pretrain/Step Time": 8.501019563525915} +{"Pretrain/Learning Rate": 2.5874599365520806e-06, "Pretrain/Loss": 1.9973912239074707, "Pretrain/Loss (Raw)": 1.9757546186447144, "Pretrain/Step": 16370, "Pretrain/Step Time": 8.49849422648549} +{"Pretrain/Learning Rate": 2.5855794792529254e-06, "Pretrain/Loss": 1.9989581108093262, "Pretrain/Loss (Raw)": 2.0881600379943848, "Pretrain/Step": 16371, "Pretrain/Step Time": 8.49690213240683} +{"Pretrain/Learning Rate": 2.5836996682577885e-06, "Pretrain/Loss": 2.0034470558166504, "Pretrain/Loss (Raw)": 2.453572988510132, "Pretrain/Step": 16372, "Pretrain/Step Time": 8.495227053761482} +{"Pretrain/Learning Rate": 2.5818205036208687e-06, "Pretrain/Loss": 2.0033860206604004, "Pretrain/Loss (Raw)": 1.9505150318145752, "Pretrain/Step": 16373, "Pretrain/Step Time": 8.496201915666461} +{"Pretrain/Learning Rate": 2.5799419853963473e-06, "Pretrain/Loss": 2.0025298595428467, "Pretrain/Loss (Raw)": 1.9680843353271484, "Pretrain/Step": 16374, "Pretrain/Step Time": 8.496890228241682} +{"Pretrain/Learning Rate": 2.5780641136383982e-06, "Pretrain/Loss": 2.001896381378174, "Pretrain/Loss (Raw)": 1.9382288455963135, "Pretrain/Step": 16375, "Pretrain/Step Time": 8.49783743545413} +{"Pretrain/Learning Rate": 2.576186888401158e-06, "Pretrain/Loss": 2.0033164024353027, "Pretrain/Loss (Raw)": 2.1252481937408447, "Pretrain/Step": 16376, "Pretrain/Step Time": 8.49352640658617} +{"Pretrain/Learning Rate": 2.574310309738767e-06, "Pretrain/Loss": 2.0030863285064697, "Pretrain/Loss (Raw)": 2.1145122051239014, "Pretrain/Step": 16377, "Pretrain/Step Time": 8.490229459479451} +{"Pretrain/Learning Rate": 2.5724343777053237e-06, "Pretrain/Loss": 2.002627372741699, "Pretrain/Loss (Raw)": 2.0124242305755615, "Pretrain/Step": 16378, "Pretrain/Step Time": 8.490144334733486} +{"Pretrain/Learning Rate": 2.570559092354932e-06, "Pretrain/Loss": 2.002589702606201, "Pretrain/Loss (Raw)": 1.860935091972351, "Pretrain/Step": 16379, "Pretrain/Step Time": 8.488651309162378} +{"Pretrain/Learning Rate": 2.5686844537416543e-06, "Pretrain/Loss": 2.0049490928649902, "Pretrain/Loss (Raw)": 2.2029688358306885, "Pretrain/Step": 16380, "Pretrain/Step Time": 8.490158434957266} +{"Pretrain/Learning Rate": 2.5668104619195443e-06, "Pretrain/Loss": 2.0069022178649902, "Pretrain/Loss (Raw)": 2.1560416221618652, "Pretrain/Step": 16381, "Pretrain/Step Time": 8.488918857648969} +{"Pretrain/Learning Rate": 2.5649371169426424e-06, "Pretrain/Loss": 2.008047580718994, "Pretrain/Loss (Raw)": 2.194831609725952, "Pretrain/Step": 16382, "Pretrain/Step Time": 8.486767938360572} +{"Pretrain/Learning Rate": 2.5630644188649604e-06, "Pretrain/Loss": 2.0091326236724854, "Pretrain/Loss (Raw)": 1.860558271408081, "Pretrain/Step": 16383, "Pretrain/Step Time": 8.487660206854343} +{"Pretrain/Learning Rate": 2.561192367740503e-06, "Pretrain/Loss": 2.00610089302063, "Pretrain/Loss (Raw)": 1.8225001096725464, "Pretrain/Step": 16384, "Pretrain/Step Time": 8.486817821860313} +{"Pretrain/Learning Rate": 2.559320963623246e-06, "Pretrain/Loss": 2.006901741027832, "Pretrain/Loss (Raw)": 2.0345821380615234, "Pretrain/Step": 16385, "Pretrain/Step Time": 8.489565515890718} +{"Pretrain/Learning Rate": 2.557450206567144e-06, "Pretrain/Loss": 2.0080339908599854, "Pretrain/Loss (Raw)": 2.056213140487671, "Pretrain/Step": 16386, "Pretrain/Step Time": 8.489072017371655} +{"Pretrain/Learning Rate": 2.5555800966261504e-06, "Pretrain/Loss": 2.00685453414917, "Pretrain/Loss (Raw)": 1.9328045845031738, "Pretrain/Step": 16387, "Pretrain/Step Time": 8.491879601031542} +{"Pretrain/Learning Rate": 2.5537106338541757e-06, "Pretrain/Loss": 2.005904197692871, "Pretrain/Loss (Raw)": 1.9784796237945557, "Pretrain/Step": 16388, "Pretrain/Step Time": 8.48945738747716} +{"Pretrain/Learning Rate": 2.551841818305137e-06, "Pretrain/Loss": 2.0044219493865967, "Pretrain/Loss (Raw)": 1.8692750930786133, "Pretrain/Step": 16389, "Pretrain/Step Time": 8.489107502624393} +{"Pretrain/Learning Rate": 2.549973650032916e-06, "Pretrain/Loss": 2.0033059120178223, "Pretrain/Loss (Raw)": 1.8959476947784424, "Pretrain/Step": 16390, "Pretrain/Step Time": 8.489722665399313} +{"Pretrain/Learning Rate": 2.548106129091371e-06, "Pretrain/Loss": 2.0014002323150635, "Pretrain/Loss (Raw)": 1.9643080234527588, "Pretrain/Step": 16391, "Pretrain/Step Time": 8.486802406609058} +{"Pretrain/Learning Rate": 2.546239255534366e-06, "Pretrain/Loss": 2.0032055377960205, "Pretrain/Loss (Raw)": 2.1058545112609863, "Pretrain/Step": 16392, "Pretrain/Step Time": 8.484738931059837} +{"Pretrain/Learning Rate": 2.544373029415717e-06, "Pretrain/Loss": 2.0027637481689453, "Pretrain/Loss (Raw)": 2.159013509750366, "Pretrain/Step": 16393, "Pretrain/Step Time": 8.48293381743133} +{"Pretrain/Learning Rate": 2.5425074507892445e-06, "Pretrain/Loss": 2.0028560161590576, "Pretrain/Loss (Raw)": 1.775012731552124, "Pretrain/Step": 16394, "Pretrain/Step Time": 8.484016744419932} +{"Pretrain/Learning Rate": 2.5406425197087413e-06, "Pretrain/Loss": 2.002666473388672, "Pretrain/Loss (Raw)": 1.9146734476089478, "Pretrain/Step": 16395, "Pretrain/Step Time": 8.480141572654247} +{"Pretrain/Learning Rate": 2.5387782362279704e-06, "Pretrain/Loss": 2.000988721847534, "Pretrain/Loss (Raw)": 1.9220961332321167, "Pretrain/Step": 16396, "Pretrain/Step Time": 8.483621126040816} +{"Pretrain/Learning Rate": 2.5369146004007027e-06, "Pretrain/Loss": 1.998769760131836, "Pretrain/Loss (Raw)": 1.8546351194381714, "Pretrain/Step": 16397, "Pretrain/Step Time": 8.484151476994157} +{"Pretrain/Learning Rate": 2.5350516122806588e-06, "Pretrain/Loss": 1.9959574937820435, "Pretrain/Loss (Raw)": 1.9302141666412354, "Pretrain/Step": 16398, "Pretrain/Step Time": 8.482666794210672} +{"Pretrain/Learning Rate": 2.533189271921571e-06, "Pretrain/Loss": 1.9962875843048096, "Pretrain/Loss (Raw)": 1.8801612854003906, "Pretrain/Step": 16399, "Pretrain/Step Time": 8.483842063695192} +{"Pretrain/Learning Rate": 2.531327579377135e-06, "Pretrain/Loss": 1.9952905178070068, "Pretrain/Loss (Raw)": 2.145228147506714, "Pretrain/Step": 16400, "Pretrain/Step Time": 8.484884265810251} +{"Pretrain/Learning Rate": 2.5294665347010223e-06, "Pretrain/Loss": 1.9939028024673462, "Pretrain/Loss (Raw)": 1.9127483367919922, "Pretrain/Step": 16401, "Pretrain/Step Time": 8.482325399294496} +{"Pretrain/Learning Rate": 2.5276061379469056e-06, "Pretrain/Loss": 1.991652488708496, "Pretrain/Loss (Raw)": 1.6738098859786987, "Pretrain/Step": 16402, "Pretrain/Step Time": 8.482977420091629} +{"Pretrain/Learning Rate": 2.525746389168421e-06, "Pretrain/Loss": 1.9888012409210205, "Pretrain/Loss (Raw)": 1.613086462020874, "Pretrain/Step": 16403, "Pretrain/Step Time": 8.483021646738052} +{"Pretrain/Learning Rate": 2.5238872884191993e-06, "Pretrain/Loss": 1.9869542121887207, "Pretrain/Loss (Raw)": 1.729854702949524, "Pretrain/Step": 16404, "Pretrain/Step Time": 8.484635869041085} +{"Pretrain/Learning Rate": 2.522028835752843e-06, "Pretrain/Loss": 1.9858958721160889, "Pretrain/Loss (Raw)": 1.9548627138137817, "Pretrain/Step": 16405, "Pretrain/Step Time": 8.481218190863729} +{"Pretrain/Learning Rate": 2.5201710312229345e-06, "Pretrain/Loss": 1.9885952472686768, "Pretrain/Loss (Raw)": 2.0455825328826904, "Pretrain/Step": 16406, "Pretrain/Step Time": 8.478760097175837} +{"Pretrain/Learning Rate": 2.518313874883052e-06, "Pretrain/Loss": 1.9877793788909912, "Pretrain/Loss (Raw)": 2.0214133262634277, "Pretrain/Step": 16407, "Pretrain/Step Time": 8.481448529288173} +{"Pretrain/Learning Rate": 2.516457366786734e-06, "Pretrain/Loss": 1.9891481399536133, "Pretrain/Loss (Raw)": 2.2192797660827637, "Pretrain/Step": 16408, "Pretrain/Step Time": 8.47890935651958} +{"Pretrain/Learning Rate": 2.514601506987524e-06, "Pretrain/Loss": 1.9858818054199219, "Pretrain/Loss (Raw)": 1.7324516773223877, "Pretrain/Step": 16409, "Pretrain/Step Time": 8.482559381052852} +{"Pretrain/Learning Rate": 2.5127462955389285e-06, "Pretrain/Loss": 1.9853754043579102, "Pretrain/Loss (Raw)": 1.8710771799087524, "Pretrain/Step": 16410, "Pretrain/Step Time": 8.486528057605028} +{"Pretrain/Learning Rate": 2.5108917324944386e-06, "Pretrain/Loss": 1.987308382987976, "Pretrain/Loss (Raw)": 2.1528773307800293, "Pretrain/Step": 16411, "Pretrain/Step Time": 8.488721776753664} +{"Pretrain/Learning Rate": 2.5090378179075334e-06, "Pretrain/Loss": 1.9861037731170654, "Pretrain/Loss (Raw)": 1.8511494398117065, "Pretrain/Step": 16412, "Pretrain/Step Time": 8.486996199935675} +{"Pretrain/Learning Rate": 2.507184551831665e-06, "Pretrain/Loss": 1.9871251583099365, "Pretrain/Loss (Raw)": 1.9662305116653442, "Pretrain/Step": 16413, "Pretrain/Step Time": 8.487480403855443} +{"Pretrain/Learning Rate": 2.5053319343202763e-06, "Pretrain/Loss": 1.9862357378005981, "Pretrain/Loss (Raw)": 1.8091931343078613, "Pretrain/Step": 16414, "Pretrain/Step Time": 8.48875955119729} +{"Pretrain/Learning Rate": 2.503479965426786e-06, "Pretrain/Loss": 1.9901982545852661, "Pretrain/Loss (Raw)": 2.2099452018737793, "Pretrain/Step": 16415, "Pretrain/Step Time": 8.48117202334106} +{"Pretrain/Learning Rate": 2.5016286452045847e-06, "Pretrain/Loss": 1.9897615909576416, "Pretrain/Loss (Raw)": 1.6706445217132568, "Pretrain/Step": 16416, "Pretrain/Step Time": 8.481072017922997} +{"Pretrain/Learning Rate": 2.499777973707068e-06, "Pretrain/Loss": 1.9895671606063843, "Pretrain/Loss (Raw)": 1.947114109992981, "Pretrain/Step": 16417, "Pretrain/Step Time": 8.484053621068597} +{"Pretrain/Learning Rate": 2.497927950987586e-06, "Pretrain/Loss": 1.9872076511383057, "Pretrain/Loss (Raw)": 1.883008599281311, "Pretrain/Step": 16418, "Pretrain/Step Time": 8.481336388736963} +{"Pretrain/Learning Rate": 2.4960785770994923e-06, "Pretrain/Loss": 1.9882659912109375, "Pretrain/Loss (Raw)": 2.0936102867126465, "Pretrain/Step": 16419, "Pretrain/Step Time": 8.479209531098604} +{"Pretrain/Learning Rate": 2.494229852096111e-06, "Pretrain/Loss": 1.9897453784942627, "Pretrain/Loss (Raw)": 2.0301287174224854, "Pretrain/Step": 16420, "Pretrain/Step Time": 8.477358682081103} +{"Pretrain/Learning Rate": 2.492381776030739e-06, "Pretrain/Loss": 1.9885025024414062, "Pretrain/Loss (Raw)": 2.042099714279175, "Pretrain/Step": 16421, "Pretrain/Step Time": 8.476807277649641} +{"Pretrain/Learning Rate": 2.4905343489566773e-06, "Pretrain/Loss": 1.9876799583435059, "Pretrain/Loss (Raw)": 1.9190343618392944, "Pretrain/Step": 16422, "Pretrain/Step Time": 8.474265916272998} +{"Pretrain/Learning Rate": 2.488687570927187e-06, "Pretrain/Loss": 1.988168478012085, "Pretrain/Loss (Raw)": 2.0005977153778076, "Pretrain/Step": 16423, "Pretrain/Step Time": 8.47576050274074} +{"Pretrain/Learning Rate": 2.48684144199553e-06, "Pretrain/Loss": 1.9872547388076782, "Pretrain/Loss (Raw)": 1.9498343467712402, "Pretrain/Step": 16424, "Pretrain/Step Time": 8.474957412108779} +{"Pretrain/Learning Rate": 2.484995962214917e-06, "Pretrain/Loss": 1.988234281539917, "Pretrain/Loss (Raw)": 2.2638118267059326, "Pretrain/Step": 16425, "Pretrain/Step Time": 8.47682579047978} +{"Pretrain/Learning Rate": 2.4831511316385808e-06, "Pretrain/Loss": 1.9882874488830566, "Pretrain/Loss (Raw)": 1.9013241529464722, "Pretrain/Step": 16426, "Pretrain/Step Time": 8.474980665370822} +{"Pretrain/Learning Rate": 2.481306950319706e-06, "Pretrain/Loss": 1.9904297590255737, "Pretrain/Loss (Raw)": 1.9979698657989502, "Pretrain/Step": 16427, "Pretrain/Step Time": 8.478046698495746} +{"Pretrain/Learning Rate": 2.4794634183114674e-06, "Pretrain/Loss": 1.9915447235107422, "Pretrain/Loss (Raw)": 2.057842969894409, "Pretrain/Step": 16428, "Pretrain/Step Time": 8.478206172585487} +{"Pretrain/Learning Rate": 2.4776205356670302e-06, "Pretrain/Loss": 1.9912824630737305, "Pretrain/Loss (Raw)": 1.7906482219696045, "Pretrain/Step": 16429, "Pretrain/Step Time": 8.482405040413141} +{"Pretrain/Learning Rate": 2.475778302439524e-06, "Pretrain/Loss": 1.9923620223999023, "Pretrain/Loss (Raw)": 2.2036550045013428, "Pretrain/Step": 16430, "Pretrain/Step Time": 8.484891090542078} +{"Pretrain/Learning Rate": 2.473936718682074e-06, "Pretrain/Loss": 1.9919389486312866, "Pretrain/Loss (Raw)": 2.0213735103607178, "Pretrain/Step": 16431, "Pretrain/Step Time": 8.481751589104533} +{"Pretrain/Learning Rate": 2.472095784447781e-06, "Pretrain/Loss": 1.9908063411712646, "Pretrain/Loss (Raw)": 1.9050594568252563, "Pretrain/Step": 16432, "Pretrain/Step Time": 8.480644008144736} +{"Pretrain/Learning Rate": 2.4702554997897197e-06, "Pretrain/Loss": 1.992075800895691, "Pretrain/Loss (Raw)": 2.0878703594207764, "Pretrain/Step": 16433, "Pretrain/Step Time": 8.48433013446629} +{"Pretrain/Learning Rate": 2.4684158647609616e-06, "Pretrain/Loss": 1.990401268005371, "Pretrain/Loss (Raw)": 1.8272666931152344, "Pretrain/Step": 16434, "Pretrain/Step Time": 8.484159724786878} +{"Pretrain/Learning Rate": 2.466576879414545e-06, "Pretrain/Loss": 1.9951094388961792, "Pretrain/Loss (Raw)": 2.4361302852630615, "Pretrain/Step": 16435, "Pretrain/Step Time": 8.484282093122602} +{"Pretrain/Learning Rate": 2.464738543803505e-06, "Pretrain/Loss": 1.99272882938385, "Pretrain/Loss (Raw)": 1.8048534393310547, "Pretrain/Step": 16436, "Pretrain/Step Time": 8.489962263032794} +{"Pretrain/Learning Rate": 2.4629008579808406e-06, "Pretrain/Loss": 1.9910964965820312, "Pretrain/Loss (Raw)": 1.9983068704605103, "Pretrain/Step": 16437, "Pretrain/Step Time": 8.487197559326887} +{"Pretrain/Learning Rate": 2.4610638219995374e-06, "Pretrain/Loss": 1.989880084991455, "Pretrain/Loss (Raw)": 1.867348551750183, "Pretrain/Step": 16438, "Pretrain/Step Time": 8.489115936681628} +{"Pretrain/Learning Rate": 2.4592274359125783e-06, "Pretrain/Loss": 1.9899280071258545, "Pretrain/Loss (Raw)": 2.079066514968872, "Pretrain/Step": 16439, "Pretrain/Step Time": 8.484504910185933} +{"Pretrain/Learning Rate": 2.4573916997728985e-06, "Pretrain/Loss": 1.989858865737915, "Pretrain/Loss (Raw)": 2.0112860202789307, "Pretrain/Step": 16440, "Pretrain/Step Time": 8.48604210652411} +{"Pretrain/Learning Rate": 2.4555566136334416e-06, "Pretrain/Loss": 1.9892206192016602, "Pretrain/Loss (Raw)": 1.8501569032669067, "Pretrain/Step": 16441, "Pretrain/Step Time": 8.48603885807097} +{"Pretrain/Learning Rate": 2.4537221775471187e-06, "Pretrain/Loss": 1.990462064743042, "Pretrain/Loss (Raw)": 2.0925679206848145, "Pretrain/Step": 16442, "Pretrain/Step Time": 8.488960204645991} +{"Pretrain/Learning Rate": 2.451888391566817e-06, "Pretrain/Loss": 1.987833023071289, "Pretrain/Loss (Raw)": 1.8323060274124146, "Pretrain/Step": 16443, "Pretrain/Step Time": 8.487826503813267} +{"Pretrain/Learning Rate": 2.4500552557454234e-06, "Pretrain/Loss": 1.9849519729614258, "Pretrain/Loss (Raw)": 1.960913062095642, "Pretrain/Step": 16444, "Pretrain/Step Time": 8.485562974587083} +{"Pretrain/Learning Rate": 2.448222770135783e-06, "Pretrain/Loss": 1.9852445125579834, "Pretrain/Loss (Raw)": 1.9850707054138184, "Pretrain/Step": 16445, "Pretrain/Step Time": 8.49107115343213} +{"Pretrain/Learning Rate": 2.446390934790749e-06, "Pretrain/Loss": 1.9851619005203247, "Pretrain/Loss (Raw)": 2.0253713130950928, "Pretrain/Step": 16446, "Pretrain/Step Time": 8.489675445482135} +{"Pretrain/Learning Rate": 2.4445597497631257e-06, "Pretrain/Loss": 1.9829802513122559, "Pretrain/Loss (Raw)": 1.7210164070129395, "Pretrain/Step": 16447, "Pretrain/Step Time": 8.489187838509679} +{"Pretrain/Learning Rate": 2.4427292151057268e-06, "Pretrain/Loss": 1.9848148822784424, "Pretrain/Loss (Raw)": 2.1348135471343994, "Pretrain/Step": 16448, "Pretrain/Step Time": 8.48988202214241} +{"Pretrain/Learning Rate": 2.4408993308713323e-06, "Pretrain/Loss": 1.9855823516845703, "Pretrain/Loss (Raw)": 2.0550780296325684, "Pretrain/Step": 16449, "Pretrain/Step Time": 8.49374857917428} +{"Pretrain/Learning Rate": 2.4390700971126947e-06, "Pretrain/Loss": 1.9835350513458252, "Pretrain/Loss (Raw)": 1.9804401397705078, "Pretrain/Step": 16450, "Pretrain/Step Time": 8.495048115029931} +{"Pretrain/Learning Rate": 2.437241513882571e-06, "Pretrain/Loss": 1.9841948747634888, "Pretrain/Loss (Raw)": 2.0403993129730225, "Pretrain/Step": 16451, "Pretrain/Step Time": 8.49231425859034} +{"Pretrain/Learning Rate": 2.4354135812336782e-06, "Pretrain/Loss": 1.9872899055480957, "Pretrain/Loss (Raw)": 2.18532657623291, "Pretrain/Step": 16452, "Pretrain/Step Time": 8.492190090939403} +{"Pretrain/Learning Rate": 2.4335862992187347e-06, "Pretrain/Loss": 1.9877121448516846, "Pretrain/Loss (Raw)": 1.876810073852539, "Pretrain/Step": 16453, "Pretrain/Step Time": 8.492896994575858} +{"Pretrain/Learning Rate": 2.431759667890418e-06, "Pretrain/Loss": 1.986947774887085, "Pretrain/Loss (Raw)": 1.9337050914764404, "Pretrain/Step": 16454, "Pretrain/Step Time": 8.491957746446133} +{"Pretrain/Learning Rate": 2.4299336873014e-06, "Pretrain/Loss": 1.987879991531372, "Pretrain/Loss (Raw)": 1.8958579301834106, "Pretrain/Step": 16455, "Pretrain/Step Time": 8.487536014989018} +{"Pretrain/Learning Rate": 2.4281083575043385e-06, "Pretrain/Loss": 1.9837690591812134, "Pretrain/Loss (Raw)": 1.4442815780639648, "Pretrain/Step": 16456, "Pretrain/Step Time": 8.488488778471947} +{"Pretrain/Learning Rate": 2.4262836785518524e-06, "Pretrain/Loss": 1.9819058179855347, "Pretrain/Loss (Raw)": 1.9326367378234863, "Pretrain/Step": 16457, "Pretrain/Step Time": 8.487577693536878} +{"Pretrain/Learning Rate": 2.4244596504965716e-06, "Pretrain/Loss": 1.9821693897247314, "Pretrain/Loss (Raw)": 1.9846426248550415, "Pretrain/Step": 16458, "Pretrain/Step Time": 8.490425769239664} +{"Pretrain/Learning Rate": 2.4226362733910794e-06, "Pretrain/Loss": 1.9815869331359863, "Pretrain/Loss (Raw)": 2.081573486328125, "Pretrain/Step": 16459, "Pretrain/Step Time": 8.484017856419086} +{"Pretrain/Learning Rate": 2.4208135472879504e-06, "Pretrain/Loss": 1.9783462285995483, "Pretrain/Loss (Raw)": 1.7373342514038086, "Pretrain/Step": 16460, "Pretrain/Step Time": 8.48732609860599} +{"Pretrain/Learning Rate": 2.4189914722397485e-06, "Pretrain/Loss": 1.9789764881134033, "Pretrain/Loss (Raw)": 2.1729891300201416, "Pretrain/Step": 16461, "Pretrain/Step Time": 8.48384515196085} +{"Pretrain/Learning Rate": 2.4171700482990057e-06, "Pretrain/Loss": 1.9785220623016357, "Pretrain/Loss (Raw)": 2.047734498977661, "Pretrain/Step": 16462, "Pretrain/Step Time": 8.485410621389747} +{"Pretrain/Learning Rate": 2.41534927551825e-06, "Pretrain/Loss": 1.9787967205047607, "Pretrain/Loss (Raw)": 2.0891215801239014, "Pretrain/Step": 16463, "Pretrain/Step Time": 8.484299965202808} +{"Pretrain/Learning Rate": 2.4135291539499754e-06, "Pretrain/Loss": 1.9789835214614868, "Pretrain/Loss (Raw)": 1.9497191905975342, "Pretrain/Step": 16464, "Pretrain/Step Time": 8.486282531172037} +{"Pretrain/Learning Rate": 2.4117096836466624e-06, "Pretrain/Loss": 1.9798028469085693, "Pretrain/Loss (Raw)": 2.1089603900909424, "Pretrain/Step": 16465, "Pretrain/Step Time": 8.483263209462166} +{"Pretrain/Learning Rate": 2.40989086466078e-06, "Pretrain/Loss": 1.9760510921478271, "Pretrain/Loss (Raw)": 1.9147366285324097, "Pretrain/Step": 16466, "Pretrain/Step Time": 8.482102019712329} +{"Pretrain/Learning Rate": 2.4080726970447664e-06, "Pretrain/Loss": 1.9754456281661987, "Pretrain/Loss (Raw)": 1.896240472793579, "Pretrain/Step": 16467, "Pretrain/Step Time": 8.487105621024966} +{"Pretrain/Learning Rate": 2.4062551808510553e-06, "Pretrain/Loss": 1.970927119255066, "Pretrain/Loss (Raw)": 1.9792884588241577, "Pretrain/Step": 16468, "Pretrain/Step Time": 8.485446978360415} +{"Pretrain/Learning Rate": 2.404438316132046e-06, "Pretrain/Loss": 1.969717264175415, "Pretrain/Loss (Raw)": 2.0414299964904785, "Pretrain/Step": 16469, "Pretrain/Step Time": 8.484718631953001} +{"Pretrain/Learning Rate": 2.4026221029401274e-06, "Pretrain/Loss": 1.9685447216033936, "Pretrain/Loss (Raw)": 1.9713467359542847, "Pretrain/Step": 16470, "Pretrain/Step Time": 8.485261494293809} +{"Pretrain/Learning Rate": 2.4008065413276716e-06, "Pretrain/Loss": 1.969748854637146, "Pretrain/Loss (Raw)": 1.9322054386138916, "Pretrain/Step": 16471, "Pretrain/Step Time": 8.488663956522942} +{"Pretrain/Learning Rate": 2.3989916313470252e-06, "Pretrain/Loss": 1.9706320762634277, "Pretrain/Loss (Raw)": 2.0315797328948975, "Pretrain/Step": 16472, "Pretrain/Step Time": 8.486365793272853} +{"Pretrain/Learning Rate": 2.397177373050527e-06, "Pretrain/Loss": 1.9706833362579346, "Pretrain/Loss (Raw)": 2.0132927894592285, "Pretrain/Step": 16473, "Pretrain/Step Time": 8.490549584850669} +{"Pretrain/Learning Rate": 2.3953637664904855e-06, "Pretrain/Loss": 1.971389889717102, "Pretrain/Loss (Raw)": 1.9794528484344482, "Pretrain/Step": 16474, "Pretrain/Step Time": 8.487467462196946} +{"Pretrain/Learning Rate": 2.3935508117191892e-06, "Pretrain/Loss": 1.9699101448059082, "Pretrain/Loss (Raw)": 1.7708117961883545, "Pretrain/Step": 16475, "Pretrain/Step Time": 8.49187322333455} +{"Pretrain/Learning Rate": 2.3917385087889238e-06, "Pretrain/Loss": 1.9719046354293823, "Pretrain/Loss (Raw)": 1.9406416416168213, "Pretrain/Step": 16476, "Pretrain/Step Time": 8.484618565067649} +{"Pretrain/Learning Rate": 2.3899268577519367e-06, "Pretrain/Loss": 1.9715006351470947, "Pretrain/Loss (Raw)": 1.825334072113037, "Pretrain/Step": 16477, "Pretrain/Step Time": 8.488786090165377} +{"Pretrain/Learning Rate": 2.3881158586604724e-06, "Pretrain/Loss": 1.9740427732467651, "Pretrain/Loss (Raw)": 2.3322954177856445, "Pretrain/Step": 16478, "Pretrain/Step Time": 8.490934409201145} +{"Pretrain/Learning Rate": 2.38630551156675e-06, "Pretrain/Loss": 1.9706487655639648, "Pretrain/Loss (Raw)": 1.767540693283081, "Pretrain/Step": 16479, "Pretrain/Step Time": 8.492169167846441} +{"Pretrain/Learning Rate": 2.384495816522958e-06, "Pretrain/Loss": 1.971935749053955, "Pretrain/Loss (Raw)": 2.0066335201263428, "Pretrain/Step": 16480, "Pretrain/Step Time": 8.492049554362893} +{"Pretrain/Learning Rate": 2.382686773581294e-06, "Pretrain/Loss": 1.9721424579620361, "Pretrain/Loss (Raw)": 1.9106801748275757, "Pretrain/Step": 16481, "Pretrain/Step Time": 8.485752262175083} +{"Pretrain/Learning Rate": 2.380878382793908e-06, "Pretrain/Loss": 1.9694924354553223, "Pretrain/Loss (Raw)": 1.724865198135376, "Pretrain/Step": 16482, "Pretrain/Step Time": 8.486219948157668} +{"Pretrain/Learning Rate": 2.3790706442129496e-06, "Pretrain/Loss": 1.9692915678024292, "Pretrain/Loss (Raw)": 1.8648194074630737, "Pretrain/Step": 16483, "Pretrain/Step Time": 8.484311178326607} +{"Pretrain/Learning Rate": 2.3772635578905467e-06, "Pretrain/Loss": 1.9686594009399414, "Pretrain/Loss (Raw)": 2.0483286380767822, "Pretrain/Step": 16484, "Pretrain/Step Time": 8.484943274408579} +{"Pretrain/Learning Rate": 2.3754571238787937e-06, "Pretrain/Loss": 1.9689667224884033, "Pretrain/Loss (Raw)": 2.077341318130493, "Pretrain/Step": 16485, "Pretrain/Step Time": 8.48931378684938} +{"Pretrain/Learning Rate": 2.373651342229791e-06, "Pretrain/Loss": 1.9691276550292969, "Pretrain/Loss (Raw)": 1.8998844623565674, "Pretrain/Step": 16486, "Pretrain/Step Time": 8.48679582029581} +{"Pretrain/Learning Rate": 2.371846212995596e-06, "Pretrain/Loss": 1.965995192527771, "Pretrain/Loss (Raw)": 1.7003251314163208, "Pretrain/Step": 16487, "Pretrain/Step Time": 8.487857239320874} +{"Pretrain/Learning Rate": 2.3700417362282707e-06, "Pretrain/Loss": 1.9662823677062988, "Pretrain/Loss (Raw)": 2.0465002059936523, "Pretrain/Step": 16488, "Pretrain/Step Time": 8.486520398408175} +{"Pretrain/Learning Rate": 2.368237911979837e-06, "Pretrain/Loss": 1.972726821899414, "Pretrain/Loss (Raw)": 2.470101833343506, "Pretrain/Step": 16489, "Pretrain/Step Time": 8.48532253690064} +{"Pretrain/Learning Rate": 2.3664347403023037e-06, "Pretrain/Loss": 1.9738285541534424, "Pretrain/Loss (Raw)": 1.9173380136489868, "Pretrain/Step": 16490, "Pretrain/Step Time": 8.48864196613431} +{"Pretrain/Learning Rate": 2.364632221247673e-06, "Pretrain/Loss": 1.9741747379302979, "Pretrain/Loss (Raw)": 1.9839316606521606, "Pretrain/Step": 16491, "Pretrain/Step Time": 8.486136706545949} +{"Pretrain/Learning Rate": 2.362830354867912e-06, "Pretrain/Loss": 1.9737497568130493, "Pretrain/Loss (Raw)": 1.9328900575637817, "Pretrain/Step": 16492, "Pretrain/Step Time": 8.486443929374218} +{"Pretrain/Learning Rate": 2.3610291412149847e-06, "Pretrain/Loss": 1.972499132156372, "Pretrain/Loss (Raw)": 1.7847392559051514, "Pretrain/Step": 16493, "Pretrain/Step Time": 8.49064901843667} +{"Pretrain/Learning Rate": 2.359228580340822e-06, "Pretrain/Loss": 1.9739727973937988, "Pretrain/Loss (Raw)": 2.1976709365844727, "Pretrain/Step": 16494, "Pretrain/Step Time": 8.485007362440228} +{"Pretrain/Learning Rate": 2.3574286722973377e-06, "Pretrain/Loss": 1.9757837057113647, "Pretrain/Loss (Raw)": 2.2305755615234375, "Pretrain/Step": 16495, "Pretrain/Step Time": 8.48804609850049} +{"Pretrain/Learning Rate": 2.3556294171364403e-06, "Pretrain/Loss": 1.9750711917877197, "Pretrain/Loss (Raw)": 1.9760026931762695, "Pretrain/Step": 16496, "Pretrain/Step Time": 8.483665505424142} +{"Pretrain/Learning Rate": 2.353830814910002e-06, "Pretrain/Loss": 1.975820541381836, "Pretrain/Loss (Raw)": 1.9210851192474365, "Pretrain/Step": 16497, "Pretrain/Step Time": 8.481078192591667} +{"Pretrain/Learning Rate": 2.3520328656698927e-06, "Pretrain/Loss": 1.977105736732483, "Pretrain/Loss (Raw)": 2.1402676105499268, "Pretrain/Step": 16498, "Pretrain/Step Time": 8.479271141812205} +{"Pretrain/Learning Rate": 2.3502355694679486e-06, "Pretrain/Loss": 1.9743727445602417, "Pretrain/Loss (Raw)": 1.7383350133895874, "Pretrain/Step": 16499, "Pretrain/Step Time": 8.485942229628563} +{"Pretrain/Learning Rate": 2.348438926355989e-06, "Pretrain/Loss": 1.970052719116211, "Pretrain/Loss (Raw)": 1.9006105661392212, "Pretrain/Step": 16500, "Pretrain/Step Time": 8.481063881888986} +{"Pretrain/Learning Rate": 2.3466429363858316e-06, "Pretrain/Loss": 1.9720709323883057, "Pretrain/Loss (Raw)": 2.2088520526885986, "Pretrain/Step": 16501, "Pretrain/Step Time": 8.480253044515848} +{"Pretrain/Learning Rate": 2.3448475996092483e-06, "Pretrain/Loss": 1.9715461730957031, "Pretrain/Loss (Raw)": 1.9009076356887817, "Pretrain/Step": 16502, "Pretrain/Step Time": 8.47947989962995} +{"Pretrain/Learning Rate": 2.34305291607802e-06, "Pretrain/Loss": 1.9703161716461182, "Pretrain/Loss (Raw)": 1.7807904481887817, "Pretrain/Step": 16503, "Pretrain/Step Time": 8.478431334719062} +{"Pretrain/Learning Rate": 2.341258885843889e-06, "Pretrain/Loss": 1.969406247138977, "Pretrain/Loss (Raw)": 2.0087854862213135, "Pretrain/Step": 16504, "Pretrain/Step Time": 8.479865454137325} +{"Pretrain/Learning Rate": 2.33946550895858e-06, "Pretrain/Loss": 1.9680745601654053, "Pretrain/Loss (Raw)": 1.9440486431121826, "Pretrain/Step": 16505, "Pretrain/Step Time": 8.480001231655478} +{"Pretrain/Learning Rate": 2.337672785473813e-06, "Pretrain/Loss": 1.9698772430419922, "Pretrain/Loss (Raw)": 2.243164300918579, "Pretrain/Step": 16506, "Pretrain/Step Time": 8.482710072770715} +{"Pretrain/Learning Rate": 2.3358807154412686e-06, "Pretrain/Loss": 1.970031499862671, "Pretrain/Loss (Raw)": 1.8806933164596558, "Pretrain/Step": 16507, "Pretrain/Step Time": 8.484682247042656} +{"Pretrain/Learning Rate": 2.334089298912634e-06, "Pretrain/Loss": 1.966928482055664, "Pretrain/Loss (Raw)": 1.8057910203933716, "Pretrain/Step": 16508, "Pretrain/Step Time": 8.48753571510315} +{"Pretrain/Learning Rate": 2.3322985359395535e-06, "Pretrain/Loss": 1.9640520811080933, "Pretrain/Loss (Raw)": 1.7878364324569702, "Pretrain/Step": 16509, "Pretrain/Step Time": 8.488887095823884} +{"Pretrain/Learning Rate": 2.3305084265736686e-06, "Pretrain/Loss": 1.962787389755249, "Pretrain/Loss (Raw)": 2.0329654216766357, "Pretrain/Step": 16510, "Pretrain/Step Time": 8.490729659795761} +{"Pretrain/Learning Rate": 2.3287189708665836e-06, "Pretrain/Loss": 1.966238021850586, "Pretrain/Loss (Raw)": 2.302232503890991, "Pretrain/Step": 16511, "Pretrain/Step Time": 8.485394269227982} +{"Pretrain/Learning Rate": 2.326930168869912e-06, "Pretrain/Loss": 1.9677913188934326, "Pretrain/Loss (Raw)": 2.021333932876587, "Pretrain/Step": 16512, "Pretrain/Step Time": 8.487953003495932} +{"Pretrain/Learning Rate": 2.3251420206352264e-06, "Pretrain/Loss": 1.9668457508087158, "Pretrain/Loss (Raw)": 1.9135395288467407, "Pretrain/Step": 16513, "Pretrain/Step Time": 8.48867717012763} +{"Pretrain/Learning Rate": 2.3233545262140775e-06, "Pretrain/Loss": 1.9652314186096191, "Pretrain/Loss (Raw)": 1.8495787382125854, "Pretrain/Step": 16514, "Pretrain/Step Time": 8.487914744764566} +{"Pretrain/Learning Rate": 2.3215676856580242e-06, "Pretrain/Loss": 1.9651780128479004, "Pretrain/Loss (Raw)": 1.9259635210037231, "Pretrain/Step": 16515, "Pretrain/Step Time": 8.485835067927837} +{"Pretrain/Learning Rate": 2.319781499018572e-06, "Pretrain/Loss": 1.9639639854431152, "Pretrain/Loss (Raw)": 1.823101282119751, "Pretrain/Step": 16516, "Pretrain/Step Time": 8.49079792946577} +{"Pretrain/Learning Rate": 2.317995966347236e-06, "Pretrain/Loss": 1.963326334953308, "Pretrain/Loss (Raw)": 1.7876423597335815, "Pretrain/Step": 16517, "Pretrain/Step Time": 8.496394982561469} +{"Pretrain/Learning Rate": 2.3162110876954967e-06, "Pretrain/Loss": 1.9630439281463623, "Pretrain/Loss (Raw)": 1.859802007675171, "Pretrain/Step": 16518, "Pretrain/Step Time": 8.491005145013332} +{"Pretrain/Learning Rate": 2.3144268631148157e-06, "Pretrain/Loss": 1.9639852046966553, "Pretrain/Loss (Raw)": 2.0847771167755127, "Pretrain/Step": 16519, "Pretrain/Step Time": 8.4917167481035} +{"Pretrain/Learning Rate": 2.312643292656649e-06, "Pretrain/Loss": 1.9638770818710327, "Pretrain/Loss (Raw)": 2.092036724090576, "Pretrain/Step": 16520, "Pretrain/Step Time": 8.494665201753378} +{"Pretrain/Learning Rate": 2.3108603763724146e-06, "Pretrain/Loss": 1.9612908363342285, "Pretrain/Loss (Raw)": 1.827970266342163, "Pretrain/Step": 16521, "Pretrain/Step Time": 8.494907950982451} +{"Pretrain/Learning Rate": 2.3090781143135314e-06, "Pretrain/Loss": 1.965039610862732, "Pretrain/Loss (Raw)": 2.2548470497131348, "Pretrain/Step": 16522, "Pretrain/Step Time": 8.490671135485172} +{"Pretrain/Learning Rate": 2.307296506531384e-06, "Pretrain/Loss": 1.9669562578201294, "Pretrain/Loss (Raw)": 2.1600186824798584, "Pretrain/Step": 16523, "Pretrain/Step Time": 8.494386794045568} +{"Pretrain/Learning Rate": 2.3055155530773394e-06, "Pretrain/Loss": 1.9688234329223633, "Pretrain/Loss (Raw)": 2.1610894203186035, "Pretrain/Step": 16524, "Pretrain/Step Time": 8.495090140029788} +{"Pretrain/Learning Rate": 2.3037352540027616e-06, "Pretrain/Loss": 1.9688458442687988, "Pretrain/Loss (Raw)": 1.8574879169464111, "Pretrain/Step": 16525, "Pretrain/Step Time": 8.498431958258152} +{"Pretrain/Learning Rate": 2.3019556093589717e-06, "Pretrain/Loss": 1.967379093170166, "Pretrain/Loss (Raw)": 1.742476224899292, "Pretrain/Step": 16526, "Pretrain/Step Time": 8.501037465408444} +{"Pretrain/Learning Rate": 2.3001766191972973e-06, "Pretrain/Loss": 1.967560052871704, "Pretrain/Loss (Raw)": 1.9033399820327759, "Pretrain/Step": 16527, "Pretrain/Step Time": 8.498180279508233} +{"Pretrain/Learning Rate": 2.2983982835690254e-06, "Pretrain/Loss": 1.966110110282898, "Pretrain/Loss (Raw)": 1.9596236944198608, "Pretrain/Step": 16528, "Pretrain/Step Time": 8.495852338150144} +{"Pretrain/Learning Rate": 2.2966206025254316e-06, "Pretrain/Loss": 1.966308832168579, "Pretrain/Loss (Raw)": 1.9381996393203735, "Pretrain/Step": 16529, "Pretrain/Step Time": 8.494414016604424} +{"Pretrain/Learning Rate": 2.2948435761177835e-06, "Pretrain/Loss": 1.9697794914245605, "Pretrain/Loss (Raw)": 2.118032932281494, "Pretrain/Step": 16530, "Pretrain/Step Time": 8.495426984503865} +{"Pretrain/Learning Rate": 2.293067204397309e-06, "Pretrain/Loss": 1.9730124473571777, "Pretrain/Loss (Raw)": 2.026900053024292, "Pretrain/Step": 16531, "Pretrain/Step Time": 8.494763426482677} +{"Pretrain/Learning Rate": 2.29129148741524e-06, "Pretrain/Loss": 1.9738894701004028, "Pretrain/Loss (Raw)": 1.842124104499817, "Pretrain/Step": 16532, "Pretrain/Step Time": 8.495873456820846} +{"Pretrain/Learning Rate": 2.289516425222771e-06, "Pretrain/Loss": 1.976354718208313, "Pretrain/Loss (Raw)": 2.270404577255249, "Pretrain/Step": 16533, "Pretrain/Step Time": 8.49937130510807} +{"Pretrain/Learning Rate": 2.2877420178710806e-06, "Pretrain/Loss": 1.9732540845870972, "Pretrain/Loss (Raw)": 1.6487065553665161, "Pretrain/Step": 16534, "Pretrain/Step Time": 8.502190798521042} +{"Pretrain/Learning Rate": 2.2859682654113452e-06, "Pretrain/Loss": 1.9737164974212646, "Pretrain/Loss (Raw)": 2.080615997314453, "Pretrain/Step": 16535, "Pretrain/Step Time": 8.495655097067356} +{"Pretrain/Learning Rate": 2.284195167894698e-06, "Pretrain/Loss": 1.9715216159820557, "Pretrain/Loss (Raw)": 1.9383258819580078, "Pretrain/Step": 16536, "Pretrain/Step Time": 8.496629809960723} +{"Pretrain/Learning Rate": 2.282422725372271e-06, "Pretrain/Loss": 1.972367763519287, "Pretrain/Loss (Raw)": 1.8407617807388306, "Pretrain/Step": 16537, "Pretrain/Step Time": 8.4923578761518} +{"Pretrain/Learning Rate": 2.2806509378951735e-06, "Pretrain/Loss": 1.9729509353637695, "Pretrain/Loss (Raw)": 1.9457162618637085, "Pretrain/Step": 16538, "Pretrain/Step Time": 8.489445336163044} +{"Pretrain/Learning Rate": 2.2788798055144834e-06, "Pretrain/Loss": 1.9725463390350342, "Pretrain/Loss (Raw)": 2.1011013984680176, "Pretrain/Step": 16539, "Pretrain/Step Time": 8.49251377955079} +{"Pretrain/Learning Rate": 2.277109328281282e-06, "Pretrain/Loss": 1.9731475114822388, "Pretrain/Loss (Raw)": 1.9280881881713867, "Pretrain/Step": 16540, "Pretrain/Step Time": 8.497414307668805} +{"Pretrain/Learning Rate": 2.27533950624661e-06, "Pretrain/Loss": 1.973313808441162, "Pretrain/Loss (Raw)": 1.9875019788742065, "Pretrain/Step": 16541, "Pretrain/Step Time": 8.495174955576658} +{"Pretrain/Learning Rate": 2.2735703394615087e-06, "Pretrain/Loss": 1.9747262001037598, "Pretrain/Loss (Raw)": 1.990006685256958, "Pretrain/Step": 16542, "Pretrain/Step Time": 8.496374452486634} +{"Pretrain/Learning Rate": 2.2718018279769826e-06, "Pretrain/Loss": 1.9741123914718628, "Pretrain/Loss (Raw)": 2.1313703060150146, "Pretrain/Step": 16543, "Pretrain/Step Time": 8.50705149397254} +{"Pretrain/Learning Rate": 2.2700339718440268e-06, "Pretrain/Loss": 1.9769654273986816, "Pretrain/Loss (Raw)": 2.0358335971832275, "Pretrain/Step": 16544, "Pretrain/Step Time": 8.505091896280646} +{"Pretrain/Learning Rate": 2.2682667711136225e-06, "Pretrain/Loss": 1.9769978523254395, "Pretrain/Loss (Raw)": 1.9512721300125122, "Pretrain/Step": 16545, "Pretrain/Step Time": 8.505407864227891} +{"Pretrain/Learning Rate": 2.2665002258367153e-06, "Pretrain/Loss": 1.9769556522369385, "Pretrain/Loss (Raw)": 1.8776054382324219, "Pretrain/Step": 16546, "Pretrain/Step Time": 8.505069253966212} +{"Pretrain/Learning Rate": 2.264734336064253e-06, "Pretrain/Loss": 1.9755165576934814, "Pretrain/Loss (Raw)": 1.9093883037567139, "Pretrain/Step": 16547, "Pretrain/Step Time": 8.505909154191613} +{"Pretrain/Learning Rate": 2.2629691018471484e-06, "Pretrain/Loss": 1.9738191366195679, "Pretrain/Loss (Raw)": 1.8128682374954224, "Pretrain/Step": 16548, "Pretrain/Step Time": 8.507471576333046} +{"Pretrain/Learning Rate": 2.261204523236296e-06, "Pretrain/Loss": 1.974023461341858, "Pretrain/Loss (Raw)": 2.0682432651519775, "Pretrain/Step": 16549, "Pretrain/Step Time": 8.510642712935805} +{"Pretrain/Learning Rate": 2.259440600282589e-06, "Pretrain/Loss": 1.974349021911621, "Pretrain/Loss (Raw)": 1.9607093334197998, "Pretrain/Step": 16550, "Pretrain/Step Time": 8.509373372420669} +{"Pretrain/Learning Rate": 2.257677333036873e-06, "Pretrain/Loss": 1.9726386070251465, "Pretrain/Loss (Raw)": 1.781674861907959, "Pretrain/Step": 16551, "Pretrain/Step Time": 8.507976090535522} +{"Pretrain/Learning Rate": 2.2559147215500067e-06, "Pretrain/Loss": 1.9733521938323975, "Pretrain/Loss (Raw)": 2.0411558151245117, "Pretrain/Step": 16552, "Pretrain/Step Time": 8.50882676616311} +{"Pretrain/Learning Rate": 2.2541527658728023e-06, "Pretrain/Loss": 1.974501609802246, "Pretrain/Loss (Raw)": 2.4109556674957275, "Pretrain/Step": 16553, "Pretrain/Step Time": 8.509313574060798} +{"Pretrain/Learning Rate": 2.252391466056067e-06, "Pretrain/Loss": 1.9752793312072754, "Pretrain/Loss (Raw)": 2.0008702278137207, "Pretrain/Step": 16554, "Pretrain/Step Time": 8.505390994250774} +{"Pretrain/Learning Rate": 2.25063082215059e-06, "Pretrain/Loss": 1.9743046760559082, "Pretrain/Loss (Raw)": 1.8732179403305054, "Pretrain/Step": 16555, "Pretrain/Step Time": 8.50496349669993} +{"Pretrain/Learning Rate": 2.2488708342071314e-06, "Pretrain/Loss": 1.974098801612854, "Pretrain/Loss (Raw)": 2.0314865112304688, "Pretrain/Step": 16556, "Pretrain/Step Time": 8.509692708030343} +{"Pretrain/Learning Rate": 2.24711150227645e-06, "Pretrain/Loss": 1.9772753715515137, "Pretrain/Loss (Raw)": 2.1972496509552, "Pretrain/Step": 16557, "Pretrain/Step Time": 8.506749238818884} +{"Pretrain/Learning Rate": 2.2453528264092693e-06, "Pretrain/Loss": 1.9746276140213013, "Pretrain/Loss (Raw)": 1.8647501468658447, "Pretrain/Step": 16558, "Pretrain/Step Time": 8.502645641565323} +{"Pretrain/Learning Rate": 2.2435948066562904e-06, "Pretrain/Loss": 1.9749202728271484, "Pretrain/Loss (Raw)": 2.058823585510254, "Pretrain/Step": 16559, "Pretrain/Step Time": 8.50654062256217} +{"Pretrain/Learning Rate": 2.2418374430682203e-06, "Pretrain/Loss": 1.9759106636047363, "Pretrain/Loss (Raw)": 2.0318214893341064, "Pretrain/Step": 16560, "Pretrain/Step Time": 8.504818800836802} +{"Pretrain/Learning Rate": 2.240080735695721e-06, "Pretrain/Loss": 1.9730966091156006, "Pretrain/Loss (Raw)": 1.72769296169281, "Pretrain/Step": 16561, "Pretrain/Step Time": 8.506412280723453} +{"Pretrain/Learning Rate": 2.238324684589452e-06, "Pretrain/Loss": 1.9742484092712402, "Pretrain/Loss (Raw)": 1.9746942520141602, "Pretrain/Step": 16562, "Pretrain/Step Time": 8.502541441470385} +{"Pretrain/Learning Rate": 2.2365692898000444e-06, "Pretrain/Loss": 1.9704601764678955, "Pretrain/Loss (Raw)": 1.9512336254119873, "Pretrain/Step": 16563, "Pretrain/Step Time": 8.501362225040793} +{"Pretrain/Learning Rate": 2.234814551378109e-06, "Pretrain/Loss": 1.9715275764465332, "Pretrain/Loss (Raw)": 1.9414726495742798, "Pretrain/Step": 16564, "Pretrain/Step Time": 8.49833707138896} +{"Pretrain/Learning Rate": 2.2330604693742542e-06, "Pretrain/Loss": 1.9726588726043701, "Pretrain/Loss (Raw)": 2.143110990524292, "Pretrain/Step": 16565, "Pretrain/Step Time": 8.49611714296043} +{"Pretrain/Learning Rate": 2.2313070438390454e-06, "Pretrain/Loss": 1.9762022495269775, "Pretrain/Loss (Raw)": 2.32090163230896, "Pretrain/Step": 16566, "Pretrain/Step Time": 8.494637375697494} +{"Pretrain/Learning Rate": 2.2295542748230506e-06, "Pretrain/Loss": 1.9741302728652954, "Pretrain/Loss (Raw)": 1.8138583898544312, "Pretrain/Step": 16567, "Pretrain/Step Time": 8.499072900041938} +{"Pretrain/Learning Rate": 2.2278021623768074e-06, "Pretrain/Loss": 1.974995493888855, "Pretrain/Loss (Raw)": 2.122023820877075, "Pretrain/Step": 16568, "Pretrain/Step Time": 8.493811931461096} +{"Pretrain/Learning Rate": 2.226050706550831e-06, "Pretrain/Loss": 1.975572109222412, "Pretrain/Loss (Raw)": 1.9239860773086548, "Pretrain/Step": 16569, "Pretrain/Step Time": 8.497563807293773} +{"Pretrain/Learning Rate": 2.224299907395633e-06, "Pretrain/Loss": 1.97502601146698, "Pretrain/Loss (Raw)": 2.022643804550171, "Pretrain/Step": 16570, "Pretrain/Step Time": 8.49502551741898} +{"Pretrain/Learning Rate": 2.2225497649616873e-06, "Pretrain/Loss": 1.9766392707824707, "Pretrain/Loss (Raw)": 2.038821220397949, "Pretrain/Step": 16571, "Pretrain/Step Time": 8.497446589171886} +{"Pretrain/Learning Rate": 2.220800279299465e-06, "Pretrain/Loss": 1.977828025817871, "Pretrain/Loss (Raw)": 2.113072633743286, "Pretrain/Step": 16572, "Pretrain/Step Time": 8.501460677012801} +{"Pretrain/Learning Rate": 2.2190514504594086e-06, "Pretrain/Loss": 1.9787213802337646, "Pretrain/Loss (Raw)": 2.0994009971618652, "Pretrain/Step": 16573, "Pretrain/Step Time": 8.5007300414145} +{"Pretrain/Learning Rate": 2.217303278491939e-06, "Pretrain/Loss": 1.9774216413497925, "Pretrain/Loss (Raw)": 1.8590153455734253, "Pretrain/Step": 16574, "Pretrain/Step Time": 8.49812433309853} +{"Pretrain/Learning Rate": 2.2155557634474745e-06, "Pretrain/Loss": 1.9772720336914062, "Pretrain/Loss (Raw)": 1.7018706798553467, "Pretrain/Step": 16575, "Pretrain/Step Time": 8.500500362366438} +{"Pretrain/Learning Rate": 2.2138089053763913e-06, "Pretrain/Loss": 1.9775803089141846, "Pretrain/Loss (Raw)": 2.1742656230926514, "Pretrain/Step": 16576, "Pretrain/Step Time": 8.500084115192294} +{"Pretrain/Learning Rate": 2.212062704329071e-06, "Pretrain/Loss": 1.9787660837173462, "Pretrain/Loss (Raw)": 2.2068636417388916, "Pretrain/Step": 16577, "Pretrain/Step Time": 8.49794209934771} +{"Pretrain/Learning Rate": 2.21031716035586e-06, "Pretrain/Loss": 1.9781699180603027, "Pretrain/Loss (Raw)": 1.9041165113449097, "Pretrain/Step": 16578, "Pretrain/Step Time": 8.495608516037464} +{"Pretrain/Learning Rate": 2.2085722735070814e-06, "Pretrain/Loss": 1.9764058589935303, "Pretrain/Loss (Raw)": 1.8146106004714966, "Pretrain/Step": 16579, "Pretrain/Step Time": 8.500341111794114} +{"Pretrain/Learning Rate": 2.2068280438330564e-06, "Pretrain/Loss": 1.9739744663238525, "Pretrain/Loss (Raw)": 1.8741158246994019, "Pretrain/Step": 16580, "Pretrain/Step Time": 8.49970425106585} +{"Pretrain/Learning Rate": 2.205084471384075e-06, "Pretrain/Loss": 1.9756025075912476, "Pretrain/Loss (Raw)": 2.085188388824463, "Pretrain/Step": 16581, "Pretrain/Step Time": 8.496142351999879} +{"Pretrain/Learning Rate": 2.2033415562104196e-06, "Pretrain/Loss": 1.9758026599884033, "Pretrain/Loss (Raw)": 1.9593234062194824, "Pretrain/Step": 16582, "Pretrain/Step Time": 8.499692438170314} +{"Pretrain/Learning Rate": 2.2015992983623336e-06, "Pretrain/Loss": 1.9797979593276978, "Pretrain/Loss (Raw)": 2.407264232635498, "Pretrain/Step": 16583, "Pretrain/Step Time": 8.497472181916237} +{"Pretrain/Learning Rate": 2.199857697890062e-06, "Pretrain/Loss": 1.9846380949020386, "Pretrain/Loss (Raw)": 2.063814640045166, "Pretrain/Step": 16584, "Pretrain/Step Time": 8.497742814943194} +{"Pretrain/Learning Rate": 2.1981167548438237e-06, "Pretrain/Loss": 1.9858031272888184, "Pretrain/Loss (Raw)": 2.0817601680755615, "Pretrain/Step": 16585, "Pretrain/Step Time": 8.499705808237195} +{"Pretrain/Learning Rate": 2.196376469273809e-06, "Pretrain/Loss": 1.985489010810852, "Pretrain/Loss (Raw)": 1.9444255828857422, "Pretrain/Step": 16586, "Pretrain/Step Time": 8.498117139562964} +{"Pretrain/Learning Rate": 2.1946368412302103e-06, "Pretrain/Loss": 1.9862943887710571, "Pretrain/Loss (Raw)": 2.184680938720703, "Pretrain/Step": 16587, "Pretrain/Step Time": 8.497020289301872} +{"Pretrain/Learning Rate": 2.192897870763175e-06, "Pretrain/Loss": 1.9872218370437622, "Pretrain/Loss (Raw)": 1.8560423851013184, "Pretrain/Step": 16588, "Pretrain/Step Time": 8.497620960697532} +{"Pretrain/Learning Rate": 2.1911595579228534e-06, "Pretrain/Loss": 1.9860961437225342, "Pretrain/Loss (Raw)": 2.028897762298584, "Pretrain/Step": 16589, "Pretrain/Step Time": 8.498593537136912} +{"Pretrain/Learning Rate": 2.18942190275937e-06, "Pretrain/Loss": 1.9857869148254395, "Pretrain/Loss (Raw)": 2.008155107498169, "Pretrain/Step": 16590, "Pretrain/Step Time": 8.500764546915889} +{"Pretrain/Learning Rate": 2.1876849053228204e-06, "Pretrain/Loss": 1.9880958795547485, "Pretrain/Loss (Raw)": 2.384657859802246, "Pretrain/Step": 16591, "Pretrain/Step Time": 8.501574616879225} +{"Pretrain/Learning Rate": 2.185948565663301e-06, "Pretrain/Loss": 1.9895164966583252, "Pretrain/Loss (Raw)": 2.131563663482666, "Pretrain/Step": 16592, "Pretrain/Step Time": 8.499829739332199} +{"Pretrain/Learning Rate": 2.184212883830869e-06, "Pretrain/Loss": 1.9878966808319092, "Pretrain/Loss (Raw)": 1.901620864868164, "Pretrain/Step": 16593, "Pretrain/Step Time": 8.501107659190893} +{"Pretrain/Learning Rate": 2.1824778598755755e-06, "Pretrain/Loss": 1.9875330924987793, "Pretrain/Loss (Raw)": 1.8682103157043457, "Pretrain/Step": 16594, "Pretrain/Step Time": 8.499142898246646} +{"Pretrain/Learning Rate": 2.1807434938474453e-06, "Pretrain/Loss": 1.9887707233428955, "Pretrain/Loss (Raw)": 2.054654121398926, "Pretrain/Step": 16595, "Pretrain/Step Time": 8.497273709625006} +{"Pretrain/Learning Rate": 2.179009785796493e-06, "Pretrain/Loss": 1.9884557723999023, "Pretrain/Loss (Raw)": 1.9389653205871582, "Pretrain/Step": 16596, "Pretrain/Step Time": 8.497393047437072} +{"Pretrain/Learning Rate": 2.177276735772704e-06, "Pretrain/Loss": 1.9876943826675415, "Pretrain/Loss (Raw)": 1.943975806236267, "Pretrain/Step": 16597, "Pretrain/Step Time": 8.49791688658297} +{"Pretrain/Learning Rate": 2.1755443438260496e-06, "Pretrain/Loss": 1.9907035827636719, "Pretrain/Loss (Raw)": 2.3565196990966797, "Pretrain/Step": 16598, "Pretrain/Step Time": 8.503176905214787} +{"Pretrain/Learning Rate": 2.173812610006487e-06, "Pretrain/Loss": 1.9902095794677734, "Pretrain/Loss (Raw)": 1.8689733743667603, "Pretrain/Step": 16599, "Pretrain/Step Time": 8.498570278286934} +{"Pretrain/Learning Rate": 2.17208153436394e-06, "Pretrain/Loss": 1.9916082620620728, "Pretrain/Loss (Raw)": 2.210618019104004, "Pretrain/Step": 16600, "Pretrain/Step Time": 8.499646266922355} +{"Pretrain/Learning Rate": 2.1703511169483382e-06, "Pretrain/Loss": 1.9926059246063232, "Pretrain/Loss (Raw)": 2.140986442565918, "Pretrain/Step": 16601, "Pretrain/Step Time": 8.495737301185727} +{"Pretrain/Learning Rate": 2.1686213578095638e-06, "Pretrain/Loss": 1.993252158164978, "Pretrain/Loss (Raw)": 2.06217622756958, "Pretrain/Step": 16602, "Pretrain/Step Time": 8.50255911424756} +{"Pretrain/Learning Rate": 2.1668922569974963e-06, "Pretrain/Loss": 1.9943336248397827, "Pretrain/Loss (Raw)": 1.9092470407485962, "Pretrain/Step": 16603, "Pretrain/Step Time": 8.500252099707723} +{"Pretrain/Learning Rate": 2.165163814561996e-06, "Pretrain/Loss": 1.9955239295959473, "Pretrain/Loss (Raw)": 2.0929837226867676, "Pretrain/Step": 16604, "Pretrain/Step Time": 8.496817026287317} +{"Pretrain/Learning Rate": 2.1634360305528956e-06, "Pretrain/Loss": 1.9978151321411133, "Pretrain/Loss (Raw)": 2.1186070442199707, "Pretrain/Step": 16605, "Pretrain/Step Time": 8.500189777463675} +{"Pretrain/Learning Rate": 2.161708905020024e-06, "Pretrain/Loss": 1.9953314065933228, "Pretrain/Loss (Raw)": 2.014397382736206, "Pretrain/Step": 16606, "Pretrain/Step Time": 8.498798619955778} +{"Pretrain/Learning Rate": 2.159982438013178e-06, "Pretrain/Loss": 1.9950073957443237, "Pretrain/Loss (Raw)": 1.726055383682251, "Pretrain/Step": 16607, "Pretrain/Step Time": 8.501442534849048} +{"Pretrain/Learning Rate": 2.158256629582131e-06, "Pretrain/Loss": 1.995809555053711, "Pretrain/Loss (Raw)": 2.1093063354492188, "Pretrain/Step": 16608, "Pretrain/Step Time": 8.498856073245406} +{"Pretrain/Learning Rate": 2.156531479776655e-06, "Pretrain/Loss": 1.99664306640625, "Pretrain/Loss (Raw)": 2.017362356185913, "Pretrain/Step": 16609, "Pretrain/Step Time": 8.503515724092722} +{"Pretrain/Learning Rate": 2.1548069886464878e-06, "Pretrain/Loss": 1.999630331993103, "Pretrain/Loss (Raw)": 2.1072611808776855, "Pretrain/Step": 16610, "Pretrain/Step Time": 8.502036483958364} +{"Pretrain/Learning Rate": 2.1530831562413587e-06, "Pretrain/Loss": 2.000332832336426, "Pretrain/Loss (Raw)": 1.9547187089920044, "Pretrain/Step": 16611, "Pretrain/Step Time": 8.501295283436775} +{"Pretrain/Learning Rate": 2.1513599826109705e-06, "Pretrain/Loss": 2.0002472400665283, "Pretrain/Loss (Raw)": 2.037372589111328, "Pretrain/Step": 16612, "Pretrain/Step Time": 8.503066327422857} +{"Pretrain/Learning Rate": 2.1496374678050076e-06, "Pretrain/Loss": 1.9975937604904175, "Pretrain/Loss (Raw)": 1.7377039194107056, "Pretrain/Step": 16613, "Pretrain/Step Time": 8.503815986216068} +{"Pretrain/Learning Rate": 2.1479156118731442e-06, "Pretrain/Loss": 1.9997609853744507, "Pretrain/Loss (Raw)": 2.1772966384887695, "Pretrain/Step": 16614, "Pretrain/Step Time": 8.501071417704225} +{"Pretrain/Learning Rate": 2.1461944148650186e-06, "Pretrain/Loss": 2.0029497146606445, "Pretrain/Loss (Raw)": 2.1084671020507812, "Pretrain/Step": 16615, "Pretrain/Step Time": 8.50359171256423} +{"Pretrain/Learning Rate": 2.144473876830272e-06, "Pretrain/Loss": 2.0013208389282227, "Pretrain/Loss (Raw)": 1.838001012802124, "Pretrain/Step": 16616, "Pretrain/Step Time": 8.501774564385414} +{"Pretrain/Learning Rate": 2.1427539978185086e-06, "Pretrain/Loss": 2.0006790161132812, "Pretrain/Loss (Raw)": 2.3879575729370117, "Pretrain/Step": 16617, "Pretrain/Step Time": 8.505586422979832} +{"Pretrain/Learning Rate": 2.141034777879314e-06, "Pretrain/Loss": 1.9987493753433228, "Pretrain/Loss (Raw)": 1.6703505516052246, "Pretrain/Step": 16618, "Pretrain/Step Time": 8.504138009622693} +{"Pretrain/Learning Rate": 2.1393162170622733e-06, "Pretrain/Loss": 1.9991424083709717, "Pretrain/Loss (Raw)": 2.0342507362365723, "Pretrain/Step": 16619, "Pretrain/Step Time": 8.506482776254416} +{"Pretrain/Learning Rate": 2.1375983154169304e-06, "Pretrain/Loss": 2.000020980834961, "Pretrain/Loss (Raw)": 2.045323610305786, "Pretrain/Step": 16620, "Pretrain/Step Time": 8.503702279180288} +{"Pretrain/Learning Rate": 2.1358810729928265e-06, "Pretrain/Loss": 2.0018343925476074, "Pretrain/Loss (Raw)": 2.0168609619140625, "Pretrain/Step": 16621, "Pretrain/Step Time": 8.498739188537002} +{"Pretrain/Learning Rate": 2.134164489839474e-06, "Pretrain/Loss": 1.9991986751556396, "Pretrain/Loss (Raw)": 1.8603017330169678, "Pretrain/Step": 16622, "Pretrain/Step Time": 8.502122787758708} +{"Pretrain/Learning Rate": 2.132448566006365e-06, "Pretrain/Loss": 1.997660756111145, "Pretrain/Loss (Raw)": 2.033714532852173, "Pretrain/Step": 16623, "Pretrain/Step Time": 8.502034293487668} +{"Pretrain/Learning Rate": 2.1307333015429835e-06, "Pretrain/Loss": 2.0008625984191895, "Pretrain/Loss (Raw)": 2.3858704566955566, "Pretrain/Step": 16624, "Pretrain/Step Time": 8.50478763319552} +{"Pretrain/Learning Rate": 2.129018696498783e-06, "Pretrain/Loss": 2.0001919269561768, "Pretrain/Loss (Raw)": 1.8352147340774536, "Pretrain/Step": 16625, "Pretrain/Step Time": 8.501575972884893} +{"Pretrain/Learning Rate": 2.127304750923209e-06, "Pretrain/Loss": 2.0003137588500977, "Pretrain/Loss (Raw)": 2.1558547019958496, "Pretrain/Step": 16626, "Pretrain/Step Time": 8.502184053882957} +{"Pretrain/Learning Rate": 2.1255914648656782e-06, "Pretrain/Loss": 2.0024847984313965, "Pretrain/Loss (Raw)": 2.016260862350464, "Pretrain/Step": 16627, "Pretrain/Step Time": 8.495643695816398} +{"Pretrain/Learning Rate": 2.123878838375587e-06, "Pretrain/Loss": 2.002603769302368, "Pretrain/Loss (Raw)": 1.9157962799072266, "Pretrain/Step": 16628, "Pretrain/Step Time": 8.49593660235405} +{"Pretrain/Learning Rate": 2.122166871502329e-06, "Pretrain/Loss": 2.001894950866699, "Pretrain/Loss (Raw)": 2.118117332458496, "Pretrain/Step": 16629, "Pretrain/Step Time": 8.494040861725807} +{"Pretrain/Learning Rate": 2.1204555642952567e-06, "Pretrain/Loss": 1.9965773820877075, "Pretrain/Loss (Raw)": 1.2202845811843872, "Pretrain/Step": 16630, "Pretrain/Step Time": 8.496295491233468} +{"Pretrain/Learning Rate": 2.118744916803722e-06, "Pretrain/Loss": 1.9988205432891846, "Pretrain/Loss (Raw)": 2.067909002304077, "Pretrain/Step": 16631, "Pretrain/Step Time": 8.499707298353314} +{"Pretrain/Learning Rate": 2.1170349290770497e-06, "Pretrain/Loss": 1.9985097646713257, "Pretrain/Loss (Raw)": 1.969016194343567, "Pretrain/Step": 16632, "Pretrain/Step Time": 8.497675500810146} +{"Pretrain/Learning Rate": 2.115325601164539e-06, "Pretrain/Loss": 1.9979503154754639, "Pretrain/Loss (Raw)": 1.8724334239959717, "Pretrain/Step": 16633, "Pretrain/Step Time": 8.49816220253706} +{"Pretrain/Learning Rate": 2.1136169331154835e-06, "Pretrain/Loss": 1.9941072463989258, "Pretrain/Loss (Raw)": 1.7512449026107788, "Pretrain/Step": 16634, "Pretrain/Step Time": 8.496007272973657} +{"Pretrain/Learning Rate": 2.11190892497915e-06, "Pretrain/Loss": 1.99635648727417, "Pretrain/Loss (Raw)": 2.168586254119873, "Pretrain/Step": 16635, "Pretrain/Step Time": 8.495481755584478} +{"Pretrain/Learning Rate": 2.110201576804788e-06, "Pretrain/Loss": 1.9981260299682617, "Pretrain/Loss (Raw)": 2.0323307514190674, "Pretrain/Step": 16636, "Pretrain/Step Time": 8.494161074981093} +{"Pretrain/Learning Rate": 2.1084948886416295e-06, "Pretrain/Loss": 2.0020318031311035, "Pretrain/Loss (Raw)": 2.2877390384674072, "Pretrain/Step": 16637, "Pretrain/Step Time": 8.4966352134943} +{"Pretrain/Learning Rate": 2.1067888605388774e-06, "Pretrain/Loss": 2.001152992248535, "Pretrain/Loss (Raw)": 1.9204879999160767, "Pretrain/Step": 16638, "Pretrain/Step Time": 8.496908342465758} +{"Pretrain/Learning Rate": 2.1050834925457368e-06, "Pretrain/Loss": 1.9950149059295654, "Pretrain/Loss (Raw)": 1.5165438652038574, "Pretrain/Step": 16639, "Pretrain/Step Time": 8.502629214897752} +{"Pretrain/Learning Rate": 2.1033787847113685e-06, "Pretrain/Loss": 1.9935181140899658, "Pretrain/Loss (Raw)": 1.8297683000564575, "Pretrain/Step": 16640, "Pretrain/Step Time": 8.502739030867815} +{"Pretrain/Learning Rate": 2.1016747370849353e-06, "Pretrain/Loss": 1.9943013191223145, "Pretrain/Loss (Raw)": 2.013789415359497, "Pretrain/Step": 16641, "Pretrain/Step Time": 8.49984927661717} +{"Pretrain/Learning Rate": 2.0999713497155683e-06, "Pretrain/Loss": 1.9946975708007812, "Pretrain/Loss (Raw)": 1.9002901315689087, "Pretrain/Step": 16642, "Pretrain/Step Time": 8.497712889686227} +{"Pretrain/Learning Rate": 2.0982686226523803e-06, "Pretrain/Loss": 1.9968887567520142, "Pretrain/Loss (Raw)": 2.2064437866210938, "Pretrain/Step": 16643, "Pretrain/Step Time": 8.497289603576064} +{"Pretrain/Learning Rate": 2.0965665559444763e-06, "Pretrain/Loss": 1.9990389347076416, "Pretrain/Loss (Raw)": 2.09831166267395, "Pretrain/Step": 16644, "Pretrain/Step Time": 8.49550231359899} +{"Pretrain/Learning Rate": 2.0948651496409263e-06, "Pretrain/Loss": 2.0009689331054688, "Pretrain/Loss (Raw)": 2.0346806049346924, "Pretrain/Step": 16645, "Pretrain/Step Time": 8.49507450684905} +{"Pretrain/Learning Rate": 2.0931644037907983e-06, "Pretrain/Loss": 2.0035343170166016, "Pretrain/Loss (Raw)": 2.188171148300171, "Pretrain/Step": 16646, "Pretrain/Step Time": 8.496927941218019} +{"Pretrain/Learning Rate": 2.091464318443118e-06, "Pretrain/Loss": 2.0027527809143066, "Pretrain/Loss (Raw)": 1.9847328662872314, "Pretrain/Step": 16647, "Pretrain/Step Time": 8.499711342155933} +{"Pretrain/Learning Rate": 2.0897648936469226e-06, "Pretrain/Loss": 2.003023862838745, "Pretrain/Loss (Raw)": 2.1267571449279785, "Pretrain/Step": 16648, "Pretrain/Step Time": 8.49476832151413} +{"Pretrain/Learning Rate": 2.088066129451205e-06, "Pretrain/Loss": 2.003561496734619, "Pretrain/Loss (Raw)": 1.896795392036438, "Pretrain/Step": 16649, "Pretrain/Step Time": 8.496117169037461} +{"Pretrain/Learning Rate": 2.0863680259049416e-06, "Pretrain/Loss": 2.00175142288208, "Pretrain/Loss (Raw)": 2.02315616607666, "Pretrain/Step": 16650, "Pretrain/Step Time": 8.493307318538427} +{"Pretrain/Learning Rate": 2.0846705830571106e-06, "Pretrain/Loss": 2.000448226928711, "Pretrain/Loss (Raw)": 1.9931889772415161, "Pretrain/Step": 16651, "Pretrain/Step Time": 8.49239033460617} +{"Pretrain/Learning Rate": 2.0829738009566446e-06, "Pretrain/Loss": 1.9983489513397217, "Pretrain/Loss (Raw)": 1.8924150466918945, "Pretrain/Step": 16652, "Pretrain/Step Time": 8.491104459390044} +{"Pretrain/Learning Rate": 2.081277679652477e-06, "Pretrain/Loss": 1.9980645179748535, "Pretrain/Loss (Raw)": 1.8210688829421997, "Pretrain/Step": 16653, "Pretrain/Step Time": 8.48978828266263} +{"Pretrain/Learning Rate": 2.07958221919351e-06, "Pretrain/Loss": 1.9997565746307373, "Pretrain/Loss (Raw)": 1.9590445756912231, "Pretrain/Step": 16654, "Pretrain/Step Time": 8.49580148793757} +{"Pretrain/Learning Rate": 2.0778874196286296e-06, "Pretrain/Loss": 2.000044107437134, "Pretrain/Loss (Raw)": 1.940146803855896, "Pretrain/Step": 16655, "Pretrain/Step Time": 8.495466284453869} +{"Pretrain/Learning Rate": 2.076193281006708e-06, "Pretrain/Loss": 1.9988406896591187, "Pretrain/Loss (Raw)": 1.805586814880371, "Pretrain/Step": 16656, "Pretrain/Step Time": 8.497404545545578} +{"Pretrain/Learning Rate": 2.074499803376592e-06, "Pretrain/Loss": 1.9987521171569824, "Pretrain/Loss (Raw)": 1.9268662929534912, "Pretrain/Step": 16657, "Pretrain/Step Time": 8.496591363102198} +{"Pretrain/Learning Rate": 2.072806986787115e-06, "Pretrain/Loss": 1.9985651969909668, "Pretrain/Loss (Raw)": 2.094090461730957, "Pretrain/Step": 16658, "Pretrain/Step Time": 8.492792524397373} +{"Pretrain/Learning Rate": 2.0711148312870854e-06, "Pretrain/Loss": 1.9983948469161987, "Pretrain/Loss (Raw)": 2.005101442337036, "Pretrain/Step": 16659, "Pretrain/Step Time": 8.49171482771635} +{"Pretrain/Learning Rate": 2.069423336925294e-06, "Pretrain/Loss": 1.9986419677734375, "Pretrain/Loss (Raw)": 1.873759388923645, "Pretrain/Step": 16660, "Pretrain/Step Time": 8.490517361089587} +{"Pretrain/Learning Rate": 2.0677325037505165e-06, "Pretrain/Loss": 1.9961663484573364, "Pretrain/Loss (Raw)": 1.9535375833511353, "Pretrain/Step": 16661, "Pretrain/Step Time": 8.490021688863635} +{"Pretrain/Learning Rate": 2.0660423318115047e-06, "Pretrain/Loss": 1.9979826211929321, "Pretrain/Loss (Raw)": 1.881170392036438, "Pretrain/Step": 16662, "Pretrain/Step Time": 8.495160425081849} +{"Pretrain/Learning Rate": 2.064352821156998e-06, "Pretrain/Loss": 1.9995800256729126, "Pretrain/Loss (Raw)": 2.285095691680908, "Pretrain/Step": 16663, "Pretrain/Step Time": 8.496867766603827} +{"Pretrain/Learning Rate": 2.06266397183571e-06, "Pretrain/Loss": 1.9993901252746582, "Pretrain/Loss (Raw)": 1.914023995399475, "Pretrain/Step": 16664, "Pretrain/Step Time": 8.49931145645678} +{"Pretrain/Learning Rate": 2.060975783896332e-06, "Pretrain/Loss": 2.0020885467529297, "Pretrain/Loss (Raw)": 2.1861658096313477, "Pretrain/Step": 16665, "Pretrain/Step Time": 8.501892112195492} +{"Pretrain/Learning Rate": 2.0592882573875485e-06, "Pretrain/Loss": 2.0030627250671387, "Pretrain/Loss (Raw)": 2.070406436920166, "Pretrain/Step": 16666, "Pretrain/Step Time": 8.500141683965921} +{"Pretrain/Learning Rate": 2.0576013923580133e-06, "Pretrain/Loss": 2.00108003616333, "Pretrain/Loss (Raw)": 1.847313404083252, "Pretrain/Step": 16667, "Pretrain/Step Time": 8.493107656016946} +{"Pretrain/Learning Rate": 2.055915188856375e-06, "Pretrain/Loss": 2.000929832458496, "Pretrain/Loss (Raw)": 1.9088488817214966, "Pretrain/Step": 16668, "Pretrain/Step Time": 8.489525441080332} +{"Pretrain/Learning Rate": 2.054229646931244e-06, "Pretrain/Loss": 2.0010645389556885, "Pretrain/Loss (Raw)": 2.004762649536133, "Pretrain/Step": 16669, "Pretrain/Step Time": 8.494790205731988} +{"Pretrain/Learning Rate": 2.052544766631223e-06, "Pretrain/Loss": 1.9993873834609985, "Pretrain/Loss (Raw)": 1.7753082513809204, "Pretrain/Step": 16670, "Pretrain/Step Time": 8.493089962750673} +{"Pretrain/Learning Rate": 2.0508605480049015e-06, "Pretrain/Loss": 2.0009500980377197, "Pretrain/Loss (Raw)": 2.331411361694336, "Pretrain/Step": 16671, "Pretrain/Step Time": 8.487655410543084} +{"Pretrain/Learning Rate": 2.049176991100832e-06, "Pretrain/Loss": 2.000129222869873, "Pretrain/Loss (Raw)": 1.9307589530944824, "Pretrain/Step": 16672, "Pretrain/Step Time": 8.486941920593381} +{"Pretrain/Learning Rate": 2.0474940959675727e-06, "Pretrain/Loss": 1.999948263168335, "Pretrain/Loss (Raw)": 1.928125262260437, "Pretrain/Step": 16673, "Pretrain/Step Time": 8.48795959353447} +{"Pretrain/Learning Rate": 2.0458118626536375e-06, "Pretrain/Loss": 2.001220941543579, "Pretrain/Loss (Raw)": 2.0404934883117676, "Pretrain/Step": 16674, "Pretrain/Step Time": 8.491709282621741} +{"Pretrain/Learning Rate": 2.0441302912075298e-06, "Pretrain/Loss": 2.0022873878479004, "Pretrain/Loss (Raw)": 2.0459039211273193, "Pretrain/Step": 16675, "Pretrain/Step Time": 8.489085171371698} +{"Pretrain/Learning Rate": 2.0424493816777496e-06, "Pretrain/Loss": 2.003671884536743, "Pretrain/Loss (Raw)": 1.9900668859481812, "Pretrain/Step": 16676, "Pretrain/Step Time": 8.486683085560799} +{"Pretrain/Learning Rate": 2.0407691341127575e-06, "Pretrain/Loss": 2.004258632659912, "Pretrain/Loss (Raw)": 2.1433775424957275, "Pretrain/Step": 16677, "Pretrain/Step Time": 8.485292507335544} +{"Pretrain/Learning Rate": 2.0390895485610017e-06, "Pretrain/Loss": 2.003021717071533, "Pretrain/Loss (Raw)": 1.8023658990859985, "Pretrain/Step": 16678, "Pretrain/Step Time": 8.49230552278459} +{"Pretrain/Learning Rate": 2.037410625070907e-06, "Pretrain/Loss": 2.0033082962036133, "Pretrain/Loss (Raw)": 1.8183642625808716, "Pretrain/Step": 16679, "Pretrain/Step Time": 8.491592613980174} +{"Pretrain/Learning Rate": 2.0357323636908956e-06, "Pretrain/Loss": 2.0028793811798096, "Pretrain/Loss (Raw)": 1.9862416982650757, "Pretrain/Step": 16680, "Pretrain/Step Time": 8.490052007138729} +{"Pretrain/Learning Rate": 2.0340547644693506e-06, "Pretrain/Loss": 2.000283718109131, "Pretrain/Loss (Raw)": 2.0787277221679688, "Pretrain/Step": 16681, "Pretrain/Step Time": 8.490799127146602} +{"Pretrain/Learning Rate": 2.0323778274546428e-06, "Pretrain/Loss": 2.000765562057495, "Pretrain/Loss (Raw)": 2.062516212463379, "Pretrain/Step": 16682, "Pretrain/Step Time": 8.48899051360786} +{"Pretrain/Learning Rate": 2.030701552695136e-06, "Pretrain/Loss": 2.0010249614715576, "Pretrain/Loss (Raw)": 1.9064302444458008, "Pretrain/Step": 16683, "Pretrain/Step Time": 8.48656765371561} +{"Pretrain/Learning Rate": 2.029025940239149e-06, "Pretrain/Loss": 2.0009875297546387, "Pretrain/Loss (Raw)": 2.026698112487793, "Pretrain/Step": 16684, "Pretrain/Step Time": 8.480207197368145} +{"Pretrain/Learning Rate": 2.027350990135013e-06, "Pretrain/Loss": 1.9961321353912354, "Pretrain/Loss (Raw)": 1.5757704973220825, "Pretrain/Step": 16685, "Pretrain/Step Time": 8.485443010926247} +{"Pretrain/Learning Rate": 2.0256767024310147e-06, "Pretrain/Loss": 1.9982597827911377, "Pretrain/Loss (Raw)": 2.137080669403076, "Pretrain/Step": 16686, "Pretrain/Step Time": 8.486603830009699} +{"Pretrain/Learning Rate": 2.024003077175429e-06, "Pretrain/Loss": 1.999147653579712, "Pretrain/Loss (Raw)": 2.172450065612793, "Pretrain/Step": 16687, "Pretrain/Step Time": 8.483506022021174} +{"Pretrain/Learning Rate": 2.0223301144165237e-06, "Pretrain/Loss": 1.9978471994400024, "Pretrain/Loss (Raw)": 1.8653693199157715, "Pretrain/Step": 16688, "Pretrain/Step Time": 8.486278438940644} +{"Pretrain/Learning Rate": 2.0206578142025256e-06, "Pretrain/Loss": 1.9985191822052002, "Pretrain/Loss (Raw)": 1.8137249946594238, "Pretrain/Step": 16689, "Pretrain/Step Time": 8.484785787761211} +{"Pretrain/Learning Rate": 2.0189861765816638e-06, "Pretrain/Loss": 1.9999792575836182, "Pretrain/Loss (Raw)": 2.161571741104126, "Pretrain/Step": 16690, "Pretrain/Step Time": 8.485167901962996} +{"Pretrain/Learning Rate": 2.017315201602135e-06, "Pretrain/Loss": 1.9995144605636597, "Pretrain/Loss (Raw)": 1.8917430639266968, "Pretrain/Step": 16691, "Pretrain/Step Time": 8.487564746290445} +{"Pretrain/Learning Rate": 2.0156448893121184e-06, "Pretrain/Loss": 2.0004851818084717, "Pretrain/Loss (Raw)": 2.0657145977020264, "Pretrain/Step": 16692, "Pretrain/Step Time": 8.483921000733972} +{"Pretrain/Learning Rate": 2.013975239759783e-06, "Pretrain/Loss": 1.999435305595398, "Pretrain/Loss (Raw)": 2.0087502002716064, "Pretrain/Step": 16693, "Pretrain/Step Time": 8.490806490182877} +{"Pretrain/Learning Rate": 2.0123062529932596e-06, "Pretrain/Loss": 1.9964927434921265, "Pretrain/Loss (Raw)": 1.9442418813705444, "Pretrain/Step": 16694, "Pretrain/Step Time": 8.492149997502565} +{"Pretrain/Learning Rate": 2.010637929060688e-06, "Pretrain/Loss": 1.9976742267608643, "Pretrain/Loss (Raw)": 1.9650776386260986, "Pretrain/Step": 16695, "Pretrain/Step Time": 8.489360375329852} +{"Pretrain/Learning Rate": 2.008970268010163e-06, "Pretrain/Loss": 1.9950697422027588, "Pretrain/Loss (Raw)": 1.7886700630187988, "Pretrain/Step": 16696, "Pretrain/Step Time": 8.496351197361946} +{"Pretrain/Learning Rate": 2.007303269889768e-06, "Pretrain/Loss": 1.9940698146820068, "Pretrain/Loss (Raw)": 1.7960013151168823, "Pretrain/Step": 16697, "Pretrain/Step Time": 8.49280241690576} +{"Pretrain/Learning Rate": 2.005636934747582e-06, "Pretrain/Loss": 1.9930542707443237, "Pretrain/Loss (Raw)": 1.8926408290863037, "Pretrain/Step": 16698, "Pretrain/Step Time": 8.494015356525779} +{"Pretrain/Learning Rate": 2.0039712626316375e-06, "Pretrain/Loss": 1.9918830394744873, "Pretrain/Loss (Raw)": 1.8889063596725464, "Pretrain/Step": 16699, "Pretrain/Step Time": 8.48697423376143} +{"Pretrain/Learning Rate": 2.002306253589975e-06, "Pretrain/Loss": 1.990700125694275, "Pretrain/Loss (Raw)": 1.9616589546203613, "Pretrain/Step": 16700, "Pretrain/Step Time": 8.486411454156041} +{"Pretrain/Learning Rate": 2.000641907670603e-06, "Pretrain/Loss": 1.989108681678772, "Pretrain/Loss (Raw)": 1.8957006931304932, "Pretrain/Step": 16701, "Pretrain/Step Time": 8.48619306460023} +{"Pretrain/Learning Rate": 1.9989782249214995e-06, "Pretrain/Loss": 1.9905067682266235, "Pretrain/Loss (Raw)": 2.037966251373291, "Pretrain/Step": 16702, "Pretrain/Step Time": 8.492782037705183} +{"Pretrain/Learning Rate": 1.9973152053906515e-06, "Pretrain/Loss": 1.9920170307159424, "Pretrain/Loss (Raw)": 1.895177960395813, "Pretrain/Step": 16703, "Pretrain/Step Time": 8.490108696743846} +{"Pretrain/Learning Rate": 1.995652849125998e-06, "Pretrain/Loss": 1.9909905195236206, "Pretrain/Loss (Raw)": 2.0428669452667236, "Pretrain/Step": 16704, "Pretrain/Step Time": 8.488828340545297} +{"Pretrain/Learning Rate": 1.9939911561754815e-06, "Pretrain/Loss": 1.9864461421966553, "Pretrain/Loss (Raw)": 1.6251965761184692, "Pretrain/Step": 16705, "Pretrain/Step Time": 8.496873129159212} +{"Pretrain/Learning Rate": 1.992330126587011e-06, "Pretrain/Loss": 1.9865505695343018, "Pretrain/Loss (Raw)": 1.9174765348434448, "Pretrain/Step": 16706, "Pretrain/Step Time": 8.496949827298522} +{"Pretrain/Learning Rate": 1.990669760408481e-06, "Pretrain/Loss": 1.9897119998931885, "Pretrain/Loss (Raw)": 2.2192866802215576, "Pretrain/Step": 16707, "Pretrain/Step Time": 8.494024766609073} +{"Pretrain/Learning Rate": 1.9890100576877707e-06, "Pretrain/Loss": 1.9898576736450195, "Pretrain/Loss (Raw)": 1.8927499055862427, "Pretrain/Step": 16708, "Pretrain/Step Time": 8.494504995644093} +{"Pretrain/Learning Rate": 1.987351018472727e-06, "Pretrain/Loss": 1.9882018566131592, "Pretrain/Loss (Raw)": 1.873258352279663, "Pretrain/Step": 16709, "Pretrain/Step Time": 8.494924049824476} +{"Pretrain/Learning Rate": 1.9856926428112014e-06, "Pretrain/Loss": 1.9908679723739624, "Pretrain/Loss (Raw)": 2.300572395324707, "Pretrain/Step": 16710, "Pretrain/Step Time": 8.496142806485295} +{"Pretrain/Learning Rate": 1.984034930750997e-06, "Pretrain/Loss": 1.98787522315979, "Pretrain/Loss (Raw)": 2.0241806507110596, "Pretrain/Step": 16711, "Pretrain/Step Time": 8.499153383076191} +{"Pretrain/Learning Rate": 1.982377882339928e-06, "Pretrain/Loss": 1.9879108667373657, "Pretrain/Loss (Raw)": 2.0683929920196533, "Pretrain/Step": 16712, "Pretrain/Step Time": 8.499869113788009} +{"Pretrain/Learning Rate": 1.980721497625765e-06, "Pretrain/Loss": 1.986793041229248, "Pretrain/Loss (Raw)": 1.9386887550354004, "Pretrain/Step": 16713, "Pretrain/Step Time": 8.499673577025533} +{"Pretrain/Learning Rate": 1.9790657766562635e-06, "Pretrain/Loss": 1.986548900604248, "Pretrain/Loss (Raw)": 1.9131629467010498, "Pretrain/Step": 16714, "Pretrain/Step Time": 8.501072438433766} +{"Pretrain/Learning Rate": 1.977410719479178e-06, "Pretrain/Loss": 1.9862287044525146, "Pretrain/Loss (Raw)": 2.143697500228882, "Pretrain/Step": 16715, "Pretrain/Step Time": 8.49921951815486} +{"Pretrain/Learning Rate": 1.9757563261422223e-06, "Pretrain/Loss": 1.9882280826568604, "Pretrain/Loss (Raw)": 2.111955404281616, "Pretrain/Step": 16716, "Pretrain/Step Time": 8.49892227910459} +{"Pretrain/Learning Rate": 1.9741025966931033e-06, "Pretrain/Loss": 1.9888052940368652, "Pretrain/Loss (Raw)": 2.1027934551239014, "Pretrain/Step": 16717, "Pretrain/Step Time": 8.4978341832757} +{"Pretrain/Learning Rate": 1.9724495311795042e-06, "Pretrain/Loss": 1.9891114234924316, "Pretrain/Loss (Raw)": 2.047332763671875, "Pretrain/Step": 16718, "Pretrain/Step Time": 8.492838986217976} +{"Pretrain/Learning Rate": 1.970797129649085e-06, "Pretrain/Loss": 1.9847971200942993, "Pretrain/Loss (Raw)": 1.8324352502822876, "Pretrain/Step": 16719, "Pretrain/Step Time": 8.49166714027524} +{"Pretrain/Learning Rate": 1.9691453921495016e-06, "Pretrain/Loss": 1.983819603919983, "Pretrain/Loss (Raw)": 2.00643253326416, "Pretrain/Step": 16720, "Pretrain/Step Time": 8.500012956559658} +{"Pretrain/Learning Rate": 1.967494318728369e-06, "Pretrain/Loss": 1.9829206466674805, "Pretrain/Loss (Raw)": 1.7865604162216187, "Pretrain/Step": 16721, "Pretrain/Step Time": 8.499162688851357} +{"Pretrain/Learning Rate": 1.965843909433307e-06, "Pretrain/Loss": 1.98313570022583, "Pretrain/Loss (Raw)": 1.895734190940857, "Pretrain/Step": 16722, "Pretrain/Step Time": 8.49987062625587} +{"Pretrain/Learning Rate": 1.964194164311897e-06, "Pretrain/Loss": 1.9840049743652344, "Pretrain/Loss (Raw)": 2.165919303894043, "Pretrain/Step": 16723, "Pretrain/Step Time": 8.500975742936134} +{"Pretrain/Learning Rate": 1.962545083411704e-06, "Pretrain/Loss": 1.9866151809692383, "Pretrain/Loss (Raw)": 2.2730636596679688, "Pretrain/Step": 16724, "Pretrain/Step Time": 8.50205965526402} +{"Pretrain/Learning Rate": 1.9608966667802903e-06, "Pretrain/Loss": 1.984999179840088, "Pretrain/Loss (Raw)": 1.7371306419372559, "Pretrain/Step": 16725, "Pretrain/Step Time": 8.503011191263795} +{"Pretrain/Learning Rate": 1.9592489144651727e-06, "Pretrain/Loss": 1.9828009605407715, "Pretrain/Loss (Raw)": 2.0751490592956543, "Pretrain/Step": 16726, "Pretrain/Step Time": 8.499436881393194} +{"Pretrain/Learning Rate": 1.9576018265138747e-06, "Pretrain/Loss": 1.9832775592803955, "Pretrain/Loss (Raw)": 1.9299787282943726, "Pretrain/Step": 16727, "Pretrain/Step Time": 8.497841058298945} +{"Pretrain/Learning Rate": 1.9559554029738857e-06, "Pretrain/Loss": 1.9825727939605713, "Pretrain/Loss (Raw)": 2.120406150817871, "Pretrain/Step": 16728, "Pretrain/Step Time": 8.498732475563884} +{"Pretrain/Learning Rate": 1.954309643892671e-06, "Pretrain/Loss": 1.979529619216919, "Pretrain/Loss (Raw)": 1.75147545337677, "Pretrain/Step": 16729, "Pretrain/Step Time": 8.50225698389113} +{"Pretrain/Learning Rate": 1.9526645493176983e-06, "Pretrain/Loss": 1.980134129524231, "Pretrain/Loss (Raw)": 2.1395466327667236, "Pretrain/Step": 16730, "Pretrain/Step Time": 8.497137691825628} +{"Pretrain/Learning Rate": 1.9510201192963902e-06, "Pretrain/Loss": 1.9792943000793457, "Pretrain/Loss (Raw)": 1.8017449378967285, "Pretrain/Step": 16731, "Pretrain/Step Time": 8.49490712210536} +{"Pretrain/Learning Rate": 1.9493763538761726e-06, "Pretrain/Loss": 1.9775898456573486, "Pretrain/Loss (Raw)": 1.8748047351837158, "Pretrain/Step": 16732, "Pretrain/Step Time": 8.496471263468266} +{"Pretrain/Learning Rate": 1.947733253104439e-06, "Pretrain/Loss": 1.975083351135254, "Pretrain/Loss (Raw)": 1.7977896928787231, "Pretrain/Step": 16733, "Pretrain/Step Time": 8.4919970985502} +{"Pretrain/Learning Rate": 1.946090817028562e-06, "Pretrain/Loss": 1.9739041328430176, "Pretrain/Loss (Raw)": 1.8634499311447144, "Pretrain/Step": 16734, "Pretrain/Step Time": 8.491931937634945} +{"Pretrain/Learning Rate": 1.944449045695909e-06, "Pretrain/Loss": 1.9745762348175049, "Pretrain/Loss (Raw)": 1.8120818138122559, "Pretrain/Step": 16735, "Pretrain/Step Time": 8.487211683765054} +{"Pretrain/Learning Rate": 1.9428079391538097e-06, "Pretrain/Loss": 1.9728745222091675, "Pretrain/Loss (Raw)": 1.8914897441864014, "Pretrain/Step": 16736, "Pretrain/Step Time": 8.489649092778563} +{"Pretrain/Learning Rate": 1.941167497449595e-06, "Pretrain/Loss": 1.9697978496551514, "Pretrain/Loss (Raw)": 1.623548150062561, "Pretrain/Step": 16737, "Pretrain/Step Time": 8.486375039443374} +{"Pretrain/Learning Rate": 1.939527720630557e-06, "Pretrain/Loss": 1.967108130455017, "Pretrain/Loss (Raw)": 1.762974500656128, "Pretrain/Step": 16738, "Pretrain/Step Time": 8.487959031015635} +{"Pretrain/Learning Rate": 1.937888608743979e-06, "Pretrain/Loss": 1.965266227722168, "Pretrain/Loss (Raw)": 1.7189491987228394, "Pretrain/Step": 16739, "Pretrain/Step Time": 8.486921846866608} +{"Pretrain/Learning Rate": 1.9362501618371277e-06, "Pretrain/Loss": 1.9656651020050049, "Pretrain/Loss (Raw)": 2.088442087173462, "Pretrain/Step": 16740, "Pretrain/Step Time": 8.484540367498994} +{"Pretrain/Learning Rate": 1.934612379957243e-06, "Pretrain/Loss": 1.9682648181915283, "Pretrain/Loss (Raw)": 2.070451259613037, "Pretrain/Step": 16741, "Pretrain/Step Time": 8.483042733743787} +{"Pretrain/Learning Rate": 1.9329752631515513e-06, "Pretrain/Loss": 1.965518593788147, "Pretrain/Loss (Raw)": 1.8257946968078613, "Pretrain/Step": 16742, "Pretrain/Step Time": 8.484978584572673} +{"Pretrain/Learning Rate": 1.9313388114672563e-06, "Pretrain/Loss": 1.9645938873291016, "Pretrain/Loss (Raw)": 1.9901090860366821, "Pretrain/Step": 16743, "Pretrain/Step Time": 8.48450850136578} +{"Pretrain/Learning Rate": 1.929703024951543e-06, "Pretrain/Loss": 1.9655033349990845, "Pretrain/Loss (Raw)": 1.9544100761413574, "Pretrain/Step": 16744, "Pretrain/Step Time": 8.486685758456588} +{"Pretrain/Learning Rate": 1.9280679036515813e-06, "Pretrain/Loss": 1.962012767791748, "Pretrain/Loss (Raw)": 1.9411613941192627, "Pretrain/Step": 16745, "Pretrain/Step Time": 8.48023466579616} +{"Pretrain/Learning Rate": 1.9264334476145146e-06, "Pretrain/Loss": 1.9635568857192993, "Pretrain/Loss (Raw)": 1.86801016330719, "Pretrain/Step": 16746, "Pretrain/Step Time": 8.481602769345045} +{"Pretrain/Learning Rate": 1.9247996568874773e-06, "Pretrain/Loss": 1.9639403820037842, "Pretrain/Loss (Raw)": 2.083314895629883, "Pretrain/Step": 16747, "Pretrain/Step Time": 8.481442760676146} +{"Pretrain/Learning Rate": 1.923166531517573e-06, "Pretrain/Loss": 1.9629310369491577, "Pretrain/Loss (Raw)": 1.9161349534988403, "Pretrain/Step": 16748, "Pretrain/Step Time": 8.479199472814798} +{"Pretrain/Learning Rate": 1.921534071551892e-06, "Pretrain/Loss": 1.9635258913040161, "Pretrain/Loss (Raw)": 2.0930001735687256, "Pretrain/Step": 16749, "Pretrain/Step Time": 8.483497953042388} +{"Pretrain/Learning Rate": 1.919902277037511e-06, "Pretrain/Loss": 1.964966893196106, "Pretrain/Loss (Raw)": 2.0447585582733154, "Pretrain/Step": 16750, "Pretrain/Step Time": 8.483731172978878} +{"Pretrain/Learning Rate": 1.918271148021472e-06, "Pretrain/Loss": 1.969405174255371, "Pretrain/Loss (Raw)": 2.6018152236938477, "Pretrain/Step": 16751, "Pretrain/Step Time": 8.48320729099214} +{"Pretrain/Learning Rate": 1.916640684550816e-06, "Pretrain/Loss": 1.9661598205566406, "Pretrain/Loss (Raw)": 1.9704591035842896, "Pretrain/Step": 16752, "Pretrain/Step Time": 8.48480780981481} +{"Pretrain/Learning Rate": 1.9150108866725554e-06, "Pretrain/Loss": 1.9703447818756104, "Pretrain/Loss (Raw)": 2.370884418487549, "Pretrain/Step": 16753, "Pretrain/Step Time": 8.489546447992325} +{"Pretrain/Learning Rate": 1.913381754433677e-06, "Pretrain/Loss": 1.9705990552902222, "Pretrain/Loss (Raw)": 2.188413619995117, "Pretrain/Step": 16754, "Pretrain/Step Time": 8.49095700122416} +{"Pretrain/Learning Rate": 1.9117532878811655e-06, "Pretrain/Loss": 1.971578598022461, "Pretrain/Loss (Raw)": 2.1416237354278564, "Pretrain/Step": 16755, "Pretrain/Step Time": 8.492959154769778} +{"Pretrain/Learning Rate": 1.9101254870619646e-06, "Pretrain/Loss": 1.9717549085617065, "Pretrain/Loss (Raw)": 1.9383869171142578, "Pretrain/Step": 16756, "Pretrain/Step Time": 8.498118476942182} +{"Pretrain/Learning Rate": 1.908498352023025e-06, "Pretrain/Loss": 1.9708788394927979, "Pretrain/Loss (Raw)": 2.00596022605896, "Pretrain/Step": 16757, "Pretrain/Step Time": 8.498665392398834} +{"Pretrain/Learning Rate": 1.9068718828112564e-06, "Pretrain/Loss": 1.9760792255401611, "Pretrain/Loss (Raw)": 1.8859533071517944, "Pretrain/Step": 16758, "Pretrain/Step Time": 8.496205063536763} +{"Pretrain/Learning Rate": 1.905246079473555e-06, "Pretrain/Loss": 1.9750479459762573, "Pretrain/Loss (Raw)": 1.9359034299850464, "Pretrain/Step": 16759, "Pretrain/Step Time": 8.491838049143553} +{"Pretrain/Learning Rate": 1.9036209420568052e-06, "Pretrain/Loss": 1.9768569469451904, "Pretrain/Loss (Raw)": 2.2005648612976074, "Pretrain/Step": 16760, "Pretrain/Step Time": 8.495749525725842} +{"Pretrain/Learning Rate": 1.9019964706078614e-06, "Pretrain/Loss": 1.9773987531661987, "Pretrain/Loss (Raw)": 1.9417897462844849, "Pretrain/Step": 16761, "Pretrain/Step Time": 8.502138253301382} +{"Pretrain/Learning Rate": 1.9003726651735692e-06, "Pretrain/Loss": 1.979744553565979, "Pretrain/Loss (Raw)": 2.051502227783203, "Pretrain/Step": 16762, "Pretrain/Step Time": 8.499218937009573} +{"Pretrain/Learning Rate": 1.8987495258007414e-06, "Pretrain/Loss": 1.9789230823516846, "Pretrain/Loss (Raw)": 2.0634233951568604, "Pretrain/Step": 16763, "Pretrain/Step Time": 8.500278249382973} +{"Pretrain/Learning Rate": 1.8971270525361906e-06, "Pretrain/Loss": 1.9791947603225708, "Pretrain/Loss (Raw)": 2.0671205520629883, "Pretrain/Step": 16764, "Pretrain/Step Time": 8.499815287068486} +{"Pretrain/Learning Rate": 1.8955052454266958e-06, "Pretrain/Loss": 1.976332664489746, "Pretrain/Loss (Raw)": 1.9213957786560059, "Pretrain/Step": 16765, "Pretrain/Step Time": 8.494781084358692} +{"Pretrain/Learning Rate": 1.8938841045190143e-06, "Pretrain/Loss": 1.9767035245895386, "Pretrain/Loss (Raw)": 1.9679478406906128, "Pretrain/Step": 16766, "Pretrain/Step Time": 8.496457712724805} +{"Pretrain/Learning Rate": 1.8922636298599e-06, "Pretrain/Loss": 1.9801836013793945, "Pretrain/Loss (Raw)": 1.9619860649108887, "Pretrain/Step": 16767, "Pretrain/Step Time": 8.494421249255538} +{"Pretrain/Learning Rate": 1.8906438214960686e-06, "Pretrain/Loss": 1.9809757471084595, "Pretrain/Loss (Raw)": 1.9311625957489014, "Pretrain/Step": 16768, "Pretrain/Step Time": 8.49648792296648} +{"Pretrain/Learning Rate": 1.8890246794742384e-06, "Pretrain/Loss": 1.9809945821762085, "Pretrain/Loss (Raw)": 2.01621413230896, "Pretrain/Step": 16769, "Pretrain/Step Time": 8.502875111997128} +{"Pretrain/Learning Rate": 1.8874062038410856e-06, "Pretrain/Loss": 1.9815417528152466, "Pretrain/Loss (Raw)": 1.9703279733657837, "Pretrain/Step": 16770, "Pretrain/Step Time": 8.501612255349755} +{"Pretrain/Learning Rate": 1.8857883946432813e-06, "Pretrain/Loss": 1.9794466495513916, "Pretrain/Loss (Raw)": 1.9382573366165161, "Pretrain/Step": 16771, "Pretrain/Step Time": 8.502410588786006} +{"Pretrain/Learning Rate": 1.8841712519274773e-06, "Pretrain/Loss": 1.9792078733444214, "Pretrain/Loss (Raw)": 2.067763328552246, "Pretrain/Step": 16772, "Pretrain/Step Time": 8.503481812775135} +{"Pretrain/Learning Rate": 1.8825547757402945e-06, "Pretrain/Loss": 1.9786162376403809, "Pretrain/Loss (Raw)": 1.958954930305481, "Pretrain/Step": 16773, "Pretrain/Step Time": 8.49780766479671} +{"Pretrain/Learning Rate": 1.8809389661283538e-06, "Pretrain/Loss": 1.977588415145874, "Pretrain/Loss (Raw)": 2.056596517562866, "Pretrain/Step": 16774, "Pretrain/Step Time": 8.495549287647009} +{"Pretrain/Learning Rate": 1.8793238231382375e-06, "Pretrain/Loss": 1.9779647588729858, "Pretrain/Loss (Raw)": 2.0329082012176514, "Pretrain/Step": 16775, "Pretrain/Step Time": 8.493569139391184} +{"Pretrain/Learning Rate": 1.877709346816517e-06, "Pretrain/Loss": 1.976426601409912, "Pretrain/Loss (Raw)": 1.9298629760742188, "Pretrain/Step": 16776, "Pretrain/Step Time": 8.497117640450597} +{"Pretrain/Learning Rate": 1.8760955372097515e-06, "Pretrain/Loss": 1.978910207748413, "Pretrain/Loss (Raw)": 2.214717388153076, "Pretrain/Step": 16777, "Pretrain/Step Time": 8.497737381607294} +{"Pretrain/Learning Rate": 1.8744823943644657e-06, "Pretrain/Loss": 1.978208065032959, "Pretrain/Loss (Raw)": 1.933261752128601, "Pretrain/Step": 16778, "Pretrain/Step Time": 8.500763919204473} +{"Pretrain/Learning Rate": 1.872869918327183e-06, "Pretrain/Loss": 1.9792160987854004, "Pretrain/Loss (Raw)": 2.1222293376922607, "Pretrain/Step": 16779, "Pretrain/Step Time": 8.500373251736164} +{"Pretrain/Learning Rate": 1.8712581091443888e-06, "Pretrain/Loss": 1.980247974395752, "Pretrain/Loss (Raw)": 2.0244951248168945, "Pretrain/Step": 16780, "Pretrain/Step Time": 8.496614748612046} +{"Pretrain/Learning Rate": 1.869646966862565e-06, "Pretrain/Loss": 1.9823070764541626, "Pretrain/Loss (Raw)": 2.084644079208374, "Pretrain/Step": 16781, "Pretrain/Step Time": 8.49651019461453} +{"Pretrain/Learning Rate": 1.8680364915281634e-06, "Pretrain/Loss": 1.984006404876709, "Pretrain/Loss (Raw)": 2.176532030105591, "Pretrain/Step": 16782, "Pretrain/Step Time": 8.489769905805588} +{"Pretrain/Learning Rate": 1.866426683187622e-06, "Pretrain/Loss": 1.9851515293121338, "Pretrain/Loss (Raw)": 2.086733341217041, "Pretrain/Step": 16783, "Pretrain/Step Time": 8.488410525023937} +{"Pretrain/Learning Rate": 1.864817541887362e-06, "Pretrain/Loss": 1.9845263957977295, "Pretrain/Loss (Raw)": 1.7255685329437256, "Pretrain/Step": 16784, "Pretrain/Step Time": 8.494026871398091} +{"Pretrain/Learning Rate": 1.863209067673774e-06, "Pretrain/Loss": 1.985098123550415, "Pretrain/Loss (Raw)": 2.0000438690185547, "Pretrain/Step": 16785, "Pretrain/Step Time": 8.494044221937656} +{"Pretrain/Learning Rate": 1.861601260593246e-06, "Pretrain/Loss": 1.9831327199935913, "Pretrain/Loss (Raw)": 1.8425205945968628, "Pretrain/Step": 16786, "Pretrain/Step Time": 8.494917504489422} +{"Pretrain/Learning Rate": 1.859994120692135e-06, "Pretrain/Loss": 1.982677936553955, "Pretrain/Loss (Raw)": 1.9469026327133179, "Pretrain/Step": 16787, "Pretrain/Step Time": 8.498169902712107} +{"Pretrain/Learning Rate": 1.8583876480167767e-06, "Pretrain/Loss": 1.9834638833999634, "Pretrain/Loss (Raw)": 1.9743436574935913, "Pretrain/Step": 16788, "Pretrain/Step Time": 8.499358559027314} +{"Pretrain/Learning Rate": 1.8567818426135004e-06, "Pretrain/Loss": 1.9833433628082275, "Pretrain/Loss (Raw)": 1.9381352663040161, "Pretrain/Step": 16789, "Pretrain/Step Time": 8.498574044555426} +{"Pretrain/Learning Rate": 1.8551767045286022e-06, "Pretrain/Loss": 1.9841976165771484, "Pretrain/Loss (Raw)": 1.9905015230178833, "Pretrain/Step": 16790, "Pretrain/Step Time": 8.492307348176837} +{"Pretrain/Learning Rate": 1.8535722338083704e-06, "Pretrain/Loss": 1.9835606813430786, "Pretrain/Loss (Raw)": 2.203564167022705, "Pretrain/Step": 16791, "Pretrain/Step Time": 8.490204242989421} +{"Pretrain/Learning Rate": 1.8519684304990653e-06, "Pretrain/Loss": 1.9850565195083618, "Pretrain/Loss (Raw)": 2.1054904460906982, "Pretrain/Step": 16792, "Pretrain/Step Time": 8.491559011861682} +{"Pretrain/Learning Rate": 1.8503652946469303e-06, "Pretrain/Loss": 1.985409140586853, "Pretrain/Loss (Raw)": 2.231318235397339, "Pretrain/Step": 16793, "Pretrain/Step Time": 8.48859565705061} +{"Pretrain/Learning Rate": 1.8487628262981948e-06, "Pretrain/Loss": 1.9858999252319336, "Pretrain/Loss (Raw)": 2.133211612701416, "Pretrain/Step": 16794, "Pretrain/Step Time": 8.49174347706139} +{"Pretrain/Learning Rate": 1.8471610254990613e-06, "Pretrain/Loss": 1.9858794212341309, "Pretrain/Loss (Raw)": 1.8446851968765259, "Pretrain/Step": 16795, "Pretrain/Step Time": 8.491888668388128} +{"Pretrain/Learning Rate": 1.8455598922957201e-06, "Pretrain/Loss": 1.9848685264587402, "Pretrain/Loss (Raw)": 1.7794462442398071, "Pretrain/Step": 16796, "Pretrain/Step Time": 8.492254117503762} +{"Pretrain/Learning Rate": 1.8439594267343374e-06, "Pretrain/Loss": 1.9853533506393433, "Pretrain/Loss (Raw)": 2.0668489933013916, "Pretrain/Step": 16797, "Pretrain/Step Time": 8.490261347964406} +{"Pretrain/Learning Rate": 1.842359628861054e-06, "Pretrain/Loss": 1.9861717224121094, "Pretrain/Loss (Raw)": 1.880033254623413, "Pretrain/Step": 16798, "Pretrain/Step Time": 8.493885468691587} +{"Pretrain/Learning Rate": 1.8407604987220133e-06, "Pretrain/Loss": 1.9813220500946045, "Pretrain/Loss (Raw)": 1.7106765508651733, "Pretrain/Step": 16799, "Pretrain/Step Time": 8.491960313171148} +{"Pretrain/Learning Rate": 1.8391620363633094e-06, "Pretrain/Loss": 1.9838485717773438, "Pretrain/Loss (Raw)": 2.2541463375091553, "Pretrain/Step": 16800, "Pretrain/Step Time": 8.495721792802215} +{"Pretrain/Learning Rate": 1.8375642418310496e-06, "Pretrain/Loss": 1.9834840297698975, "Pretrain/Loss (Raw)": 1.8814563751220703, "Pretrain/Step": 16801, "Pretrain/Step Time": 8.490013247355819} +{"Pretrain/Learning Rate": 1.8359671151712916e-06, "Pretrain/Loss": 1.985358715057373, "Pretrain/Loss (Raw)": 2.2804532051086426, "Pretrain/Step": 16802, "Pretrain/Step Time": 8.493513138964772} +{"Pretrain/Learning Rate": 1.8343706564300927e-06, "Pretrain/Loss": 1.9839658737182617, "Pretrain/Loss (Raw)": 1.8676289319992065, "Pretrain/Step": 16803, "Pretrain/Step Time": 8.49354655481875} +{"Pretrain/Learning Rate": 1.832774865653486e-06, "Pretrain/Loss": 1.9838981628417969, "Pretrain/Loss (Raw)": 1.981378197669983, "Pretrain/Step": 16804, "Pretrain/Step Time": 8.4946198053658} +{"Pretrain/Learning Rate": 1.8311797428874817e-06, "Pretrain/Loss": 1.9815350770950317, "Pretrain/Loss (Raw)": 1.8409253358840942, "Pretrain/Step": 16805, "Pretrain/Step Time": 8.495825659483671} +{"Pretrain/Learning Rate": 1.8295852881780817e-06, "Pretrain/Loss": 1.982557773590088, "Pretrain/Loss (Raw)": 1.9332648515701294, "Pretrain/Step": 16806, "Pretrain/Step Time": 8.4915872476995} +{"Pretrain/Learning Rate": 1.8279915015712522e-06, "Pretrain/Loss": 1.98787522315979, "Pretrain/Loss (Raw)": 2.499000310897827, "Pretrain/Step": 16807, "Pretrain/Step Time": 8.492611328139901} +{"Pretrain/Learning Rate": 1.8263983831129512e-06, "Pretrain/Loss": 1.9867202043533325, "Pretrain/Loss (Raw)": 1.8383907079696655, "Pretrain/Step": 16808, "Pretrain/Step Time": 8.493986532092094} +{"Pretrain/Learning Rate": 1.8248059328491217e-06, "Pretrain/Loss": 1.9868378639221191, "Pretrain/Loss (Raw)": 2.093808889389038, "Pretrain/Step": 16809, "Pretrain/Step Time": 8.492186959832907} +{"Pretrain/Learning Rate": 1.8232141508256696e-06, "Pretrain/Loss": 1.9870645999908447, "Pretrain/Loss (Raw)": 2.0915095806121826, "Pretrain/Step": 16810, "Pretrain/Step Time": 8.49274849705398} +{"Pretrain/Learning Rate": 1.8216230370885017e-06, "Pretrain/Loss": 1.9867644309997559, "Pretrain/Loss (Raw)": 1.868022084236145, "Pretrain/Step": 16811, "Pretrain/Step Time": 8.491155920550227} +{"Pretrain/Learning Rate": 1.820032591683496e-06, "Pretrain/Loss": 1.9853407144546509, "Pretrain/Loss (Raw)": 1.8444565534591675, "Pretrain/Step": 16812, "Pretrain/Step Time": 8.490291357040405} +{"Pretrain/Learning Rate": 1.818442814656507e-06, "Pretrain/Loss": 1.9868489503860474, "Pretrain/Loss (Raw)": 1.768837332725525, "Pretrain/Step": 16813, "Pretrain/Step Time": 8.486511688679457} +{"Pretrain/Learning Rate": 1.8168537060533787e-06, "Pretrain/Loss": 1.9845035076141357, "Pretrain/Loss (Raw)": 1.8368586301803589, "Pretrain/Step": 16814, "Pretrain/Step Time": 8.486135508865118} +{"Pretrain/Learning Rate": 1.815265265919927e-06, "Pretrain/Loss": 1.9820884466171265, "Pretrain/Loss (Raw)": 1.8633337020874023, "Pretrain/Step": 16815, "Pretrain/Step Time": 8.489638829603791} +{"Pretrain/Learning Rate": 1.813677494301963e-06, "Pretrain/Loss": 1.9820133447647095, "Pretrain/Loss (Raw)": 1.8557448387145996, "Pretrain/Step": 16816, "Pretrain/Step Time": 8.488380087539554} +{"Pretrain/Learning Rate": 1.8120903912452636e-06, "Pretrain/Loss": 1.9838073253631592, "Pretrain/Loss (Raw)": 2.0433437824249268, "Pretrain/Step": 16817, "Pretrain/Step Time": 8.487410377711058} +{"Pretrain/Learning Rate": 1.810503956795584e-06, "Pretrain/Loss": 1.983887791633606, "Pretrain/Loss (Raw)": 2.171884059906006, "Pretrain/Step": 16818, "Pretrain/Step Time": 8.493667991831899} +{"Pretrain/Learning Rate": 1.8089181909986818e-06, "Pretrain/Loss": 1.9848501682281494, "Pretrain/Loss (Raw)": 2.014941453933716, "Pretrain/Step": 16819, "Pretrain/Step Time": 8.489978522062302} +{"Pretrain/Learning Rate": 1.8073330939002708e-06, "Pretrain/Loss": 1.984452486038208, "Pretrain/Loss (Raw)": 2.01478910446167, "Pretrain/Step": 16820, "Pretrain/Step Time": 8.494772471487522} +{"Pretrain/Learning Rate": 1.8057486655460643e-06, "Pretrain/Loss": 1.9839386940002441, "Pretrain/Loss (Raw)": 1.942983865737915, "Pretrain/Step": 16821, "Pretrain/Step Time": 8.494305051863194} +{"Pretrain/Learning Rate": 1.8041649059817422e-06, "Pretrain/Loss": 1.9837418794631958, "Pretrain/Loss (Raw)": 1.9190617799758911, "Pretrain/Step": 16822, "Pretrain/Step Time": 8.494273075833917} +{"Pretrain/Learning Rate": 1.8025818152529712e-06, "Pretrain/Loss": 1.9818247556686401, "Pretrain/Loss (Raw)": 1.719693660736084, "Pretrain/Step": 16823, "Pretrain/Step Time": 8.49338306300342} +{"Pretrain/Learning Rate": 1.8009993934054031e-06, "Pretrain/Loss": 1.9835494756698608, "Pretrain/Loss (Raw)": 2.009416103363037, "Pretrain/Step": 16824, "Pretrain/Step Time": 8.484856078401208} +{"Pretrain/Learning Rate": 1.7994176404846603e-06, "Pretrain/Loss": 1.9872241020202637, "Pretrain/Loss (Raw)": 2.266347646713257, "Pretrain/Step": 16825, "Pretrain/Step Time": 8.490188701078296} +{"Pretrain/Learning Rate": 1.7978365565363586e-06, "Pretrain/Loss": 1.9878385066986084, "Pretrain/Loss (Raw)": 1.9712892770767212, "Pretrain/Step": 16826, "Pretrain/Step Time": 8.487242545932531} +{"Pretrain/Learning Rate": 1.7962561416060842e-06, "Pretrain/Loss": 1.9889469146728516, "Pretrain/Loss (Raw)": 2.030785083770752, "Pretrain/Step": 16827, "Pretrain/Step Time": 8.487482216209173} +{"Pretrain/Learning Rate": 1.7946763957394002e-06, "Pretrain/Loss": 1.989640712738037, "Pretrain/Loss (Raw)": 2.0504767894744873, "Pretrain/Step": 16828, "Pretrain/Step Time": 8.4846181999892} +{"Pretrain/Learning Rate": 1.793097318981868e-06, "Pretrain/Loss": 1.989409327507019, "Pretrain/Loss (Raw)": 1.8660613298416138, "Pretrain/Step": 16829, "Pretrain/Step Time": 8.482721157371998} +{"Pretrain/Learning Rate": 1.7915189113790115e-06, "Pretrain/Loss": 1.989932656288147, "Pretrain/Loss (Raw)": 2.1049726009368896, "Pretrain/Step": 16830, "Pretrain/Step Time": 8.480294832959771} +{"Pretrain/Learning Rate": 1.7899411729763504e-06, "Pretrain/Loss": 1.9911646842956543, "Pretrain/Loss (Raw)": 2.0528945922851562, "Pretrain/Step": 16831, "Pretrain/Step Time": 8.483655652031302} +{"Pretrain/Learning Rate": 1.7883641038193733e-06, "Pretrain/Loss": 1.9917373657226562, "Pretrain/Loss (Raw)": 2.116136074066162, "Pretrain/Step": 16832, "Pretrain/Step Time": 8.484017040580511} +{"Pretrain/Learning Rate": 1.7867877039535492e-06, "Pretrain/Loss": 1.9943801164627075, "Pretrain/Loss (Raw)": 1.963475227355957, "Pretrain/Step": 16833, "Pretrain/Step Time": 8.477401811629534} +{"Pretrain/Learning Rate": 1.7852119734243444e-06, "Pretrain/Loss": 1.9948878288269043, "Pretrain/Loss (Raw)": 1.9824706315994263, "Pretrain/Step": 16834, "Pretrain/Step Time": 8.48080788180232} +{"Pretrain/Learning Rate": 1.7836369122771812e-06, "Pretrain/Loss": 1.992469072341919, "Pretrain/Loss (Raw)": 1.9096893072128296, "Pretrain/Step": 16835, "Pretrain/Step Time": 8.481877783313394} +{"Pretrain/Learning Rate": 1.7820625205574843e-06, "Pretrain/Loss": 1.9931786060333252, "Pretrain/Loss (Raw)": 1.9835723638534546, "Pretrain/Step": 16836, "Pretrain/Step Time": 8.485370561480522} +{"Pretrain/Learning Rate": 1.7804887983106478e-06, "Pretrain/Loss": 1.9938483238220215, "Pretrain/Loss (Raw)": 1.9589611291885376, "Pretrain/Step": 16837, "Pretrain/Step Time": 8.487314274534583} +{"Pretrain/Learning Rate": 1.7789157455820438e-06, "Pretrain/Loss": 1.9914401769638062, "Pretrain/Loss (Raw)": 1.9923487901687622, "Pretrain/Step": 16838, "Pretrain/Step Time": 8.48862073943019} +{"Pretrain/Learning Rate": 1.7773433624170389e-06, "Pretrain/Loss": 1.992613673210144, "Pretrain/Loss (Raw)": 2.174391508102417, "Pretrain/Step": 16839, "Pretrain/Step Time": 8.485372746363282} +{"Pretrain/Learning Rate": 1.7757716488609633e-06, "Pretrain/Loss": 1.9912077188491821, "Pretrain/Loss (Raw)": 1.8884159326553345, "Pretrain/Step": 16840, "Pretrain/Step Time": 8.483003847301006} +{"Pretrain/Learning Rate": 1.7742006049591447e-06, "Pretrain/Loss": 1.9906853437423706, "Pretrain/Loss (Raw)": 1.8718348741531372, "Pretrain/Step": 16841, "Pretrain/Step Time": 8.483880886808038} +{"Pretrain/Learning Rate": 1.7726302307568777e-06, "Pretrain/Loss": 1.989784836769104, "Pretrain/Loss (Raw)": 1.7978874444961548, "Pretrain/Step": 16842, "Pretrain/Step Time": 8.483163394033909} +{"Pretrain/Learning Rate": 1.7710605262994395e-06, "Pretrain/Loss": 1.98954176902771, "Pretrain/Loss (Raw)": 2.11257266998291, "Pretrain/Step": 16843, "Pretrain/Step Time": 8.490717245265841} +{"Pretrain/Learning Rate": 1.7694914916320997e-06, "Pretrain/Loss": 1.9885621070861816, "Pretrain/Loss (Raw)": 1.9865713119506836, "Pretrain/Step": 16844, "Pretrain/Step Time": 8.487446280196309} +{"Pretrain/Learning Rate": 1.7679231268000972e-06, "Pretrain/Loss": 1.9876718521118164, "Pretrain/Loss (Raw)": 1.9888341426849365, "Pretrain/Step": 16845, "Pretrain/Step Time": 8.486659349873662} +{"Pretrain/Learning Rate": 1.7663554318486514e-06, "Pretrain/Loss": 1.9864457845687866, "Pretrain/Loss (Raw)": 1.89041006565094, "Pretrain/Step": 16846, "Pretrain/Step Time": 8.489011235535145} +{"Pretrain/Learning Rate": 1.7647884068229676e-06, "Pretrain/Loss": 1.9907920360565186, "Pretrain/Loss (Raw)": 2.3887598514556885, "Pretrain/Step": 16847, "Pretrain/Step Time": 8.492978369817138} +{"Pretrain/Learning Rate": 1.763222051768232e-06, "Pretrain/Loss": 1.9902245998382568, "Pretrain/Loss (Raw)": 1.9337869882583618, "Pretrain/Step": 16848, "Pretrain/Step Time": 8.492649720981717} +{"Pretrain/Learning Rate": 1.7616563667296055e-06, "Pretrain/Loss": 1.9906336069107056, "Pretrain/Loss (Raw)": 1.8389310836791992, "Pretrain/Step": 16849, "Pretrain/Step Time": 8.495504166930914} +{"Pretrain/Learning Rate": 1.7600913517522383e-06, "Pretrain/Loss": 1.9911673069000244, "Pretrain/Loss (Raw)": 1.9640333652496338, "Pretrain/Step": 16850, "Pretrain/Step Time": 8.495981240645051} +{"Pretrain/Learning Rate": 1.7585270068812553e-06, "Pretrain/Loss": 1.9873464107513428, "Pretrain/Loss (Raw)": 1.6768410205841064, "Pretrain/Step": 16851, "Pretrain/Step Time": 8.49045423604548} +{"Pretrain/Learning Rate": 1.7569633321617569e-06, "Pretrain/Loss": 1.9869775772094727, "Pretrain/Loss (Raw)": 2.22587513923645, "Pretrain/Step": 16852, "Pretrain/Step Time": 8.493191186338663} +{"Pretrain/Learning Rate": 1.755400327638837e-06, "Pretrain/Loss": 1.990020513534546, "Pretrain/Loss (Raw)": 2.1266071796417236, "Pretrain/Step": 16853, "Pretrain/Step Time": 8.497233401983976} +{"Pretrain/Learning Rate": 1.7538379933575628e-06, "Pretrain/Loss": 1.9898629188537598, "Pretrain/Loss (Raw)": 2.054990530014038, "Pretrain/Step": 16854, "Pretrain/Step Time": 8.496117506176233} +{"Pretrain/Learning Rate": 1.752276329362984e-06, "Pretrain/Loss": 1.9903762340545654, "Pretrain/Loss (Raw)": 1.995676875114441, "Pretrain/Step": 16855, "Pretrain/Step Time": 8.49554742500186} +{"Pretrain/Learning Rate": 1.7507153357001287e-06, "Pretrain/Loss": 1.9898322820663452, "Pretrain/Loss (Raw)": 2.0507867336273193, "Pretrain/Step": 16856, "Pretrain/Step Time": 8.499243006110191} +{"Pretrain/Learning Rate": 1.7491550124140028e-06, "Pretrain/Loss": 1.9906857013702393, "Pretrain/Loss (Raw)": 1.86070716381073, "Pretrain/Step": 16857, "Pretrain/Step Time": 8.495340168476105} +{"Pretrain/Learning Rate": 1.7475953595496086e-06, "Pretrain/Loss": 1.9905452728271484, "Pretrain/Loss (Raw)": 2.1215624809265137, "Pretrain/Step": 16858, "Pretrain/Step Time": 8.495783876627684} +{"Pretrain/Learning Rate": 1.7460363771519023e-06, "Pretrain/Loss": 1.9896519184112549, "Pretrain/Loss (Raw)": 1.6873799562454224, "Pretrain/Step": 16859, "Pretrain/Step Time": 8.500644750893116} +{"Pretrain/Learning Rate": 1.7444780652658505e-06, "Pretrain/Loss": 1.9905847311019897, "Pretrain/Loss (Raw)": 1.9942303895950317, "Pretrain/Step": 16860, "Pretrain/Step Time": 8.50107428431511} +{"Pretrain/Learning Rate": 1.7429204239363783e-06, "Pretrain/Loss": 1.9907240867614746, "Pretrain/Loss (Raw)": 1.8156323432922363, "Pretrain/Step": 16861, "Pretrain/Step Time": 8.49959504045546} +{"Pretrain/Learning Rate": 1.7413634532083973e-06, "Pretrain/Loss": 1.990845799446106, "Pretrain/Loss (Raw)": 1.8790267705917358, "Pretrain/Step": 16862, "Pretrain/Step Time": 8.4972043056041} +{"Pretrain/Learning Rate": 1.7398071531268072e-06, "Pretrain/Loss": 1.9930297136306763, "Pretrain/Loss (Raw)": 2.0916144847869873, "Pretrain/Step": 16863, "Pretrain/Step Time": 8.498157639056444} +{"Pretrain/Learning Rate": 1.7382515237364782e-06, "Pretrain/Loss": 1.9925895929336548, "Pretrain/Loss (Raw)": 1.835159182548523, "Pretrain/Step": 16864, "Pretrain/Step Time": 8.500961190089583} +{"Pretrain/Learning Rate": 1.7366965650822714e-06, "Pretrain/Loss": 1.99448823928833, "Pretrain/Loss (Raw)": 1.8665707111358643, "Pretrain/Step": 16865, "Pretrain/Step Time": 8.501775812357664} +{"Pretrain/Learning Rate": 1.7351422772090203e-06, "Pretrain/Loss": 1.9958512783050537, "Pretrain/Loss (Raw)": 1.9374418258666992, "Pretrain/Step": 16866, "Pretrain/Step Time": 8.502462418749928} +{"Pretrain/Learning Rate": 1.7335886601615363e-06, "Pretrain/Loss": 1.9987409114837646, "Pretrain/Loss (Raw)": 2.0888233184814453, "Pretrain/Step": 16867, "Pretrain/Step Time": 8.504120720550418} +{"Pretrain/Learning Rate": 1.7320357139846283e-06, "Pretrain/Loss": 1.9979629516601562, "Pretrain/Loss (Raw)": 1.9888684749603271, "Pretrain/Step": 16868, "Pretrain/Step Time": 8.505987785756588} +{"Pretrain/Learning Rate": 1.73048343872306e-06, "Pretrain/Loss": 1.9967089891433716, "Pretrain/Loss (Raw)": 1.9099394083023071, "Pretrain/Step": 16869, "Pretrain/Step Time": 8.505035964772105} +{"Pretrain/Learning Rate": 1.7289318344216015e-06, "Pretrain/Loss": 1.997268795967102, "Pretrain/Loss (Raw)": 1.8974616527557373, "Pretrain/Step": 16870, "Pretrain/Step Time": 8.502420766279101} +{"Pretrain/Learning Rate": 1.727380901124992e-06, "Pretrain/Loss": 1.9989054203033447, "Pretrain/Loss (Raw)": 2.1995677947998047, "Pretrain/Step": 16871, "Pretrain/Step Time": 8.50116484425962} +{"Pretrain/Learning Rate": 1.7258306388779427e-06, "Pretrain/Loss": 2.0004220008850098, "Pretrain/Loss (Raw)": 2.148538589477539, "Pretrain/Step": 16872, "Pretrain/Step Time": 8.50362373702228} +{"Pretrain/Learning Rate": 1.7242810477251626e-06, "Pretrain/Loss": 2.0032315254211426, "Pretrain/Loss (Raw)": 2.300788640975952, "Pretrain/Step": 16873, "Pretrain/Step Time": 8.503858203068376} +{"Pretrain/Learning Rate": 1.7227321277113268e-06, "Pretrain/Loss": 2.0036721229553223, "Pretrain/Loss (Raw)": 1.9244170188903809, "Pretrain/Step": 16874, "Pretrain/Step Time": 8.505969328805804} +{"Pretrain/Learning Rate": 1.7211838788811052e-06, "Pretrain/Loss": 2.0021510124206543, "Pretrain/Loss (Raw)": 1.888617753982544, "Pretrain/Step": 16875, "Pretrain/Step Time": 8.50307060033083} +{"Pretrain/Learning Rate": 1.7196363012791345e-06, "Pretrain/Loss": 2.002289295196533, "Pretrain/Loss (Raw)": 1.9338278770446777, "Pretrain/Step": 16876, "Pretrain/Step Time": 8.505574794486165} +{"Pretrain/Learning Rate": 1.718089394950037e-06, "Pretrain/Loss": 2.0017993450164795, "Pretrain/Loss (Raw)": 2.030294418334961, "Pretrain/Step": 16877, "Pretrain/Step Time": 8.500708477571607} +{"Pretrain/Learning Rate": 1.7165431599384218e-06, "Pretrain/Loss": 2.002241611480713, "Pretrain/Loss (Raw)": 2.1013715267181396, "Pretrain/Step": 16878, "Pretrain/Step Time": 8.500600706785917} +{"Pretrain/Learning Rate": 1.714997596288867e-06, "Pretrain/Loss": 1.9962716102600098, "Pretrain/Loss (Raw)": 1.8376295566558838, "Pretrain/Step": 16879, "Pretrain/Step Time": 8.497230092063546} +{"Pretrain/Learning Rate": 1.713452704045948e-06, "Pretrain/Loss": 1.9954559803009033, "Pretrain/Loss (Raw)": 1.8660739660263062, "Pretrain/Step": 16880, "Pretrain/Step Time": 8.501640385016799} +{"Pretrain/Learning Rate": 1.7119084832542014e-06, "Pretrain/Loss": 1.9924085140228271, "Pretrain/Loss (Raw)": 1.9807958602905273, "Pretrain/Step": 16881, "Pretrain/Step Time": 8.49976484850049} +{"Pretrain/Learning Rate": 1.7103649339581528e-06, "Pretrain/Loss": 1.9932291507720947, "Pretrain/Loss (Raw)": 2.2934513092041016, "Pretrain/Step": 16882, "Pretrain/Step Time": 8.497688014060259} +{"Pretrain/Learning Rate": 1.7088220562023193e-06, "Pretrain/Loss": 1.993391752243042, "Pretrain/Loss (Raw)": 2.162443161010742, "Pretrain/Step": 16883, "Pretrain/Step Time": 8.49931245855987} +{"Pretrain/Learning Rate": 1.7072798500311764e-06, "Pretrain/Loss": 1.992762804031372, "Pretrain/Loss (Raw)": 1.857886791229248, "Pretrain/Step": 16884, "Pretrain/Step Time": 8.497195456176996} +{"Pretrain/Learning Rate": 1.7057383154892054e-06, "Pretrain/Loss": 1.9911631345748901, "Pretrain/Loss (Raw)": 1.801192045211792, "Pretrain/Step": 16885, "Pretrain/Step Time": 8.499175475910306} +{"Pretrain/Learning Rate": 1.7041974526208483e-06, "Pretrain/Loss": 1.9921414852142334, "Pretrain/Loss (Raw)": 2.0111939907073975, "Pretrain/Step": 16886, "Pretrain/Step Time": 8.500673521310091} +{"Pretrain/Learning Rate": 1.7026572614705277e-06, "Pretrain/Loss": 1.993547797203064, "Pretrain/Loss (Raw)": 2.115907907485962, "Pretrain/Step": 16887, "Pretrain/Step Time": 8.4991489443928} +{"Pretrain/Learning Rate": 1.7011177420826697e-06, "Pretrain/Loss": 1.991426706314087, "Pretrain/Loss (Raw)": 1.929064154624939, "Pretrain/Step": 16888, "Pretrain/Step Time": 8.49824097007513} +{"Pretrain/Learning Rate": 1.6995788945016494e-06, "Pretrain/Loss": 1.991438865661621, "Pretrain/Loss (Raw)": 1.943363070487976, "Pretrain/Step": 16889, "Pretrain/Step Time": 8.492746263742447} +{"Pretrain/Learning Rate": 1.6980407187718511e-06, "Pretrain/Loss": 1.9900718927383423, "Pretrain/Loss (Raw)": 1.8765122890472412, "Pretrain/Step": 16890, "Pretrain/Step Time": 8.493932943791151} +{"Pretrain/Learning Rate": 1.6965032149376225e-06, "Pretrain/Loss": 1.9905664920806885, "Pretrain/Loss (Raw)": 2.1267406940460205, "Pretrain/Step": 16891, "Pretrain/Step Time": 8.491048723459244} +{"Pretrain/Learning Rate": 1.694966383043292e-06, "Pretrain/Loss": 1.9882783889770508, "Pretrain/Loss (Raw)": 1.774245262145996, "Pretrain/Step": 16892, "Pretrain/Step Time": 8.49055390432477} +{"Pretrain/Learning Rate": 1.6934302231331828e-06, "Pretrain/Loss": 1.9891990423202515, "Pretrain/Loss (Raw)": 2.0392372608184814, "Pretrain/Step": 16893, "Pretrain/Step Time": 8.492158006876707} +{"Pretrain/Learning Rate": 1.6918947352515757e-06, "Pretrain/Loss": 1.9902076721191406, "Pretrain/Loss (Raw)": 2.0970590114593506, "Pretrain/Step": 16894, "Pretrain/Step Time": 8.491717336699367} +{"Pretrain/Learning Rate": 1.6903599194427578e-06, "Pretrain/Loss": 1.989187240600586, "Pretrain/Loss (Raw)": 1.8313590288162231, "Pretrain/Step": 16895, "Pretrain/Step Time": 8.489987034350634} +{"Pretrain/Learning Rate": 1.6888257757509795e-06, "Pretrain/Loss": 1.9888901710510254, "Pretrain/Loss (Raw)": 1.8931268453598022, "Pretrain/Step": 16896, "Pretrain/Step Time": 8.488187646493316} +{"Pretrain/Learning Rate": 1.6872923042204725e-06, "Pretrain/Loss": 1.9873697757720947, "Pretrain/Loss (Raw)": 1.8216272592544556, "Pretrain/Step": 16897, "Pretrain/Step Time": 8.482829447835684} +{"Pretrain/Learning Rate": 1.6857595048954621e-06, "Pretrain/Loss": 1.988086223602295, "Pretrain/Loss (Raw)": 2.0620131492614746, "Pretrain/Step": 16898, "Pretrain/Step Time": 8.484444115310907} +{"Pretrain/Learning Rate": 1.6842273778201356e-06, "Pretrain/Loss": 1.9887316226959229, "Pretrain/Loss (Raw)": 2.0208733081817627, "Pretrain/Step": 16899, "Pretrain/Step Time": 8.484149472787976} +{"Pretrain/Learning Rate": 1.6826959230386824e-06, "Pretrain/Loss": 1.9879531860351562, "Pretrain/Loss (Raw)": 1.9681370258331299, "Pretrain/Step": 16900, "Pretrain/Step Time": 8.484869601204991} +{"Pretrain/Learning Rate": 1.6811651405952533e-06, "Pretrain/Loss": 1.9886555671691895, "Pretrain/Loss (Raw)": 2.0488367080688477, "Pretrain/Step": 16901, "Pretrain/Step Time": 8.486352298408747} +{"Pretrain/Learning Rate": 1.6796350305339852e-06, "Pretrain/Loss": 1.9893763065338135, "Pretrain/Loss (Raw)": 2.148862361907959, "Pretrain/Step": 16902, "Pretrain/Step Time": 8.487709328532219} +{"Pretrain/Learning Rate": 1.6781055928990042e-06, "Pretrain/Loss": 1.989795207977295, "Pretrain/Loss (Raw)": 2.0865378379821777, "Pretrain/Step": 16903, "Pretrain/Step Time": 8.493086036294699} +{"Pretrain/Learning Rate": 1.6765768277344024e-06, "Pretrain/Loss": 1.9911967515945435, "Pretrain/Loss (Raw)": 2.1092498302459717, "Pretrain/Step": 16904, "Pretrain/Step Time": 8.49076054431498} +{"Pretrain/Learning Rate": 1.6750487350842725e-06, "Pretrain/Loss": 1.990558385848999, "Pretrain/Loss (Raw)": 2.133012533187866, "Pretrain/Step": 16905, "Pretrain/Step Time": 8.489398889243603} +{"Pretrain/Learning Rate": 1.6735213149926682e-06, "Pretrain/Loss": 1.9904460906982422, "Pretrain/Loss (Raw)": 1.9188761711120605, "Pretrain/Step": 16906, "Pretrain/Step Time": 8.485118916258216} +{"Pretrain/Learning Rate": 1.6719945675036292e-06, "Pretrain/Loss": 1.9901154041290283, "Pretrain/Loss (Raw)": 2.0799190998077393, "Pretrain/Step": 16907, "Pretrain/Step Time": 8.489387502893806} +{"Pretrain/Learning Rate": 1.670468492661187e-06, "Pretrain/Loss": 1.9897514581680298, "Pretrain/Loss (Raw)": 1.9779020547866821, "Pretrain/Step": 16908, "Pretrain/Step Time": 8.489676399156451} +{"Pretrain/Learning Rate": 1.6689430905093311e-06, "Pretrain/Loss": 1.988612413406372, "Pretrain/Loss (Raw)": 1.9388558864593506, "Pretrain/Step": 16909, "Pretrain/Step Time": 8.490415496751666} +{"Pretrain/Learning Rate": 1.6674183610920629e-06, "Pretrain/Loss": 1.984750747680664, "Pretrain/Loss (Raw)": 1.6822388172149658, "Pretrain/Step": 16910, "Pretrain/Step Time": 8.491306472569704} +{"Pretrain/Learning Rate": 1.665894304453336e-06, "Pretrain/Loss": 1.984339952468872, "Pretrain/Loss (Raw)": 2.0341484546661377, "Pretrain/Step": 16911, "Pretrain/Step Time": 8.494541944935918} +{"Pretrain/Learning Rate": 1.6643709206370927e-06, "Pretrain/Loss": 1.9863824844360352, "Pretrain/Loss (Raw)": 1.9869980812072754, "Pretrain/Step": 16912, "Pretrain/Step Time": 8.48749339953065} +{"Pretrain/Learning Rate": 1.6628482096872678e-06, "Pretrain/Loss": 1.988393783569336, "Pretrain/Loss (Raw)": 2.2574939727783203, "Pretrain/Step": 16913, "Pretrain/Step Time": 8.488740308210254} +{"Pretrain/Learning Rate": 1.661326171647759e-06, "Pretrain/Loss": 1.9905725717544556, "Pretrain/Loss (Raw)": 2.1214041709899902, "Pretrain/Step": 16914, "Pretrain/Step Time": 8.487779423594475} +{"Pretrain/Learning Rate": 1.6598048065624594e-06, "Pretrain/Loss": 1.9910075664520264, "Pretrain/Loss (Raw)": 2.002580165863037, "Pretrain/Step": 16915, "Pretrain/Step Time": 8.492748092859983} +{"Pretrain/Learning Rate": 1.6582841144752336e-06, "Pretrain/Loss": 1.9901838302612305, "Pretrain/Loss (Raw)": 1.8689074516296387, "Pretrain/Step": 16916, "Pretrain/Step Time": 8.491341212764382} +{"Pretrain/Learning Rate": 1.656764095429933e-06, "Pretrain/Loss": 1.9917380809783936, "Pretrain/Loss (Raw)": 2.1370928287506104, "Pretrain/Step": 16917, "Pretrain/Step Time": 8.490743432193995} +{"Pretrain/Learning Rate": 1.6552447494703833e-06, "Pretrain/Loss": 1.9909766912460327, "Pretrain/Loss (Raw)": 1.8930400609970093, "Pretrain/Step": 16918, "Pretrain/Step Time": 8.489141682162881} +{"Pretrain/Learning Rate": 1.653726076640391e-06, "Pretrain/Loss": 1.9891560077667236, "Pretrain/Loss (Raw)": 1.9705042839050293, "Pretrain/Step": 16919, "Pretrain/Step Time": 8.493711728602648} +{"Pretrain/Learning Rate": 1.652208076983755e-06, "Pretrain/Loss": 1.9885337352752686, "Pretrain/Loss (Raw)": 2.0258336067199707, "Pretrain/Step": 16920, "Pretrain/Step Time": 8.490249855443835} +{"Pretrain/Learning Rate": 1.6506907505442344e-06, "Pretrain/Loss": 1.9905022382736206, "Pretrain/Loss (Raw)": 2.4833052158355713, "Pretrain/Step": 16921, "Pretrain/Step Time": 8.493868051096797} +{"Pretrain/Learning Rate": 1.6491740973655883e-06, "Pretrain/Loss": 1.9899017810821533, "Pretrain/Loss (Raw)": 2.056352376937866, "Pretrain/Step": 16922, "Pretrain/Step Time": 8.492644699290395} +{"Pretrain/Learning Rate": 1.647658117491549e-06, "Pretrain/Loss": 1.991145372390747, "Pretrain/Loss (Raw)": 2.003861665725708, "Pretrain/Step": 16923, "Pretrain/Step Time": 8.494374234229326} +{"Pretrain/Learning Rate": 1.64614281096582e-06, "Pretrain/Loss": 1.9946472644805908, "Pretrain/Loss (Raw)": 2.2276997566223145, "Pretrain/Step": 16924, "Pretrain/Step Time": 8.493287282064557} +{"Pretrain/Learning Rate": 1.6446281778321026e-06, "Pretrain/Loss": 1.9941942691802979, "Pretrain/Loss (Raw)": 2.0088484287261963, "Pretrain/Step": 16925, "Pretrain/Step Time": 8.492618067190051} +{"Pretrain/Learning Rate": 1.6431142181340647e-06, "Pretrain/Loss": 1.9950287342071533, "Pretrain/Loss (Raw)": 1.9868413209915161, "Pretrain/Step": 16926, "Pretrain/Step Time": 8.491258664056659} +{"Pretrain/Learning Rate": 1.6416009319153658e-06, "Pretrain/Loss": 1.9957268238067627, "Pretrain/Loss (Raw)": 1.8000508546829224, "Pretrain/Step": 16927, "Pretrain/Step Time": 8.49074107222259} +{"Pretrain/Learning Rate": 1.6400883192196376e-06, "Pretrain/Loss": 1.9911366701126099, "Pretrain/Loss (Raw)": 1.6665894985198975, "Pretrain/Step": 16928, "Pretrain/Step Time": 8.493130063638091} +{"Pretrain/Learning Rate": 1.638576380090498e-06, "Pretrain/Loss": 1.9917964935302734, "Pretrain/Loss (Raw)": 1.9659144878387451, "Pretrain/Step": 16929, "Pretrain/Step Time": 8.497512739151716} +{"Pretrain/Learning Rate": 1.637065114571537e-06, "Pretrain/Loss": 1.98957359790802, "Pretrain/Loss (Raw)": 1.9959317445755005, "Pretrain/Step": 16930, "Pretrain/Step Time": 8.49269157461822} +{"Pretrain/Learning Rate": 1.6355545227063285e-06, "Pretrain/Loss": 1.9883689880371094, "Pretrain/Loss (Raw)": 1.7134350538253784, "Pretrain/Step": 16931, "Pretrain/Step Time": 8.493921615183353} +{"Pretrain/Learning Rate": 1.63404460453844e-06, "Pretrain/Loss": 1.986149549484253, "Pretrain/Loss (Raw)": 1.697303056716919, "Pretrain/Step": 16932, "Pretrain/Step Time": 8.4932720977813} +{"Pretrain/Learning Rate": 1.632535360111398e-06, "Pretrain/Loss": 1.9885859489440918, "Pretrain/Loss (Raw)": 2.152761697769165, "Pretrain/Step": 16933, "Pretrain/Step Time": 8.496742069721222} +{"Pretrain/Learning Rate": 1.6310267894687315e-06, "Pretrain/Loss": 1.9884779453277588, "Pretrain/Loss (Raw)": 1.9194459915161133, "Pretrain/Step": 16934, "Pretrain/Step Time": 8.491526952013373} +{"Pretrain/Learning Rate": 1.6295188926539335e-06, "Pretrain/Loss": 1.983866572380066, "Pretrain/Loss (Raw)": 1.9087470769882202, "Pretrain/Step": 16935, "Pretrain/Step Time": 8.495860882103443} +{"Pretrain/Learning Rate": 1.6280116697104802e-06, "Pretrain/Loss": 1.983529806137085, "Pretrain/Loss (Raw)": 1.795289397239685, "Pretrain/Step": 16936, "Pretrain/Step Time": 8.494283463805914} +{"Pretrain/Learning Rate": 1.6265051206818371e-06, "Pretrain/Loss": 1.9807325601577759, "Pretrain/Loss (Raw)": 1.7357598543167114, "Pretrain/Step": 16937, "Pretrain/Step Time": 8.495128694921732} +{"Pretrain/Learning Rate": 1.624999245611436e-06, "Pretrain/Loss": 1.9800665378570557, "Pretrain/Loss (Raw)": 2.006258964538574, "Pretrain/Step": 16938, "Pretrain/Step Time": 8.496435783803463} +{"Pretrain/Learning Rate": 1.6234940445427088e-06, "Pretrain/Loss": 1.9797184467315674, "Pretrain/Loss (Raw)": 1.823458194732666, "Pretrain/Step": 16939, "Pretrain/Step Time": 8.495571985840797} +{"Pretrain/Learning Rate": 1.6219895175190513e-06, "Pretrain/Loss": 1.9807772636413574, "Pretrain/Loss (Raw)": 1.9799830913543701, "Pretrain/Step": 16940, "Pretrain/Step Time": 8.499653415754437} +{"Pretrain/Learning Rate": 1.620485664583843e-06, "Pretrain/Loss": 1.9826693534851074, "Pretrain/Loss (Raw)": 2.01103138923645, "Pretrain/Step": 16941, "Pretrain/Step Time": 8.497416615486145} +{"Pretrain/Learning Rate": 1.6189824857804515e-06, "Pretrain/Loss": 1.9836554527282715, "Pretrain/Loss (Raw)": 1.9630661010742188, "Pretrain/Step": 16942, "Pretrain/Step Time": 8.498507659882307} +{"Pretrain/Learning Rate": 1.6174799811522117e-06, "Pretrain/Loss": 1.9837336540222168, "Pretrain/Loss (Raw)": 1.8733505010604858, "Pretrain/Step": 16943, "Pretrain/Step Time": 8.492940597236156} +{"Pretrain/Learning Rate": 1.6159781507424614e-06, "Pretrain/Loss": 1.9847397804260254, "Pretrain/Loss (Raw)": 1.984535574913025, "Pretrain/Step": 16944, "Pretrain/Step Time": 8.496026935055852} +{"Pretrain/Learning Rate": 1.6144769945944938e-06, "Pretrain/Loss": 1.982692003250122, "Pretrain/Loss (Raw)": 1.7812223434448242, "Pretrain/Step": 16945, "Pretrain/Step Time": 8.498086573556066} +{"Pretrain/Learning Rate": 1.6129765127515933e-06, "Pretrain/Loss": 1.9811965227127075, "Pretrain/Loss (Raw)": 1.9804764986038208, "Pretrain/Step": 16946, "Pretrain/Step Time": 8.492777314037085} +{"Pretrain/Learning Rate": 1.6114767052570311e-06, "Pretrain/Loss": 1.9838519096374512, "Pretrain/Loss (Raw)": 2.354822874069214, "Pretrain/Step": 16947, "Pretrain/Step Time": 8.494339153170586} +{"Pretrain/Learning Rate": 1.609977572154045e-06, "Pretrain/Loss": 1.9841670989990234, "Pretrain/Loss (Raw)": 2.055133581161499, "Pretrain/Step": 16948, "Pretrain/Step Time": 8.495547510683537} +{"Pretrain/Learning Rate": 1.6084791134858751e-06, "Pretrain/Loss": 1.984709620475769, "Pretrain/Loss (Raw)": 2.0124101638793945, "Pretrain/Step": 16949, "Pretrain/Step Time": 8.490412089973688} +{"Pretrain/Learning Rate": 1.6069813292957176e-06, "Pretrain/Loss": 1.9843077659606934, "Pretrain/Loss (Raw)": 1.867641806602478, "Pretrain/Step": 16950, "Pretrain/Step Time": 8.489767586812377} +{"Pretrain/Learning Rate": 1.6054842196267571e-06, "Pretrain/Loss": 1.9859511852264404, "Pretrain/Loss (Raw)": 1.9300529956817627, "Pretrain/Step": 16951, "Pretrain/Step Time": 8.491825725883245} +{"Pretrain/Learning Rate": 1.6039877845221735e-06, "Pretrain/Loss": 1.9876036643981934, "Pretrain/Loss (Raw)": 2.220935106277466, "Pretrain/Step": 16952, "Pretrain/Step Time": 8.496719559654593} +{"Pretrain/Learning Rate": 1.602492024025104e-06, "Pretrain/Loss": 1.9856176376342773, "Pretrain/Loss (Raw)": 2.012126922607422, "Pretrain/Step": 16953, "Pretrain/Step Time": 8.496858846396208} +{"Pretrain/Learning Rate": 1.6009969381786866e-06, "Pretrain/Loss": 1.98576021194458, "Pretrain/Loss (Raw)": 1.989542007446289, "Pretrain/Step": 16954, "Pretrain/Step Time": 8.497615026310086} +{"Pretrain/Learning Rate": 1.5995025270260256e-06, "Pretrain/Loss": 1.9852409362792969, "Pretrain/Loss (Raw)": 1.9643160104751587, "Pretrain/Step": 16955, "Pretrain/Step Time": 8.499138565734029} +{"Pretrain/Learning Rate": 1.5980087906102115e-06, "Pretrain/Loss": 1.9849776029586792, "Pretrain/Loss (Raw)": 2.016765832901001, "Pretrain/Step": 16956, "Pretrain/Step Time": 8.50094592757523} +{"Pretrain/Learning Rate": 1.596515728974321e-06, "Pretrain/Loss": 1.9865353107452393, "Pretrain/Loss (Raw)": 2.065432071685791, "Pretrain/Step": 16957, "Pretrain/Step Time": 8.500263683497906} +{"Pretrain/Learning Rate": 1.5950233421613947e-06, "Pretrain/Loss": 1.9875009059906006, "Pretrain/Loss (Raw)": 2.2285892963409424, "Pretrain/Step": 16958, "Pretrain/Step Time": 8.500641936436296} +{"Pretrain/Learning Rate": 1.593531630214476e-06, "Pretrain/Loss": 1.9872567653656006, "Pretrain/Loss (Raw)": 2.021653175354004, "Pretrain/Step": 16959, "Pretrain/Step Time": 8.496266931295395} +{"Pretrain/Learning Rate": 1.5920405931765748e-06, "Pretrain/Loss": 1.9850201606750488, "Pretrain/Loss (Raw)": 1.8298473358154297, "Pretrain/Step": 16960, "Pretrain/Step Time": 8.500684028491378} +{"Pretrain/Learning Rate": 1.5905502310906735e-06, "Pretrain/Loss": 1.9860759973526, "Pretrain/Loss (Raw)": 2.0986127853393555, "Pretrain/Step": 16961, "Pretrain/Step Time": 8.498518785461783} +{"Pretrain/Learning Rate": 1.5890605439997596e-06, "Pretrain/Loss": 1.9870057106018066, "Pretrain/Loss (Raw)": 2.10148024559021, "Pretrain/Step": 16962, "Pretrain/Step Time": 8.497677164152265} +{"Pretrain/Learning Rate": 1.587571531946777e-06, "Pretrain/Loss": 1.989391565322876, "Pretrain/Loss (Raw)": 2.215090036392212, "Pretrain/Step": 16963, "Pretrain/Step Time": 8.503224654123187} +{"Pretrain/Learning Rate": 1.5860831949746691e-06, "Pretrain/Loss": 1.9900078773498535, "Pretrain/Loss (Raw)": 2.062448024749756, "Pretrain/Step": 16964, "Pretrain/Step Time": 8.500836787745357} +{"Pretrain/Learning Rate": 1.5845955331263456e-06, "Pretrain/Loss": 1.9900758266448975, "Pretrain/Loss (Raw)": 1.9676421880722046, "Pretrain/Step": 16965, "Pretrain/Step Time": 8.500235801562667} +{"Pretrain/Learning Rate": 1.5831085464447004e-06, "Pretrain/Loss": 1.990686297416687, "Pretrain/Loss (Raw)": 2.070509910583496, "Pretrain/Step": 16966, "Pretrain/Step Time": 8.498508997261524} +{"Pretrain/Learning Rate": 1.5816222349726155e-06, "Pretrain/Loss": 1.9892573356628418, "Pretrain/Loss (Raw)": 1.9914941787719727, "Pretrain/Step": 16967, "Pretrain/Step Time": 8.499628942459822} +{"Pretrain/Learning Rate": 1.5801365987529404e-06, "Pretrain/Loss": 1.9894680976867676, "Pretrain/Loss (Raw)": 1.9153953790664673, "Pretrain/Step": 16968, "Pretrain/Step Time": 8.499504055827856} +{"Pretrain/Learning Rate": 1.578651637828521e-06, "Pretrain/Loss": 1.9895398616790771, "Pretrain/Loss (Raw)": 1.8809963464736938, "Pretrain/Step": 16969, "Pretrain/Step Time": 8.496746718883514} +{"Pretrain/Learning Rate": 1.5771673522421704e-06, "Pretrain/Loss": 1.9901108741760254, "Pretrain/Loss (Raw)": 1.8709837198257446, "Pretrain/Step": 16970, "Pretrain/Step Time": 8.497446751222014} +{"Pretrain/Learning Rate": 1.575683742036685e-06, "Pretrain/Loss": 1.99027681350708, "Pretrain/Loss (Raw)": 2.133807897567749, "Pretrain/Step": 16971, "Pretrain/Step Time": 8.492367772385478} +{"Pretrain/Learning Rate": 1.574200807254847e-06, "Pretrain/Loss": 1.9881739616394043, "Pretrain/Loss (Raw)": 1.7174081802368164, "Pretrain/Step": 16972, "Pretrain/Step Time": 8.493862384930253} +{"Pretrain/Learning Rate": 1.572718547939414e-06, "Pretrain/Loss": 1.9873464107513428, "Pretrain/Loss (Raw)": 1.8828972578048706, "Pretrain/Step": 16973, "Pretrain/Step Time": 8.495130626484752} +{"Pretrain/Learning Rate": 1.571236964133127e-06, "Pretrain/Loss": 1.9880461692810059, "Pretrain/Loss (Raw)": 1.980005145072937, "Pretrain/Step": 16974, "Pretrain/Step Time": 8.492084106430411} +{"Pretrain/Learning Rate": 1.5697560558787072e-06, "Pretrain/Loss": 1.9847455024719238, "Pretrain/Loss (Raw)": 1.9662784337997437, "Pretrain/Step": 16975, "Pretrain/Step Time": 8.492113279178739} +{"Pretrain/Learning Rate": 1.568275823218851e-06, "Pretrain/Loss": 1.986644983291626, "Pretrain/Loss (Raw)": 2.176917552947998, "Pretrain/Step": 16976, "Pretrain/Step Time": 8.485328847542405} +{"Pretrain/Learning Rate": 1.5667962661962465e-06, "Pretrain/Loss": 1.9872227907180786, "Pretrain/Loss (Raw)": 1.9128762483596802, "Pretrain/Step": 16977, "Pretrain/Step Time": 8.485170165076852} +{"Pretrain/Learning Rate": 1.5653173848535486e-06, "Pretrain/Loss": 1.9874858856201172, "Pretrain/Loss (Raw)": 1.9977116584777832, "Pretrain/Step": 16978, "Pretrain/Step Time": 8.488452397286892} +{"Pretrain/Learning Rate": 1.5638391792334062e-06, "Pretrain/Loss": 1.9899415969848633, "Pretrain/Loss (Raw)": 1.9911617040634155, "Pretrain/Step": 16979, "Pretrain/Step Time": 8.489105485379696} +{"Pretrain/Learning Rate": 1.5623616493784382e-06, "Pretrain/Loss": 1.9879562854766846, "Pretrain/Loss (Raw)": 1.9717686176300049, "Pretrain/Step": 16980, "Pretrain/Step Time": 8.487016282975674} +{"Pretrain/Learning Rate": 1.560884795331252e-06, "Pretrain/Loss": 1.98595130443573, "Pretrain/Loss (Raw)": 1.86996591091156, "Pretrain/Step": 16981, "Pretrain/Step Time": 8.48668833822012} +{"Pretrain/Learning Rate": 1.5594086171344308e-06, "Pretrain/Loss": 1.9854233264923096, "Pretrain/Loss (Raw)": 1.987403154373169, "Pretrain/Step": 16982, "Pretrain/Step Time": 8.486474448814988} +{"Pretrain/Learning Rate": 1.5579331148305315e-06, "Pretrain/Loss": 1.9843463897705078, "Pretrain/Loss (Raw)": 1.857837438583374, "Pretrain/Step": 16983, "Pretrain/Step Time": 8.49157015234232} +{"Pretrain/Learning Rate": 1.5564582884621093e-06, "Pretrain/Loss": 1.9832994937896729, "Pretrain/Loss (Raw)": 1.9167944192886353, "Pretrain/Step": 16984, "Pretrain/Step Time": 8.48751663416624} +{"Pretrain/Learning Rate": 1.554984138071683e-06, "Pretrain/Loss": 1.983379602432251, "Pretrain/Loss (Raw)": 1.8709373474121094, "Pretrain/Step": 16985, "Pretrain/Step Time": 8.49054205045104} +{"Pretrain/Learning Rate": 1.5535106637017654e-06, "Pretrain/Loss": 1.9811482429504395, "Pretrain/Loss (Raw)": 1.8359686136245728, "Pretrain/Step": 16986, "Pretrain/Step Time": 8.490783400833607} +{"Pretrain/Learning Rate": 1.552037865394837e-06, "Pretrain/Loss": 1.9818888902664185, "Pretrain/Loss (Raw)": 1.7821675539016724, "Pretrain/Step": 16987, "Pretrain/Step Time": 8.484826328232884} +{"Pretrain/Learning Rate": 1.5505657431933661e-06, "Pretrain/Loss": 1.9822337627410889, "Pretrain/Loss (Raw)": 2.0383923053741455, "Pretrain/Step": 16988, "Pretrain/Step Time": 8.487331617623568} +{"Pretrain/Learning Rate": 1.5490942971398027e-06, "Pretrain/Loss": 1.9836010932922363, "Pretrain/Loss (Raw)": 1.9906294345855713, "Pretrain/Step": 16989, "Pretrain/Step Time": 8.485500827431679} +{"Pretrain/Learning Rate": 1.5476235272765704e-06, "Pretrain/Loss": 1.9856574535369873, "Pretrain/Loss (Raw)": 2.142247438430786, "Pretrain/Step": 16990, "Pretrain/Step Time": 8.487262541428208} +{"Pretrain/Learning Rate": 1.5461534336460859e-06, "Pretrain/Loss": 1.9834327697753906, "Pretrain/Loss (Raw)": 1.8068664073944092, "Pretrain/Step": 16991, "Pretrain/Step Time": 8.493178110569715} +{"Pretrain/Learning Rate": 1.5446840162907316e-06, "Pretrain/Loss": 1.985764741897583, "Pretrain/Loss (Raw)": 2.1336395740509033, "Pretrain/Step": 16992, "Pretrain/Step Time": 8.487904531881213} +{"Pretrain/Learning Rate": 1.5432152752528767e-06, "Pretrain/Loss": 1.987593173980713, "Pretrain/Loss (Raw)": 2.100618362426758, "Pretrain/Step": 16993, "Pretrain/Step Time": 8.490990776568651} +{"Pretrain/Learning Rate": 1.541747210574876e-06, "Pretrain/Loss": 1.987840175628662, "Pretrain/Loss (Raw)": 1.9690556526184082, "Pretrain/Step": 16994, "Pretrain/Step Time": 8.48917543888092} +{"Pretrain/Learning Rate": 1.5402798222990538e-06, "Pretrain/Loss": 1.9865992069244385, "Pretrain/Loss (Raw)": 1.9299858808517456, "Pretrain/Step": 16995, "Pretrain/Step Time": 8.486639047041535} +{"Pretrain/Learning Rate": 1.5388131104677294e-06, "Pretrain/Loss": 1.9867866039276123, "Pretrain/Loss (Raw)": 2.0128555297851562, "Pretrain/Step": 16996, "Pretrain/Step Time": 8.486834082752466} +{"Pretrain/Learning Rate": 1.5373470751231883e-06, "Pretrain/Loss": 1.9871448278427124, "Pretrain/Loss (Raw)": 1.9557784795761108, "Pretrain/Step": 16997, "Pretrain/Step Time": 8.491922510787845} +{"Pretrain/Learning Rate": 1.5358817163077022e-06, "Pretrain/Loss": 1.988577127456665, "Pretrain/Loss (Raw)": 2.080796718597412, "Pretrain/Step": 16998, "Pretrain/Step Time": 8.493559505790472} +{"Pretrain/Learning Rate": 1.5344170340635288e-06, "Pretrain/Loss": 1.9874528646469116, "Pretrain/Loss (Raw)": 2.055656909942627, "Pretrain/Step": 16999, "Pretrain/Step Time": 8.499325217679143} +{"Pretrain/Learning Rate": 1.532953028432893e-06, "Pretrain/Loss": 1.9878818988800049, "Pretrain/Loss (Raw)": 2.20345139503479, "Pretrain/Step": 17000, "Pretrain/Step Time": 8.49409756436944} +{"Pretrain/Learning Rate": 1.5314896994580192e-06, "Pretrain/Loss": 1.983781099319458, "Pretrain/Loss (Raw)": 1.775890588760376, "Pretrain/Step": 17001, "Pretrain/Step Time": 8.498621014878154} +{"Pretrain/Learning Rate": 1.5300270471810958e-06, "Pretrain/Loss": 1.983558177947998, "Pretrain/Loss (Raw)": 1.895887017250061, "Pretrain/Step": 17002, "Pretrain/Step Time": 8.497572982683778} +{"Pretrain/Learning Rate": 1.5285650716442917e-06, "Pretrain/Loss": 1.9848893880844116, "Pretrain/Loss (Raw)": 2.0590107440948486, "Pretrain/Step": 17003, "Pretrain/Step Time": 8.499012731015682} +{"Pretrain/Learning Rate": 1.5271037728897737e-06, "Pretrain/Loss": 1.9851129055023193, "Pretrain/Loss (Raw)": 1.9624558687210083, "Pretrain/Step": 17004, "Pretrain/Step Time": 8.499200077727437} +{"Pretrain/Learning Rate": 1.5256431509596658e-06, "Pretrain/Loss": 1.9846491813659668, "Pretrain/Loss (Raw)": 1.9709174633026123, "Pretrain/Step": 17005, "Pretrain/Step Time": 8.49879902228713} +{"Pretrain/Learning Rate": 1.524183205896093e-06, "Pretrain/Loss": 1.985350489616394, "Pretrain/Loss (Raw)": 2.1911473274230957, "Pretrain/Step": 17006, "Pretrain/Step Time": 8.495918853208423} +{"Pretrain/Learning Rate": 1.5227239377411468e-06, "Pretrain/Loss": 1.9850934743881226, "Pretrain/Loss (Raw)": 1.8047306537628174, "Pretrain/Step": 17007, "Pretrain/Step Time": 8.496686201542616} +{"Pretrain/Learning Rate": 1.5212653465369041e-06, "Pretrain/Loss": 1.9851051568984985, "Pretrain/Loss (Raw)": 1.8675662279129028, "Pretrain/Step": 17008, "Pretrain/Step Time": 8.492398640140891} +{"Pretrain/Learning Rate": 1.5198074323254264e-06, "Pretrain/Loss": 1.985515832901001, "Pretrain/Loss (Raw)": 2.0333704948425293, "Pretrain/Step": 17009, "Pretrain/Step Time": 8.493777129799128} +{"Pretrain/Learning Rate": 1.5183501951487462e-06, "Pretrain/Loss": 1.9807250499725342, "Pretrain/Loss (Raw)": 1.680217981338501, "Pretrain/Step": 17010, "Pretrain/Step Time": 8.500227784737945} +{"Pretrain/Learning Rate": 1.5168936350488856e-06, "Pretrain/Loss": 1.9785321950912476, "Pretrain/Loss (Raw)": 1.8817667961120605, "Pretrain/Step": 17011, "Pretrain/Step Time": 8.496165620163083} +{"Pretrain/Learning Rate": 1.5154377520678442e-06, "Pretrain/Loss": 1.9802629947662354, "Pretrain/Loss (Raw)": 2.0794360637664795, "Pretrain/Step": 17012, "Pretrain/Step Time": 8.496908197179437} +{"Pretrain/Learning Rate": 1.5139825462475998e-06, "Pretrain/Loss": 1.9827296733856201, "Pretrain/Loss (Raw)": 2.116924285888672, "Pretrain/Step": 17013, "Pretrain/Step Time": 8.494642851874232} +{"Pretrain/Learning Rate": 1.5125280176301131e-06, "Pretrain/Loss": 1.9834649562835693, "Pretrain/Loss (Raw)": 2.1053192615509033, "Pretrain/Step": 17014, "Pretrain/Step Time": 8.49311332963407} +{"Pretrain/Learning Rate": 1.5110741662573175e-06, "Pretrain/Loss": 1.9802725315093994, "Pretrain/Loss (Raw)": 1.7072563171386719, "Pretrain/Step": 17015, "Pretrain/Step Time": 8.498867815360427} +{"Pretrain/Learning Rate": 1.5096209921711458e-06, "Pretrain/Loss": 1.9800724983215332, "Pretrain/Loss (Raw)": 1.9034675359725952, "Pretrain/Step": 17016, "Pretrain/Step Time": 8.498540330678225} +{"Pretrain/Learning Rate": 1.5081684954134895e-06, "Pretrain/Loss": 1.981248378753662, "Pretrain/Loss (Raw)": 2.0938849449157715, "Pretrain/Step": 17017, "Pretrain/Step Time": 8.49454427883029} +{"Pretrain/Learning Rate": 1.5067166760262348e-06, "Pretrain/Loss": 1.9827241897583008, "Pretrain/Loss (Raw)": 2.0654046535491943, "Pretrain/Step": 17018, "Pretrain/Step Time": 8.498363170772791} +{"Pretrain/Learning Rate": 1.505265534051245e-06, "Pretrain/Loss": 1.981718897819519, "Pretrain/Loss (Raw)": 1.998062014579773, "Pretrain/Step": 17019, "Pretrain/Step Time": 8.498433781787753} +{"Pretrain/Learning Rate": 1.5038150695303566e-06, "Pretrain/Loss": 1.9855717420578003, "Pretrain/Loss (Raw)": 2.2674152851104736, "Pretrain/Step": 17020, "Pretrain/Step Time": 8.498889552429318} +{"Pretrain/Learning Rate": 1.5023652825054024e-06, "Pretrain/Loss": 1.984894871711731, "Pretrain/Loss (Raw)": 1.9526071548461914, "Pretrain/Step": 17021, "Pretrain/Step Time": 8.499600488692522} +{"Pretrain/Learning Rate": 1.5009161730181742e-06, "Pretrain/Loss": 1.9820647239685059, "Pretrain/Loss (Raw)": 1.7347867488861084, "Pretrain/Step": 17022, "Pretrain/Step Time": 8.497167211025953} +{"Pretrain/Learning Rate": 1.499467741110469e-06, "Pretrain/Loss": 1.9829931259155273, "Pretrain/Loss (Raw)": 1.9501875638961792, "Pretrain/Step": 17023, "Pretrain/Step Time": 8.495897818356752} +{"Pretrain/Learning Rate": 1.4980199868240425e-06, "Pretrain/Loss": 1.9837809801101685, "Pretrain/Loss (Raw)": 1.9939746856689453, "Pretrain/Step": 17024, "Pretrain/Step Time": 8.493168881163001} +{"Pretrain/Learning Rate": 1.4965729102006388e-06, "Pretrain/Loss": 1.984783411026001, "Pretrain/Loss (Raw)": 1.9499393701553345, "Pretrain/Step": 17025, "Pretrain/Step Time": 8.493877355009317} +{"Pretrain/Learning Rate": 1.4951265112819885e-06, "Pretrain/Loss": 1.9835294485092163, "Pretrain/Loss (Raw)": 1.9015060663223267, "Pretrain/Step": 17026, "Pretrain/Step Time": 8.499349953606725} +{"Pretrain/Learning Rate": 1.4936807901097943e-06, "Pretrain/Loss": 1.984997034072876, "Pretrain/Loss (Raw)": 2.2087130546569824, "Pretrain/Step": 17027, "Pretrain/Step Time": 8.504321174696088} +{"Pretrain/Learning Rate": 1.4922357467257452e-06, "Pretrain/Loss": 1.983835220336914, "Pretrain/Loss (Raw)": 1.8194286823272705, "Pretrain/Step": 17028, "Pretrain/Step Time": 8.500299343839288} +{"Pretrain/Learning Rate": 1.490791381171508e-06, "Pretrain/Loss": 1.9840315580368042, "Pretrain/Loss (Raw)": 2.0739846229553223, "Pretrain/Step": 17029, "Pretrain/Step Time": 8.499922025948763} +{"Pretrain/Learning Rate": 1.489347693488724e-06, "Pretrain/Loss": 1.983389139175415, "Pretrain/Loss (Raw)": 2.06662917137146, "Pretrain/Step": 17030, "Pretrain/Step Time": 8.502288458868861} +{"Pretrain/Learning Rate": 1.4879046837190297e-06, "Pretrain/Loss": 1.98219895362854, "Pretrain/Loss (Raw)": 1.93418550491333, "Pretrain/Step": 17031, "Pretrain/Step Time": 8.497640769928694} +{"Pretrain/Learning Rate": 1.486462351904025e-06, "Pretrain/Loss": 1.981885313987732, "Pretrain/Loss (Raw)": 2.0691092014312744, "Pretrain/Step": 17032, "Pretrain/Step Time": 8.501114087179303} +{"Pretrain/Learning Rate": 1.4850206980853071e-06, "Pretrain/Loss": 1.9795715808868408, "Pretrain/Loss (Raw)": 1.836863398551941, "Pretrain/Step": 17033, "Pretrain/Step Time": 8.501250119879842} +{"Pretrain/Learning Rate": 1.4835797223044374e-06, "Pretrain/Loss": 1.9818902015686035, "Pretrain/Loss (Raw)": 2.2156670093536377, "Pretrain/Step": 17034, "Pretrain/Step Time": 8.504214465618134} +{"Pretrain/Learning Rate": 1.4821394246029685e-06, "Pretrain/Loss": 1.9818352460861206, "Pretrain/Loss (Raw)": 2.072866916656494, "Pretrain/Step": 17035, "Pretrain/Step Time": 8.498433880507946} +{"Pretrain/Learning Rate": 1.4806998050224312e-06, "Pretrain/Loss": 1.9798834323883057, "Pretrain/Loss (Raw)": 1.728075385093689, "Pretrain/Step": 17036, "Pretrain/Step Time": 8.501370619982481} +{"Pretrain/Learning Rate": 1.4792608636043315e-06, "Pretrain/Loss": 1.9821228981018066, "Pretrain/Loss (Raw)": 2.2255165576934814, "Pretrain/Step": 17037, "Pretrain/Step Time": 8.497433759272099} +{"Pretrain/Learning Rate": 1.477822600390169e-06, "Pretrain/Loss": 1.9854652881622314, "Pretrain/Loss (Raw)": 2.1100504398345947, "Pretrain/Step": 17038, "Pretrain/Step Time": 8.494795482605696} +{"Pretrain/Learning Rate": 1.4763850154214081e-06, "Pretrain/Loss": 1.985564112663269, "Pretrain/Loss (Raw)": 2.046799898147583, "Pretrain/Step": 17039, "Pretrain/Step Time": 8.495341558009386} +{"Pretrain/Learning Rate": 1.474948108739499e-06, "Pretrain/Loss": 1.9839630126953125, "Pretrain/Loss (Raw)": 1.7820574045181274, "Pretrain/Step": 17040, "Pretrain/Step Time": 8.494073834270239} +{"Pretrain/Learning Rate": 1.4735118803858805e-06, "Pretrain/Loss": 1.9828072786331177, "Pretrain/Loss (Raw)": 2.1095666885375977, "Pretrain/Step": 17041, "Pretrain/Step Time": 8.491980383172631} +{"Pretrain/Learning Rate": 1.4720763304019613e-06, "Pretrain/Loss": 1.9805824756622314, "Pretrain/Loss (Raw)": 1.8366293907165527, "Pretrain/Step": 17042, "Pretrain/Step Time": 8.495838794857264} +{"Pretrain/Learning Rate": 1.4706414588291362e-06, "Pretrain/Loss": 1.9801620244979858, "Pretrain/Loss (Raw)": 1.9487594366073608, "Pretrain/Step": 17043, "Pretrain/Step Time": 8.49462648294866} +{"Pretrain/Learning Rate": 1.4692072657087718e-06, "Pretrain/Loss": 1.9795799255371094, "Pretrain/Loss (Raw)": 1.794409155845642, "Pretrain/Step": 17044, "Pretrain/Step Time": 8.492729099467397} +{"Pretrain/Learning Rate": 1.4677737510822354e-06, "Pretrain/Loss": 1.9773244857788086, "Pretrain/Loss (Raw)": 1.848400354385376, "Pretrain/Step": 17045, "Pretrain/Step Time": 8.495629392564297} +{"Pretrain/Learning Rate": 1.466340914990852e-06, "Pretrain/Loss": 1.9782860279083252, "Pretrain/Loss (Raw)": 2.016105890274048, "Pretrain/Step": 17046, "Pretrain/Step Time": 8.497678279876709} +{"Pretrain/Learning Rate": 1.4649087574759328e-06, "Pretrain/Loss": 1.9785335063934326, "Pretrain/Loss (Raw)": 2.002173900604248, "Pretrain/Step": 17047, "Pretrain/Step Time": 8.496080802753568} +{"Pretrain/Learning Rate": 1.4634772785787842e-06, "Pretrain/Loss": 1.9748618602752686, "Pretrain/Loss (Raw)": 1.5558676719665527, "Pretrain/Step": 17048, "Pretrain/Step Time": 8.493118543177843} +{"Pretrain/Learning Rate": 1.4620464783406728e-06, "Pretrain/Loss": 1.9718124866485596, "Pretrain/Loss (Raw)": 2.0929863452911377, "Pretrain/Step": 17049, "Pretrain/Step Time": 8.495882861316204} +{"Pretrain/Learning Rate": 1.4606163568028603e-06, "Pretrain/Loss": 1.9712064266204834, "Pretrain/Loss (Raw)": 1.9787834882736206, "Pretrain/Step": 17050, "Pretrain/Step Time": 8.496725376695395} +{"Pretrain/Learning Rate": 1.45918691400658e-06, "Pretrain/Loss": 1.969363808631897, "Pretrain/Loss (Raw)": 1.7679911851882935, "Pretrain/Step": 17051, "Pretrain/Step Time": 8.49299655109644} +{"Pretrain/Learning Rate": 1.4577581499930493e-06, "Pretrain/Loss": 1.9677263498306274, "Pretrain/Loss (Raw)": 2.0181076526641846, "Pretrain/Step": 17052, "Pretrain/Step Time": 8.494883393868804} +{"Pretrain/Learning Rate": 1.4563300648034683e-06, "Pretrain/Loss": 1.9666657447814941, "Pretrain/Loss (Raw)": 1.8731017112731934, "Pretrain/Step": 17053, "Pretrain/Step Time": 8.495860485360026} +{"Pretrain/Learning Rate": 1.454902658479007e-06, "Pretrain/Loss": 1.9672720432281494, "Pretrain/Loss (Raw)": 2.064436912536621, "Pretrain/Step": 17054, "Pretrain/Step Time": 8.49452598579228} +{"Pretrain/Learning Rate": 1.4534759310608354e-06, "Pretrain/Loss": 1.9680308103561401, "Pretrain/Loss (Raw)": 1.8971810340881348, "Pretrain/Step": 17055, "Pretrain/Step Time": 8.493988957256079} +{"Pretrain/Learning Rate": 1.452049882590087e-06, "Pretrain/Loss": 1.970171570777893, "Pretrain/Loss (Raw)": 1.940596342086792, "Pretrain/Step": 17056, "Pretrain/Step Time": 8.48725962266326} +{"Pretrain/Learning Rate": 1.4506245131078733e-06, "Pretrain/Loss": 1.9700241088867188, "Pretrain/Loss (Raw)": 1.9470576047897339, "Pretrain/Step": 17057, "Pretrain/Step Time": 8.48757753521204} +{"Pretrain/Learning Rate": 1.449199822655306e-06, "Pretrain/Loss": 1.9702072143554688, "Pretrain/Loss (Raw)": 2.0193681716918945, "Pretrain/Step": 17058, "Pretrain/Step Time": 8.489148169755936} +{"Pretrain/Learning Rate": 1.4477758112734552e-06, "Pretrain/Loss": 1.971629023551941, "Pretrain/Loss (Raw)": 1.8954253196716309, "Pretrain/Step": 17059, "Pretrain/Step Time": 8.490631375461817} +{"Pretrain/Learning Rate": 1.4463524790033906e-06, "Pretrain/Loss": 1.972593069076538, "Pretrain/Loss (Raw)": 1.8206969499588013, "Pretrain/Step": 17060, "Pretrain/Step Time": 8.494524145498872} +{"Pretrain/Learning Rate": 1.4449298258861487e-06, "Pretrain/Loss": 1.9719994068145752, "Pretrain/Loss (Raw)": 2.0767767429351807, "Pretrain/Step": 17061, "Pretrain/Step Time": 8.487674746662378} +{"Pretrain/Learning Rate": 1.4435078519627442e-06, "Pretrain/Loss": 1.9733264446258545, "Pretrain/Loss (Raw)": 2.0893027782440186, "Pretrain/Step": 17062, "Pretrain/Step Time": 8.494154730811715} +{"Pretrain/Learning Rate": 1.4420865572741888e-06, "Pretrain/Loss": 1.974314570426941, "Pretrain/Loss (Raw)": 2.035229444503784, "Pretrain/Step": 17063, "Pretrain/Step Time": 8.490731734782457} +{"Pretrain/Learning Rate": 1.4406659418614577e-06, "Pretrain/Loss": 1.9756746292114258, "Pretrain/Loss (Raw)": 1.9693645238876343, "Pretrain/Step": 17064, "Pretrain/Step Time": 8.492204932495952} +{"Pretrain/Learning Rate": 1.4392460057655183e-06, "Pretrain/Loss": 1.9774500131607056, "Pretrain/Loss (Raw)": 1.9630300998687744, "Pretrain/Step": 17065, "Pretrain/Step Time": 8.49034514091909} +{"Pretrain/Learning Rate": 1.4378267490273128e-06, "Pretrain/Loss": 1.9777636528015137, "Pretrain/Loss (Raw)": 2.046398878097534, "Pretrain/Step": 17066, "Pretrain/Step Time": 8.492847602814436} +{"Pretrain/Learning Rate": 1.4364081716877558e-06, "Pretrain/Loss": 1.9805126190185547, "Pretrain/Loss (Raw)": 2.1753311157226562, "Pretrain/Step": 17067, "Pretrain/Step Time": 8.494262050837278} +{"Pretrain/Learning Rate": 1.4349902737877646e-06, "Pretrain/Loss": 1.9817826747894287, "Pretrain/Loss (Raw)": 2.142526865005493, "Pretrain/Step": 17068, "Pretrain/Step Time": 8.492612617090344} +{"Pretrain/Learning Rate": 1.433573055368212e-06, "Pretrain/Loss": 1.981785774230957, "Pretrain/Loss (Raw)": 2.0114548206329346, "Pretrain/Step": 17069, "Pretrain/Step Time": 8.495706930756569} +{"Pretrain/Learning Rate": 1.4321565164699708e-06, "Pretrain/Loss": 1.9824583530426025, "Pretrain/Loss (Raw)": 2.0491368770599365, "Pretrain/Step": 17070, "Pretrain/Step Time": 8.49550379626453} +{"Pretrain/Learning Rate": 1.4307406571338832e-06, "Pretrain/Loss": 1.9827467203140259, "Pretrain/Loss (Raw)": 1.9102638959884644, "Pretrain/Step": 17071, "Pretrain/Step Time": 8.496779406443238} +{"Pretrain/Learning Rate": 1.4293254774007669e-06, "Pretrain/Loss": 1.9807847738265991, "Pretrain/Loss (Raw)": 1.7334039211273193, "Pretrain/Step": 17072, "Pretrain/Step Time": 8.494821449741721} +{"Pretrain/Learning Rate": 1.4279109773114418e-06, "Pretrain/Loss": 1.9831678867340088, "Pretrain/Loss (Raw)": 2.086256980895996, "Pretrain/Step": 17073, "Pretrain/Step Time": 8.491596480831504} +{"Pretrain/Learning Rate": 1.4264971569066809e-06, "Pretrain/Loss": 1.9825115203857422, "Pretrain/Loss (Raw)": 1.8964828252792358, "Pretrain/Step": 17074, "Pretrain/Step Time": 8.487466871738434} +{"Pretrain/Learning Rate": 1.42508401622726e-06, "Pretrain/Loss": 1.9804713726043701, "Pretrain/Loss (Raw)": 2.093681812286377, "Pretrain/Step": 17075, "Pretrain/Step Time": 8.49405557103455} +{"Pretrain/Learning Rate": 1.4236715553139213e-06, "Pretrain/Loss": 1.9807848930358887, "Pretrain/Loss (Raw)": 2.095245122909546, "Pretrain/Step": 17076, "Pretrain/Step Time": 8.498758498579264} +{"Pretrain/Learning Rate": 1.4222597742073906e-06, "Pretrain/Loss": 1.980630874633789, "Pretrain/Loss (Raw)": 1.9926968812942505, "Pretrain/Step": 17077, "Pretrain/Step Time": 8.50125129148364} +{"Pretrain/Learning Rate": 1.42084867294838e-06, "Pretrain/Loss": 1.982574462890625, "Pretrain/Loss (Raw)": 2.116433620452881, "Pretrain/Step": 17078, "Pretrain/Step Time": 8.504045197740197} +{"Pretrain/Learning Rate": 1.4194382515775734e-06, "Pretrain/Loss": 1.983344554901123, "Pretrain/Loss (Raw)": 2.028616189956665, "Pretrain/Step": 17079, "Pretrain/Step Time": 8.50432744435966} +{"Pretrain/Learning Rate": 1.4180285101356467e-06, "Pretrain/Loss": 1.9805316925048828, "Pretrain/Loss (Raw)": 1.8608967065811157, "Pretrain/Step": 17080, "Pretrain/Step Time": 8.507355263456702} +{"Pretrain/Learning Rate": 1.4166194486632422e-06, "Pretrain/Loss": 1.9804003238677979, "Pretrain/Loss (Raw)": 1.995301365852356, "Pretrain/Step": 17081, "Pretrain/Step Time": 8.501838168129325} +{"Pretrain/Learning Rate": 1.4152110672009861e-06, "Pretrain/Loss": 1.9801621437072754, "Pretrain/Loss (Raw)": 1.9590684175491333, "Pretrain/Step": 17082, "Pretrain/Step Time": 8.506885247305036} +{"Pretrain/Learning Rate": 1.4138033657894984e-06, "Pretrain/Loss": 1.979613184928894, "Pretrain/Loss (Raw)": 1.8940598964691162, "Pretrain/Step": 17083, "Pretrain/Step Time": 8.505207747220993} +{"Pretrain/Learning Rate": 1.4123963444693578e-06, "Pretrain/Loss": 1.9820334911346436, "Pretrain/Loss (Raw)": 2.326542377471924, "Pretrain/Step": 17084, "Pretrain/Step Time": 8.504616921767592} +{"Pretrain/Learning Rate": 1.4109900032811457e-06, "Pretrain/Loss": 1.9812428951263428, "Pretrain/Loss (Raw)": 1.9642268419265747, "Pretrain/Step": 17085, "Pretrain/Step Time": 8.50739235803485} +{"Pretrain/Learning Rate": 1.4095843422654076e-06, "Pretrain/Loss": 1.9797831773757935, "Pretrain/Loss (Raw)": 2.041748046875, "Pretrain/Step": 17086, "Pretrain/Step Time": 8.505499081686139} +{"Pretrain/Learning Rate": 1.4081793614626692e-06, "Pretrain/Loss": 1.9779001474380493, "Pretrain/Loss (Raw)": 1.7806252241134644, "Pretrain/Step": 17087, "Pretrain/Step Time": 8.50789686664939} +{"Pretrain/Learning Rate": 1.4067750609134539e-06, "Pretrain/Loss": 1.9800734519958496, "Pretrain/Loss (Raw)": 2.108035087585449, "Pretrain/Step": 17088, "Pretrain/Step Time": 8.504860125482082} +{"Pretrain/Learning Rate": 1.405371440658243e-06, "Pretrain/Loss": 1.9764975309371948, "Pretrain/Loss (Raw)": 1.6408989429473877, "Pretrain/Step": 17089, "Pretrain/Step Time": 8.505429623648524} +{"Pretrain/Learning Rate": 1.403968500737518e-06, "Pretrain/Loss": 1.9762775897979736, "Pretrain/Loss (Raw)": 2.0733423233032227, "Pretrain/Step": 17090, "Pretrain/Step Time": 8.504437496885657} +{"Pretrain/Learning Rate": 1.4025662411917246e-06, "Pretrain/Loss": 1.9749784469604492, "Pretrain/Loss (Raw)": 2.048798084259033, "Pretrain/Step": 17091, "Pretrain/Step Time": 8.499223291873932} +{"Pretrain/Learning Rate": 1.4011646620612968e-06, "Pretrain/Loss": 1.9728695154190063, "Pretrain/Loss (Raw)": 1.7924977540969849, "Pretrain/Step": 17092, "Pretrain/Step Time": 8.498840456828475} +{"Pretrain/Learning Rate": 1.399763763386655e-06, "Pretrain/Loss": 1.9720795154571533, "Pretrain/Loss (Raw)": 1.8665207624435425, "Pretrain/Step": 17093, "Pretrain/Step Time": 8.503826141357422} +{"Pretrain/Learning Rate": 1.398363545208181e-06, "Pretrain/Loss": 1.970245122909546, "Pretrain/Loss (Raw)": 1.835715651512146, "Pretrain/Step": 17094, "Pretrain/Step Time": 8.503470558673143} +{"Pretrain/Learning Rate": 1.3969640075662622e-06, "Pretrain/Loss": 1.9707419872283936, "Pretrain/Loss (Raw)": 2.05507230758667, "Pretrain/Step": 17095, "Pretrain/Step Time": 8.503350166603923} +{"Pretrain/Learning Rate": 1.3955651505012462e-06, "Pretrain/Loss": 1.972364902496338, "Pretrain/Loss (Raw)": 2.123136520385742, "Pretrain/Step": 17096, "Pretrain/Step Time": 8.502278493717313} +{"Pretrain/Learning Rate": 1.3941669740534708e-06, "Pretrain/Loss": 1.9737348556518555, "Pretrain/Loss (Raw)": 2.056346893310547, "Pretrain/Step": 17097, "Pretrain/Step Time": 8.505558045580983} +{"Pretrain/Learning Rate": 1.3927694782632477e-06, "Pretrain/Loss": 1.9751133918762207, "Pretrain/Loss (Raw)": 2.0474495887756348, "Pretrain/Step": 17098, "Pretrain/Step Time": 8.505363825708628} +{"Pretrain/Learning Rate": 1.39137266317087e-06, "Pretrain/Loss": 1.9719294309616089, "Pretrain/Loss (Raw)": 1.7262563705444336, "Pretrain/Step": 17099, "Pretrain/Step Time": 8.504649112001061} +{"Pretrain/Learning Rate": 1.389976528816625e-06, "Pretrain/Loss": 1.9733176231384277, "Pretrain/Loss (Raw)": 1.8950945138931274, "Pretrain/Step": 17100, "Pretrain/Step Time": 8.505364874377847} +{"Pretrain/Learning Rate": 1.3885810752407579e-06, "Pretrain/Loss": 1.9737565517425537, "Pretrain/Loss (Raw)": 1.9390759468078613, "Pretrain/Step": 17101, "Pretrain/Step Time": 8.504546098411083} +{"Pretrain/Learning Rate": 1.3871863024835147e-06, "Pretrain/Loss": 1.9737942218780518, "Pretrain/Loss (Raw)": 1.9848384857177734, "Pretrain/Step": 17102, "Pretrain/Step Time": 8.506718104705215} +{"Pretrain/Learning Rate": 1.3857922105851073e-06, "Pretrain/Loss": 1.9744681119918823, "Pretrain/Loss (Raw)": 2.0525214672088623, "Pretrain/Step": 17103, "Pretrain/Step Time": 8.503217393532395} +{"Pretrain/Learning Rate": 1.3843987995857316e-06, "Pretrain/Loss": 1.9726550579071045, "Pretrain/Loss (Raw)": 1.944858193397522, "Pretrain/Step": 17104, "Pretrain/Step Time": 8.50389456935227} +{"Pretrain/Learning Rate": 1.383006069525572e-06, "Pretrain/Loss": 1.9748106002807617, "Pretrain/Loss (Raw)": 2.188776969909668, "Pretrain/Step": 17105, "Pretrain/Step Time": 8.499711383134127} +{"Pretrain/Learning Rate": 1.3816140204447798e-06, "Pretrain/Loss": 1.9749490022659302, "Pretrain/Loss (Raw)": 2.015430450439453, "Pretrain/Step": 17106, "Pretrain/Step Time": 8.497571535408497} +{"Pretrain/Learning Rate": 1.3802226523835032e-06, "Pretrain/Loss": 1.9764283895492554, "Pretrain/Loss (Raw)": 2.1805226802825928, "Pretrain/Step": 17107, "Pretrain/Step Time": 8.500986713916063} +{"Pretrain/Learning Rate": 1.3788319653818493e-06, "Pretrain/Loss": 1.976090669631958, "Pretrain/Loss (Raw)": 1.9285494089126587, "Pretrain/Step": 17108, "Pretrain/Step Time": 8.500006791204214} +{"Pretrain/Learning Rate": 1.3774419594799276e-06, "Pretrain/Loss": 1.9760253429412842, "Pretrain/Loss (Raw)": 1.861613154411316, "Pretrain/Step": 17109, "Pretrain/Step Time": 8.501991866156459} +{"Pretrain/Learning Rate": 1.3760526347178142e-06, "Pretrain/Loss": 1.9790563583374023, "Pretrain/Loss (Raw)": 2.3753669261932373, "Pretrain/Step": 17110, "Pretrain/Step Time": 8.500862272456288} +{"Pretrain/Learning Rate": 1.3746639911355692e-06, "Pretrain/Loss": 1.9787747859954834, "Pretrain/Loss (Raw)": 1.8217848539352417, "Pretrain/Step": 17111, "Pretrain/Step Time": 8.498974975198507} +{"Pretrain/Learning Rate": 1.3732760287732321e-06, "Pretrain/Loss": 1.9765613079071045, "Pretrain/Loss (Raw)": 1.6334549188613892, "Pretrain/Step": 17112, "Pretrain/Step Time": 8.501066353172064} +{"Pretrain/Learning Rate": 1.3718887476708241e-06, "Pretrain/Loss": 1.977782964706421, "Pretrain/Loss (Raw)": 2.0273332595825195, "Pretrain/Step": 17113, "Pretrain/Step Time": 8.49948993511498} +{"Pretrain/Learning Rate": 1.3705021478683495e-06, "Pretrain/Loss": 1.979292631149292, "Pretrain/Loss (Raw)": 2.029205083847046, "Pretrain/Step": 17114, "Pretrain/Step Time": 8.49947401881218} +{"Pretrain/Learning Rate": 1.3691162294057896e-06, "Pretrain/Loss": 1.9810383319854736, "Pretrain/Loss (Raw)": 2.0056159496307373, "Pretrain/Step": 17115, "Pretrain/Step Time": 8.501421282067895} +{"Pretrain/Learning Rate": 1.367730992323099e-06, "Pretrain/Loss": 1.9793987274169922, "Pretrain/Loss (Raw)": 1.828511357307434, "Pretrain/Step": 17116, "Pretrain/Step Time": 8.502159714698792} +{"Pretrain/Learning Rate": 1.3663464366602292e-06, "Pretrain/Loss": 1.979682445526123, "Pretrain/Loss (Raw)": 2.0269594192504883, "Pretrain/Step": 17117, "Pretrain/Step Time": 8.503486374393106} +{"Pretrain/Learning Rate": 1.3649625624570977e-06, "Pretrain/Loss": 1.9789639711380005, "Pretrain/Loss (Raw)": 2.0502755641937256, "Pretrain/Step": 17118, "Pretrain/Step Time": 8.49886634759605} +{"Pretrain/Learning Rate": 1.363579369753612e-06, "Pretrain/Loss": 1.9812161922454834, "Pretrain/Loss (Raw)": 2.0951602458953857, "Pretrain/Step": 17119, "Pretrain/Step Time": 8.496248450130224} +{"Pretrain/Learning Rate": 1.362196858589651e-06, "Pretrain/Loss": 1.979724407196045, "Pretrain/Loss (Raw)": 1.9426778554916382, "Pretrain/Step": 17120, "Pretrain/Step Time": 8.497906504198909} +{"Pretrain/Learning Rate": 1.3608150290050775e-06, "Pretrain/Loss": 1.9783748388290405, "Pretrain/Loss (Raw)": 1.9278823137283325, "Pretrain/Step": 17121, "Pretrain/Step Time": 8.491640755906701} +{"Pretrain/Learning Rate": 1.3594338810397428e-06, "Pretrain/Loss": 1.9768967628479004, "Pretrain/Loss (Raw)": 1.7798430919647217, "Pretrain/Step": 17122, "Pretrain/Step Time": 8.494199397042394} +{"Pretrain/Learning Rate": 1.3580534147334623e-06, "Pretrain/Loss": 1.978670597076416, "Pretrain/Loss (Raw)": 2.157043218612671, "Pretrain/Step": 17123, "Pretrain/Step Time": 8.495208997279406} +{"Pretrain/Learning Rate": 1.3566736301260486e-06, "Pretrain/Loss": 1.979112148284912, "Pretrain/Loss (Raw)": 2.0693814754486084, "Pretrain/Step": 17124, "Pretrain/Step Time": 8.490217313170433} +{"Pretrain/Learning Rate": 1.3552945272572809e-06, "Pretrain/Loss": 1.979239821434021, "Pretrain/Loss (Raw)": 1.9721224308013916, "Pretrain/Step": 17125, "Pretrain/Step Time": 8.490058152005076} +{"Pretrain/Learning Rate": 1.3539161061669276e-06, "Pretrain/Loss": 1.9784033298492432, "Pretrain/Loss (Raw)": 1.9737310409545898, "Pretrain/Step": 17126, "Pretrain/Step Time": 8.492506368085742} +{"Pretrain/Learning Rate": 1.3525383668947345e-06, "Pretrain/Loss": 1.978818416595459, "Pretrain/Loss (Raw)": 2.108778953552246, "Pretrain/Step": 17127, "Pretrain/Step Time": 8.482899418100715} +{"Pretrain/Learning Rate": 1.3511613094804255e-06, "Pretrain/Loss": 1.9790575504302979, "Pretrain/Loss (Raw)": 2.234049081802368, "Pretrain/Step": 17128, "Pretrain/Step Time": 8.485367327928543} +{"Pretrain/Learning Rate": 1.3497849339637103e-06, "Pretrain/Loss": 1.9786345958709717, "Pretrain/Loss (Raw)": 1.721785545349121, "Pretrain/Step": 17129, "Pretrain/Step Time": 8.486540811136365} +{"Pretrain/Learning Rate": 1.3484092403842768e-06, "Pretrain/Loss": 1.9798309803009033, "Pretrain/Loss (Raw)": 2.049006938934326, "Pretrain/Step": 17130, "Pretrain/Step Time": 8.48312427289784} +{"Pretrain/Learning Rate": 1.347034228781785e-06, "Pretrain/Loss": 1.9764573574066162, "Pretrain/Loss (Raw)": 1.6271861791610718, "Pretrain/Step": 17131, "Pretrain/Step Time": 8.483757020905614} +{"Pretrain/Learning Rate": 1.345659899195889e-06, "Pretrain/Loss": 1.9769446849822998, "Pretrain/Loss (Raw)": 2.0248351097106934, "Pretrain/Step": 17132, "Pretrain/Step Time": 8.485835624858737} +{"Pretrain/Learning Rate": 1.344286251666213e-06, "Pretrain/Loss": 1.9767452478408813, "Pretrain/Loss (Raw)": 1.945394515991211, "Pretrain/Step": 17133, "Pretrain/Step Time": 8.486795414239168} +{"Pretrain/Learning Rate": 1.3429132862323695e-06, "Pretrain/Loss": 1.976757526397705, "Pretrain/Loss (Raw)": 2.1927003860473633, "Pretrain/Step": 17134, "Pretrain/Step Time": 8.491274815052748} +{"Pretrain/Learning Rate": 1.3415410029339464e-06, "Pretrain/Loss": 1.9786391258239746, "Pretrain/Loss (Raw)": 2.045586109161377, "Pretrain/Step": 17135, "Pretrain/Step Time": 8.489439252763987} +{"Pretrain/Learning Rate": 1.3401694018105038e-06, "Pretrain/Loss": 1.9799256324768066, "Pretrain/Loss (Raw)": 2.0322303771972656, "Pretrain/Step": 17136, "Pretrain/Step Time": 8.4873456209898} +{"Pretrain/Learning Rate": 1.3387984829016016e-06, "Pretrain/Loss": 1.9786601066589355, "Pretrain/Loss (Raw)": 1.8714009523391724, "Pretrain/Step": 17137, "Pretrain/Step Time": 8.484149288386106} +{"Pretrain/Learning Rate": 1.3374282462467636e-06, "Pretrain/Loss": 1.9820644855499268, "Pretrain/Loss (Raw)": 2.115971565246582, "Pretrain/Step": 17138, "Pretrain/Step Time": 8.478675462305546} +{"Pretrain/Learning Rate": 1.3360586918855028e-06, "Pretrain/Loss": 1.9826794862747192, "Pretrain/Loss (Raw)": 1.9604843854904175, "Pretrain/Step": 17139, "Pretrain/Step Time": 8.484421214088798} +{"Pretrain/Learning Rate": 1.3346898198573072e-06, "Pretrain/Loss": 1.9830217361450195, "Pretrain/Loss (Raw)": 2.123241662979126, "Pretrain/Step": 17140, "Pretrain/Step Time": 8.485790129750967} +{"Pretrain/Learning Rate": 1.333321630201645e-06, "Pretrain/Loss": 1.9856863021850586, "Pretrain/Loss (Raw)": 2.457998037338257, "Pretrain/Step": 17141, "Pretrain/Step Time": 8.485680405050516} +{"Pretrain/Learning Rate": 1.3319541229579734e-06, "Pretrain/Loss": 1.9829902648925781, "Pretrain/Loss (Raw)": 1.760212779045105, "Pretrain/Step": 17142, "Pretrain/Step Time": 8.485272858291864} +{"Pretrain/Learning Rate": 1.330587298165714e-06, "Pretrain/Loss": 1.9866259098052979, "Pretrain/Loss (Raw)": 2.172621488571167, "Pretrain/Step": 17143, "Pretrain/Step Time": 8.484996646642685} +{"Pretrain/Learning Rate": 1.329221155864291e-06, "Pretrain/Loss": 1.987363576889038, "Pretrain/Loss (Raw)": 1.997888445854187, "Pretrain/Step": 17144, "Pretrain/Step Time": 8.48583821579814} +{"Pretrain/Learning Rate": 1.327855696093086e-06, "Pretrain/Loss": 1.9866834878921509, "Pretrain/Loss (Raw)": 2.0068399906158447, "Pretrain/Step": 17145, "Pretrain/Step Time": 8.491390563547611} +{"Pretrain/Learning Rate": 1.3264909188914736e-06, "Pretrain/Loss": 1.9859373569488525, "Pretrain/Loss (Raw)": 1.9698874950408936, "Pretrain/Step": 17146, "Pretrain/Step Time": 8.485497133806348} +{"Pretrain/Learning Rate": 1.3251268242988086e-06, "Pretrain/Loss": 1.9873919486999512, "Pretrain/Loss (Raw)": 2.1842570304870605, "Pretrain/Step": 17147, "Pretrain/Step Time": 8.48573224246502} +{"Pretrain/Learning Rate": 1.3237634123544202e-06, "Pretrain/Loss": 1.9867117404937744, "Pretrain/Loss (Raw)": 2.1803557872772217, "Pretrain/Step": 17148, "Pretrain/Step Time": 8.48460478708148} +{"Pretrain/Learning Rate": 1.3224006830976242e-06, "Pretrain/Loss": 1.987060546875, "Pretrain/Loss (Raw)": 1.997245192527771, "Pretrain/Step": 17149, "Pretrain/Step Time": 8.481131428852677} +{"Pretrain/Learning Rate": 1.3210386365677146e-06, "Pretrain/Loss": 1.9928746223449707, "Pretrain/Loss (Raw)": 2.479001045227051, "Pretrain/Step": 17150, "Pretrain/Step Time": 8.48315953090787} +{"Pretrain/Learning Rate": 1.3196772728039596e-06, "Pretrain/Loss": 1.9931286573410034, "Pretrain/Loss (Raw)": 1.982702374458313, "Pretrain/Step": 17151, "Pretrain/Step Time": 8.48358927294612} +{"Pretrain/Learning Rate": 1.3183165918456198e-06, "Pretrain/Loss": 1.9921238422393799, "Pretrain/Loss (Raw)": 1.86534583568573, "Pretrain/Step": 17152, "Pretrain/Step Time": 8.486411113291979} +{"Pretrain/Learning Rate": 1.3169565937319216e-06, "Pretrain/Loss": 1.9921138286590576, "Pretrain/Loss (Raw)": 1.9486751556396484, "Pretrain/Step": 17153, "Pretrain/Step Time": 8.48483681678772} +{"Pretrain/Learning Rate": 1.3155972785020898e-06, "Pretrain/Loss": 1.9905567169189453, "Pretrain/Loss (Raw)": 1.702181100845337, "Pretrain/Step": 17154, "Pretrain/Step Time": 8.480413231998682} +{"Pretrain/Learning Rate": 1.3142386461953148e-06, "Pretrain/Loss": 1.9880642890930176, "Pretrain/Loss (Raw)": 1.8896971940994263, "Pretrain/Step": 17155, "Pretrain/Step Time": 8.472944742068648} +{"Pretrain/Learning Rate": 1.3128806968507684e-06, "Pretrain/Loss": 1.9919452667236328, "Pretrain/Loss (Raw)": 2.316195249557495, "Pretrain/Step": 17156, "Pretrain/Step Time": 8.475373284891248} +{"Pretrain/Learning Rate": 1.3115234305076107e-06, "Pretrain/Loss": 1.990272879600525, "Pretrain/Loss (Raw)": 1.8599015474319458, "Pretrain/Step": 17157, "Pretrain/Step Time": 8.478689080104232} +{"Pretrain/Learning Rate": 1.3101668472049717e-06, "Pretrain/Loss": 1.9895737171173096, "Pretrain/Loss (Raw)": 1.9771393537521362, "Pretrain/Step": 17158, "Pretrain/Step Time": 8.480131074786186} +{"Pretrain/Learning Rate": 1.3088109469819754e-06, "Pretrain/Loss": 1.9876697063446045, "Pretrain/Loss (Raw)": 1.6904698610305786, "Pretrain/Step": 17159, "Pretrain/Step Time": 8.480123301967978} +{"Pretrain/Learning Rate": 1.307455729877713e-06, "Pretrain/Loss": 1.9869861602783203, "Pretrain/Loss (Raw)": 1.9816144704818726, "Pretrain/Step": 17160, "Pretrain/Step Time": 8.479181682690978} +{"Pretrain/Learning Rate": 1.3061011959312613e-06, "Pretrain/Loss": 1.9895497560501099, "Pretrain/Loss (Raw)": 2.165008544921875, "Pretrain/Step": 17161, "Pretrain/Step Time": 8.478341406211257} +{"Pretrain/Learning Rate": 1.304747345181681e-06, "Pretrain/Loss": 1.988293170928955, "Pretrain/Loss (Raw)": 2.0548086166381836, "Pretrain/Step": 17162, "Pretrain/Step Time": 8.475073799490929} +{"Pretrain/Learning Rate": 1.3033941776680047e-06, "Pretrain/Loss": 1.9879229068756104, "Pretrain/Loss (Raw)": 2.0254859924316406, "Pretrain/Step": 17163, "Pretrain/Step Time": 8.48288295418024} +{"Pretrain/Learning Rate": 1.302041693429254e-06, "Pretrain/Loss": 1.989576816558838, "Pretrain/Loss (Raw)": 1.9397730827331543, "Pretrain/Step": 17164, "Pretrain/Step Time": 8.47883171401918} +{"Pretrain/Learning Rate": 1.3006898925044253e-06, "Pretrain/Loss": 1.9881258010864258, "Pretrain/Loss (Raw)": 2.039795398712158, "Pretrain/Step": 17165, "Pretrain/Step Time": 8.480240248143673} +{"Pretrain/Learning Rate": 1.299338774932493e-06, "Pretrain/Loss": 1.9852824211120605, "Pretrain/Loss (Raw)": 1.746095895767212, "Pretrain/Step": 17166, "Pretrain/Step Time": 8.483278499916196} +{"Pretrain/Learning Rate": 1.2979883407524236e-06, "Pretrain/Loss": 1.9853744506835938, "Pretrain/Loss (Raw)": 2.058568000793457, "Pretrain/Step": 17167, "Pretrain/Step Time": 8.481423338875175} +{"Pretrain/Learning Rate": 1.2966385900031463e-06, "Pretrain/Loss": 1.9874637126922607, "Pretrain/Loss (Raw)": 2.049485921859741, "Pretrain/Step": 17168, "Pretrain/Step Time": 8.481962945312262} +{"Pretrain/Learning Rate": 1.2952895227235917e-06, "Pretrain/Loss": 1.9867994785308838, "Pretrain/Loss (Raw)": 2.0245583057403564, "Pretrain/Step": 17169, "Pretrain/Step Time": 8.485255997627974} +{"Pretrain/Learning Rate": 1.2939411389526507e-06, "Pretrain/Loss": 1.9903051853179932, "Pretrain/Loss (Raw)": 2.285353183746338, "Pretrain/Step": 17170, "Pretrain/Step Time": 8.481962757185102} +{"Pretrain/Learning Rate": 1.2925934387292033e-06, "Pretrain/Loss": 1.9893178939819336, "Pretrain/Loss (Raw)": 1.8223884105682373, "Pretrain/Step": 17171, "Pretrain/Step Time": 8.476682526990771} +{"Pretrain/Learning Rate": 1.2912464220921155e-06, "Pretrain/Loss": 1.9902756214141846, "Pretrain/Loss (Raw)": 1.9170002937316895, "Pretrain/Step": 17172, "Pretrain/Step Time": 8.480559665709734} +{"Pretrain/Learning Rate": 1.2899000890802175e-06, "Pretrain/Loss": 1.9902608394622803, "Pretrain/Loss (Raw)": 1.8464945554733276, "Pretrain/Step": 17173, "Pretrain/Step Time": 8.47788431495428} +{"Pretrain/Learning Rate": 1.2885544397323424e-06, "Pretrain/Loss": 1.9891834259033203, "Pretrain/Loss (Raw)": 1.8782052993774414, "Pretrain/Step": 17174, "Pretrain/Step Time": 8.478249426931143} +{"Pretrain/Learning Rate": 1.2872094740872808e-06, "Pretrain/Loss": 1.9893410205841064, "Pretrain/Loss (Raw)": 2.0223429203033447, "Pretrain/Step": 17175, "Pretrain/Step Time": 8.476740933954716} +{"Pretrain/Learning Rate": 1.2858651921838188e-06, "Pretrain/Loss": 1.9923126697540283, "Pretrain/Loss (Raw)": 1.9362343549728394, "Pretrain/Step": 17176, "Pretrain/Step Time": 8.480792032554746} +{"Pretrain/Learning Rate": 1.284521594060717e-06, "Pretrain/Loss": 1.9918129444122314, "Pretrain/Loss (Raw)": 2.0290305614471436, "Pretrain/Step": 17177, "Pretrain/Step Time": 8.478101575747132} +{"Pretrain/Learning Rate": 1.2831786797567135e-06, "Pretrain/Loss": 1.9909300804138184, "Pretrain/Loss (Raw)": 1.865774393081665, "Pretrain/Step": 17178, "Pretrain/Step Time": 8.47785078920424} +{"Pretrain/Learning Rate": 1.2818364493105362e-06, "Pretrain/Loss": 1.9928162097930908, "Pretrain/Loss (Raw)": 2.0094141960144043, "Pretrain/Step": 17179, "Pretrain/Step Time": 8.478274963796139} +{"Pretrain/Learning Rate": 1.2804949027608842e-06, "Pretrain/Loss": 1.994992733001709, "Pretrain/Loss (Raw)": 2.2967076301574707, "Pretrain/Step": 17180, "Pretrain/Step Time": 8.478462563827634} +{"Pretrain/Learning Rate": 1.2791540401464436e-06, "Pretrain/Loss": 1.9972333908081055, "Pretrain/Loss (Raw)": 2.1599082946777344, "Pretrain/Step": 17181, "Pretrain/Step Time": 8.479900810867548} +{"Pretrain/Learning Rate": 1.2778138615058693e-06, "Pretrain/Loss": 1.9935939311981201, "Pretrain/Loss (Raw)": 1.5985736846923828, "Pretrain/Step": 17182, "Pretrain/Step Time": 8.477417098358274} +{"Pretrain/Learning Rate": 1.2764743668778139e-06, "Pretrain/Loss": 1.9952423572540283, "Pretrain/Loss (Raw)": 2.1081998348236084, "Pretrain/Step": 17183, "Pretrain/Step Time": 8.48345790989697} +{"Pretrain/Learning Rate": 1.2751355563008937e-06, "Pretrain/Loss": 1.9949438571929932, "Pretrain/Loss (Raw)": 1.9023656845092773, "Pretrain/Step": 17184, "Pretrain/Step Time": 8.480488985776901} +{"Pretrain/Learning Rate": 1.273797429813714e-06, "Pretrain/Loss": 1.9953229427337646, "Pretrain/Loss (Raw)": 1.9955737590789795, "Pretrain/Step": 17185, "Pretrain/Step Time": 8.481026137247682} +{"Pretrain/Learning Rate": 1.2724599874548604e-06, "Pretrain/Loss": 1.9941825866699219, "Pretrain/Loss (Raw)": 1.8734205961227417, "Pretrain/Step": 17186, "Pretrain/Step Time": 8.47782906703651} +{"Pretrain/Learning Rate": 1.271123229262894e-06, "Pretrain/Loss": 1.9948885440826416, "Pretrain/Loss (Raw)": 1.9857828617095947, "Pretrain/Step": 17187, "Pretrain/Step Time": 8.478086736053228} +{"Pretrain/Learning Rate": 1.2697871552763667e-06, "Pretrain/Loss": 1.9965990781784058, "Pretrain/Loss (Raw)": 2.03964900970459, "Pretrain/Step": 17188, "Pretrain/Step Time": 8.476970333606005} +{"Pretrain/Learning Rate": 1.2684517655337958e-06, "Pretrain/Loss": 1.9969940185546875, "Pretrain/Loss (Raw)": 2.127319574356079, "Pretrain/Step": 17189, "Pretrain/Step Time": 8.479167433455586} +{"Pretrain/Learning Rate": 1.2671170600736859e-06, "Pretrain/Loss": 1.995806097984314, "Pretrain/Loss (Raw)": 1.937241554260254, "Pretrain/Step": 17190, "Pretrain/Step Time": 8.475894467905164} +{"Pretrain/Learning Rate": 1.2657830389345288e-06, "Pretrain/Loss": 1.996015191078186, "Pretrain/Loss (Raw)": 2.0620176792144775, "Pretrain/Step": 17191, "Pretrain/Step Time": 8.474868584424257} +{"Pretrain/Learning Rate": 1.2644497021547824e-06, "Pretrain/Loss": 1.9968210458755493, "Pretrain/Loss (Raw)": 2.0725061893463135, "Pretrain/Step": 17192, "Pretrain/Step Time": 8.47527970187366} +{"Pretrain/Learning Rate": 1.2631170497728995e-06, "Pretrain/Loss": 1.9961717128753662, "Pretrain/Loss (Raw)": 1.8799136877059937, "Pretrain/Step": 17193, "Pretrain/Step Time": 8.476024063304067} +{"Pretrain/Learning Rate": 1.2617850818273019e-06, "Pretrain/Loss": 1.9958839416503906, "Pretrain/Loss (Raw)": 2.0095577239990234, "Pretrain/Step": 17194, "Pretrain/Step Time": 8.478302093222737} +{"Pretrain/Learning Rate": 1.2604537983563952e-06, "Pretrain/Loss": 1.9927256107330322, "Pretrain/Loss (Raw)": 1.7710639238357544, "Pretrain/Step": 17195, "Pretrain/Step Time": 8.477882258594036} +{"Pretrain/Learning Rate": 1.2591231993985708e-06, "Pretrain/Loss": 1.9918463230133057, "Pretrain/Loss (Raw)": 2.0299835205078125, "Pretrain/Step": 17196, "Pretrain/Step Time": 8.476385943591595} +{"Pretrain/Learning Rate": 1.2577932849921897e-06, "Pretrain/Loss": 1.9917505979537964, "Pretrain/Loss (Raw)": 1.9992072582244873, "Pretrain/Step": 17197, "Pretrain/Step Time": 8.473055670037866} +{"Pretrain/Learning Rate": 1.2564640551756047e-06, "Pretrain/Loss": 1.989987850189209, "Pretrain/Loss (Raw)": 1.823501706123352, "Pretrain/Step": 17198, "Pretrain/Step Time": 8.475969042629004} +{"Pretrain/Learning Rate": 1.2551355099871432e-06, "Pretrain/Loss": 1.9908580780029297, "Pretrain/Loss (Raw)": 2.0216596126556396, "Pretrain/Step": 17199, "Pretrain/Step Time": 8.475655898451805} +{"Pretrain/Learning Rate": 1.2538076494651052e-06, "Pretrain/Loss": 1.9944888353347778, "Pretrain/Loss (Raw)": 2.1981334686279297, "Pretrain/Step": 17200, "Pretrain/Step Time": 8.476700222119689} +{"Pretrain/Learning Rate": 1.2524804736477853e-06, "Pretrain/Loss": 1.9949262142181396, "Pretrain/Loss (Raw)": 2.142247438430786, "Pretrain/Step": 17201, "Pretrain/Step Time": 8.477557081729174} +{"Pretrain/Learning Rate": 1.2511539825734497e-06, "Pretrain/Loss": 1.9961752891540527, "Pretrain/Loss (Raw)": 2.0563573837280273, "Pretrain/Step": 17202, "Pretrain/Step Time": 8.481638925150037} +{"Pretrain/Learning Rate": 1.2498281762803489e-06, "Pretrain/Loss": 1.996368408203125, "Pretrain/Loss (Raw)": 2.1184020042419434, "Pretrain/Step": 17203, "Pretrain/Step Time": 8.476529315114021} +{"Pretrain/Learning Rate": 1.24850305480671e-06, "Pretrain/Loss": 1.99474036693573, "Pretrain/Loss (Raw)": 1.8868532180786133, "Pretrain/Step": 17204, "Pretrain/Step Time": 8.470751153305173} +{"Pretrain/Learning Rate": 1.2471786181907392e-06, "Pretrain/Loss": 1.9941928386688232, "Pretrain/Loss (Raw)": 1.9226056337356567, "Pretrain/Step": 17205, "Pretrain/Step Time": 8.4686492215842} +{"Pretrain/Learning Rate": 1.2458548664706305e-06, "Pretrain/Loss": 1.991913914680481, "Pretrain/Loss (Raw)": 1.8247294425964355, "Pretrain/Step": 17206, "Pretrain/Step Time": 8.46709674410522} +{"Pretrain/Learning Rate": 1.2445317996845478e-06, "Pretrain/Loss": 1.9912067651748657, "Pretrain/Loss (Raw)": 1.9381210803985596, "Pretrain/Step": 17207, "Pretrain/Step Time": 8.465075133368373} +{"Pretrain/Learning Rate": 1.2432094178706471e-06, "Pretrain/Loss": 1.9902424812316895, "Pretrain/Loss (Raw)": 1.7374473810195923, "Pretrain/Step": 17208, "Pretrain/Step Time": 8.464532155543566} +{"Pretrain/Learning Rate": 1.241887721067056e-06, "Pretrain/Loss": 1.992771029472351, "Pretrain/Loss (Raw)": 2.3189773559570312, "Pretrain/Step": 17209, "Pretrain/Step Time": 8.467293111607432} +{"Pretrain/Learning Rate": 1.2405667093118827e-06, "Pretrain/Loss": 1.9916865825653076, "Pretrain/Loss (Raw)": 1.8202362060546875, "Pretrain/Step": 17210, "Pretrain/Step Time": 8.46272443048656} +{"Pretrain/Learning Rate": 1.2392463826432193e-06, "Pretrain/Loss": 1.9902262687683105, "Pretrain/Loss (Raw)": 1.707152009010315, "Pretrain/Step": 17211, "Pretrain/Step Time": 8.471821449697018} +{"Pretrain/Learning Rate": 1.2379267410991352e-06, "Pretrain/Loss": 1.9878411293029785, "Pretrain/Loss (Raw)": 2.021232843399048, "Pretrain/Step": 17212, "Pretrain/Step Time": 8.4729218557477} +{"Pretrain/Learning Rate": 1.2366077847176832e-06, "Pretrain/Loss": 1.9887586832046509, "Pretrain/Loss (Raw)": 2.081697940826416, "Pretrain/Step": 17213, "Pretrain/Step Time": 8.470054568722844} +{"Pretrain/Learning Rate": 1.235289513536897e-06, "Pretrain/Loss": 1.9892220497131348, "Pretrain/Loss (Raw)": 2.1010401248931885, "Pretrain/Step": 17214, "Pretrain/Step Time": 8.469232963398099} +{"Pretrain/Learning Rate": 1.2339719275947792e-06, "Pretrain/Loss": 1.9902902841567993, "Pretrain/Loss (Raw)": 1.9173725843429565, "Pretrain/Step": 17215, "Pretrain/Step Time": 8.470861623063684} +{"Pretrain/Learning Rate": 1.2326550269293302e-06, "Pretrain/Loss": 1.9877495765686035, "Pretrain/Loss (Raw)": 1.7828218936920166, "Pretrain/Step": 17216, "Pretrain/Step Time": 8.469232872128487} +{"Pretrain/Learning Rate": 1.2313388115785168e-06, "Pretrain/Loss": 1.9904980659484863, "Pretrain/Loss (Raw)": 1.992708683013916, "Pretrain/Step": 17217, "Pretrain/Step Time": 8.46969479136169} +{"Pretrain/Learning Rate": 1.2300232815802948e-06, "Pretrain/Loss": 1.9907126426696777, "Pretrain/Loss (Raw)": 2.1008048057556152, "Pretrain/Step": 17218, "Pretrain/Step Time": 8.465451154857874} +{"Pretrain/Learning Rate": 1.2287084369725949e-06, "Pretrain/Loss": 1.9908862113952637, "Pretrain/Loss (Raw)": 2.071018934249878, "Pretrain/Step": 17219, "Pretrain/Step Time": 8.463284406810999} +{"Pretrain/Learning Rate": 1.2273942777933255e-06, "Pretrain/Loss": 1.9927411079406738, "Pretrain/Loss (Raw)": 2.0299110412597656, "Pretrain/Step": 17220, "Pretrain/Step Time": 8.464044481515884} +{"Pretrain/Learning Rate": 1.2260808040803873e-06, "Pretrain/Loss": 1.9955158233642578, "Pretrain/Loss (Raw)": 2.2216897010803223, "Pretrain/Step": 17221, "Pretrain/Step Time": 8.46388577669859} +{"Pretrain/Learning Rate": 1.224768015871647e-06, "Pretrain/Loss": 1.9957135915756226, "Pretrain/Loss (Raw)": 1.861031174659729, "Pretrain/Step": 17222, "Pretrain/Step Time": 8.467421537265182} +{"Pretrain/Learning Rate": 1.2234559132049628e-06, "Pretrain/Loss": 1.9948670864105225, "Pretrain/Loss (Raw)": 1.9467284679412842, "Pretrain/Step": 17223, "Pretrain/Step Time": 8.467196486890316} +{"Pretrain/Learning Rate": 1.2221444961181689e-06, "Pretrain/Loss": 1.992945671081543, "Pretrain/Loss (Raw)": 1.8771865367889404, "Pretrain/Step": 17224, "Pretrain/Step Time": 8.467129115015268} +{"Pretrain/Learning Rate": 1.2208337646490709e-06, "Pretrain/Loss": 1.9923357963562012, "Pretrain/Loss (Raw)": 1.9782992601394653, "Pretrain/Step": 17225, "Pretrain/Step Time": 8.46419857442379} +{"Pretrain/Learning Rate": 1.219523718835469e-06, "Pretrain/Loss": 1.9908922910690308, "Pretrain/Loss (Raw)": 1.862668514251709, "Pretrain/Step": 17226, "Pretrain/Step Time": 8.466781312599778} +{"Pretrain/Learning Rate": 1.2182143587151362e-06, "Pretrain/Loss": 1.991369605064392, "Pretrain/Loss (Raw)": 1.7873637676239014, "Pretrain/Step": 17227, "Pretrain/Step Time": 8.469194544479251} +{"Pretrain/Learning Rate": 1.216905684325831e-06, "Pretrain/Loss": 1.9918951988220215, "Pretrain/Loss (Raw)": 1.9623451232910156, "Pretrain/Step": 17228, "Pretrain/Step Time": 8.468034122139215} +{"Pretrain/Learning Rate": 1.215597695705284e-06, "Pretrain/Loss": 1.9911571741104126, "Pretrain/Loss (Raw)": 1.8446394205093384, "Pretrain/Step": 17229, "Pretrain/Step Time": 8.468137606978416} +{"Pretrain/Learning Rate": 1.214290392891204e-06, "Pretrain/Loss": 1.9895813465118408, "Pretrain/Loss (Raw)": 1.7830978631973267, "Pretrain/Step": 17230, "Pretrain/Step Time": 8.467125665396452} +{"Pretrain/Learning Rate": 1.2129837759213004e-06, "Pretrain/Loss": 1.9878031015396118, "Pretrain/Loss (Raw)": 1.8249335289001465, "Pretrain/Step": 17231, "Pretrain/Step Time": 8.470074690878391} +{"Pretrain/Learning Rate": 1.2116778448332338e-06, "Pretrain/Loss": 1.9888513088226318, "Pretrain/Loss (Raw)": 2.079021453857422, "Pretrain/Step": 17232, "Pretrain/Step Time": 8.470929088070989} +{"Pretrain/Learning Rate": 1.2103725996646747e-06, "Pretrain/Loss": 1.9865306615829468, "Pretrain/Loss (Raw)": 1.8917442560195923, "Pretrain/Step": 17233, "Pretrain/Step Time": 8.47223486378789} +{"Pretrain/Learning Rate": 1.2090680404532485e-06, "Pretrain/Loss": 1.9858300685882568, "Pretrain/Loss (Raw)": 1.925732135772705, "Pretrain/Step": 17234, "Pretrain/Step Time": 8.469798404723406} +{"Pretrain/Learning Rate": 1.2077641672365691e-06, "Pretrain/Loss": 1.982654333114624, "Pretrain/Loss (Raw)": 1.7740415334701538, "Pretrain/Step": 17235, "Pretrain/Step Time": 8.467999011278152} +{"Pretrain/Learning Rate": 1.206460980052243e-06, "Pretrain/Loss": 1.9832828044891357, "Pretrain/Loss (Raw)": 2.0089991092681885, "Pretrain/Step": 17236, "Pretrain/Step Time": 8.468439545482397} +{"Pretrain/Learning Rate": 1.2051584789378373e-06, "Pretrain/Loss": 1.984398603439331, "Pretrain/Loss (Raw)": 2.0044233798980713, "Pretrain/Step": 17237, "Pretrain/Step Time": 8.464310728013515} +{"Pretrain/Learning Rate": 1.2038566639309162e-06, "Pretrain/Loss": 1.981612205505371, "Pretrain/Loss (Raw)": 2.018711805343628, "Pretrain/Step": 17238, "Pretrain/Step Time": 8.467938045039773} +{"Pretrain/Learning Rate": 1.202555535069011e-06, "Pretrain/Loss": 1.9856866598129272, "Pretrain/Loss (Raw)": 2.343320846557617, "Pretrain/Step": 17239, "Pretrain/Step Time": 8.467602353543043} +{"Pretrain/Learning Rate": 1.2012550923896387e-06, "Pretrain/Loss": 1.986783742904663, "Pretrain/Loss (Raw)": 1.773881435394287, "Pretrain/Step": 17240, "Pretrain/Step Time": 8.46528392098844} +{"Pretrain/Learning Rate": 1.1999553359303029e-06, "Pretrain/Loss": 1.9874088764190674, "Pretrain/Loss (Raw)": 2.1073594093322754, "Pretrain/Step": 17241, "Pretrain/Step Time": 8.465847309678793} +{"Pretrain/Learning Rate": 1.1986562657284732e-06, "Pretrain/Loss": 1.9921544790267944, "Pretrain/Loss (Raw)": 2.6366279125213623, "Pretrain/Step": 17242, "Pretrain/Step Time": 8.464243104681373} +{"Pretrain/Learning Rate": 1.1973578818216147e-06, "Pretrain/Loss": 1.9918181896209717, "Pretrain/Loss (Raw)": 1.9625804424285889, "Pretrain/Step": 17243, "Pretrain/Step Time": 8.46230274066329} +{"Pretrain/Learning Rate": 1.1960601842471636e-06, "Pretrain/Loss": 1.992325782775879, "Pretrain/Loss (Raw)": 1.893481731414795, "Pretrain/Step": 17244, "Pretrain/Step Time": 8.466922232881188} +{"Pretrain/Learning Rate": 1.1947631730425318e-06, "Pretrain/Loss": 1.9926191568374634, "Pretrain/Loss (Raw)": 2.064497470855713, "Pretrain/Step": 17245, "Pretrain/Step Time": 8.465040734037757} +{"Pretrain/Learning Rate": 1.1934668482451228e-06, "Pretrain/Loss": 1.9934470653533936, "Pretrain/Loss (Raw)": 2.1562421321868896, "Pretrain/Step": 17246, "Pretrain/Step Time": 8.469723016023636} +{"Pretrain/Learning Rate": 1.192171209892315e-06, "Pretrain/Loss": 1.992604374885559, "Pretrain/Loss (Raw)": 1.9873089790344238, "Pretrain/Step": 17247, "Pretrain/Step Time": 8.46427839808166} +{"Pretrain/Learning Rate": 1.19087625802147e-06, "Pretrain/Loss": 1.995658278465271, "Pretrain/Loss (Raw)": 2.3335752487182617, "Pretrain/Step": 17248, "Pretrain/Step Time": 8.466993786394596} +{"Pretrain/Learning Rate": 1.1895819926699191e-06, "Pretrain/Loss": 1.996313452720642, "Pretrain/Loss (Raw)": 2.0117461681365967, "Pretrain/Step": 17249, "Pretrain/Step Time": 8.470950979739428} +{"Pretrain/Learning Rate": 1.188288413874991e-06, "Pretrain/Loss": 1.998366355895996, "Pretrain/Loss (Raw)": 2.042612075805664, "Pretrain/Step": 17250, "Pretrain/Step Time": 8.470364900305867} +{"Pretrain/Learning Rate": 1.1869955216739782e-06, "Pretrain/Loss": 1.996711015701294, "Pretrain/Loss (Raw)": 1.9451781511306763, "Pretrain/Step": 17251, "Pretrain/Step Time": 8.470790471881628} +{"Pretrain/Learning Rate": 1.1857033161041614e-06, "Pretrain/Loss": 1.9969747066497803, "Pretrain/Loss (Raw)": 2.103121042251587, "Pretrain/Step": 17252, "Pretrain/Step Time": 8.474176602438092} +{"Pretrain/Learning Rate": 1.184411797202803e-06, "Pretrain/Loss": 1.9932894706726074, "Pretrain/Loss (Raw)": 1.5004055500030518, "Pretrain/Step": 17253, "Pretrain/Step Time": 8.472502052783966} +{"Pretrain/Learning Rate": 1.1831209650071395e-06, "Pretrain/Loss": 1.9927639961242676, "Pretrain/Loss (Raw)": 1.9064725637435913, "Pretrain/Step": 17254, "Pretrain/Step Time": 8.471553383395076} +{"Pretrain/Learning Rate": 1.1818308195543942e-06, "Pretrain/Loss": 1.9920271635055542, "Pretrain/Loss (Raw)": 2.0144646167755127, "Pretrain/Step": 17255, "Pretrain/Step Time": 8.477893056347966} +{"Pretrain/Learning Rate": 1.1805413608817707e-06, "Pretrain/Loss": 1.9886854887008667, "Pretrain/Loss (Raw)": 1.8063113689422607, "Pretrain/Step": 17256, "Pretrain/Step Time": 8.479660699144006} +{"Pretrain/Learning Rate": 1.1792525890264388e-06, "Pretrain/Loss": 1.98930025100708, "Pretrain/Loss (Raw)": 1.8004770278930664, "Pretrain/Step": 17257, "Pretrain/Step Time": 8.47420715354383} +{"Pretrain/Learning Rate": 1.1779645040255694e-06, "Pretrain/Loss": 1.9887479543685913, "Pretrain/Loss (Raw)": 1.9783093929290771, "Pretrain/Step": 17258, "Pretrain/Step Time": 8.47625626809895} +{"Pretrain/Learning Rate": 1.176677105916299e-06, "Pretrain/Loss": 1.9911134243011475, "Pretrain/Loss (Raw)": 1.9299715757369995, "Pretrain/Step": 17259, "Pretrain/Step Time": 8.475010201334953} +{"Pretrain/Learning Rate": 1.175390394735751e-06, "Pretrain/Loss": 1.989370346069336, "Pretrain/Loss (Raw)": 1.8017070293426514, "Pretrain/Step": 17260, "Pretrain/Step Time": 8.478256715461612} +{"Pretrain/Learning Rate": 1.174104370521026e-06, "Pretrain/Loss": 1.9904091358184814, "Pretrain/Loss (Raw)": 2.0783498287200928, "Pretrain/Step": 17261, "Pretrain/Step Time": 8.477468963712454} +{"Pretrain/Learning Rate": 1.1728190333092025e-06, "Pretrain/Loss": 1.9880900382995605, "Pretrain/Loss (Raw)": 1.8958690166473389, "Pretrain/Step": 17262, "Pretrain/Step Time": 8.47551185823977} +{"Pretrain/Learning Rate": 1.1715343831373487e-06, "Pretrain/Loss": 1.9864088296890259, "Pretrain/Loss (Raw)": 1.8303979635238647, "Pretrain/Step": 17263, "Pretrain/Step Time": 8.477901866659522} +{"Pretrain/Learning Rate": 1.1702504200424986e-06, "Pretrain/Loss": 1.9805090427398682, "Pretrain/Loss (Raw)": 1.277060866355896, "Pretrain/Step": 17264, "Pretrain/Step Time": 8.482305090874434} +{"Pretrain/Learning Rate": 1.1689671440616862e-06, "Pretrain/Loss": 1.9808833599090576, "Pretrain/Loss (Raw)": 1.919316291809082, "Pretrain/Step": 17265, "Pretrain/Step Time": 8.4839085675776} +{"Pretrain/Learning Rate": 1.1676845552319016e-06, "Pretrain/Loss": 1.9798784255981445, "Pretrain/Loss (Raw)": 1.9873322248458862, "Pretrain/Step": 17266, "Pretrain/Step Time": 8.489006305113435} +{"Pretrain/Learning Rate": 1.1664026535901318e-06, "Pretrain/Loss": 1.9794540405273438, "Pretrain/Loss (Raw)": 1.906179428100586, "Pretrain/Step": 17267, "Pretrain/Step Time": 8.483444450423121} +{"Pretrain/Learning Rate": 1.1651214391733445e-06, "Pretrain/Loss": 1.9776543378829956, "Pretrain/Loss (Raw)": 1.8928605318069458, "Pretrain/Step": 17268, "Pretrain/Step Time": 8.478627411648631} +{"Pretrain/Learning Rate": 1.1638409120184712e-06, "Pretrain/Loss": 1.9729667901992798, "Pretrain/Loss (Raw)": 1.8580012321472168, "Pretrain/Step": 17269, "Pretrain/Step Time": 8.484786843881011} +{"Pretrain/Learning Rate": 1.1625610721624464e-06, "Pretrain/Loss": 1.9750288724899292, "Pretrain/Loss (Raw)": 2.0241565704345703, "Pretrain/Step": 17270, "Pretrain/Step Time": 8.48265577852726} +{"Pretrain/Learning Rate": 1.1612819196421653e-06, "Pretrain/Loss": 1.9737718105316162, "Pretrain/Loss (Raw)": 2.0117340087890625, "Pretrain/Step": 17271, "Pretrain/Step Time": 8.487727731466293} +{"Pretrain/Learning Rate": 1.1600034544945154e-06, "Pretrain/Loss": 1.9726630449295044, "Pretrain/Loss (Raw)": 1.8559503555297852, "Pretrain/Step": 17272, "Pretrain/Step Time": 8.484410682693124} +{"Pretrain/Learning Rate": 1.1587256767563642e-06, "Pretrain/Loss": 1.973893642425537, "Pretrain/Loss (Raw)": 2.1643457412719727, "Pretrain/Step": 17273, "Pretrain/Step Time": 8.483623007312417} +{"Pretrain/Learning Rate": 1.1574485864645463e-06, "Pretrain/Loss": 1.9708746671676636, "Pretrain/Loss (Raw)": 1.5834766626358032, "Pretrain/Step": 17274, "Pretrain/Step Time": 8.4849141407758} +{"Pretrain/Learning Rate": 1.156172183655893e-06, "Pretrain/Loss": 1.9696564674377441, "Pretrain/Loss (Raw)": 2.0283188819885254, "Pretrain/Step": 17275, "Pretrain/Step Time": 8.486864693462849} +{"Pretrain/Learning Rate": 1.154896468367203e-06, "Pretrain/Loss": 1.9700171947479248, "Pretrain/Loss (Raw)": 2.2265193462371826, "Pretrain/Step": 17276, "Pretrain/Step Time": 8.486576670780778} +{"Pretrain/Learning Rate": 1.1536214406352664e-06, "Pretrain/Loss": 1.9686431884765625, "Pretrain/Loss (Raw)": 1.8213773965835571, "Pretrain/Step": 17277, "Pretrain/Step Time": 8.489503175020218} +{"Pretrain/Learning Rate": 1.152347100496845e-06, "Pretrain/Loss": 1.965273380279541, "Pretrain/Loss (Raw)": 2.047659397125244, "Pretrain/Step": 17278, "Pretrain/Step Time": 8.485660975798965} +{"Pretrain/Learning Rate": 1.151073447988682e-06, "Pretrain/Loss": 1.9647605419158936, "Pretrain/Loss (Raw)": 1.917066216468811, "Pretrain/Step": 17279, "Pretrain/Step Time": 8.48669876717031} +{"Pretrain/Learning Rate": 1.1498004831475063e-06, "Pretrain/Loss": 1.9657293558120728, "Pretrain/Loss (Raw)": 1.9893600940704346, "Pretrain/Step": 17280, "Pretrain/Step Time": 8.484272714704275} +{"Pretrain/Learning Rate": 1.148528206010016e-06, "Pretrain/Loss": 1.965046763420105, "Pretrain/Loss (Raw)": 1.8613080978393555, "Pretrain/Step": 17281, "Pretrain/Step Time": 8.484709801152349} +{"Pretrain/Learning Rate": 1.1472566166129045e-06, "Pretrain/Loss": 1.9677977561950684, "Pretrain/Loss (Raw)": 2.054314374923706, "Pretrain/Step": 17282, "Pretrain/Step Time": 8.481540258973837} +{"Pretrain/Learning Rate": 1.1459857149928338e-06, "Pretrain/Loss": 1.9682308435440063, "Pretrain/Loss (Raw)": 1.9451239109039307, "Pretrain/Step": 17283, "Pretrain/Step Time": 8.489341532811522} +{"Pretrain/Learning Rate": 1.1447155011864468e-06, "Pretrain/Loss": 1.967079758644104, "Pretrain/Loss (Raw)": 2.1688523292541504, "Pretrain/Step": 17284, "Pretrain/Step Time": 8.486511837691069} +{"Pretrain/Learning Rate": 1.1434459752303728e-06, "Pretrain/Loss": 1.9685227870941162, "Pretrain/Loss (Raw)": 2.044619083404541, "Pretrain/Step": 17285, "Pretrain/Step Time": 8.482963275164366} +{"Pretrain/Learning Rate": 1.1421771371612128e-06, "Pretrain/Loss": 1.9680405855178833, "Pretrain/Loss (Raw)": 1.915406584739685, "Pretrain/Step": 17286, "Pretrain/Step Time": 8.487720429897308} +{"Pretrain/Learning Rate": 1.1409089870155598e-06, "Pretrain/Loss": 1.969738483428955, "Pretrain/Loss (Raw)": 1.9077959060668945, "Pretrain/Step": 17287, "Pretrain/Step Time": 8.492482099682093} +{"Pretrain/Learning Rate": 1.1396415248299791e-06, "Pretrain/Loss": 1.9702210426330566, "Pretrain/Loss (Raw)": 2.043384313583374, "Pretrain/Step": 17288, "Pretrain/Step Time": 8.490223877131939} +{"Pretrain/Learning Rate": 1.1383747506410081e-06, "Pretrain/Loss": 1.968949556350708, "Pretrain/Loss (Raw)": 2.0022716522216797, "Pretrain/Step": 17289, "Pretrain/Step Time": 8.495874045416713} +{"Pretrain/Learning Rate": 1.1371086644851843e-06, "Pretrain/Loss": 1.967725157737732, "Pretrain/Loss (Raw)": 1.8980814218521118, "Pretrain/Step": 17290, "Pretrain/Step Time": 8.497329965233803} +{"Pretrain/Learning Rate": 1.1358432663990087e-06, "Pretrain/Loss": 1.9652063846588135, "Pretrain/Loss (Raw)": 1.7030658721923828, "Pretrain/Step": 17291, "Pretrain/Step Time": 8.490973988547921} +{"Pretrain/Learning Rate": 1.1345785564189692e-06, "Pretrain/Loss": 1.9653569459915161, "Pretrain/Loss (Raw)": 1.959053874015808, "Pretrain/Step": 17292, "Pretrain/Step Time": 8.49997690320015} +{"Pretrain/Learning Rate": 1.1333145345815366e-06, "Pretrain/Loss": 1.964621663093567, "Pretrain/Loss (Raw)": 1.945693850517273, "Pretrain/Step": 17293, "Pretrain/Step Time": 8.497086545452476} +{"Pretrain/Learning Rate": 1.1320512009231481e-06, "Pretrain/Loss": 1.9686856269836426, "Pretrain/Loss (Raw)": 2.2662808895111084, "Pretrain/Step": 17294, "Pretrain/Step Time": 8.494012519717216} +{"Pretrain/Learning Rate": 1.1307885554802416e-06, "Pretrain/Loss": 1.9686319828033447, "Pretrain/Loss (Raw)": 2.0516915321350098, "Pretrain/Step": 17295, "Pretrain/Step Time": 8.49746236950159} +{"Pretrain/Learning Rate": 1.1295265982892184e-06, "Pretrain/Loss": 1.9671940803527832, "Pretrain/Loss (Raw)": 1.8654354810714722, "Pretrain/Step": 17296, "Pretrain/Step Time": 8.49675957299769} +{"Pretrain/Learning Rate": 1.1282653293864687e-06, "Pretrain/Loss": 1.9674890041351318, "Pretrain/Loss (Raw)": 2.0623083114624023, "Pretrain/Step": 17297, "Pretrain/Step Time": 8.494700657203794} +{"Pretrain/Learning Rate": 1.1270047488083634e-06, "Pretrain/Loss": 1.9658329486846924, "Pretrain/Loss (Raw)": 2.0733742713928223, "Pretrain/Step": 17298, "Pretrain/Step Time": 8.49778332002461} +{"Pretrain/Learning Rate": 1.1257448565912404e-06, "Pretrain/Loss": 1.9657541513442993, "Pretrain/Loss (Raw)": 1.8123077154159546, "Pretrain/Step": 17299, "Pretrain/Step Time": 8.501009149476886} +{"Pretrain/Learning Rate": 1.1244856527714397e-06, "Pretrain/Loss": 1.9655897617340088, "Pretrain/Loss (Raw)": 1.8959667682647705, "Pretrain/Step": 17300, "Pretrain/Step Time": 8.500238476321101} +{"Pretrain/Learning Rate": 1.1232271373852604e-06, "Pretrain/Loss": 1.9658026695251465, "Pretrain/Loss (Raw)": 1.8737437725067139, "Pretrain/Step": 17301, "Pretrain/Step Time": 8.499370386824012} +{"Pretrain/Learning Rate": 1.1219693104689954e-06, "Pretrain/Loss": 1.9681799411773682, "Pretrain/Loss (Raw)": 2.182490825653076, "Pretrain/Step": 17302, "Pretrain/Step Time": 8.499557860195637} +{"Pretrain/Learning Rate": 1.1207121720589158e-06, "Pretrain/Loss": 1.9671294689178467, "Pretrain/Loss (Raw)": 1.8878722190856934, "Pretrain/Step": 17303, "Pretrain/Step Time": 8.510304570198059} +{"Pretrain/Learning Rate": 1.119455722191262e-06, "Pretrain/Loss": 1.9682139158248901, "Pretrain/Loss (Raw)": 2.0750441551208496, "Pretrain/Step": 17304, "Pretrain/Step Time": 8.509704070165753} +{"Pretrain/Learning Rate": 1.118199960902272e-06, "Pretrain/Loss": 1.9688160419464111, "Pretrain/Loss (Raw)": 2.1061179637908936, "Pretrain/Step": 17305, "Pretrain/Step Time": 8.507383171468973} +{"Pretrain/Learning Rate": 1.1169448882281469e-06, "Pretrain/Loss": 1.969226598739624, "Pretrain/Loss (Raw)": 1.9183073043823242, "Pretrain/Step": 17306, "Pretrain/Step Time": 8.512317355722189} +{"Pretrain/Learning Rate": 1.1156905042050803e-06, "Pretrain/Loss": 1.9701595306396484, "Pretrain/Loss (Raw)": 2.1288352012634277, "Pretrain/Step": 17307, "Pretrain/Step Time": 8.512577695772052} +{"Pretrain/Learning Rate": 1.114436808869243e-06, "Pretrain/Loss": 1.9668689966201782, "Pretrain/Loss (Raw)": 1.8755213022232056, "Pretrain/Step": 17308, "Pretrain/Step Time": 8.511196747422218} +{"Pretrain/Learning Rate": 1.1131838022567786e-06, "Pretrain/Loss": 1.9656689167022705, "Pretrain/Loss (Raw)": 2.0063068866729736, "Pretrain/Step": 17309, "Pretrain/Step Time": 8.50945657491684} +{"Pretrain/Learning Rate": 1.1119314844038248e-06, "Pretrain/Loss": 1.9690113067626953, "Pretrain/Loss (Raw)": 2.0263895988464355, "Pretrain/Step": 17310, "Pretrain/Step Time": 8.513115288689733} +{"Pretrain/Learning Rate": 1.1106798553464804e-06, "Pretrain/Loss": 1.9680159091949463, "Pretrain/Loss (Raw)": 1.9807991981506348, "Pretrain/Step": 17311, "Pretrain/Step Time": 8.507625538855791} +{"Pretrain/Learning Rate": 1.109428915120847e-06, "Pretrain/Loss": 1.9674630165100098, "Pretrain/Loss (Raw)": 1.8315831422805786, "Pretrain/Step": 17312, "Pretrain/Step Time": 8.513413313776255} +{"Pretrain/Learning Rate": 1.1081786637629849e-06, "Pretrain/Loss": 1.970475435256958, "Pretrain/Loss (Raw)": 2.3811635971069336, "Pretrain/Step": 17313, "Pretrain/Step Time": 8.509116757661104} +{"Pretrain/Learning Rate": 1.106929101308954e-06, "Pretrain/Loss": 1.9732327461242676, "Pretrain/Loss (Raw)": 2.226374387741089, "Pretrain/Step": 17314, "Pretrain/Step Time": 8.510789779946208} +{"Pretrain/Learning Rate": 1.1056802277947753e-06, "Pretrain/Loss": 1.9737236499786377, "Pretrain/Loss (Raw)": 2.0486111640930176, "Pretrain/Step": 17315, "Pretrain/Step Time": 8.508962022140622} +{"Pretrain/Learning Rate": 1.104432043256462e-06, "Pretrain/Loss": 1.97426438331604, "Pretrain/Loss (Raw)": 2.108865737915039, "Pretrain/Step": 17316, "Pretrain/Step Time": 8.504482896998525} +{"Pretrain/Learning Rate": 1.1031845477300073e-06, "Pretrain/Loss": 1.9705562591552734, "Pretrain/Loss (Raw)": 1.6526799201965332, "Pretrain/Step": 17317, "Pretrain/Step Time": 8.508355103433132} +{"Pretrain/Learning Rate": 1.1019377412513771e-06, "Pretrain/Loss": 1.9700260162353516, "Pretrain/Loss (Raw)": 1.8693656921386719, "Pretrain/Step": 17318, "Pretrain/Step Time": 8.5068662147969} +{"Pretrain/Learning Rate": 1.1006916238565285e-06, "Pretrain/Loss": 1.9693188667297363, "Pretrain/Loss (Raw)": 1.9715076684951782, "Pretrain/Step": 17319, "Pretrain/Step Time": 8.5095295291394} +{"Pretrain/Learning Rate": 1.0994461955813911e-06, "Pretrain/Loss": 1.9687749147415161, "Pretrain/Loss (Raw)": 2.0028796195983887, "Pretrain/Step": 17320, "Pretrain/Step Time": 8.507790137082338} +{"Pretrain/Learning Rate": 1.098201456461867e-06, "Pretrain/Loss": 1.9715183973312378, "Pretrain/Loss (Raw)": 2.2310726642608643, "Pretrain/Step": 17321, "Pretrain/Step Time": 8.511978337541223} +{"Pretrain/Learning Rate": 1.0969574065338606e-06, "Pretrain/Loss": 1.972182035446167, "Pretrain/Loss (Raw)": 2.09450626373291, "Pretrain/Step": 17322, "Pretrain/Step Time": 8.50755961239338} +{"Pretrain/Learning Rate": 1.0957140458332322e-06, "Pretrain/Loss": 1.9723176956176758, "Pretrain/Loss (Raw)": 1.7884360551834106, "Pretrain/Step": 17323, "Pretrain/Step Time": 8.514291729778051} +{"Pretrain/Learning Rate": 1.0944713743958418e-06, "Pretrain/Loss": 1.9730950593948364, "Pretrain/Loss (Raw)": 2.1294796466827393, "Pretrain/Step": 17324, "Pretrain/Step Time": 8.517613589763641} +{"Pretrain/Learning Rate": 1.0932293922575165e-06, "Pretrain/Loss": 1.973963737487793, "Pretrain/Loss (Raw)": 2.110405445098877, "Pretrain/Step": 17325, "Pretrain/Step Time": 8.525190483778715} +{"Pretrain/Learning Rate": 1.0919880994540637e-06, "Pretrain/Loss": 1.9755561351776123, "Pretrain/Loss (Raw)": 2.027318239212036, "Pretrain/Step": 17326, "Pretrain/Step Time": 8.519765267148614} +{"Pretrain/Learning Rate": 1.0907474960212854e-06, "Pretrain/Loss": 1.9748646020889282, "Pretrain/Loss (Raw)": 1.933151364326477, "Pretrain/Step": 17327, "Pretrain/Step Time": 8.5228461176157} +{"Pretrain/Learning Rate": 1.0895075819949446e-06, "Pretrain/Loss": 1.9722156524658203, "Pretrain/Loss (Raw)": 1.859057903289795, "Pretrain/Step": 17328, "Pretrain/Step Time": 8.521349182352424} +{"Pretrain/Learning Rate": 1.0882683574107988e-06, "Pretrain/Loss": 1.9691427946090698, "Pretrain/Loss (Raw)": 1.7489197254180908, "Pretrain/Step": 17329, "Pretrain/Step Time": 8.521268183365464} +{"Pretrain/Learning Rate": 1.0870298223045805e-06, "Pretrain/Loss": 1.9680640697479248, "Pretrain/Loss (Raw)": 1.9182825088500977, "Pretrain/Step": 17330, "Pretrain/Step Time": 8.519823711365461} +{"Pretrain/Learning Rate": 1.0857919767119945e-06, "Pretrain/Loss": 1.965553879737854, "Pretrain/Loss (Raw)": 1.7970993518829346, "Pretrain/Step": 17331, "Pretrain/Step Time": 8.521238576620817} +{"Pretrain/Learning Rate": 1.0845548206687429e-06, "Pretrain/Loss": 1.964715838432312, "Pretrain/Loss (Raw)": 1.7795847654342651, "Pretrain/Step": 17332, "Pretrain/Step Time": 8.518070384860039} +{"Pretrain/Learning Rate": 1.0833183542104885e-06, "Pretrain/Loss": 1.9652409553527832, "Pretrain/Loss (Raw)": 1.9898196458816528, "Pretrain/Step": 17333, "Pretrain/Step Time": 8.515754317864776} +{"Pretrain/Learning Rate": 1.0820825773728948e-06, "Pretrain/Loss": 1.9664177894592285, "Pretrain/Loss (Raw)": 1.9753729104995728, "Pretrain/Step": 17334, "Pretrain/Step Time": 8.523003352805972} +{"Pretrain/Learning Rate": 1.080847490191589e-06, "Pretrain/Loss": 1.9676449298858643, "Pretrain/Loss (Raw)": 2.095201015472412, "Pretrain/Step": 17335, "Pretrain/Step Time": 8.524108747020364} +{"Pretrain/Learning Rate": 1.079613092702178e-06, "Pretrain/Loss": 1.968694806098938, "Pretrain/Loss (Raw)": 1.8718197345733643, "Pretrain/Step": 17336, "Pretrain/Step Time": 8.517835838720202} +{"Pretrain/Learning Rate": 1.0783793849402674e-06, "Pretrain/Loss": 1.9651910066604614, "Pretrain/Loss (Raw)": 1.8704919815063477, "Pretrain/Step": 17337, "Pretrain/Step Time": 8.517963018268347} +{"Pretrain/Learning Rate": 1.0771463669414173e-06, "Pretrain/Loss": 1.9665141105651855, "Pretrain/Loss (Raw)": 1.989594578742981, "Pretrain/Step": 17338, "Pretrain/Step Time": 8.518715238198638} +{"Pretrain/Learning Rate": 1.0759140387411937e-06, "Pretrain/Loss": 1.9698681831359863, "Pretrain/Loss (Raw)": 2.1364800930023193, "Pretrain/Step": 17339, "Pretrain/Step Time": 8.511856988072395} +{"Pretrain/Learning Rate": 1.074682400375121e-06, "Pretrain/Loss": 1.968797206878662, "Pretrain/Loss (Raw)": 1.8841311931610107, "Pretrain/Step": 17340, "Pretrain/Step Time": 8.513252457603812} +{"Pretrain/Learning Rate": 1.0734514518787126e-06, "Pretrain/Loss": 1.9686567783355713, "Pretrain/Loss (Raw)": 2.0637407302856445, "Pretrain/Step": 17341, "Pretrain/Step Time": 8.51583425141871} +{"Pretrain/Learning Rate": 1.0722211932874675e-06, "Pretrain/Loss": 1.9677748680114746, "Pretrain/Loss (Raw)": 1.9881545305252075, "Pretrain/Step": 17342, "Pretrain/Step Time": 8.51775280572474} +{"Pretrain/Learning Rate": 1.0709916246368524e-06, "Pretrain/Loss": 1.9684538841247559, "Pretrain/Loss (Raw)": 2.004281997680664, "Pretrain/Step": 17343, "Pretrain/Step Time": 8.515223233029246} +{"Pretrain/Learning Rate": 1.06976274596233e-06, "Pretrain/Loss": 1.968390703201294, "Pretrain/Loss (Raw)": 1.774711012840271, "Pretrain/Step": 17344, "Pretrain/Step Time": 8.515229601413012} +{"Pretrain/Learning Rate": 1.0685345572993278e-06, "Pretrain/Loss": 1.9680733680725098, "Pretrain/Loss (Raw)": 1.9521064758300781, "Pretrain/Step": 17345, "Pretrain/Step Time": 8.51657415740192} +{"Pretrain/Learning Rate": 1.0673070586832563e-06, "Pretrain/Loss": 1.965693473815918, "Pretrain/Loss (Raw)": 1.7961844205856323, "Pretrain/Step": 17346, "Pretrain/Step Time": 8.520352993160486} +{"Pretrain/Learning Rate": 1.0660802501495204e-06, "Pretrain/Loss": 1.9658541679382324, "Pretrain/Loss (Raw)": 2.0915939807891846, "Pretrain/Step": 17347, "Pretrain/Step Time": 8.521640568971634} +{"Pretrain/Learning Rate": 1.0648541317334836e-06, "Pretrain/Loss": 1.964064121246338, "Pretrain/Loss (Raw)": 1.8007752895355225, "Pretrain/Step": 17348, "Pretrain/Step Time": 8.521891120821238} +{"Pretrain/Learning Rate": 1.0636287034705066e-06, "Pretrain/Loss": 1.961984634399414, "Pretrain/Loss (Raw)": 1.9555186033248901, "Pretrain/Step": 17349, "Pretrain/Step Time": 8.516133410856128} +{"Pretrain/Learning Rate": 1.062403965395925e-06, "Pretrain/Loss": 1.962355136871338, "Pretrain/Loss (Raw)": 1.9084445238113403, "Pretrain/Step": 17350, "Pretrain/Step Time": 8.516270760446787} +{"Pretrain/Learning Rate": 1.0611799175450494e-06, "Pretrain/Loss": 1.9632097482681274, "Pretrain/Loss (Raw)": 2.0561318397521973, "Pretrain/Step": 17351, "Pretrain/Step Time": 8.517995808273554} +{"Pretrain/Learning Rate": 1.0599565599531735e-06, "Pretrain/Loss": 1.9647471904754639, "Pretrain/Loss (Raw)": 2.073960781097412, "Pretrain/Step": 17352, "Pretrain/Step Time": 8.519732527434826} +{"Pretrain/Learning Rate": 1.0587338926555724e-06, "Pretrain/Loss": 1.9656331539154053, "Pretrain/Loss (Raw)": 2.0917141437530518, "Pretrain/Step": 17353, "Pretrain/Step Time": 8.521776508539915} +{"Pretrain/Learning Rate": 1.0575119156875036e-06, "Pretrain/Loss": 1.9682056903839111, "Pretrain/Loss (Raw)": 2.1919593811035156, "Pretrain/Step": 17354, "Pretrain/Step Time": 8.520922400057316} +{"Pretrain/Learning Rate": 1.0562906290841973e-06, "Pretrain/Loss": 1.9696005582809448, "Pretrain/Loss (Raw)": 1.9659178256988525, "Pretrain/Step": 17355, "Pretrain/Step Time": 8.518304267898202} +{"Pretrain/Learning Rate": 1.0550700328808755e-06, "Pretrain/Loss": 1.9732298851013184, "Pretrain/Loss (Raw)": 2.426884174346924, "Pretrain/Step": 17356, "Pretrain/Step Time": 8.520582642406225} +{"Pretrain/Learning Rate": 1.0538501271127265e-06, "Pretrain/Loss": 1.9741193056106567, "Pretrain/Loss (Raw)": 1.9584851264953613, "Pretrain/Step": 17357, "Pretrain/Step Time": 8.52425966784358} +{"Pretrain/Learning Rate": 1.052630911814928e-06, "Pretrain/Loss": 1.9772937297821045, "Pretrain/Loss (Raw)": 2.1894233226776123, "Pretrain/Step": 17358, "Pretrain/Step Time": 8.524173013865948} +{"Pretrain/Learning Rate": 1.0514123870226377e-06, "Pretrain/Loss": 1.9772828817367554, "Pretrain/Loss (Raw)": 1.8235515356063843, "Pretrain/Step": 17359, "Pretrain/Step Time": 8.521142888814211} +{"Pretrain/Learning Rate": 1.0501945527709862e-06, "Pretrain/Loss": 1.977736234664917, "Pretrain/Loss (Raw)": 2.137040853500366, "Pretrain/Step": 17360, "Pretrain/Step Time": 8.521251734346151} +{"Pretrain/Learning Rate": 1.0489774090950948e-06, "Pretrain/Loss": 1.9767119884490967, "Pretrain/Loss (Raw)": 1.7606490850448608, "Pretrain/Step": 17361, "Pretrain/Step Time": 8.5222954954952} +{"Pretrain/Learning Rate": 1.0477609560300527e-06, "Pretrain/Loss": 1.976953387260437, "Pretrain/Loss (Raw)": 1.956632137298584, "Pretrain/Step": 17362, "Pretrain/Step Time": 8.524145379662514} +{"Pretrain/Learning Rate": 1.0465451936109371e-06, "Pretrain/Loss": 1.9780888557434082, "Pretrain/Loss (Raw)": 1.919386863708496, "Pretrain/Step": 17363, "Pretrain/Step Time": 8.522059524431825} +{"Pretrain/Learning Rate": 1.045330121872809e-06, "Pretrain/Loss": 1.9781908988952637, "Pretrain/Loss (Raw)": 2.0220489501953125, "Pretrain/Step": 17364, "Pretrain/Step Time": 8.524147855117917} +{"Pretrain/Learning Rate": 1.044115740850693e-06, "Pretrain/Loss": 1.976741075515747, "Pretrain/Loss (Raw)": 1.8188464641571045, "Pretrain/Step": 17365, "Pretrain/Step Time": 8.523047473281622} +{"Pretrain/Learning Rate": 1.0429020505796194e-06, "Pretrain/Loss": 1.9766428470611572, "Pretrain/Loss (Raw)": 2.006147623062134, "Pretrain/Step": 17366, "Pretrain/Step Time": 8.520464660599828} +{"Pretrain/Learning Rate": 1.0416890510945743e-06, "Pretrain/Loss": 1.9733860492706299, "Pretrain/Loss (Raw)": 1.9264450073242188, "Pretrain/Step": 17367, "Pretrain/Step Time": 8.521583614870906} +{"Pretrain/Learning Rate": 1.0404767424305322e-06, "Pretrain/Loss": 1.9738707542419434, "Pretrain/Loss (Raw)": 1.8359211683273315, "Pretrain/Step": 17368, "Pretrain/Step Time": 8.522418264299631} +{"Pretrain/Learning Rate": 1.0392651246224573e-06, "Pretrain/Loss": 1.9728620052337646, "Pretrain/Loss (Raw)": 1.9782227277755737, "Pretrain/Step": 17369, "Pretrain/Step Time": 8.518716553226113} +{"Pretrain/Learning Rate": 1.0380541977052765e-06, "Pretrain/Loss": 1.9677963256835938, "Pretrain/Loss (Raw)": 1.9882491827011108, "Pretrain/Step": 17370, "Pretrain/Step Time": 8.524461826309562} +{"Pretrain/Learning Rate": 1.0368439617139152e-06, "Pretrain/Loss": 1.967395305633545, "Pretrain/Loss (Raw)": 1.9112441539764404, "Pretrain/Step": 17371, "Pretrain/Step Time": 8.527142256498337} +{"Pretrain/Learning Rate": 1.0356344166832648e-06, "Pretrain/Loss": 1.9658222198486328, "Pretrain/Loss (Raw)": 1.6921241283416748, "Pretrain/Step": 17372, "Pretrain/Step Time": 8.523887734860182} +{"Pretrain/Learning Rate": 1.0344255626482002e-06, "Pretrain/Loss": 1.9653918743133545, "Pretrain/Loss (Raw)": 2.0094101428985596, "Pretrain/Step": 17373, "Pretrain/Step Time": 8.52239990234375} +{"Pretrain/Learning Rate": 1.0332173996435824e-06, "Pretrain/Loss": 1.9638316631317139, "Pretrain/Loss (Raw)": 1.9565390348434448, "Pretrain/Step": 17374, "Pretrain/Step Time": 8.521759880706668} +{"Pretrain/Learning Rate": 1.0320099277042416e-06, "Pretrain/Loss": 1.9651720523834229, "Pretrain/Loss (Raw)": 2.158877372741699, "Pretrain/Step": 17375, "Pretrain/Step Time": 8.527692575007677} +{"Pretrain/Learning Rate": 1.030803146865003e-06, "Pretrain/Loss": 1.9609098434448242, "Pretrain/Loss (Raw)": 1.788017988204956, "Pretrain/Step": 17376, "Pretrain/Step Time": 8.52434371970594} +{"Pretrain/Learning Rate": 1.0295970571606555e-06, "Pretrain/Loss": 1.962281584739685, "Pretrain/Loss (Raw)": 2.1873059272766113, "Pretrain/Step": 17377, "Pretrain/Step Time": 8.519760789349675} +{"Pretrain/Learning Rate": 1.0283916586259796e-06, "Pretrain/Loss": 1.9601147174835205, "Pretrain/Loss (Raw)": 1.7652682065963745, "Pretrain/Step": 17378, "Pretrain/Step Time": 8.520231317728758} +{"Pretrain/Learning Rate": 1.0271869512957334e-06, "Pretrain/Loss": 1.9617387056350708, "Pretrain/Loss (Raw)": 2.153047800064087, "Pretrain/Step": 17379, "Pretrain/Step Time": 8.522545598447323} +{"Pretrain/Learning Rate": 1.0259829352046474e-06, "Pretrain/Loss": 1.9614951610565186, "Pretrain/Loss (Raw)": 2.0719571113586426, "Pretrain/Step": 17380, "Pretrain/Step Time": 8.523079551756382} +{"Pretrain/Learning Rate": 1.024779610387447e-06, "Pretrain/Loss": 1.964059829711914, "Pretrain/Loss (Raw)": 1.8286664485931396, "Pretrain/Step": 17381, "Pretrain/Step Time": 8.51929622143507} +{"Pretrain/Learning Rate": 1.0235769768788206e-06, "Pretrain/Loss": 1.9650160074234009, "Pretrain/Loss (Raw)": 2.028864860534668, "Pretrain/Step": 17382, "Pretrain/Step Time": 8.516491021960974} +{"Pretrain/Learning Rate": 1.022375034713452e-06, "Pretrain/Loss": 1.9645878076553345, "Pretrain/Loss (Raw)": 1.9596617221832275, "Pretrain/Step": 17383, "Pretrain/Step Time": 8.51811420917511} +{"Pretrain/Learning Rate": 1.0211737839259994e-06, "Pretrain/Loss": 1.9628827571868896, "Pretrain/Loss (Raw)": 1.5880756378173828, "Pretrain/Step": 17384, "Pretrain/Step Time": 8.515989154577255} +{"Pretrain/Learning Rate": 1.0199732245510907e-06, "Pretrain/Loss": 1.9651527404785156, "Pretrain/Loss (Raw)": 2.0910117626190186, "Pretrain/Step": 17385, "Pretrain/Step Time": 8.51326317153871} +{"Pretrain/Learning Rate": 1.0187733566233538e-06, "Pretrain/Loss": 1.96488618850708, "Pretrain/Loss (Raw)": 1.9442073106765747, "Pretrain/Step": 17386, "Pretrain/Step Time": 8.51317210122943} +{"Pretrain/Learning Rate": 1.0175741801773803e-06, "Pretrain/Loss": 1.9673571586608887, "Pretrain/Loss (Raw)": 2.2462432384490967, "Pretrain/Step": 17387, "Pretrain/Step Time": 8.518028751015663} +{"Pretrain/Learning Rate": 1.0163756952477482e-06, "Pretrain/Loss": 1.9685087203979492, "Pretrain/Loss (Raw)": 1.9491225481033325, "Pretrain/Step": 17388, "Pretrain/Step Time": 8.509508496150374} +{"Pretrain/Learning Rate": 1.0151779018690188e-06, "Pretrain/Loss": 1.9669544696807861, "Pretrain/Loss (Raw)": 1.8793755769729614, "Pretrain/Step": 17389, "Pretrain/Step Time": 8.511323764920235} +{"Pretrain/Learning Rate": 1.0139808000757228e-06, "Pretrain/Loss": 1.9702205657958984, "Pretrain/Loss (Raw)": 2.313931465148926, "Pretrain/Step": 17390, "Pretrain/Step Time": 8.513143640011549} +{"Pretrain/Learning Rate": 1.0127843899023826e-06, "Pretrain/Loss": 1.9727171659469604, "Pretrain/Loss (Raw)": 2.1499788761138916, "Pretrain/Step": 17391, "Pretrain/Step Time": 8.51087386906147} +{"Pretrain/Learning Rate": 1.0115886713834928e-06, "Pretrain/Loss": 1.9760258197784424, "Pretrain/Loss (Raw)": 1.7005808353424072, "Pretrain/Step": 17392, "Pretrain/Step Time": 8.511114589869976} +{"Pretrain/Learning Rate": 1.0103936445535368e-06, "Pretrain/Loss": 1.976379632949829, "Pretrain/Loss (Raw)": 1.9645791053771973, "Pretrain/Step": 17393, "Pretrain/Step Time": 8.508726321160793} +{"Pretrain/Learning Rate": 1.0091993094469648e-06, "Pretrain/Loss": 1.9769272804260254, "Pretrain/Loss (Raw)": 2.057446002960205, "Pretrain/Step": 17394, "Pretrain/Step Time": 8.504695734009147} +{"Pretrain/Learning Rate": 1.008005666098219e-06, "Pretrain/Loss": 1.9789406061172485, "Pretrain/Loss (Raw)": 2.16387677192688, "Pretrain/Step": 17395, "Pretrain/Step Time": 8.505132036283612} +{"Pretrain/Learning Rate": 1.0068127145417189e-06, "Pretrain/Loss": 1.979306936264038, "Pretrain/Loss (Raw)": 1.9397698640823364, "Pretrain/Step": 17396, "Pretrain/Step Time": 8.505408672615886} +{"Pretrain/Learning Rate": 1.0056204548118563e-06, "Pretrain/Loss": 1.9805047512054443, "Pretrain/Loss (Raw)": 2.0113003253936768, "Pretrain/Step": 17397, "Pretrain/Step Time": 8.496562784537673} +{"Pretrain/Learning Rate": 1.004428886943018e-06, "Pretrain/Loss": 1.9813048839569092, "Pretrain/Loss (Raw)": 2.1265923976898193, "Pretrain/Step": 17398, "Pretrain/Step Time": 8.506912959739566} +{"Pretrain/Learning Rate": 1.0032380109695537e-06, "Pretrain/Loss": 1.9817360639572144, "Pretrain/Loss (Raw)": 2.066910743713379, "Pretrain/Step": 17399, "Pretrain/Step Time": 8.50326825864613} +{"Pretrain/Learning Rate": 1.0020478269258032e-06, "Pretrain/Loss": 1.9806597232818604, "Pretrain/Loss (Raw)": 1.7181766033172607, "Pretrain/Step": 17400, "Pretrain/Step Time": 8.505926111713052} +{"Pretrain/Learning Rate": 1.0008583348460915e-06, "Pretrain/Loss": 1.9793288707733154, "Pretrain/Loss (Raw)": 1.9939990043640137, "Pretrain/Step": 17401, "Pretrain/Step Time": 8.501504238694906} +{"Pretrain/Learning Rate": 9.996695347647051e-07, "Pretrain/Loss": 1.981431245803833, "Pretrain/Loss (Raw)": 1.852584719657898, "Pretrain/Step": 17402, "Pretrain/Step Time": 8.501513365656137} +{"Pretrain/Learning Rate": 9.984814267159332e-07, "Pretrain/Loss": 1.9821335077285767, "Pretrain/Loss (Raw)": 2.118201971054077, "Pretrain/Step": 17403, "Pretrain/Step Time": 8.501815520226955} +{"Pretrain/Learning Rate": 9.972940107340288e-07, "Pretrain/Loss": 1.9789785146713257, "Pretrain/Loss (Raw)": 1.8226940631866455, "Pretrain/Step": 17404, "Pretrain/Step Time": 8.5049120914191} +{"Pretrain/Learning Rate": 9.96107286853229e-07, "Pretrain/Loss": 1.9825342893600464, "Pretrain/Loss (Raw)": 2.276500940322876, "Pretrain/Step": 17405, "Pretrain/Step Time": 8.50706964917481} +{"Pretrain/Learning Rate": 9.949212551077558e-07, "Pretrain/Loss": 1.9844077825546265, "Pretrain/Loss (Raw)": 2.2874722480773926, "Pretrain/Step": 17406, "Pretrain/Step Time": 8.506938848644495} +{"Pretrain/Learning Rate": 9.937359155318017e-07, "Pretrain/Loss": 1.9829344749450684, "Pretrain/Loss (Raw)": 1.7284917831420898, "Pretrain/Step": 17407, "Pretrain/Step Time": 8.50968343950808} +{"Pretrain/Learning Rate": 9.925512681595527e-07, "Pretrain/Loss": 1.983092188835144, "Pretrain/Loss (Raw)": 2.009549379348755, "Pretrain/Step": 17408, "Pretrain/Step Time": 8.512528419494629} +{"Pretrain/Learning Rate": 9.913673130251654e-07, "Pretrain/Loss": 1.9835569858551025, "Pretrain/Loss (Raw)": 1.9207994937896729, "Pretrain/Step": 17409, "Pretrain/Step Time": 8.512511467561126} +{"Pretrain/Learning Rate": 9.901840501627735e-07, "Pretrain/Loss": 1.9830923080444336, "Pretrain/Loss (Raw)": 1.9948195219039917, "Pretrain/Step": 17410, "Pretrain/Step Time": 8.520771948620677} +{"Pretrain/Learning Rate": 9.890014796064995e-07, "Pretrain/Loss": 1.9828470945358276, "Pretrain/Loss (Raw)": 1.9137420654296875, "Pretrain/Step": 17411, "Pretrain/Step Time": 8.514767682179809} +{"Pretrain/Learning Rate": 9.878196013904383e-07, "Pretrain/Loss": 1.9824191331863403, "Pretrain/Loss (Raw)": 2.1140754222869873, "Pretrain/Step": 17412, "Pretrain/Step Time": 8.51522258669138} +{"Pretrain/Learning Rate": 9.86638415548677e-07, "Pretrain/Loss": 1.9805786609649658, "Pretrain/Loss (Raw)": 1.8090311288833618, "Pretrain/Step": 17413, "Pretrain/Step Time": 8.517269112169743} +{"Pretrain/Learning Rate": 9.854579221152682e-07, "Pretrain/Loss": 1.9798431396484375, "Pretrain/Loss (Raw)": 1.8212740421295166, "Pretrain/Step": 17414, "Pretrain/Step Time": 8.506802985444665} +{"Pretrain/Learning Rate": 9.842781211242464e-07, "Pretrain/Loss": 1.9812641143798828, "Pretrain/Loss (Raw)": 2.089665651321411, "Pretrain/Step": 17415, "Pretrain/Step Time": 8.505021309480071} +{"Pretrain/Learning Rate": 9.830990126096394e-07, "Pretrain/Loss": 1.9808597564697266, "Pretrain/Loss (Raw)": 1.9916340112686157, "Pretrain/Step": 17416, "Pretrain/Step Time": 8.508346889168024} +{"Pretrain/Learning Rate": 9.819205966054374e-07, "Pretrain/Loss": 1.9813809394836426, "Pretrain/Loss (Raw)": 2.0689942836761475, "Pretrain/Step": 17417, "Pretrain/Step Time": 8.508135778829455} +{"Pretrain/Learning Rate": 9.807428731456263e-07, "Pretrain/Loss": 1.9834225177764893, "Pretrain/Loss (Raw)": 2.159391164779663, "Pretrain/Step": 17418, "Pretrain/Step Time": 8.50609152391553} +{"Pretrain/Learning Rate": 9.79565842264163e-07, "Pretrain/Loss": 1.9850496053695679, "Pretrain/Loss (Raw)": 1.9113376140594482, "Pretrain/Step": 17419, "Pretrain/Step Time": 8.506278686225414} +{"Pretrain/Learning Rate": 9.783895039949837e-07, "Pretrain/Loss": 1.9838958978652954, "Pretrain/Loss (Raw)": 1.8113806247711182, "Pretrain/Step": 17420, "Pretrain/Step Time": 8.504481742158532} +{"Pretrain/Learning Rate": 9.772138583720086e-07, "Pretrain/Loss": 1.9858450889587402, "Pretrain/Loss (Raw)": 2.1951794624328613, "Pretrain/Step": 17421, "Pretrain/Step Time": 8.50907988473773} +{"Pretrain/Learning Rate": 9.760389054291357e-07, "Pretrain/Loss": 1.9829373359680176, "Pretrain/Loss (Raw)": 1.8940993547439575, "Pretrain/Step": 17422, "Pretrain/Step Time": 8.507936213165522} +{"Pretrain/Learning Rate": 9.748646452002491e-07, "Pretrain/Loss": 1.9824161529541016, "Pretrain/Loss (Raw)": 1.9849703311920166, "Pretrain/Step": 17423, "Pretrain/Step Time": 8.507115460932255} +{"Pretrain/Learning Rate": 9.736910777192021e-07, "Pretrain/Loss": 1.9838086366653442, "Pretrain/Loss (Raw)": 2.043679714202881, "Pretrain/Step": 17424, "Pretrain/Step Time": 8.510011214762926} +{"Pretrain/Learning Rate": 9.725182030198344e-07, "Pretrain/Loss": 1.9843909740447998, "Pretrain/Loss (Raw)": 2.1368367671966553, "Pretrain/Step": 17425, "Pretrain/Step Time": 8.515561439096928} +{"Pretrain/Learning Rate": 9.71346021135966e-07, "Pretrain/Loss": 1.9817755222320557, "Pretrain/Loss (Raw)": 1.7386101484298706, "Pretrain/Step": 17426, "Pretrain/Step Time": 8.511770758777857} +{"Pretrain/Learning Rate": 9.70174532101395e-07, "Pretrain/Loss": 1.9810945987701416, "Pretrain/Loss (Raw)": 1.7251431941986084, "Pretrain/Step": 17427, "Pretrain/Step Time": 8.506414011120796} +{"Pretrain/Learning Rate": 9.690037359499054e-07, "Pretrain/Loss": 1.9796584844589233, "Pretrain/Loss (Raw)": 1.7121407985687256, "Pretrain/Step": 17428, "Pretrain/Step Time": 8.508104870095849} +{"Pretrain/Learning Rate": 9.67833632715251e-07, "Pretrain/Loss": 1.9789702892303467, "Pretrain/Loss (Raw)": 1.7856552600860596, "Pretrain/Step": 17429, "Pretrain/Step Time": 8.510649153962731} +{"Pretrain/Learning Rate": 9.666642224311684e-07, "Pretrain/Loss": 1.978158712387085, "Pretrain/Loss (Raw)": 2.0786142349243164, "Pretrain/Step": 17430, "Pretrain/Step Time": 8.508355233818293} +{"Pretrain/Learning Rate": 9.654955051313863e-07, "Pretrain/Loss": 1.9780244827270508, "Pretrain/Loss (Raw)": 1.8706945180892944, "Pretrain/Step": 17431, "Pretrain/Step Time": 8.501351660117507} +{"Pretrain/Learning Rate": 9.643274808495916e-07, "Pretrain/Loss": 1.9788894653320312, "Pretrain/Loss (Raw)": 2.1857588291168213, "Pretrain/Step": 17432, "Pretrain/Step Time": 8.504049086943269} +{"Pretrain/Learning Rate": 9.631601496194743e-07, "Pretrain/Loss": 1.9783685207366943, "Pretrain/Loss (Raw)": 2.0394318103790283, "Pretrain/Step": 17433, "Pretrain/Step Time": 8.505789250135422} +{"Pretrain/Learning Rate": 9.619935114746903e-07, "Pretrain/Loss": 1.9797664880752563, "Pretrain/Loss (Raw)": 2.097249746322632, "Pretrain/Step": 17434, "Pretrain/Step Time": 8.500936696305871} +{"Pretrain/Learning Rate": 9.608275664488769e-07, "Pretrain/Loss": 1.9782755374908447, "Pretrain/Loss (Raw)": 1.9379870891571045, "Pretrain/Step": 17435, "Pretrain/Step Time": 8.503445506095886} +{"Pretrain/Learning Rate": 9.596623145756544e-07, "Pretrain/Loss": 1.9807054996490479, "Pretrain/Loss (Raw)": 2.1865663528442383, "Pretrain/Step": 17436, "Pretrain/Step Time": 8.502768162637949} +{"Pretrain/Learning Rate": 9.584977558886183e-07, "Pretrain/Loss": 1.986054539680481, "Pretrain/Loss (Raw)": 2.6909677982330322, "Pretrain/Step": 17437, "Pretrain/Step Time": 8.502234436571598} +{"Pretrain/Learning Rate": 9.573338904213553e-07, "Pretrain/Loss": 1.985818862915039, "Pretrain/Loss (Raw)": 1.9962337017059326, "Pretrain/Step": 17438, "Pretrain/Step Time": 8.50399916805327} +{"Pretrain/Learning Rate": 9.561707182074165e-07, "Pretrain/Loss": 1.9864381551742554, "Pretrain/Loss (Raw)": 2.060075521469116, "Pretrain/Step": 17439, "Pretrain/Step Time": 8.50160824880004} +{"Pretrain/Learning Rate": 9.5500823928035e-07, "Pretrain/Loss": 1.988037347793579, "Pretrain/Loss (Raw)": 2.0362679958343506, "Pretrain/Step": 17440, "Pretrain/Step Time": 8.50015527382493} +{"Pretrain/Learning Rate": 9.538464536736651e-07, "Pretrain/Loss": 1.9850218296051025, "Pretrain/Loss (Raw)": 1.9951940774917603, "Pretrain/Step": 17441, "Pretrain/Step Time": 8.504666971042752} +{"Pretrain/Learning Rate": 9.526853614208713e-07, "Pretrain/Loss": 1.9828524589538574, "Pretrain/Loss (Raw)": 1.9486812353134155, "Pretrain/Step": 17442, "Pretrain/Step Time": 8.505954103544354} +{"Pretrain/Learning Rate": 9.515249625554418e-07, "Pretrain/Loss": 1.982462763786316, "Pretrain/Loss (Raw)": 1.998731255531311, "Pretrain/Step": 17443, "Pretrain/Step Time": 8.506518786773086} +{"Pretrain/Learning Rate": 9.503652571108329e-07, "Pretrain/Loss": 1.9837340116500854, "Pretrain/Loss (Raw)": 2.271580457687378, "Pretrain/Step": 17444, "Pretrain/Step Time": 8.50682265125215} +{"Pretrain/Learning Rate": 9.49206245120493e-07, "Pretrain/Loss": 1.9873290061950684, "Pretrain/Loss (Raw)": 2.112851858139038, "Pretrain/Step": 17445, "Pretrain/Step Time": 8.503107761964202} +{"Pretrain/Learning Rate": 9.480479266178316e-07, "Pretrain/Loss": 1.9912383556365967, "Pretrain/Loss (Raw)": 2.369751214981079, "Pretrain/Step": 17446, "Pretrain/Step Time": 8.505231406539679} +{"Pretrain/Learning Rate": 9.468903016362551e-07, "Pretrain/Loss": 1.991284966468811, "Pretrain/Loss (Raw)": 1.9774972200393677, "Pretrain/Step": 17447, "Pretrain/Step Time": 8.507533127442002} +{"Pretrain/Learning Rate": 9.457333702091425e-07, "Pretrain/Loss": 1.991400122642517, "Pretrain/Loss (Raw)": 2.017606258392334, "Pretrain/Step": 17448, "Pretrain/Step Time": 8.506521252915263} +{"Pretrain/Learning Rate": 9.445771323698477e-07, "Pretrain/Loss": 1.9904717206954956, "Pretrain/Loss (Raw)": 2.112241744995117, "Pretrain/Step": 17449, "Pretrain/Step Time": 8.503322089090943} +{"Pretrain/Learning Rate": 9.434215881517161e-07, "Pretrain/Loss": 1.990450382232666, "Pretrain/Loss (Raw)": 2.0917632579803467, "Pretrain/Step": 17450, "Pretrain/Step Time": 8.506768541410565} +{"Pretrain/Learning Rate": 9.4226673758806e-07, "Pretrain/Loss": 1.9927160739898682, "Pretrain/Loss (Raw)": 2.0784425735473633, "Pretrain/Step": 17451, "Pretrain/Step Time": 8.501350844278932} +{"Pretrain/Learning Rate": 9.411125807121862e-07, "Pretrain/Loss": 1.9923919439315796, "Pretrain/Loss (Raw)": 2.088005304336548, "Pretrain/Step": 17452, "Pretrain/Step Time": 8.498459154739976} +{"Pretrain/Learning Rate": 9.399591175573735e-07, "Pretrain/Loss": 1.9913188219070435, "Pretrain/Loss (Raw)": 1.9730420112609863, "Pretrain/Step": 17453, "Pretrain/Step Time": 8.495236909016967} +{"Pretrain/Learning Rate": 9.388063481568732e-07, "Pretrain/Loss": 1.9919167757034302, "Pretrain/Loss (Raw)": 2.1038472652435303, "Pretrain/Step": 17454, "Pretrain/Step Time": 8.502156622707844} +{"Pretrain/Learning Rate": 9.376542725439336e-07, "Pretrain/Loss": 1.993283748626709, "Pretrain/Loss (Raw)": 2.1081247329711914, "Pretrain/Step": 17455, "Pretrain/Step Time": 8.498672608286142} +{"Pretrain/Learning Rate": 9.365028907517642e-07, "Pretrain/Loss": 1.9941866397857666, "Pretrain/Loss (Raw)": 1.9746192693710327, "Pretrain/Step": 17456, "Pretrain/Step Time": 8.499321773648262} +{"Pretrain/Learning Rate": 9.353522028135775e-07, "Pretrain/Loss": 2.000279426574707, "Pretrain/Loss (Raw)": 2.5288257598876953, "Pretrain/Step": 17457, "Pretrain/Step Time": 8.500120522454381} +{"Pretrain/Learning Rate": 9.34202208762544e-07, "Pretrain/Loss": 2.0019631385803223, "Pretrain/Loss (Raw)": 2.1337904930114746, "Pretrain/Step": 17458, "Pretrain/Step Time": 8.50272424146533} +{"Pretrain/Learning Rate": 9.330529086318207e-07, "Pretrain/Loss": 2.0015645027160645, "Pretrain/Loss (Raw)": 1.7460569143295288, "Pretrain/Step": 17459, "Pretrain/Step Time": 8.501228528097272} +{"Pretrain/Learning Rate": 9.319043024545532e-07, "Pretrain/Loss": 2.0040876865386963, "Pretrain/Loss (Raw)": 2.1025633811950684, "Pretrain/Step": 17460, "Pretrain/Step Time": 8.500058459118009} +{"Pretrain/Learning Rate": 9.307563902638566e-07, "Pretrain/Loss": 2.003976345062256, "Pretrain/Loss (Raw)": 1.9755594730377197, "Pretrain/Step": 17461, "Pretrain/Step Time": 8.501909658312798} +{"Pretrain/Learning Rate": 9.296091720928351e-07, "Pretrain/Loss": 2.003887176513672, "Pretrain/Loss (Raw)": 1.9639778137207031, "Pretrain/Step": 17462, "Pretrain/Step Time": 8.491215908899903} +{"Pretrain/Learning Rate": 9.284626479745651e-07, "Pretrain/Loss": 2.0040087699890137, "Pretrain/Loss (Raw)": 2.1107425689697266, "Pretrain/Step": 17463, "Pretrain/Step Time": 8.491031849756837} +{"Pretrain/Learning Rate": 9.273168179421004e-07, "Pretrain/Loss": 2.0061514377593994, "Pretrain/Loss (Raw)": 2.1460909843444824, "Pretrain/Step": 17464, "Pretrain/Step Time": 8.492729322984815} +{"Pretrain/Learning Rate": 9.2617168202849e-07, "Pretrain/Loss": 2.0065956115722656, "Pretrain/Loss (Raw)": 1.9273686408996582, "Pretrain/Step": 17465, "Pretrain/Step Time": 8.495902482420206} +{"Pretrain/Learning Rate": 9.250272402667431e-07, "Pretrain/Loss": 2.004657030105591, "Pretrain/Loss (Raw)": 1.74143385887146, "Pretrain/Step": 17466, "Pretrain/Step Time": 8.498927541077137} +{"Pretrain/Learning Rate": 9.238834926898698e-07, "Pretrain/Loss": 2.003279209136963, "Pretrain/Loss (Raw)": 1.9601339101791382, "Pretrain/Step": 17467, "Pretrain/Step Time": 8.499612607061863} +{"Pretrain/Learning Rate": 9.227404393308408e-07, "Pretrain/Loss": 2.0031003952026367, "Pretrain/Loss (Raw)": 1.861226201057434, "Pretrain/Step": 17468, "Pretrain/Step Time": 8.497496154159307} +{"Pretrain/Learning Rate": 9.215980802226159e-07, "Pretrain/Loss": 1.9996646642684937, "Pretrain/Loss (Raw)": 1.6239796876907349, "Pretrain/Step": 17469, "Pretrain/Step Time": 8.49412571452558} +{"Pretrain/Learning Rate": 9.204564153981382e-07, "Pretrain/Loss": 2.001477003097534, "Pretrain/Loss (Raw)": 2.22011399269104, "Pretrain/Step": 17470, "Pretrain/Step Time": 8.500482553616166} +{"Pretrain/Learning Rate": 9.193154448903229e-07, "Pretrain/Loss": 2.000196933746338, "Pretrain/Loss (Raw)": 1.8404288291931152, "Pretrain/Step": 17471, "Pretrain/Step Time": 8.500904727727175} +{"Pretrain/Learning Rate": 9.181751687320745e-07, "Pretrain/Loss": 2.0000498294830322, "Pretrain/Loss (Raw)": 1.7558892965316772, "Pretrain/Step": 17472, "Pretrain/Step Time": 8.507156321778893} +{"Pretrain/Learning Rate": 9.170355869562692e-07, "Pretrain/Loss": 1.9999717473983765, "Pretrain/Loss (Raw)": 1.9421203136444092, "Pretrain/Step": 17473, "Pretrain/Step Time": 8.506517881527543} +{"Pretrain/Learning Rate": 9.158966995957613e-07, "Pretrain/Loss": 2.0018134117126465, "Pretrain/Loss (Raw)": 2.0319108963012695, "Pretrain/Step": 17474, "Pretrain/Step Time": 8.506549624726176} +{"Pretrain/Learning Rate": 9.147585066833942e-07, "Pretrain/Loss": 2.0008506774902344, "Pretrain/Loss (Raw)": 1.9683839082717896, "Pretrain/Step": 17475, "Pretrain/Step Time": 8.504995729774237} +{"Pretrain/Learning Rate": 9.136210082519858e-07, "Pretrain/Loss": 2.002946615219116, "Pretrain/Loss (Raw)": 2.0690536499023438, "Pretrain/Step": 17476, "Pretrain/Step Time": 8.502320246770978} +{"Pretrain/Learning Rate": 9.124842043343407e-07, "Pretrain/Loss": 2.004467248916626, "Pretrain/Loss (Raw)": 2.1501524448394775, "Pretrain/Step": 17477, "Pretrain/Step Time": 8.500022741034627} +{"Pretrain/Learning Rate": 9.113480949632325e-07, "Pretrain/Loss": 2.0050108432769775, "Pretrain/Loss (Raw)": 1.9780147075653076, "Pretrain/Step": 17478, "Pretrain/Step Time": 8.499111516401172} +{"Pretrain/Learning Rate": 9.102126801714156e-07, "Pretrain/Loss": 2.00409197807312, "Pretrain/Loss (Raw)": 1.938520073890686, "Pretrain/Step": 17479, "Pretrain/Step Time": 8.497446300461888} +{"Pretrain/Learning Rate": 9.090779599916361e-07, "Pretrain/Loss": 2.0020995140075684, "Pretrain/Loss (Raw)": 1.8189276456832886, "Pretrain/Step": 17480, "Pretrain/Step Time": 8.497227679938078} +{"Pretrain/Learning Rate": 9.079439344566092e-07, "Pretrain/Loss": 2.001518726348877, "Pretrain/Loss (Raw)": 2.017367362976074, "Pretrain/Step": 17481, "Pretrain/Step Time": 8.498246535658836} +{"Pretrain/Learning Rate": 9.068106035990398e-07, "Pretrain/Loss": 2.000458240509033, "Pretrain/Loss (Raw)": 2.056230306625366, "Pretrain/Step": 17482, "Pretrain/Step Time": 8.499254131689668} +{"Pretrain/Learning Rate": 9.056779674516014e-07, "Pretrain/Loss": 1.9995198249816895, "Pretrain/Loss (Raw)": 1.8458038568496704, "Pretrain/Step": 17483, "Pretrain/Step Time": 8.49865536019206} +{"Pretrain/Learning Rate": 9.045460260469485e-07, "Pretrain/Loss": 1.996457576751709, "Pretrain/Loss (Raw)": 2.0348851680755615, "Pretrain/Step": 17484, "Pretrain/Step Time": 8.498904867097735} +{"Pretrain/Learning Rate": 9.0341477941773e-07, "Pretrain/Loss": 1.9966455698013306, "Pretrain/Loss (Raw)": 1.9825613498687744, "Pretrain/Step": 17485, "Pretrain/Step Time": 8.497110242024064} +{"Pretrain/Learning Rate": 9.022842275965532e-07, "Pretrain/Loss": 1.9939794540405273, "Pretrain/Loss (Raw)": 1.848166823387146, "Pretrain/Step": 17486, "Pretrain/Step Time": 8.498151617124677} +{"Pretrain/Learning Rate": 9.01154370616028e-07, "Pretrain/Loss": 1.9957501888275146, "Pretrain/Loss (Raw)": 2.0502023696899414, "Pretrain/Step": 17487, "Pretrain/Step Time": 8.497607534751296} +{"Pretrain/Learning Rate": 9.000252085087285e-07, "Pretrain/Loss": 1.991180419921875, "Pretrain/Loss (Raw)": 1.5521161556243896, "Pretrain/Step": 17488, "Pretrain/Step Time": 8.499825730919838} +{"Pretrain/Learning Rate": 8.988967413072091e-07, "Pretrain/Loss": 1.9946821928024292, "Pretrain/Loss (Raw)": 2.208879232406616, "Pretrain/Step": 17489, "Pretrain/Step Time": 8.496208069846034} +{"Pretrain/Learning Rate": 8.977689690440161e-07, "Pretrain/Loss": 1.996567964553833, "Pretrain/Loss (Raw)": 2.1980133056640625, "Pretrain/Step": 17490, "Pretrain/Step Time": 8.49642888456583} +{"Pretrain/Learning Rate": 8.966418917516595e-07, "Pretrain/Loss": 1.9975179433822632, "Pretrain/Loss (Raw)": 2.0409796237945557, "Pretrain/Step": 17491, "Pretrain/Step Time": 8.498269757255912} +{"Pretrain/Learning Rate": 8.955155094626439e-07, "Pretrain/Loss": 1.995265007019043, "Pretrain/Loss (Raw)": 1.7336602210998535, "Pretrain/Step": 17492, "Pretrain/Step Time": 8.494784969836473} +{"Pretrain/Learning Rate": 8.943898222094488e-07, "Pretrain/Loss": 1.9955565929412842, "Pretrain/Loss (Raw)": 1.8561785221099854, "Pretrain/Step": 17493, "Pretrain/Step Time": 8.494631113484502} +{"Pretrain/Learning Rate": 8.932648300245261e-07, "Pretrain/Loss": 1.9968693256378174, "Pretrain/Loss (Raw)": 2.174180030822754, "Pretrain/Step": 17494, "Pretrain/Step Time": 8.493582049384713} +{"Pretrain/Learning Rate": 8.921405329403193e-07, "Pretrain/Loss": 1.9972031116485596, "Pretrain/Loss (Raw)": 1.969164252281189, "Pretrain/Step": 17495, "Pretrain/Step Time": 8.491092095151544} +{"Pretrain/Learning Rate": 8.910169309892441e-07, "Pretrain/Loss": 1.998483657836914, "Pretrain/Loss (Raw)": 1.9998224973678589, "Pretrain/Step": 17496, "Pretrain/Step Time": 8.491450371220708} +{"Pretrain/Learning Rate": 8.898940242037024e-07, "Pretrain/Loss": 1.9990787506103516, "Pretrain/Loss (Raw)": 2.054405450820923, "Pretrain/Step": 17497, "Pretrain/Step Time": 8.493520207703114} +{"Pretrain/Learning Rate": 8.88771812616071e-07, "Pretrain/Loss": 1.9979016780853271, "Pretrain/Loss (Raw)": 1.8375810384750366, "Pretrain/Step": 17498, "Pretrain/Step Time": 8.493450677022338} +{"Pretrain/Learning Rate": 8.876502962587019e-07, "Pretrain/Loss": 1.9997460842132568, "Pretrain/Loss (Raw)": 2.1473259925842285, "Pretrain/Step": 17499, "Pretrain/Step Time": 8.4937873352319} +{"Pretrain/Learning Rate": 8.865294751639442e-07, "Pretrain/Loss": 2.0031681060791016, "Pretrain/Loss (Raw)": 2.130145788192749, "Pretrain/Step": 17500, "Pretrain/Step Time": 8.48729656636715} +{"Pretrain/Learning Rate": 8.854093493641052e-07, "Pretrain/Loss": 2.0021674633026123, "Pretrain/Loss (Raw)": 1.8813215494155884, "Pretrain/Step": 17501, "Pretrain/Step Time": 8.491978937759995} +{"Pretrain/Learning Rate": 8.842899188914899e-07, "Pretrain/Loss": 2.002826690673828, "Pretrain/Loss (Raw)": 2.0409419536590576, "Pretrain/Step": 17502, "Pretrain/Step Time": 8.493342030793428} +{"Pretrain/Learning Rate": 8.831711837783751e-07, "Pretrain/Loss": 2.0001792907714844, "Pretrain/Loss (Raw)": 1.8200058937072754, "Pretrain/Step": 17503, "Pretrain/Step Time": 8.487769177183509} +{"Pretrain/Learning Rate": 8.820531440570184e-07, "Pretrain/Loss": 2.002741575241089, "Pretrain/Loss (Raw)": 2.115973711013794, "Pretrain/Step": 17504, "Pretrain/Step Time": 8.496196035295725} +{"Pretrain/Learning Rate": 8.809357997596551e-07, "Pretrain/Loss": 1.9996694326400757, "Pretrain/Loss (Raw)": 1.7940768003463745, "Pretrain/Step": 17505, "Pretrain/Step Time": 8.501785838976502} +{"Pretrain/Learning Rate": 8.798191509185067e-07, "Pretrain/Loss": 1.9998421669006348, "Pretrain/Loss (Raw)": 1.7873835563659668, "Pretrain/Step": 17506, "Pretrain/Step Time": 8.499959198758006} +{"Pretrain/Learning Rate": 8.787031975657694e-07, "Pretrain/Loss": 1.999330759048462, "Pretrain/Loss (Raw)": 2.0875940322875977, "Pretrain/Step": 17507, "Pretrain/Step Time": 8.50027934834361} +{"Pretrain/Learning Rate": 8.775879397336206e-07, "Pretrain/Loss": 1.9983830451965332, "Pretrain/Loss (Raw)": 1.950626254081726, "Pretrain/Step": 17508, "Pretrain/Step Time": 8.501627700403333} +{"Pretrain/Learning Rate": 8.764733774542178e-07, "Pretrain/Loss": 1.9982703924179077, "Pretrain/Loss (Raw)": 1.8142465353012085, "Pretrain/Step": 17509, "Pretrain/Step Time": 8.499011117964983} +{"Pretrain/Learning Rate": 8.753595107597018e-07, "Pretrain/Loss": 1.9981536865234375, "Pretrain/Loss (Raw)": 2.013929843902588, "Pretrain/Step": 17510, "Pretrain/Step Time": 8.502493634819984} +{"Pretrain/Learning Rate": 8.742463396821832e-07, "Pretrain/Loss": 1.998822569847107, "Pretrain/Loss (Raw)": 2.0452966690063477, "Pretrain/Step": 17511, "Pretrain/Step Time": 8.495316814631224} +{"Pretrain/Learning Rate": 8.731338642537667e-07, "Pretrain/Loss": 2.002096652984619, "Pretrain/Loss (Raw)": 2.007148265838623, "Pretrain/Step": 17512, "Pretrain/Step Time": 8.492703460156918} +{"Pretrain/Learning Rate": 8.720220845065269e-07, "Pretrain/Loss": 2.001024007797241, "Pretrain/Loss (Raw)": 1.9537020921707153, "Pretrain/Step": 17513, "Pretrain/Step Time": 8.499778548255563} +{"Pretrain/Learning Rate": 8.709110004725212e-07, "Pretrain/Loss": 2.0026845932006836, "Pretrain/Loss (Raw)": 2.1567797660827637, "Pretrain/Step": 17514, "Pretrain/Step Time": 8.499662039801478} +{"Pretrain/Learning Rate": 8.698006121837882e-07, "Pretrain/Loss": 2.000333786010742, "Pretrain/Loss (Raw)": 1.945340633392334, "Pretrain/Step": 17515, "Pretrain/Step Time": 8.49949192814529} +{"Pretrain/Learning Rate": 8.686909196723408e-07, "Pretrain/Loss": 1.999324917793274, "Pretrain/Loss (Raw)": 1.8199782371520996, "Pretrain/Step": 17516, "Pretrain/Step Time": 8.503363028168678} +{"Pretrain/Learning Rate": 8.675819229701815e-07, "Pretrain/Loss": 2.001091718673706, "Pretrain/Loss (Raw)": 2.105529546737671, "Pretrain/Step": 17517, "Pretrain/Step Time": 8.50116421468556} +{"Pretrain/Learning Rate": 8.664736221092845e-07, "Pretrain/Loss": 1.9989898204803467, "Pretrain/Loss (Raw)": 2.044910430908203, "Pretrain/Step": 17518, "Pretrain/Step Time": 8.498575735837221} +{"Pretrain/Learning Rate": 8.653660171216105e-07, "Pretrain/Loss": 1.997295618057251, "Pretrain/Loss (Raw)": 1.933099389076233, "Pretrain/Step": 17519, "Pretrain/Step Time": 8.504152836278081} +{"Pretrain/Learning Rate": 8.642591080390893e-07, "Pretrain/Loss": 2.000725269317627, "Pretrain/Loss (Raw)": 2.1395633220672607, "Pretrain/Step": 17520, "Pretrain/Step Time": 8.500499803572893} +{"Pretrain/Learning Rate": 8.631528948936429e-07, "Pretrain/Loss": 2.0009231567382812, "Pretrain/Loss (Raw)": 1.989932656288147, "Pretrain/Step": 17521, "Pretrain/Step Time": 8.50270982272923} +{"Pretrain/Learning Rate": 8.620473777171706e-07, "Pretrain/Loss": 2.000309467315674, "Pretrain/Loss (Raw)": 1.9788678884506226, "Pretrain/Step": 17522, "Pretrain/Step Time": 8.503165453672409} +{"Pretrain/Learning Rate": 8.609425565415413e-07, "Pretrain/Loss": 1.9968862533569336, "Pretrain/Loss (Raw)": 1.7257338762283325, "Pretrain/Step": 17523, "Pretrain/Step Time": 8.503524096682668} +{"Pretrain/Learning Rate": 8.598384313986186e-07, "Pretrain/Loss": 1.9955533742904663, "Pretrain/Loss (Raw)": 1.7691500186920166, "Pretrain/Step": 17524, "Pretrain/Step Time": 8.509287431836128} +{"Pretrain/Learning Rate": 8.58735002320235e-07, "Pretrain/Loss": 1.9947723150253296, "Pretrain/Loss (Raw)": 1.9113134145736694, "Pretrain/Step": 17525, "Pretrain/Step Time": 8.510162366554141} +{"Pretrain/Learning Rate": 8.576322693382127e-07, "Pretrain/Loss": 1.9947447776794434, "Pretrain/Loss (Raw)": 2.123075246810913, "Pretrain/Step": 17526, "Pretrain/Step Time": 8.502901822328568} +{"Pretrain/Learning Rate": 8.565302324843455e-07, "Pretrain/Loss": 1.993584156036377, "Pretrain/Loss (Raw)": 1.9183692932128906, "Pretrain/Step": 17527, "Pretrain/Step Time": 8.5010397862643} +{"Pretrain/Learning Rate": 8.554288917904052e-07, "Pretrain/Loss": 1.9965851306915283, "Pretrain/Loss (Raw)": 2.1022958755493164, "Pretrain/Step": 17528, "Pretrain/Step Time": 8.501497033983469} +{"Pretrain/Learning Rate": 8.543282472881526e-07, "Pretrain/Loss": 1.9969717264175415, "Pretrain/Loss (Raw)": 2.0434722900390625, "Pretrain/Step": 17529, "Pretrain/Step Time": 8.504654794931412} +{"Pretrain/Learning Rate": 8.532282990093232e-07, "Pretrain/Loss": 1.9973859786987305, "Pretrain/Loss (Raw)": 1.9056153297424316, "Pretrain/Step": 17530, "Pretrain/Step Time": 8.509874731302261} +{"Pretrain/Learning Rate": 8.521290469856363e-07, "Pretrain/Loss": 1.996769905090332, "Pretrain/Loss (Raw)": 2.0393383502960205, "Pretrain/Step": 17531, "Pretrain/Step Time": 8.509905979037285} +{"Pretrain/Learning Rate": 8.510304912487832e-07, "Pretrain/Loss": 1.9981666803359985, "Pretrain/Loss (Raw)": 2.0014841556549072, "Pretrain/Step": 17532, "Pretrain/Step Time": 8.507412631064653} +{"Pretrain/Learning Rate": 8.499326318304413e-07, "Pretrain/Loss": 1.9971208572387695, "Pretrain/Loss (Raw)": 2.142642021179199, "Pretrain/Step": 17533, "Pretrain/Step Time": 8.505228346213698} +{"Pretrain/Learning Rate": 8.488354687622685e-07, "Pretrain/Loss": 1.994652509689331, "Pretrain/Loss (Raw)": 1.971510648727417, "Pretrain/Step": 17534, "Pretrain/Step Time": 8.5102657712996} +{"Pretrain/Learning Rate": 8.477390020758979e-07, "Pretrain/Loss": 1.9967259168624878, "Pretrain/Loss (Raw)": 1.9938971996307373, "Pretrain/Step": 17535, "Pretrain/Step Time": 8.510148959234357} +{"Pretrain/Learning Rate": 8.466432318029488e-07, "Pretrain/Loss": 1.9972293376922607, "Pretrain/Loss (Raw)": 2.073991298675537, "Pretrain/Step": 17536, "Pretrain/Step Time": 8.5080203153193} +{"Pretrain/Learning Rate": 8.455481579750179e-07, "Pretrain/Loss": 1.9983651638031006, "Pretrain/Loss (Raw)": 2.066183090209961, "Pretrain/Step": 17537, "Pretrain/Step Time": 8.511311274021864} +{"Pretrain/Learning Rate": 8.444537806236719e-07, "Pretrain/Loss": 1.9965990781784058, "Pretrain/Loss (Raw)": 1.7687604427337646, "Pretrain/Step": 17538, "Pretrain/Step Time": 8.503422744572163} +{"Pretrain/Learning Rate": 8.43360099780477e-07, "Pretrain/Loss": 1.9955307245254517, "Pretrain/Loss (Raw)": 1.7770025730133057, "Pretrain/Step": 17539, "Pretrain/Step Time": 8.504393685609102} +{"Pretrain/Learning Rate": 8.422671154769607e-07, "Pretrain/Loss": 1.994276762008667, "Pretrain/Loss (Raw)": 1.9535466432571411, "Pretrain/Step": 17540, "Pretrain/Step Time": 8.510377548635006} +{"Pretrain/Learning Rate": 8.411748277446451e-07, "Pretrain/Loss": 1.9946879148483276, "Pretrain/Loss (Raw)": 1.8616664409637451, "Pretrain/Step": 17541, "Pretrain/Step Time": 8.505844160914421} +{"Pretrain/Learning Rate": 8.400832366150218e-07, "Pretrain/Loss": 1.9941675662994385, "Pretrain/Loss (Raw)": 1.7546719312667847, "Pretrain/Step": 17542, "Pretrain/Step Time": 8.507415628060699} +{"Pretrain/Learning Rate": 8.389923421195656e-07, "Pretrain/Loss": 1.9923491477966309, "Pretrain/Loss (Raw)": 1.8569071292877197, "Pretrain/Step": 17543, "Pretrain/Step Time": 8.503199718892574} +{"Pretrain/Learning Rate": 8.379021442897345e-07, "Pretrain/Loss": 1.992148756980896, "Pretrain/Loss (Raw)": 1.9659849405288696, "Pretrain/Step": 17544, "Pretrain/Step Time": 8.502079734578729} +{"Pretrain/Learning Rate": 8.368126431569589e-07, "Pretrain/Loss": 1.9891903400421143, "Pretrain/Loss (Raw)": 1.6903208494186401, "Pretrain/Step": 17545, "Pretrain/Step Time": 8.497366858646274} +{"Pretrain/Learning Rate": 8.357238387526612e-07, "Pretrain/Loss": 1.986051321029663, "Pretrain/Loss (Raw)": 1.7575947046279907, "Pretrain/Step": 17546, "Pretrain/Step Time": 8.504787605255842} +{"Pretrain/Learning Rate": 8.346357311082298e-07, "Pretrain/Loss": 1.9856594800949097, "Pretrain/Loss (Raw)": 1.8611761331558228, "Pretrain/Step": 17547, "Pretrain/Step Time": 8.505472423508763} +{"Pretrain/Learning Rate": 8.335483202550398e-07, "Pretrain/Loss": 1.9866032600402832, "Pretrain/Loss (Raw)": 1.9321911334991455, "Pretrain/Step": 17548, "Pretrain/Step Time": 8.497315756976604} +{"Pretrain/Learning Rate": 8.324616062244522e-07, "Pretrain/Loss": 1.9845365285873413, "Pretrain/Loss (Raw)": 1.9306401014328003, "Pretrain/Step": 17549, "Pretrain/Step Time": 8.497525272890925} +{"Pretrain/Learning Rate": 8.31375589047792e-07, "Pretrain/Loss": 1.985112190246582, "Pretrain/Loss (Raw)": 1.9677799940109253, "Pretrain/Step": 17550, "Pretrain/Step Time": 8.498219953849912} +{"Pretrain/Learning Rate": 8.302902687563812e-07, "Pretrain/Loss": 1.985992670059204, "Pretrain/Loss (Raw)": 2.0976760387420654, "Pretrain/Step": 17551, "Pretrain/Step Time": 8.49893887527287} +{"Pretrain/Learning Rate": 8.292056453815144e-07, "Pretrain/Loss": 1.9861531257629395, "Pretrain/Loss (Raw)": 2.0642218589782715, "Pretrain/Step": 17552, "Pretrain/Step Time": 8.49573447369039} +{"Pretrain/Learning Rate": 8.28121718954461e-07, "Pretrain/Loss": 1.984755516052246, "Pretrain/Loss (Raw)": 1.9579405784606934, "Pretrain/Step": 17553, "Pretrain/Step Time": 8.497245939448476} +{"Pretrain/Learning Rate": 8.270384895064793e-07, "Pretrain/Loss": 1.9864649772644043, "Pretrain/Loss (Raw)": 1.9574155807495117, "Pretrain/Step": 17554, "Pretrain/Step Time": 8.499331764876842} +{"Pretrain/Learning Rate": 8.259559570687969e-07, "Pretrain/Loss": 1.9866905212402344, "Pretrain/Loss (Raw)": 1.7540152072906494, "Pretrain/Step": 17555, "Pretrain/Step Time": 8.50131257250905} +{"Pretrain/Learning Rate": 8.248741216726391e-07, "Pretrain/Loss": 1.9875481128692627, "Pretrain/Loss (Raw)": 1.821906566619873, "Pretrain/Step": 17556, "Pretrain/Step Time": 8.49709340929985} +{"Pretrain/Learning Rate": 8.23792983349192e-07, "Pretrain/Loss": 1.988746166229248, "Pretrain/Loss (Raw)": 1.939005970954895, "Pretrain/Step": 17557, "Pretrain/Step Time": 8.498902447521687} +{"Pretrain/Learning Rate": 8.227125421296277e-07, "Pretrain/Loss": 1.9879138469696045, "Pretrain/Loss (Raw)": 1.9720816612243652, "Pretrain/Step": 17558, "Pretrain/Step Time": 8.497153420001268} +{"Pretrain/Learning Rate": 8.216327980451078e-07, "Pretrain/Loss": 1.9895424842834473, "Pretrain/Loss (Raw)": 2.0791797637939453, "Pretrain/Step": 17559, "Pretrain/Step Time": 8.493122534826398} +{"Pretrain/Learning Rate": 8.205537511267597e-07, "Pretrain/Loss": 1.9888858795166016, "Pretrain/Loss (Raw)": 2.101685047149658, "Pretrain/Step": 17560, "Pretrain/Step Time": 8.49100505746901} +{"Pretrain/Learning Rate": 8.194754014057005e-07, "Pretrain/Loss": 1.9885237216949463, "Pretrain/Loss (Raw)": 1.9930793046951294, "Pretrain/Step": 17561, "Pretrain/Step Time": 8.4884074293077} +{"Pretrain/Learning Rate": 8.18397748913019e-07, "Pretrain/Loss": 1.9880784749984741, "Pretrain/Loss (Raw)": 2.0402584075927734, "Pretrain/Step": 17562, "Pretrain/Step Time": 8.488917047157884} +{"Pretrain/Learning Rate": 8.173207936797933e-07, "Pretrain/Loss": 1.990485429763794, "Pretrain/Loss (Raw)": 2.246079444885254, "Pretrain/Step": 17563, "Pretrain/Step Time": 8.492064760997891} +{"Pretrain/Learning Rate": 8.162445357370735e-07, "Pretrain/Loss": 1.9878312349319458, "Pretrain/Loss (Raw)": 1.846840739250183, "Pretrain/Step": 17564, "Pretrain/Step Time": 8.489744704216719} +{"Pretrain/Learning Rate": 8.151689751158931e-07, "Pretrain/Loss": 1.982710599899292, "Pretrain/Loss (Raw)": 2.035513401031494, "Pretrain/Step": 17565, "Pretrain/Step Time": 8.492808245122433} +{"Pretrain/Learning Rate": 8.140941118472717e-07, "Pretrain/Loss": 1.9817237854003906, "Pretrain/Loss (Raw)": 1.8699291944503784, "Pretrain/Step": 17566, "Pretrain/Step Time": 8.490423848852515} +{"Pretrain/Learning Rate": 8.130199459621929e-07, "Pretrain/Loss": 1.9811278581619263, "Pretrain/Loss (Raw)": 1.9837863445281982, "Pretrain/Step": 17567, "Pretrain/Step Time": 8.49317061714828} +{"Pretrain/Learning Rate": 8.119464774916318e-07, "Pretrain/Loss": 1.982544183731079, "Pretrain/Loss (Raw)": 2.217562437057495, "Pretrain/Step": 17568, "Pretrain/Step Time": 8.496133280918002} +{"Pretrain/Learning Rate": 8.108737064665444e-07, "Pretrain/Loss": 1.9801506996154785, "Pretrain/Loss (Raw)": 1.6888302564620972, "Pretrain/Step": 17569, "Pretrain/Step Time": 8.495673218742013} +{"Pretrain/Learning Rate": 8.098016329178615e-07, "Pretrain/Loss": 1.9790488481521606, "Pretrain/Loss (Raw)": 1.8076441287994385, "Pretrain/Step": 17570, "Pretrain/Step Time": 8.493518074974418} +{"Pretrain/Learning Rate": 8.087302568764943e-07, "Pretrain/Loss": 1.980183482170105, "Pretrain/Loss (Raw)": 2.1439616680145264, "Pretrain/Step": 17571, "Pretrain/Step Time": 8.494443353265524} +{"Pretrain/Learning Rate": 8.076595783733404e-07, "Pretrain/Loss": 1.9779322147369385, "Pretrain/Loss (Raw)": 1.983424186706543, "Pretrain/Step": 17572, "Pretrain/Step Time": 8.494535863399506} +{"Pretrain/Learning Rate": 8.065895974392612e-07, "Pretrain/Loss": 1.9781383275985718, "Pretrain/Loss (Raw)": 2.139233112335205, "Pretrain/Step": 17573, "Pretrain/Step Time": 8.495577601715922} +{"Pretrain/Learning Rate": 8.05520314105121e-07, "Pretrain/Loss": 1.9750818014144897, "Pretrain/Loss (Raw)": 1.9785091876983643, "Pretrain/Step": 17574, "Pretrain/Step Time": 8.492588652297854} +{"Pretrain/Learning Rate": 8.04451728401745e-07, "Pretrain/Loss": 1.974785327911377, "Pretrain/Loss (Raw)": 1.9395536184310913, "Pretrain/Step": 17575, "Pretrain/Step Time": 8.492338698357344} +{"Pretrain/Learning Rate": 8.033838403599475e-07, "Pretrain/Loss": 1.9749345779418945, "Pretrain/Loss (Raw)": 2.0366969108581543, "Pretrain/Step": 17576, "Pretrain/Step Time": 8.49081789702177} +{"Pretrain/Learning Rate": 8.02316650010515e-07, "Pretrain/Loss": 1.9744365215301514, "Pretrain/Loss (Raw)": 2.048497200012207, "Pretrain/Step": 17577, "Pretrain/Step Time": 8.490414151921868} +{"Pretrain/Learning Rate": 8.012501573842313e-07, "Pretrain/Loss": 1.9726121425628662, "Pretrain/Loss (Raw)": 1.8582446575164795, "Pretrain/Step": 17578, "Pretrain/Step Time": 8.485447818413377} +{"Pretrain/Learning Rate": 8.001843625118354e-07, "Pretrain/Loss": 1.9727213382720947, "Pretrain/Loss (Raw)": 2.0924222469329834, "Pretrain/Step": 17579, "Pretrain/Step Time": 8.483201062306762} +{"Pretrain/Learning Rate": 7.991192654240642e-07, "Pretrain/Loss": 1.9720165729522705, "Pretrain/Loss (Raw)": 1.9977957010269165, "Pretrain/Step": 17580, "Pretrain/Step Time": 8.486297907307744} +{"Pretrain/Learning Rate": 7.980548661516291e-07, "Pretrain/Loss": 1.9721753597259521, "Pretrain/Loss (Raw)": 1.9933723211288452, "Pretrain/Step": 17581, "Pretrain/Step Time": 8.485011389479041} +{"Pretrain/Learning Rate": 7.969911647252193e-07, "Pretrain/Loss": 1.97003972530365, "Pretrain/Loss (Raw)": 1.8304784297943115, "Pretrain/Step": 17582, "Pretrain/Step Time": 8.481637425720692} +{"Pretrain/Learning Rate": 7.959281611755104e-07, "Pretrain/Loss": 1.9684938192367554, "Pretrain/Loss (Raw)": 1.9102520942687988, "Pretrain/Step": 17583, "Pretrain/Step Time": 8.479653907939792} +{"Pretrain/Learning Rate": 7.948658555331473e-07, "Pretrain/Loss": 1.9692755937576294, "Pretrain/Loss (Raw)": 2.0746824741363525, "Pretrain/Step": 17584, "Pretrain/Step Time": 8.480116637423635} +{"Pretrain/Learning Rate": 7.938042478287638e-07, "Pretrain/Loss": 1.9645845890045166, "Pretrain/Loss (Raw)": 1.9283736944198608, "Pretrain/Step": 17585, "Pretrain/Step Time": 8.485368199646473} +{"Pretrain/Learning Rate": 7.927433380929744e-07, "Pretrain/Loss": 1.9622254371643066, "Pretrain/Loss (Raw)": 1.8318201303482056, "Pretrain/Step": 17586, "Pretrain/Step Time": 8.484542399644852} +{"Pretrain/Learning Rate": 7.916831263563601e-07, "Pretrain/Loss": 1.9635778665542603, "Pretrain/Loss (Raw)": 1.9191697835922241, "Pretrain/Step": 17587, "Pretrain/Step Time": 8.483959404751658} +{"Pretrain/Learning Rate": 7.90623612649502e-07, "Pretrain/Loss": 1.9635326862335205, "Pretrain/Loss (Raw)": 2.0967743396759033, "Pretrain/Step": 17588, "Pretrain/Step Time": 8.489408953115344} +{"Pretrain/Learning Rate": 7.895647970029452e-07, "Pretrain/Loss": 1.963778018951416, "Pretrain/Loss (Raw)": 2.0069823265075684, "Pretrain/Step": 17589, "Pretrain/Step Time": 8.487592339515686} +{"Pretrain/Learning Rate": 7.885066794472151e-07, "Pretrain/Loss": 1.9633195400238037, "Pretrain/Loss (Raw)": 1.9052722454071045, "Pretrain/Step": 17590, "Pretrain/Step Time": 8.49285987764597} +{"Pretrain/Learning Rate": 7.87449260012832e-07, "Pretrain/Loss": 1.9635462760925293, "Pretrain/Loss (Raw)": 2.1397693157196045, "Pretrain/Step": 17591, "Pretrain/Step Time": 8.49481039866805} +{"Pretrain/Learning Rate": 7.863925387302767e-07, "Pretrain/Loss": 1.9645392894744873, "Pretrain/Loss (Raw)": 2.2731869220733643, "Pretrain/Step": 17592, "Pretrain/Step Time": 8.497227843850851} +{"Pretrain/Learning Rate": 7.85336515630028e-07, "Pretrain/Loss": 1.9639594554901123, "Pretrain/Loss (Raw)": 1.8531725406646729, "Pretrain/Step": 17593, "Pretrain/Step Time": 8.490360740572214} +{"Pretrain/Learning Rate": 7.842811907425279e-07, "Pretrain/Loss": 1.9657083749771118, "Pretrain/Loss (Raw)": 1.9652891159057617, "Pretrain/Step": 17594, "Pretrain/Step Time": 8.48791828006506} +{"Pretrain/Learning Rate": 7.832265640982078e-07, "Pretrain/Loss": 1.9637069702148438, "Pretrain/Loss (Raw)": 1.7039402723312378, "Pretrain/Step": 17595, "Pretrain/Step Time": 8.485647713765502} +{"Pretrain/Learning Rate": 7.821726357274822e-07, "Pretrain/Loss": 1.9661626815795898, "Pretrain/Loss (Raw)": 2.1755764484405518, "Pretrain/Step": 17596, "Pretrain/Step Time": 8.485520727932453} +{"Pretrain/Learning Rate": 7.811194056607296e-07, "Pretrain/Loss": 1.9701365232467651, "Pretrain/Loss (Raw)": 2.132626533508301, "Pretrain/Step": 17597, "Pretrain/Step Time": 8.483675956726074} +{"Pretrain/Learning Rate": 7.800668739283312e-07, "Pretrain/Loss": 1.969620704650879, "Pretrain/Loss (Raw)": 2.1540799140930176, "Pretrain/Step": 17598, "Pretrain/Step Time": 8.481134220957756} +{"Pretrain/Learning Rate": 7.790150405606295e-07, "Pretrain/Loss": 1.9709868431091309, "Pretrain/Loss (Raw)": 2.015305519104004, "Pretrain/Step": 17599, "Pretrain/Step Time": 8.480160368606448} +{"Pretrain/Learning Rate": 7.779639055879528e-07, "Pretrain/Loss": 1.9722996950149536, "Pretrain/Loss (Raw)": 1.9239228963851929, "Pretrain/Step": 17600, "Pretrain/Step Time": 8.47964408993721} +{"Pretrain/Learning Rate": 7.769134690406132e-07, "Pretrain/Loss": 1.9719094038009644, "Pretrain/Loss (Raw)": 1.8921715021133423, "Pretrain/Step": 17601, "Pretrain/Step Time": 8.478415105491877} +{"Pretrain/Learning Rate": 7.758637309488975e-07, "Pretrain/Loss": 1.9705862998962402, "Pretrain/Loss (Raw)": 1.8625636100769043, "Pretrain/Step": 17602, "Pretrain/Step Time": 8.484524175524712} +{"Pretrain/Learning Rate": 7.74814691343076e-07, "Pretrain/Loss": 1.9703075885772705, "Pretrain/Loss (Raw)": 1.932695746421814, "Pretrain/Step": 17603, "Pretrain/Step Time": 8.485938869416714} +{"Pretrain/Learning Rate": 7.73766350253391e-07, "Pretrain/Loss": 1.969572901725769, "Pretrain/Loss (Raw)": 1.975009560585022, "Pretrain/Step": 17604, "Pretrain/Step Time": 8.486777182668447} +{"Pretrain/Learning Rate": 7.727187077100767e-07, "Pretrain/Loss": 1.967194676399231, "Pretrain/Loss (Raw)": 1.845748782157898, "Pretrain/Step": 17605, "Pretrain/Step Time": 8.488772159442306} +{"Pretrain/Learning Rate": 7.716717637433396e-07, "Pretrain/Loss": 1.9661667346954346, "Pretrain/Loss (Raw)": 1.846442699432373, "Pretrain/Step": 17606, "Pretrain/Step Time": 8.486017223447561} +{"Pretrain/Learning Rate": 7.706255183833666e-07, "Pretrain/Loss": 1.9684308767318726, "Pretrain/Loss (Raw)": 2.228327751159668, "Pretrain/Step": 17607, "Pretrain/Step Time": 8.486849468201399} +{"Pretrain/Learning Rate": 7.69579971660328e-07, "Pretrain/Loss": 1.9699089527130127, "Pretrain/Loss (Raw)": 2.00812029838562, "Pretrain/Step": 17608, "Pretrain/Step Time": 8.485434409230947} +{"Pretrain/Learning Rate": 7.685351236043664e-07, "Pretrain/Loss": 1.9702794551849365, "Pretrain/Loss (Raw)": 2.0647940635681152, "Pretrain/Step": 17609, "Pretrain/Step Time": 8.481227047741413} +{"Pretrain/Learning Rate": 7.674909742456132e-07, "Pretrain/Loss": 1.9702727794647217, "Pretrain/Loss (Raw)": 2.0553743839263916, "Pretrain/Step": 17610, "Pretrain/Step Time": 8.478103578090668} +{"Pretrain/Learning Rate": 7.664475236141777e-07, "Pretrain/Loss": 1.9716368913650513, "Pretrain/Loss (Raw)": 2.0203988552093506, "Pretrain/Step": 17611, "Pretrain/Step Time": 8.478241479024291} +{"Pretrain/Learning Rate": 7.654047717401414e-07, "Pretrain/Loss": 1.9712891578674316, "Pretrain/Loss (Raw)": 1.990392804145813, "Pretrain/Step": 17612, "Pretrain/Step Time": 8.47535334713757} +{"Pretrain/Learning Rate": 7.643627186535773e-07, "Pretrain/Loss": 1.9733803272247314, "Pretrain/Loss (Raw)": 2.250209331512451, "Pretrain/Step": 17613, "Pretrain/Step Time": 8.470739040523767} +{"Pretrain/Learning Rate": 7.633213643845255e-07, "Pretrain/Loss": 1.974384069442749, "Pretrain/Loss (Raw)": 1.9766708612442017, "Pretrain/Step": 17614, "Pretrain/Step Time": 8.475325614213943} +{"Pretrain/Learning Rate": 7.622807089630201e-07, "Pretrain/Loss": 1.96674382686615, "Pretrain/Loss (Raw)": 1.072226881980896, "Pretrain/Step": 17615, "Pretrain/Step Time": 8.483465045690536} +{"Pretrain/Learning Rate": 7.612407524190624e-07, "Pretrain/Loss": 1.9725356101989746, "Pretrain/Loss (Raw)": 2.293463706970215, "Pretrain/Step": 17616, "Pretrain/Step Time": 8.478509899228811} +{"Pretrain/Learning Rate": 7.602014947826391e-07, "Pretrain/Loss": 1.9713947772979736, "Pretrain/Loss (Raw)": 2.0628585815429688, "Pretrain/Step": 17617, "Pretrain/Step Time": 8.483028726652265} +{"Pretrain/Learning Rate": 7.591629360837183e-07, "Pretrain/Loss": 1.968916416168213, "Pretrain/Loss (Raw)": 1.880788803100586, "Pretrain/Step": 17618, "Pretrain/Step Time": 8.482376059517264} +{"Pretrain/Learning Rate": 7.581250763522451e-07, "Pretrain/Loss": 1.9681007862091064, "Pretrain/Loss (Raw)": 1.9365673065185547, "Pretrain/Step": 17619, "Pretrain/Step Time": 8.483094688504934} +{"Pretrain/Learning Rate": 7.570879156181488e-07, "Pretrain/Loss": 1.970029354095459, "Pretrain/Loss (Raw)": 1.9805374145507812, "Pretrain/Step": 17620, "Pretrain/Step Time": 8.484141813591123} +{"Pretrain/Learning Rate": 7.560514539113328e-07, "Pretrain/Loss": 1.9710757732391357, "Pretrain/Loss (Raw)": 1.9901071786880493, "Pretrain/Step": 17621, "Pretrain/Step Time": 8.48868852108717} +{"Pretrain/Learning Rate": 7.550156912616763e-07, "Pretrain/Loss": 1.9693812131881714, "Pretrain/Loss (Raw)": 1.9572829008102417, "Pretrain/Step": 17622, "Pretrain/Step Time": 8.489580128341913} +{"Pretrain/Learning Rate": 7.539806276990552e-07, "Pretrain/Loss": 1.9704782962799072, "Pretrain/Loss (Raw)": 2.1095786094665527, "Pretrain/Step": 17623, "Pretrain/Step Time": 8.49301796220243} +{"Pretrain/Learning Rate": 7.529462632533097e-07, "Pretrain/Loss": 1.971390724182129, "Pretrain/Loss (Raw)": 2.11661958694458, "Pretrain/Step": 17624, "Pretrain/Step Time": 8.490319032222033} +{"Pretrain/Learning Rate": 7.519125979542657e-07, "Pretrain/Loss": 1.9691269397735596, "Pretrain/Loss (Raw)": 1.7646403312683105, "Pretrain/Step": 17625, "Pretrain/Step Time": 8.493481822311878} +{"Pretrain/Learning Rate": 7.508796318317301e-07, "Pretrain/Loss": 1.970636010169983, "Pretrain/Loss (Raw)": 2.0307581424713135, "Pretrain/Step": 17626, "Pretrain/Step Time": 8.489843053743243} +{"Pretrain/Learning Rate": 7.498473649154819e-07, "Pretrain/Loss": 1.9682962894439697, "Pretrain/Loss (Raw)": 1.8478378057479858, "Pretrain/Step": 17627, "Pretrain/Step Time": 8.490069029852748} +{"Pretrain/Learning Rate": 7.488157972352916e-07, "Pretrain/Loss": 1.966057538986206, "Pretrain/Loss (Raw)": 1.8435827493667603, "Pretrain/Step": 17628, "Pretrain/Step Time": 8.492270516231656} +{"Pretrain/Learning Rate": 7.477849288208994e-07, "Pretrain/Loss": 1.96809983253479, "Pretrain/Loss (Raw)": 2.1427299976348877, "Pretrain/Step": 17629, "Pretrain/Step Time": 8.490898175165057} +{"Pretrain/Learning Rate": 7.467547597020369e-07, "Pretrain/Loss": 1.9670230150222778, "Pretrain/Loss (Raw)": 1.9031152725219727, "Pretrain/Step": 17630, "Pretrain/Step Time": 8.490421671420336} +{"Pretrain/Learning Rate": 7.457252899084028e-07, "Pretrain/Loss": 1.9722869396209717, "Pretrain/Loss (Raw)": 2.493772268295288, "Pretrain/Step": 17631, "Pretrain/Step Time": 8.496009899303317} +{"Pretrain/Learning Rate": 7.446965194696786e-07, "Pretrain/Loss": 1.9706788063049316, "Pretrain/Loss (Raw)": 1.9101516008377075, "Pretrain/Step": 17632, "Pretrain/Step Time": 8.486794190481305} +{"Pretrain/Learning Rate": 7.436684484155326e-07, "Pretrain/Loss": 1.9726316928863525, "Pretrain/Loss (Raw)": 2.044043779373169, "Pretrain/Step": 17633, "Pretrain/Step Time": 8.487033421173692} +{"Pretrain/Learning Rate": 7.426410767756048e-07, "Pretrain/Loss": 1.974491834640503, "Pretrain/Loss (Raw)": 2.0254788398742676, "Pretrain/Step": 17634, "Pretrain/Step Time": 8.486064162105322} +{"Pretrain/Learning Rate": 7.41614404579527e-07, "Pretrain/Loss": 1.9742164611816406, "Pretrain/Loss (Raw)": 2.052333354949951, "Pretrain/Step": 17635, "Pretrain/Step Time": 8.483221320435405} +{"Pretrain/Learning Rate": 7.405884318568951e-07, "Pretrain/Loss": 1.9746774435043335, "Pretrain/Loss (Raw)": 2.009648323059082, "Pretrain/Step": 17636, "Pretrain/Step Time": 8.478895073756576} +{"Pretrain/Learning Rate": 7.395631586372908e-07, "Pretrain/Loss": 1.9775352478027344, "Pretrain/Loss (Raw)": 2.1800382137298584, "Pretrain/Step": 17637, "Pretrain/Step Time": 8.484991123899817} +{"Pretrain/Learning Rate": 7.385385849502823e-07, "Pretrain/Loss": 1.9766050577163696, "Pretrain/Loss (Raw)": 1.894877314567566, "Pretrain/Step": 17638, "Pretrain/Step Time": 8.486857775598764} +{"Pretrain/Learning Rate": 7.375147108254099e-07, "Pretrain/Loss": 1.9771875143051147, "Pretrain/Loss (Raw)": 2.119837999343872, "Pretrain/Step": 17639, "Pretrain/Step Time": 8.489062516018748} +{"Pretrain/Learning Rate": 7.36491536292197e-07, "Pretrain/Loss": 1.9759129285812378, "Pretrain/Loss (Raw)": 1.8440070152282715, "Pretrain/Step": 17640, "Pretrain/Step Time": 8.49350686557591} +{"Pretrain/Learning Rate": 7.35469061380148e-07, "Pretrain/Loss": 1.9770973920822144, "Pretrain/Loss (Raw)": 2.105314254760742, "Pretrain/Step": 17641, "Pretrain/Step Time": 8.491557482630014} +{"Pretrain/Learning Rate": 7.344472861187418e-07, "Pretrain/Loss": 1.9758397340774536, "Pretrain/Loss (Raw)": 1.9958078861236572, "Pretrain/Step": 17642, "Pretrain/Step Time": 8.490931021049619} +{"Pretrain/Learning Rate": 7.334262105374412e-07, "Pretrain/Loss": 1.9773112535476685, "Pretrain/Loss (Raw)": 2.133687973022461, "Pretrain/Step": 17643, "Pretrain/Step Time": 8.487411867827177} +{"Pretrain/Learning Rate": 7.324058346656893e-07, "Pretrain/Loss": 1.977337121963501, "Pretrain/Loss (Raw)": 1.8232895135879517, "Pretrain/Step": 17644, "Pretrain/Step Time": 8.484701812267303} +{"Pretrain/Learning Rate": 7.313861585329096e-07, "Pretrain/Loss": 1.9770550727844238, "Pretrain/Loss (Raw)": 2.069438934326172, "Pretrain/Step": 17645, "Pretrain/Step Time": 8.4882742613554} +{"Pretrain/Learning Rate": 7.303671821684982e-07, "Pretrain/Loss": 1.9768306016921997, "Pretrain/Loss (Raw)": 2.0161688327789307, "Pretrain/Step": 17646, "Pretrain/Step Time": 8.487099574878812} +{"Pretrain/Learning Rate": 7.293489056018426e-07, "Pretrain/Loss": 1.9759045839309692, "Pretrain/Loss (Raw)": 1.8145580291748047, "Pretrain/Step": 17647, "Pretrain/Step Time": 8.48543494567275} +{"Pretrain/Learning Rate": 7.283313288623028e-07, "Pretrain/Loss": 1.9749246835708618, "Pretrain/Loss (Raw)": 2.014139413833618, "Pretrain/Step": 17648, "Pretrain/Step Time": 8.484879363328218} +{"Pretrain/Learning Rate": 7.273144519792135e-07, "Pretrain/Loss": 1.974953532218933, "Pretrain/Loss (Raw)": 1.9936318397521973, "Pretrain/Step": 17649, "Pretrain/Step Time": 8.486324168741703} +{"Pretrain/Learning Rate": 7.26298274981907e-07, "Pretrain/Loss": 1.9751675128936768, "Pretrain/Loss (Raw)": 2.0062577724456787, "Pretrain/Step": 17650, "Pretrain/Step Time": 8.485641665756702} +{"Pretrain/Learning Rate": 7.252827978996734e-07, "Pretrain/Loss": 1.9774556159973145, "Pretrain/Loss (Raw)": 2.018594980239868, "Pretrain/Step": 17651, "Pretrain/Step Time": 8.488443803042173} +{"Pretrain/Learning Rate": 7.242680207618008e-07, "Pretrain/Loss": 1.9792816638946533, "Pretrain/Loss (Raw)": 2.002902030944824, "Pretrain/Step": 17652, "Pretrain/Step Time": 8.481673622503877} +{"Pretrain/Learning Rate": 7.232539435975461e-07, "Pretrain/Loss": 1.980344533920288, "Pretrain/Loss (Raw)": 2.0473453998565674, "Pretrain/Step": 17653, "Pretrain/Step Time": 8.487154809758067} +{"Pretrain/Learning Rate": 7.22240566436147e-07, "Pretrain/Loss": 1.9799268245697021, "Pretrain/Loss (Raw)": 2.0696308612823486, "Pretrain/Step": 17654, "Pretrain/Step Time": 8.485009154304862} +{"Pretrain/Learning Rate": 7.212278893068303e-07, "Pretrain/Loss": 1.9812977313995361, "Pretrain/Loss (Raw)": 2.093839406967163, "Pretrain/Step": 17655, "Pretrain/Step Time": 8.486765637993813} +{"Pretrain/Learning Rate": 7.202159122387892e-07, "Pretrain/Loss": 1.9802396297454834, "Pretrain/Loss (Raw)": 1.966849446296692, "Pretrain/Step": 17656, "Pretrain/Step Time": 8.49015792645514} +{"Pretrain/Learning Rate": 7.192046352612087e-07, "Pretrain/Loss": 1.9811925888061523, "Pretrain/Loss (Raw)": 2.1654422283172607, "Pretrain/Step": 17657, "Pretrain/Step Time": 8.48970784433186} +{"Pretrain/Learning Rate": 7.181940584032459e-07, "Pretrain/Loss": 1.9822667837142944, "Pretrain/Loss (Raw)": 2.043121337890625, "Pretrain/Step": 17658, "Pretrain/Step Time": 8.483582805842161} +{"Pretrain/Learning Rate": 7.171841816940361e-07, "Pretrain/Loss": 1.9817577600479126, "Pretrain/Loss (Raw)": 1.9741779565811157, "Pretrain/Step": 17659, "Pretrain/Step Time": 8.481104291975498} +{"Pretrain/Learning Rate": 7.161750051627059e-07, "Pretrain/Loss": 1.981386423110962, "Pretrain/Loss (Raw)": 1.9539583921432495, "Pretrain/Step": 17660, "Pretrain/Step Time": 8.47996368817985} +{"Pretrain/Learning Rate": 7.151665288383486e-07, "Pretrain/Loss": 1.9806643724441528, "Pretrain/Loss (Raw)": 2.050229549407959, "Pretrain/Step": 17661, "Pretrain/Step Time": 8.480003608390689} +{"Pretrain/Learning Rate": 7.141587527500465e-07, "Pretrain/Loss": 1.980128288269043, "Pretrain/Loss (Raw)": 1.9028915166854858, "Pretrain/Step": 17662, "Pretrain/Step Time": 8.483648395165801} +{"Pretrain/Learning Rate": 7.131516769268542e-07, "Pretrain/Loss": 1.9800639152526855, "Pretrain/Loss (Raw)": 1.9856338500976562, "Pretrain/Step": 17663, "Pretrain/Step Time": 8.479922514408827} +{"Pretrain/Learning Rate": 7.121453013978124e-07, "Pretrain/Loss": 1.9805060625076294, "Pretrain/Loss (Raw)": 2.1306023597717285, "Pretrain/Step": 17664, "Pretrain/Step Time": 8.47831598110497} +{"Pretrain/Learning Rate": 7.111396261919423e-07, "Pretrain/Loss": 1.9792163372039795, "Pretrain/Loss (Raw)": 1.9010988473892212, "Pretrain/Step": 17665, "Pretrain/Step Time": 8.477156534790993} +{"Pretrain/Learning Rate": 7.101346513382318e-07, "Pretrain/Loss": 1.9790247678756714, "Pretrain/Loss (Raw)": 1.744231939315796, "Pretrain/Step": 17666, "Pretrain/Step Time": 8.481042373925447} +{"Pretrain/Learning Rate": 7.091303768656715e-07, "Pretrain/Loss": 1.9798851013183594, "Pretrain/Loss (Raw)": 1.8871322870254517, "Pretrain/Step": 17667, "Pretrain/Step Time": 8.480182904750109} +{"Pretrain/Learning Rate": 7.081268028032135e-07, "Pretrain/Loss": 1.9787356853485107, "Pretrain/Loss (Raw)": 1.8064072132110596, "Pretrain/Step": 17668, "Pretrain/Step Time": 8.478139977902174} +{"Pretrain/Learning Rate": 7.071239291797899e-07, "Pretrain/Loss": 1.979154348373413, "Pretrain/Loss (Raw)": 1.9152802228927612, "Pretrain/Step": 17669, "Pretrain/Step Time": 8.480549419298768} +{"Pretrain/Learning Rate": 7.061217560243249e-07, "Pretrain/Loss": 1.980538249015808, "Pretrain/Loss (Raw)": 1.9318007230758667, "Pretrain/Step": 17670, "Pretrain/Step Time": 8.479827431961894} +{"Pretrain/Learning Rate": 7.051202833657122e-07, "Pretrain/Loss": 1.9807627201080322, "Pretrain/Loss (Raw)": 1.8856204748153687, "Pretrain/Step": 17671, "Pretrain/Step Time": 8.483484137803316} +{"Pretrain/Learning Rate": 7.041195112328286e-07, "Pretrain/Loss": 1.9801380634307861, "Pretrain/Loss (Raw)": 1.886047124862671, "Pretrain/Step": 17672, "Pretrain/Step Time": 8.48634022846818} +{"Pretrain/Learning Rate": 7.031194396545343e-07, "Pretrain/Loss": 1.9835257530212402, "Pretrain/Loss (Raw)": 2.123939037322998, "Pretrain/Step": 17673, "Pretrain/Step Time": 8.483551682904363} +{"Pretrain/Learning Rate": 7.021200686596591e-07, "Pretrain/Loss": 1.9847941398620605, "Pretrain/Loss (Raw)": 1.9199522733688354, "Pretrain/Step": 17674, "Pretrain/Step Time": 8.483221063390374} +{"Pretrain/Learning Rate": 7.011213982770271e-07, "Pretrain/Loss": 1.9856042861938477, "Pretrain/Loss (Raw)": 1.9648597240447998, "Pretrain/Step": 17675, "Pretrain/Step Time": 8.483636708930135} +{"Pretrain/Learning Rate": 7.001234285354263e-07, "Pretrain/Loss": 1.986416220664978, "Pretrain/Loss (Raw)": 2.0361275672912598, "Pretrain/Step": 17676, "Pretrain/Step Time": 8.486307878047228} +{"Pretrain/Learning Rate": 6.991261594636366e-07, "Pretrain/Loss": 1.9876631498336792, "Pretrain/Loss (Raw)": 2.0902562141418457, "Pretrain/Step": 17677, "Pretrain/Step Time": 8.484237873926759} +{"Pretrain/Learning Rate": 6.981295910904156e-07, "Pretrain/Loss": 1.9879662990570068, "Pretrain/Loss (Raw)": 2.0065767765045166, "Pretrain/Step": 17678, "Pretrain/Step Time": 8.489543518051505} +{"Pretrain/Learning Rate": 6.97133723444493e-07, "Pretrain/Loss": 1.985970139503479, "Pretrain/Loss (Raw)": 1.842155933380127, "Pretrain/Step": 17679, "Pretrain/Step Time": 8.485662188380957} +{"Pretrain/Learning Rate": 6.961385565545903e-07, "Pretrain/Loss": 1.986761450767517, "Pretrain/Loss (Raw)": 2.1655209064483643, "Pretrain/Step": 17680, "Pretrain/Step Time": 8.490979939699173} +{"Pretrain/Learning Rate": 6.951440904493955e-07, "Pretrain/Loss": 1.9851744174957275, "Pretrain/Loss (Raw)": 1.754788875579834, "Pretrain/Step": 17681, "Pretrain/Step Time": 8.485332902520895} +{"Pretrain/Learning Rate": 6.941503251575915e-07, "Pretrain/Loss": 1.985014796257019, "Pretrain/Loss (Raw)": 1.9369980096817017, "Pretrain/Step": 17682, "Pretrain/Step Time": 8.485738204792142} +{"Pretrain/Learning Rate": 6.931572607078274e-07, "Pretrain/Loss": 1.9866564273834229, "Pretrain/Loss (Raw)": 1.9641449451446533, "Pretrain/Step": 17683, "Pretrain/Step Time": 8.486940544098616} +{"Pretrain/Learning Rate": 6.921648971287359e-07, "Pretrain/Loss": 1.9895460605621338, "Pretrain/Loss (Raw)": 2.191781759262085, "Pretrain/Step": 17684, "Pretrain/Step Time": 8.485191715881228} +{"Pretrain/Learning Rate": 6.911732344489358e-07, "Pretrain/Loss": 1.989585518836975, "Pretrain/Loss (Raw)": 1.9440574645996094, "Pretrain/Step": 17685, "Pretrain/Step Time": 8.485578851774335} +{"Pretrain/Learning Rate": 6.90182272697018e-07, "Pretrain/Loss": 1.9898402690887451, "Pretrain/Loss (Raw)": 2.0046982765197754, "Pretrain/Step": 17686, "Pretrain/Step Time": 8.490051753818989} +{"Pretrain/Learning Rate": 6.891920119015571e-07, "Pretrain/Loss": 1.9892351627349854, "Pretrain/Loss (Raw)": 2.0017147064208984, "Pretrain/Step": 17687, "Pretrain/Step Time": 8.490444488823414} +{"Pretrain/Learning Rate": 6.882024520911051e-07, "Pretrain/Loss": 1.9882087707519531, "Pretrain/Loss (Raw)": 1.9703017473220825, "Pretrain/Step": 17688, "Pretrain/Step Time": 8.492856344208121} +{"Pretrain/Learning Rate": 6.872135932942003e-07, "Pretrain/Loss": 1.987213373184204, "Pretrain/Loss (Raw)": 1.8656634092330933, "Pretrain/Step": 17689, "Pretrain/Step Time": 8.49362614005804} +{"Pretrain/Learning Rate": 6.862254355393505e-07, "Pretrain/Loss": 1.9866361618041992, "Pretrain/Loss (Raw)": 1.966367244720459, "Pretrain/Step": 17690, "Pretrain/Step Time": 8.492251740768552} +{"Pretrain/Learning Rate": 6.852379788550495e-07, "Pretrain/Loss": 1.9839141368865967, "Pretrain/Loss (Raw)": 1.8976798057556152, "Pretrain/Step": 17691, "Pretrain/Step Time": 8.486147547140718} +{"Pretrain/Learning Rate": 6.842512232697718e-07, "Pretrain/Loss": 1.984398365020752, "Pretrain/Loss (Raw)": 1.9088164567947388, "Pretrain/Step": 17692, "Pretrain/Step Time": 8.48846511170268} +{"Pretrain/Learning Rate": 6.83265168811964e-07, "Pretrain/Loss": 1.9845874309539795, "Pretrain/Loss (Raw)": 2.0597124099731445, "Pretrain/Step": 17693, "Pretrain/Step Time": 8.484079020097852} +{"Pretrain/Learning Rate": 6.822798155100673e-07, "Pretrain/Loss": 1.9852784872055054, "Pretrain/Loss (Raw)": 1.9583910703659058, "Pretrain/Step": 17694, "Pretrain/Step Time": 8.481790715828538} +{"Pretrain/Learning Rate": 6.812951633924896e-07, "Pretrain/Loss": 1.985426425933838, "Pretrain/Loss (Raw)": 2.0027127265930176, "Pretrain/Step": 17695, "Pretrain/Step Time": 8.483505567535758} +{"Pretrain/Learning Rate": 6.803112124876221e-07, "Pretrain/Loss": 1.9842312335968018, "Pretrain/Loss (Raw)": 2.06457781791687, "Pretrain/Step": 17696, "Pretrain/Step Time": 8.48106811568141} +{"Pretrain/Learning Rate": 6.793279628238364e-07, "Pretrain/Loss": 1.9851856231689453, "Pretrain/Loss (Raw)": 1.8110008239746094, "Pretrain/Step": 17697, "Pretrain/Step Time": 8.4839478880167} +{"Pretrain/Learning Rate": 6.783454144294793e-07, "Pretrain/Loss": 1.9867221117019653, "Pretrain/Loss (Raw)": 2.00431752204895, "Pretrain/Step": 17698, "Pretrain/Step Time": 8.481259299442172} +{"Pretrain/Learning Rate": 6.77363567332892e-07, "Pretrain/Loss": 1.984006404876709, "Pretrain/Loss (Raw)": 1.7963581085205078, "Pretrain/Step": 17699, "Pretrain/Step Time": 8.487018287181854} +{"Pretrain/Learning Rate": 6.763824215623799e-07, "Pretrain/Loss": 1.9851477146148682, "Pretrain/Loss (Raw)": 2.1294877529144287, "Pretrain/Step": 17700, "Pretrain/Step Time": 8.487586913630366} +{"Pretrain/Learning Rate": 6.754019771462311e-07, "Pretrain/Loss": 1.9852360486984253, "Pretrain/Loss (Raw)": 2.1505515575408936, "Pretrain/Step": 17701, "Pretrain/Step Time": 8.487337758764625} +{"Pretrain/Learning Rate": 6.744222341127204e-07, "Pretrain/Loss": 1.9840866327285767, "Pretrain/Loss (Raw)": 1.8313862085342407, "Pretrain/Step": 17702, "Pretrain/Step Time": 8.489523345604539} +{"Pretrain/Learning Rate": 6.73443192490092e-07, "Pretrain/Loss": 1.9836993217468262, "Pretrain/Loss (Raw)": 1.8899840116500854, "Pretrain/Step": 17703, "Pretrain/Step Time": 8.485994849354029} +{"Pretrain/Learning Rate": 6.724648523065841e-07, "Pretrain/Loss": 1.982280969619751, "Pretrain/Loss (Raw)": 1.8551276922225952, "Pretrain/Step": 17704, "Pretrain/Step Time": 8.487577557563782} +{"Pretrain/Learning Rate": 6.714872135904049e-07, "Pretrain/Loss": 1.9829962253570557, "Pretrain/Loss (Raw)": 2.1400673389434814, "Pretrain/Step": 17705, "Pretrain/Step Time": 8.49035631492734} +{"Pretrain/Learning Rate": 6.705102763697346e-07, "Pretrain/Loss": 1.9833179712295532, "Pretrain/Loss (Raw)": 1.899411678314209, "Pretrain/Step": 17706, "Pretrain/Step Time": 8.489841114729643} +{"Pretrain/Learning Rate": 6.695340406727563e-07, "Pretrain/Loss": 1.9825128316879272, "Pretrain/Loss (Raw)": 1.989376425743103, "Pretrain/Step": 17707, "Pretrain/Step Time": 8.492400193586946} +{"Pretrain/Learning Rate": 6.685585065276057e-07, "Pretrain/Loss": 1.9814327955245972, "Pretrain/Loss (Raw)": 1.8595460653305054, "Pretrain/Step": 17708, "Pretrain/Step Time": 8.489619133993983} +{"Pretrain/Learning Rate": 6.675836739624214e-07, "Pretrain/Loss": 1.982386827468872, "Pretrain/Loss (Raw)": 2.1155052185058594, "Pretrain/Step": 17709, "Pretrain/Step Time": 8.486630447208881} +{"Pretrain/Learning Rate": 6.66609543005306e-07, "Pretrain/Loss": 1.9871752262115479, "Pretrain/Loss (Raw)": 2.4433844089508057, "Pretrain/Step": 17710, "Pretrain/Step Time": 8.489357441663742} +{"Pretrain/Learning Rate": 6.656361136843537e-07, "Pretrain/Loss": 1.987829327583313, "Pretrain/Loss (Raw)": 1.9939625263214111, "Pretrain/Step": 17711, "Pretrain/Step Time": 8.490686129778624} +{"Pretrain/Learning Rate": 6.646633860276308e-07, "Pretrain/Loss": 1.9874498844146729, "Pretrain/Loss (Raw)": 2.026130199432373, "Pretrain/Step": 17712, "Pretrain/Step Time": 8.490720834583044} +{"Pretrain/Learning Rate": 6.636913600631789e-07, "Pretrain/Loss": 1.987173080444336, "Pretrain/Loss (Raw)": 1.8929436206817627, "Pretrain/Step": 17713, "Pretrain/Step Time": 8.488795636221766} +{"Pretrain/Learning Rate": 6.627200358190367e-07, "Pretrain/Loss": 1.987046241760254, "Pretrain/Loss (Raw)": 1.8155850172042847, "Pretrain/Step": 17714, "Pretrain/Step Time": 8.48855729214847} +{"Pretrain/Learning Rate": 6.617494133231983e-07, "Pretrain/Loss": 1.98703932762146, "Pretrain/Loss (Raw)": 1.918267011642456, "Pretrain/Step": 17715, "Pretrain/Step Time": 8.48835949972272} +{"Pretrain/Learning Rate": 6.607794926036637e-07, "Pretrain/Loss": 1.9870208501815796, "Pretrain/Loss (Raw)": 2.0944154262542725, "Pretrain/Step": 17716, "Pretrain/Step Time": 8.4890580996871} +{"Pretrain/Learning Rate": 6.598102736883937e-07, "Pretrain/Loss": 1.9876071214675903, "Pretrain/Loss (Raw)": 2.0820271968841553, "Pretrain/Step": 17717, "Pretrain/Step Time": 8.490415336564183} +{"Pretrain/Learning Rate": 6.588417566053356e-07, "Pretrain/Loss": 1.989061713218689, "Pretrain/Loss (Raw)": 2.0914604663848877, "Pretrain/Step": 17718, "Pretrain/Step Time": 8.488426642492414} +{"Pretrain/Learning Rate": 6.578739413824142e-07, "Pretrain/Loss": 1.9862325191497803, "Pretrain/Loss (Raw)": 1.7776414155960083, "Pretrain/Step": 17719, "Pretrain/Step Time": 8.485576841980219} +{"Pretrain/Learning Rate": 6.569068280475377e-07, "Pretrain/Loss": 1.9841208457946777, "Pretrain/Loss (Raw)": 2.0028743743896484, "Pretrain/Step": 17720, "Pretrain/Step Time": 8.484162088483572} +{"Pretrain/Learning Rate": 6.559404166285948e-07, "Pretrain/Loss": 1.9855902194976807, "Pretrain/Loss (Raw)": 2.041269540786743, "Pretrain/Step": 17721, "Pretrain/Step Time": 8.484432186931372} +{"Pretrain/Learning Rate": 6.549747071534468e-07, "Pretrain/Loss": 1.9868656396865845, "Pretrain/Loss (Raw)": 2.128526449203491, "Pretrain/Step": 17722, "Pretrain/Step Time": 8.484933633357286} +{"Pretrain/Learning Rate": 6.540096996499406e-07, "Pretrain/Loss": 1.9881491661071777, "Pretrain/Loss (Raw)": 1.8682408332824707, "Pretrain/Step": 17723, "Pretrain/Step Time": 8.489127954468131} +{"Pretrain/Learning Rate": 6.530453941459041e-07, "Pretrain/Loss": 1.9848867654800415, "Pretrain/Loss (Raw)": 1.7579888105392456, "Pretrain/Step": 17724, "Pretrain/Step Time": 8.486768877133727} +{"Pretrain/Learning Rate": 6.520817906691374e-07, "Pretrain/Loss": 1.9831527471542358, "Pretrain/Loss (Raw)": 1.9106749296188354, "Pretrain/Step": 17725, "Pretrain/Step Time": 8.489710535854101} +{"Pretrain/Learning Rate": 6.51118889247429e-07, "Pretrain/Loss": 1.9818735122680664, "Pretrain/Loss (Raw)": 1.9903327226638794, "Pretrain/Step": 17726, "Pretrain/Step Time": 8.486533131450415} +{"Pretrain/Learning Rate": 6.501566899085432e-07, "Pretrain/Loss": 1.980865240097046, "Pretrain/Loss (Raw)": 1.8862406015396118, "Pretrain/Step": 17727, "Pretrain/Step Time": 8.48511160351336} +{"Pretrain/Learning Rate": 6.491951926802214e-07, "Pretrain/Loss": 1.9828088283538818, "Pretrain/Loss (Raw)": 2.172711133956909, "Pretrain/Step": 17728, "Pretrain/Step Time": 8.487395640462637} +{"Pretrain/Learning Rate": 6.482343975901944e-07, "Pretrain/Loss": 1.9871317148208618, "Pretrain/Loss (Raw)": 2.4455111026763916, "Pretrain/Step": 17729, "Pretrain/Step Time": 8.487382778897882} +{"Pretrain/Learning Rate": 6.472743046661567e-07, "Pretrain/Loss": 1.988943099975586, "Pretrain/Loss (Raw)": 2.0944154262542725, "Pretrain/Step": 17730, "Pretrain/Step Time": 8.480229306966066} +{"Pretrain/Learning Rate": 6.463149139358027e-07, "Pretrain/Loss": 1.9896962642669678, "Pretrain/Loss (Raw)": 2.0290939807891846, "Pretrain/Step": 17731, "Pretrain/Step Time": 8.48070034198463} +{"Pretrain/Learning Rate": 6.453562254267853e-07, "Pretrain/Loss": 1.9894362688064575, "Pretrain/Loss (Raw)": 1.941738247871399, "Pretrain/Step": 17732, "Pretrain/Step Time": 8.481195135042071} +{"Pretrain/Learning Rate": 6.443982391667547e-07, "Pretrain/Loss": 1.9911279678344727, "Pretrain/Loss (Raw)": 2.062270402908325, "Pretrain/Step": 17733, "Pretrain/Step Time": 8.482620351016521} +{"Pretrain/Learning Rate": 6.434409551833304e-07, "Pretrain/Loss": 1.9920765161514282, "Pretrain/Loss (Raw)": 1.9678725004196167, "Pretrain/Step": 17734, "Pretrain/Step Time": 8.480339648202062} +{"Pretrain/Learning Rate": 6.424843735041153e-07, "Pretrain/Loss": 1.99053955078125, "Pretrain/Loss (Raw)": 2.031592845916748, "Pretrain/Step": 17735, "Pretrain/Step Time": 8.478847881779075} +{"Pretrain/Learning Rate": 6.415284941566929e-07, "Pretrain/Loss": 1.9911906719207764, "Pretrain/Loss (Raw)": 2.0914804935455322, "Pretrain/Step": 17736, "Pretrain/Step Time": 8.480413554236293} +{"Pretrain/Learning Rate": 6.405733171686246e-07, "Pretrain/Loss": 1.990031361579895, "Pretrain/Loss (Raw)": 1.9163877964019775, "Pretrain/Step": 17737, "Pretrain/Step Time": 8.48257865011692} +{"Pretrain/Learning Rate": 6.396188425674521e-07, "Pretrain/Loss": 1.9893834590911865, "Pretrain/Loss (Raw)": 1.9724396467208862, "Pretrain/Step": 17738, "Pretrain/Step Time": 8.485176607966423} +{"Pretrain/Learning Rate": 6.386650703806978e-07, "Pretrain/Loss": 1.9884872436523438, "Pretrain/Loss (Raw)": 1.9056857824325562, "Pretrain/Step": 17739, "Pretrain/Step Time": 8.484194679185748} +{"Pretrain/Learning Rate": 6.377120006358622e-07, "Pretrain/Loss": 1.9887019395828247, "Pretrain/Loss (Raw)": 2.017866849899292, "Pretrain/Step": 17740, "Pretrain/Step Time": 8.487926833331585} +{"Pretrain/Learning Rate": 6.367596333604287e-07, "Pretrain/Loss": 1.9860029220581055, "Pretrain/Loss (Raw)": 1.9047507047653198, "Pretrain/Step": 17741, "Pretrain/Step Time": 8.489701267331839} +{"Pretrain/Learning Rate": 6.358079685818557e-07, "Pretrain/Loss": 1.9870190620422363, "Pretrain/Loss (Raw)": 2.106733560562134, "Pretrain/Step": 17742, "Pretrain/Step Time": 8.484787434339523} +{"Pretrain/Learning Rate": 6.3485700632758e-07, "Pretrain/Loss": 1.9948915243148804, "Pretrain/Loss (Raw)": 2.0798914432525635, "Pretrain/Step": 17743, "Pretrain/Step Time": 8.478092392906547} +{"Pretrain/Learning Rate": 6.339067466250321e-07, "Pretrain/Loss": 1.9928081035614014, "Pretrain/Loss (Raw)": 2.026787519454956, "Pretrain/Step": 17744, "Pretrain/Step Time": 8.479281513020396} +{"Pretrain/Learning Rate": 6.329571895016012e-07, "Pretrain/Loss": 1.992331862449646, "Pretrain/Loss (Raw)": 2.001901388168335, "Pretrain/Step": 17745, "Pretrain/Step Time": 8.482250031083822} +{"Pretrain/Learning Rate": 6.320083349846768e-07, "Pretrain/Loss": 1.9936212301254272, "Pretrain/Loss (Raw)": 2.0458173751831055, "Pretrain/Step": 17746, "Pretrain/Step Time": 8.483329519629478} +{"Pretrain/Learning Rate": 6.310601831016116e-07, "Pretrain/Loss": 1.9949673414230347, "Pretrain/Loss (Raw)": 2.108873128890991, "Pretrain/Step": 17747, "Pretrain/Step Time": 8.483227603137493} +{"Pretrain/Learning Rate": 6.301127338797452e-07, "Pretrain/Loss": 1.9945441484451294, "Pretrain/Loss (Raw)": 1.9263750314712524, "Pretrain/Step": 17748, "Pretrain/Step Time": 8.48290659673512} +{"Pretrain/Learning Rate": 6.291659873464001e-07, "Pretrain/Loss": 1.99503493309021, "Pretrain/Loss (Raw)": 2.052919387817383, "Pretrain/Step": 17749, "Pretrain/Step Time": 8.48060180619359} +{"Pretrain/Learning Rate": 6.282199435288738e-07, "Pretrain/Loss": 1.9953402280807495, "Pretrain/Loss (Raw)": 1.9963606595993042, "Pretrain/Step": 17750, "Pretrain/Step Time": 8.481674442067742} +{"Pretrain/Learning Rate": 6.272746024544446e-07, "Pretrain/Loss": 1.9944751262664795, "Pretrain/Loss (Raw)": 1.9988510608673096, "Pretrain/Step": 17751, "Pretrain/Step Time": 8.477739240974188} +{"Pretrain/Learning Rate": 6.263299641503711e-07, "Pretrain/Loss": 1.9940308332443237, "Pretrain/Loss (Raw)": 2.0597593784332275, "Pretrain/Step": 17752, "Pretrain/Step Time": 8.47883745841682} +{"Pretrain/Learning Rate": 6.253860286438872e-07, "Pretrain/Loss": 1.9959673881530762, "Pretrain/Loss (Raw)": 2.012519121170044, "Pretrain/Step": 17753, "Pretrain/Step Time": 8.477166390046477} +{"Pretrain/Learning Rate": 6.244427959622184e-07, "Pretrain/Loss": 1.9958730936050415, "Pretrain/Loss (Raw)": 2.018681049346924, "Pretrain/Step": 17754, "Pretrain/Step Time": 8.47551547549665} +{"Pretrain/Learning Rate": 6.235002661325568e-07, "Pretrain/Loss": 1.997164011001587, "Pretrain/Loss (Raw)": 2.0130727291107178, "Pretrain/Step": 17755, "Pretrain/Step Time": 8.478381739929318} +{"Pretrain/Learning Rate": 6.225584391820804e-07, "Pretrain/Loss": 2.001037120819092, "Pretrain/Loss (Raw)": 2.3393404483795166, "Pretrain/Step": 17756, "Pretrain/Step Time": 8.479619385674596} +{"Pretrain/Learning Rate": 6.216173151379456e-07, "Pretrain/Loss": 2.0006332397460938, "Pretrain/Loss (Raw)": 2.091026544570923, "Pretrain/Step": 17757, "Pretrain/Step Time": 8.48091634362936} +{"Pretrain/Learning Rate": 6.206768940272917e-07, "Pretrain/Loss": 2.0024425983428955, "Pretrain/Loss (Raw)": 2.134735345840454, "Pretrain/Step": 17758, "Pretrain/Step Time": 8.476620372384787} +{"Pretrain/Learning Rate": 6.19737175877233e-07, "Pretrain/Loss": 1.9992733001708984, "Pretrain/Loss (Raw)": 2.088087797164917, "Pretrain/Step": 17759, "Pretrain/Step Time": 8.476682558655739} +{"Pretrain/Learning Rate": 6.187981607148618e-07, "Pretrain/Loss": 2.000760555267334, "Pretrain/Loss (Raw)": 2.1005146503448486, "Pretrain/Step": 17760, "Pretrain/Step Time": 8.47694467753172} +{"Pretrain/Learning Rate": 6.178598485672621e-07, "Pretrain/Loss": 1.998372197151184, "Pretrain/Loss (Raw)": 1.7383418083190918, "Pretrain/Step": 17761, "Pretrain/Step Time": 8.478899898007512} +{"Pretrain/Learning Rate": 6.169222394614871e-07, "Pretrain/Loss": 1.9988739490509033, "Pretrain/Loss (Raw)": 2.0897011756896973, "Pretrain/Step": 17762, "Pretrain/Step Time": 8.481603851541877} +{"Pretrain/Learning Rate": 6.159853334245652e-07, "Pretrain/Loss": 1.9984149932861328, "Pretrain/Loss (Raw)": 1.9935847520828247, "Pretrain/Step": 17763, "Pretrain/Step Time": 8.481778260320425} +{"Pretrain/Learning Rate": 6.15049130483522e-07, "Pretrain/Loss": 1.9978082180023193, "Pretrain/Loss (Raw)": 1.931978464126587, "Pretrain/Step": 17764, "Pretrain/Step Time": 8.484205015003681} +{"Pretrain/Learning Rate": 6.141136306653417e-07, "Pretrain/Loss": 1.9954578876495361, "Pretrain/Loss (Raw)": 1.8792061805725098, "Pretrain/Step": 17765, "Pretrain/Step Time": 8.478504717350006} +{"Pretrain/Learning Rate": 6.13178833997008e-07, "Pretrain/Loss": 1.9981396198272705, "Pretrain/Loss (Raw)": 2.2381389141082764, "Pretrain/Step": 17766, "Pretrain/Step Time": 8.484199164435267} +{"Pretrain/Learning Rate": 6.122447405054687e-07, "Pretrain/Loss": 1.9978973865509033, "Pretrain/Loss (Raw)": 2.088813304901123, "Pretrain/Step": 17767, "Pretrain/Step Time": 8.484882060438395} +{"Pretrain/Learning Rate": 6.11311350217661e-07, "Pretrain/Loss": 1.999516248703003, "Pretrain/Loss (Raw)": 2.051240921020508, "Pretrain/Step": 17768, "Pretrain/Step Time": 8.48192205093801} +{"Pretrain/Learning Rate": 6.103786631604991e-07, "Pretrain/Loss": 1.998734474182129, "Pretrain/Loss (Raw)": 2.0052521228790283, "Pretrain/Step": 17769, "Pretrain/Step Time": 8.480450298637152} +{"Pretrain/Learning Rate": 6.094466793608727e-07, "Pretrain/Loss": 1.99747633934021, "Pretrain/Loss (Raw)": 1.8347482681274414, "Pretrain/Step": 17770, "Pretrain/Step Time": 8.482620246708393} +{"Pretrain/Learning Rate": 6.085153988456577e-07, "Pretrain/Loss": 1.995713472366333, "Pretrain/Loss (Raw)": 1.9080419540405273, "Pretrain/Step": 17771, "Pretrain/Step Time": 8.484203750267625} +{"Pretrain/Learning Rate": 6.075848216417074e-07, "Pretrain/Loss": 1.9971263408660889, "Pretrain/Loss (Raw)": 2.0041677951812744, "Pretrain/Step": 17772, "Pretrain/Step Time": 8.486488409340382} +{"Pretrain/Learning Rate": 6.066549477758504e-07, "Pretrain/Loss": 1.9963836669921875, "Pretrain/Loss (Raw)": 1.9743502140045166, "Pretrain/Step": 17773, "Pretrain/Step Time": 8.487412314862013} +{"Pretrain/Learning Rate": 6.057257772749042e-07, "Pretrain/Loss": 1.9964921474456787, "Pretrain/Loss (Raw)": 2.0300490856170654, "Pretrain/Step": 17774, "Pretrain/Step Time": 8.48842934332788} +{"Pretrain/Learning Rate": 6.047973101656585e-07, "Pretrain/Loss": 1.9980807304382324, "Pretrain/Loss (Raw)": 2.0179030895233154, "Pretrain/Step": 17775, "Pretrain/Step Time": 8.487303745001554} +{"Pretrain/Learning Rate": 6.038695464748833e-07, "Pretrain/Loss": 1.9985060691833496, "Pretrain/Loss (Raw)": 2.0685861110687256, "Pretrain/Step": 17776, "Pretrain/Step Time": 8.486510215327144} +{"Pretrain/Learning Rate": 6.029424862293326e-07, "Pretrain/Loss": 1.9983717203140259, "Pretrain/Loss (Raw)": 1.9764302968978882, "Pretrain/Step": 17777, "Pretrain/Step Time": 8.482751248404384} +{"Pretrain/Learning Rate": 6.020161294557375e-07, "Pretrain/Loss": 1.998430848121643, "Pretrain/Loss (Raw)": 2.0138323307037354, "Pretrain/Step": 17778, "Pretrain/Step Time": 8.490485155954957} +{"Pretrain/Learning Rate": 6.010904761808045e-07, "Pretrain/Loss": 1.9981579780578613, "Pretrain/Loss (Raw)": 1.9836748838424683, "Pretrain/Step": 17779, "Pretrain/Step Time": 8.489806909114122} +{"Pretrain/Learning Rate": 6.001655264312289e-07, "Pretrain/Loss": 1.9968292713165283, "Pretrain/Loss (Raw)": 1.8328274488449097, "Pretrain/Step": 17780, "Pretrain/Step Time": 8.493036607280374} +{"Pretrain/Learning Rate": 5.992412802336838e-07, "Pretrain/Loss": 1.993756890296936, "Pretrain/Loss (Raw)": 1.6540777683258057, "Pretrain/Step": 17781, "Pretrain/Step Time": 8.489740498363972} +{"Pretrain/Learning Rate": 5.983177376148091e-07, "Pretrain/Loss": 1.9928128719329834, "Pretrain/Loss (Raw)": 1.9488013982772827, "Pretrain/Step": 17782, "Pretrain/Step Time": 8.493126323446631} +{"Pretrain/Learning Rate": 5.973948986012445e-07, "Pretrain/Loss": 1.9944651126861572, "Pretrain/Loss (Raw)": 2.305318593978882, "Pretrain/Step": 17783, "Pretrain/Step Time": 8.494139321148396} +{"Pretrain/Learning Rate": 5.96472763219591e-07, "Pretrain/Loss": 1.9933052062988281, "Pretrain/Loss (Raw)": 1.8183691501617432, "Pretrain/Step": 17784, "Pretrain/Step Time": 8.48854129575193} +{"Pretrain/Learning Rate": 5.955513314964467e-07, "Pretrain/Loss": 1.9907714128494263, "Pretrain/Loss (Raw)": 1.8411238193511963, "Pretrain/Step": 17785, "Pretrain/Step Time": 8.491461185738444} +{"Pretrain/Learning Rate": 5.946306034583737e-07, "Pretrain/Loss": 1.991392731666565, "Pretrain/Loss (Raw)": 2.122654914855957, "Pretrain/Step": 17786, "Pretrain/Step Time": 8.49254721403122} +{"Pretrain/Learning Rate": 5.937105791319203e-07, "Pretrain/Loss": 1.9908427000045776, "Pretrain/Loss (Raw)": 1.9037725925445557, "Pretrain/Step": 17787, "Pretrain/Step Time": 8.496460961177945} +{"Pretrain/Learning Rate": 5.927912585436207e-07, "Pretrain/Loss": 1.9903879165649414, "Pretrain/Loss (Raw)": 1.8957583904266357, "Pretrain/Step": 17788, "Pretrain/Step Time": 8.496028643101454} +{"Pretrain/Learning Rate": 5.918726417199761e-07, "Pretrain/Loss": 1.9896444082260132, "Pretrain/Loss (Raw)": 1.9550360441207886, "Pretrain/Step": 17789, "Pretrain/Step Time": 8.494960937649012} +{"Pretrain/Learning Rate": 5.909547286874817e-07, "Pretrain/Loss": 1.9922926425933838, "Pretrain/Loss (Raw)": 2.241868495941162, "Pretrain/Step": 17790, "Pretrain/Step Time": 8.486798526719213} +{"Pretrain/Learning Rate": 5.900375194725971e-07, "Pretrain/Loss": 1.9913040399551392, "Pretrain/Loss (Raw)": 1.8591002225875854, "Pretrain/Step": 17791, "Pretrain/Step Time": 8.493994181975722} +{"Pretrain/Learning Rate": 5.891210141017733e-07, "Pretrain/Loss": 1.9905072450637817, "Pretrain/Loss (Raw)": 2.028607130050659, "Pretrain/Step": 17792, "Pretrain/Step Time": 8.491925990208983} +{"Pretrain/Learning Rate": 5.882052126014365e-07, "Pretrain/Loss": 1.99208402633667, "Pretrain/Loss (Raw)": 2.1029229164123535, "Pretrain/Step": 17793, "Pretrain/Step Time": 8.49164311401546} +{"Pretrain/Learning Rate": 5.872901149979932e-07, "Pretrain/Loss": 1.9958858489990234, "Pretrain/Loss (Raw)": 2.2308707237243652, "Pretrain/Step": 17794, "Pretrain/Step Time": 8.491158686578274} +{"Pretrain/Learning Rate": 5.863757213178306e-07, "Pretrain/Loss": 1.9965234994888306, "Pretrain/Loss (Raw)": 1.9687570333480835, "Pretrain/Step": 17795, "Pretrain/Step Time": 8.494137518107891} +{"Pretrain/Learning Rate": 5.854620315873139e-07, "Pretrain/Loss": 1.9971837997436523, "Pretrain/Loss (Raw)": 1.8909269571304321, "Pretrain/Step": 17796, "Pretrain/Step Time": 8.495196543633938} +{"Pretrain/Learning Rate": 5.845490458327856e-07, "Pretrain/Loss": 1.9976414442062378, "Pretrain/Loss (Raw)": 1.973859429359436, "Pretrain/Step": 17797, "Pretrain/Step Time": 8.493116760626435} +{"Pretrain/Learning Rate": 5.836367640805751e-07, "Pretrain/Loss": 1.9999480247497559, "Pretrain/Loss (Raw)": 2.2270307540893555, "Pretrain/Step": 17798, "Pretrain/Step Time": 8.499963976442814} +{"Pretrain/Learning Rate": 5.82725186356986e-07, "Pretrain/Loss": 2.000488758087158, "Pretrain/Loss (Raw)": 1.9548333883285522, "Pretrain/Step": 17799, "Pretrain/Step Time": 8.506248496472836} +{"Pretrain/Learning Rate": 5.81814312688303e-07, "Pretrain/Loss": 2.0018768310546875, "Pretrain/Loss (Raw)": 2.0637311935424805, "Pretrain/Step": 17800, "Pretrain/Step Time": 8.500457994639874} +{"Pretrain/Learning Rate": 5.809041431007939e-07, "Pretrain/Loss": 2.0013651847839355, "Pretrain/Loss (Raw)": 2.058424949645996, "Pretrain/Step": 17801, "Pretrain/Step Time": 8.50220924243331} +{"Pretrain/Learning Rate": 5.799946776206933e-07, "Pretrain/Loss": 2.0015811920166016, "Pretrain/Loss (Raw)": 1.94762122631073, "Pretrain/Step": 17802, "Pretrain/Step Time": 8.499403702095151} +{"Pretrain/Learning Rate": 5.790859162742357e-07, "Pretrain/Loss": 2.002495765686035, "Pretrain/Loss (Raw)": 2.081939458847046, "Pretrain/Step": 17803, "Pretrain/Step Time": 8.500441869720817} +{"Pretrain/Learning Rate": 5.781778590876197e-07, "Pretrain/Loss": 2.0026426315307617, "Pretrain/Loss (Raw)": 2.054903745651245, "Pretrain/Step": 17804, "Pretrain/Step Time": 8.501091266050935} +{"Pretrain/Learning Rate": 5.77270506087027e-07, "Pretrain/Loss": 1.9997470378875732, "Pretrain/Loss (Raw)": 1.719626545906067, "Pretrain/Step": 17805, "Pretrain/Step Time": 8.498837359249592} +{"Pretrain/Learning Rate": 5.763638572986258e-07, "Pretrain/Loss": 2.0003790855407715, "Pretrain/Loss (Raw)": 2.087501287460327, "Pretrain/Step": 17806, "Pretrain/Step Time": 8.496034344658256} +{"Pretrain/Learning Rate": 5.754579127485505e-07, "Pretrain/Loss": 2.0004167556762695, "Pretrain/Loss (Raw)": 1.8469690084457397, "Pretrain/Step": 17807, "Pretrain/Step Time": 8.498415675014257} +{"Pretrain/Learning Rate": 5.74552672462933e-07, "Pretrain/Loss": 1.9975597858428955, "Pretrain/Loss (Raw)": 1.7998089790344238, "Pretrain/Step": 17808, "Pretrain/Step Time": 8.498242016881704} +{"Pretrain/Learning Rate": 5.736481364678664e-07, "Pretrain/Loss": 1.9996941089630127, "Pretrain/Loss (Raw)": 2.0279924869537354, "Pretrain/Step": 17809, "Pretrain/Step Time": 8.494902856647968} +{"Pretrain/Learning Rate": 5.727443047894382e-07, "Pretrain/Loss": 2.000385046005249, "Pretrain/Loss (Raw)": 2.0254297256469727, "Pretrain/Step": 17810, "Pretrain/Step Time": 8.491221856325865} +{"Pretrain/Learning Rate": 5.718411774537081e-07, "Pretrain/Loss": 1.999428629875183, "Pretrain/Loss (Raw)": 1.8417333364486694, "Pretrain/Step": 17811, "Pretrain/Step Time": 8.492682930082083} +{"Pretrain/Learning Rate": 5.709387544867162e-07, "Pretrain/Loss": 1.9965012073516846, "Pretrain/Loss (Raw)": 1.817068338394165, "Pretrain/Step": 17812, "Pretrain/Step Time": 8.499766876921058} +{"Pretrain/Learning Rate": 5.700370359144836e-07, "Pretrain/Loss": 1.9946430921554565, "Pretrain/Loss (Raw)": 1.7062186002731323, "Pretrain/Step": 17813, "Pretrain/Step Time": 8.495347423478961} +{"Pretrain/Learning Rate": 5.691360217630115e-07, "Pretrain/Loss": 1.9971275329589844, "Pretrain/Loss (Raw)": 2.322706699371338, "Pretrain/Step": 17814, "Pretrain/Step Time": 8.496101627126336} +{"Pretrain/Learning Rate": 5.682357120582793e-07, "Pretrain/Loss": 1.9953625202178955, "Pretrain/Loss (Raw)": 1.7757891416549683, "Pretrain/Step": 17815, "Pretrain/Step Time": 8.500684957951307} +{"Pretrain/Learning Rate": 5.673361068262495e-07, "Pretrain/Loss": 1.9963645935058594, "Pretrain/Loss (Raw)": 2.098572015762329, "Pretrain/Step": 17816, "Pretrain/Step Time": 8.494992451742291} +{"Pretrain/Learning Rate": 5.664372060928569e-07, "Pretrain/Loss": 1.9951505661010742, "Pretrain/Loss (Raw)": 1.7102630138397217, "Pretrain/Step": 17817, "Pretrain/Step Time": 8.498542031273246} +{"Pretrain/Learning Rate": 5.655390098840224e-07, "Pretrain/Loss": 1.9963321685791016, "Pretrain/Loss (Raw)": 2.117602586746216, "Pretrain/Step": 17818, "Pretrain/Step Time": 8.498934160917997} +{"Pretrain/Learning Rate": 5.646415182256448e-07, "Pretrain/Loss": 1.9968321323394775, "Pretrain/Loss (Raw)": 1.9616801738739014, "Pretrain/Step": 17819, "Pretrain/Step Time": 8.500473376363516} +{"Pretrain/Learning Rate": 5.637447311436061e-07, "Pretrain/Loss": 1.9971983432769775, "Pretrain/Loss (Raw)": 1.9557061195373535, "Pretrain/Step": 17820, "Pretrain/Step Time": 8.49845253303647} +{"Pretrain/Learning Rate": 5.628486486637608e-07, "Pretrain/Loss": 1.9961214065551758, "Pretrain/Loss (Raw)": 1.9218651056289673, "Pretrain/Step": 17821, "Pretrain/Step Time": 8.498958442360163} +{"Pretrain/Learning Rate": 5.619532708119463e-07, "Pretrain/Loss": 1.995644450187683, "Pretrain/Loss (Raw)": 1.897342324256897, "Pretrain/Step": 17822, "Pretrain/Step Time": 8.49815796688199} +{"Pretrain/Learning Rate": 5.610585976139838e-07, "Pretrain/Loss": 1.9978713989257812, "Pretrain/Loss (Raw)": 2.28775954246521, "Pretrain/Step": 17823, "Pretrain/Step Time": 8.496010635048151} +{"Pretrain/Learning Rate": 5.601646290956664e-07, "Pretrain/Loss": 1.9950263500213623, "Pretrain/Loss (Raw)": 1.7003995180130005, "Pretrain/Step": 17824, "Pretrain/Step Time": 8.495681054890156} +{"Pretrain/Learning Rate": 5.592713652827736e-07, "Pretrain/Loss": 1.9964208602905273, "Pretrain/Loss (Raw)": 1.9895011186599731, "Pretrain/Step": 17825, "Pretrain/Step Time": 8.492289448156953} +{"Pretrain/Learning Rate": 5.583788062010626e-07, "Pretrain/Loss": 1.9954007863998413, "Pretrain/Loss (Raw)": 1.8737468719482422, "Pretrain/Step": 17826, "Pretrain/Step Time": 8.494215406477451} +{"Pretrain/Learning Rate": 5.574869518762654e-07, "Pretrain/Loss": 1.9974098205566406, "Pretrain/Loss (Raw)": 2.0535197257995605, "Pretrain/Step": 17827, "Pretrain/Step Time": 8.483256377279758} +{"Pretrain/Learning Rate": 5.565958023341034e-07, "Pretrain/Loss": 1.9979876279830933, "Pretrain/Loss (Raw)": 2.203428268432617, "Pretrain/Step": 17828, "Pretrain/Step Time": 8.49144921079278} +{"Pretrain/Learning Rate": 5.557053576002668e-07, "Pretrain/Loss": 1.995632529258728, "Pretrain/Loss (Raw)": 1.8491090536117554, "Pretrain/Step": 17829, "Pretrain/Step Time": 8.491062553599477} +{"Pretrain/Learning Rate": 5.548156177004382e-07, "Pretrain/Loss": 1.9953131675720215, "Pretrain/Loss (Raw)": 1.7905080318450928, "Pretrain/Step": 17830, "Pretrain/Step Time": 8.490839866921306} +{"Pretrain/Learning Rate": 5.53926582660269e-07, "Pretrain/Loss": 1.9959229230880737, "Pretrain/Loss (Raw)": 1.9680402278900146, "Pretrain/Step": 17831, "Pretrain/Step Time": 8.4928806014359} +{"Pretrain/Learning Rate": 5.53038252505389e-07, "Pretrain/Loss": 1.9975346326828003, "Pretrain/Loss (Raw)": 2.0614118576049805, "Pretrain/Step": 17832, "Pretrain/Step Time": 8.493532521650195} +{"Pretrain/Learning Rate": 5.521506272614218e-07, "Pretrain/Loss": 1.9959561824798584, "Pretrain/Loss (Raw)": 1.93804132938385, "Pretrain/Step": 17833, "Pretrain/Step Time": 8.490016942843795} +{"Pretrain/Learning Rate": 5.512637069539528e-07, "Pretrain/Loss": 1.998403549194336, "Pretrain/Loss (Raw)": 2.212671995162964, "Pretrain/Step": 17834, "Pretrain/Step Time": 8.491063257679343} +{"Pretrain/Learning Rate": 5.503774916085613e-07, "Pretrain/Loss": 1.99833345413208, "Pretrain/Loss (Raw)": 1.9804219007492065, "Pretrain/Step": 17835, "Pretrain/Step Time": 8.490753984078765} +{"Pretrain/Learning Rate": 5.494919812507993e-07, "Pretrain/Loss": 1.9990955591201782, "Pretrain/Loss (Raw)": 1.957071304321289, "Pretrain/Step": 17836, "Pretrain/Step Time": 8.495550379157066} +{"Pretrain/Learning Rate": 5.48607175906199e-07, "Pretrain/Loss": 1.9982134103775024, "Pretrain/Loss (Raw)": 2.002591609954834, "Pretrain/Step": 17837, "Pretrain/Step Time": 8.496645517647266} +{"Pretrain/Learning Rate": 5.477230756002732e-07, "Pretrain/Loss": 1.9906082153320312, "Pretrain/Loss (Raw)": 1.4699254035949707, "Pretrain/Step": 17838, "Pretrain/Step Time": 8.494765752926469} +{"Pretrain/Learning Rate": 5.468396803585157e-07, "Pretrain/Loss": 1.9871933460235596, "Pretrain/Loss (Raw)": 1.5568588972091675, "Pretrain/Step": 17839, "Pretrain/Step Time": 8.493683094158769} +{"Pretrain/Learning Rate": 5.459569902063977e-07, "Pretrain/Loss": 1.988813042640686, "Pretrain/Loss (Raw)": 2.233445167541504, "Pretrain/Step": 17840, "Pretrain/Step Time": 8.493566336110234} +{"Pretrain/Learning Rate": 5.45075005169371e-07, "Pretrain/Loss": 1.9905152320861816, "Pretrain/Loss (Raw)": 2.11082124710083, "Pretrain/Step": 17841, "Pretrain/Step Time": 8.489638824015856} +{"Pretrain/Learning Rate": 5.441937252728651e-07, "Pretrain/Loss": 1.989919900894165, "Pretrain/Loss (Raw)": 1.739395260810852, "Pretrain/Step": 17842, "Pretrain/Step Time": 8.48526668176055} +{"Pretrain/Learning Rate": 5.433131505422961e-07, "Pretrain/Loss": 1.9895331859588623, "Pretrain/Loss (Raw)": 1.8687660694122314, "Pretrain/Step": 17843, "Pretrain/Step Time": 8.490843627601862} +{"Pretrain/Learning Rate": 5.424332810030491e-07, "Pretrain/Loss": 1.9897441864013672, "Pretrain/Loss (Raw)": 2.1214094161987305, "Pretrain/Step": 17844, "Pretrain/Step Time": 8.49156635813415} +{"Pretrain/Learning Rate": 5.415541166804983e-07, "Pretrain/Loss": 1.9893743991851807, "Pretrain/Loss (Raw)": 2.0346992015838623, "Pretrain/Step": 17845, "Pretrain/Step Time": 8.49099395237863} +{"Pretrain/Learning Rate": 5.406756575999899e-07, "Pretrain/Loss": 1.9873651266098022, "Pretrain/Loss (Raw)": 1.8342883586883545, "Pretrain/Step": 17846, "Pretrain/Step Time": 8.490043818950653} +{"Pretrain/Learning Rate": 5.397979037868594e-07, "Pretrain/Loss": 1.9909913539886475, "Pretrain/Loss (Raw)": 2.241779327392578, "Pretrain/Step": 17847, "Pretrain/Step Time": 8.491171972826123} +{"Pretrain/Learning Rate": 5.389208552664115e-07, "Pretrain/Loss": 1.9895399808883667, "Pretrain/Loss (Raw)": 1.8170909881591797, "Pretrain/Step": 17848, "Pretrain/Step Time": 8.492889514192939} +{"Pretrain/Learning Rate": 5.380445120639371e-07, "Pretrain/Loss": 1.9890626668930054, "Pretrain/Loss (Raw)": 1.9801815748214722, "Pretrain/Step": 17849, "Pretrain/Step Time": 8.494556065648794} +{"Pretrain/Learning Rate": 5.371688742047049e-07, "Pretrain/Loss": 1.9889240264892578, "Pretrain/Loss (Raw)": 2.1107912063598633, "Pretrain/Step": 17850, "Pretrain/Step Time": 8.490620588883758} +{"Pretrain/Learning Rate": 5.362939417139612e-07, "Pretrain/Loss": 1.9891937971115112, "Pretrain/Loss (Raw)": 1.9027745723724365, "Pretrain/Step": 17851, "Pretrain/Step Time": 8.487068308517337} +{"Pretrain/Learning Rate": 5.354197146169387e-07, "Pretrain/Loss": 1.9898678064346313, "Pretrain/Loss (Raw)": 1.8442440032958984, "Pretrain/Step": 17852, "Pretrain/Step Time": 8.49015386775136} +{"Pretrain/Learning Rate": 5.345461929388423e-07, "Pretrain/Loss": 1.991136908531189, "Pretrain/Loss (Raw)": 2.0731208324432373, "Pretrain/Step": 17853, "Pretrain/Step Time": 8.48763252608478} +{"Pretrain/Learning Rate": 5.336733767048602e-07, "Pretrain/Loss": 1.9913996458053589, "Pretrain/Loss (Raw)": 2.0239877700805664, "Pretrain/Step": 17854, "Pretrain/Step Time": 8.485549127683043} +{"Pretrain/Learning Rate": 5.328012659401582e-07, "Pretrain/Loss": 1.9916176795959473, "Pretrain/Loss (Raw)": 1.9141381978988647, "Pretrain/Step": 17855, "Pretrain/Step Time": 8.488919325172901} +{"Pretrain/Learning Rate": 5.319298606698803e-07, "Pretrain/Loss": 1.9898430109024048, "Pretrain/Loss (Raw)": 1.9455504417419434, "Pretrain/Step": 17856, "Pretrain/Step Time": 8.481307245790958} +{"Pretrain/Learning Rate": 5.310591609191589e-07, "Pretrain/Loss": 1.986545443534851, "Pretrain/Loss (Raw)": 2.023430585861206, "Pretrain/Step": 17857, "Pretrain/Step Time": 8.484306573867798} +{"Pretrain/Learning Rate": 5.301891667130937e-07, "Pretrain/Loss": 1.9859318733215332, "Pretrain/Loss (Raw)": 2.0158801078796387, "Pretrain/Step": 17858, "Pretrain/Step Time": 8.482707764953375} +{"Pretrain/Learning Rate": 5.293198780767783e-07, "Pretrain/Loss": 1.984236717224121, "Pretrain/Loss (Raw)": 1.8121156692504883, "Pretrain/Step": 17859, "Pretrain/Step Time": 8.486638074740767} +{"Pretrain/Learning Rate": 5.284512950352705e-07, "Pretrain/Loss": 1.9834294319152832, "Pretrain/Loss (Raw)": 1.8383976221084595, "Pretrain/Step": 17860, "Pretrain/Step Time": 8.484912576153874} +{"Pretrain/Learning Rate": 5.275834176136196e-07, "Pretrain/Loss": 1.9829260110855103, "Pretrain/Loss (Raw)": 1.9978325366973877, "Pretrain/Step": 17861, "Pretrain/Step Time": 8.483884781599045} +{"Pretrain/Learning Rate": 5.267162458368474e-07, "Pretrain/Loss": 1.9847617149353027, "Pretrain/Loss (Raw)": 2.202862024307251, "Pretrain/Step": 17862, "Pretrain/Step Time": 8.49076490290463} +{"Pretrain/Learning Rate": 5.258497797299616e-07, "Pretrain/Loss": 1.9827768802642822, "Pretrain/Loss (Raw)": 1.777520775794983, "Pretrain/Step": 17863, "Pretrain/Step Time": 8.493062885478139} +{"Pretrain/Learning Rate": 5.249840193179423e-07, "Pretrain/Loss": 1.9821321964263916, "Pretrain/Loss (Raw)": 2.0089480876922607, "Pretrain/Step": 17864, "Pretrain/Step Time": 8.490434654057026} +{"Pretrain/Learning Rate": 5.241189646257583e-07, "Pretrain/Loss": 1.9831863641738892, "Pretrain/Loss (Raw)": 2.05133318901062, "Pretrain/Step": 17865, "Pretrain/Step Time": 8.490568928420544} +{"Pretrain/Learning Rate": 5.232546156783452e-07, "Pretrain/Loss": 1.984037160873413, "Pretrain/Loss (Raw)": 2.0813300609588623, "Pretrain/Step": 17866, "Pretrain/Step Time": 8.492481106892228} +{"Pretrain/Learning Rate": 5.223909725006331e-07, "Pretrain/Loss": 1.9843119382858276, "Pretrain/Loss (Raw)": 1.9408546686172485, "Pretrain/Step": 17867, "Pretrain/Step Time": 8.495157973840833} +{"Pretrain/Learning Rate": 5.215280351175216e-07, "Pretrain/Loss": 1.9842890501022339, "Pretrain/Loss (Raw)": 2.014946222305298, "Pretrain/Step": 17868, "Pretrain/Step Time": 8.489923214539886} +{"Pretrain/Learning Rate": 5.206658035538936e-07, "Pretrain/Loss": 1.9838489294052124, "Pretrain/Loss (Raw)": 1.8484221696853638, "Pretrain/Step": 17869, "Pretrain/Step Time": 8.492958268150687} +{"Pretrain/Learning Rate": 5.198042778346097e-07, "Pretrain/Loss": 1.9832555055618286, "Pretrain/Loss (Raw)": 2.0307793617248535, "Pretrain/Step": 17870, "Pretrain/Step Time": 8.491920676082373} +{"Pretrain/Learning Rate": 5.18943457984511e-07, "Pretrain/Loss": 1.9827463626861572, "Pretrain/Loss (Raw)": 2.0147206783294678, "Pretrain/Step": 17871, "Pretrain/Step Time": 8.494401194155216} +{"Pretrain/Learning Rate": 5.180833440284194e-07, "Pretrain/Loss": 1.982417106628418, "Pretrain/Loss (Raw)": 1.9846410751342773, "Pretrain/Step": 17872, "Pretrain/Step Time": 8.490887980908155} +{"Pretrain/Learning Rate": 5.172239359911374e-07, "Pretrain/Loss": 1.9833914041519165, "Pretrain/Loss (Raw)": 2.1266019344329834, "Pretrain/Step": 17873, "Pretrain/Step Time": 8.489410541951656} +{"Pretrain/Learning Rate": 5.163652338974423e-07, "Pretrain/Loss": 1.9830645322799683, "Pretrain/Loss (Raw)": 2.0039875507354736, "Pretrain/Step": 17874, "Pretrain/Step Time": 8.494077542796731} +{"Pretrain/Learning Rate": 5.155072377721005e-07, "Pretrain/Loss": 1.9825475215911865, "Pretrain/Loss (Raw)": 2.0426876544952393, "Pretrain/Step": 17875, "Pretrain/Step Time": 8.492751840502024} +{"Pretrain/Learning Rate": 5.14649947639842e-07, "Pretrain/Loss": 1.9833984375, "Pretrain/Loss (Raw)": 2.0353024005889893, "Pretrain/Step": 17876, "Pretrain/Step Time": 8.495013387873769} +{"Pretrain/Learning Rate": 5.137933635253917e-07, "Pretrain/Loss": 1.9811428785324097, "Pretrain/Loss (Raw)": 1.7642048597335815, "Pretrain/Step": 17877, "Pretrain/Step Time": 8.493196863681078} +{"Pretrain/Learning Rate": 5.129374854534492e-07, "Pretrain/Loss": 1.9799840450286865, "Pretrain/Loss (Raw)": 1.848031997680664, "Pretrain/Step": 17878, "Pretrain/Step Time": 8.490856235846877} +{"Pretrain/Learning Rate": 5.120823134486918e-07, "Pretrain/Loss": 1.9786584377288818, "Pretrain/Loss (Raw)": 1.8291559219360352, "Pretrain/Step": 17879, "Pretrain/Step Time": 8.493816707283258} +{"Pretrain/Learning Rate": 5.112278475357807e-07, "Pretrain/Loss": 1.9786068201065063, "Pretrain/Loss (Raw)": 2.0531692504882812, "Pretrain/Step": 17880, "Pretrain/Step Time": 8.496300116181374} +{"Pretrain/Learning Rate": 5.103740877393459e-07, "Pretrain/Loss": 1.977412223815918, "Pretrain/Loss (Raw)": 1.859605073928833, "Pretrain/Step": 17881, "Pretrain/Step Time": 8.49388487264514} +{"Pretrain/Learning Rate": 5.095210340840151e-07, "Pretrain/Loss": 1.9774317741394043, "Pretrain/Loss (Raw)": 2.0211782455444336, "Pretrain/Step": 17882, "Pretrain/Step Time": 8.495869655162096} +{"Pretrain/Learning Rate": 5.086686865943768e-07, "Pretrain/Loss": 1.976210355758667, "Pretrain/Loss (Raw)": 1.856724500656128, "Pretrain/Step": 17883, "Pretrain/Step Time": 8.497492205351591} +{"Pretrain/Learning Rate": 5.078170452950143e-07, "Pretrain/Loss": 1.9730360507965088, "Pretrain/Loss (Raw)": 1.9330390691757202, "Pretrain/Step": 17884, "Pretrain/Step Time": 8.49564703181386} +{"Pretrain/Learning Rate": 5.069661102104828e-07, "Pretrain/Loss": 1.9708688259124756, "Pretrain/Loss (Raw)": 1.813639521598816, "Pretrain/Step": 17885, "Pretrain/Step Time": 8.492760501801968} +{"Pretrain/Learning Rate": 5.061158813653127e-07, "Pretrain/Loss": 1.9698799848556519, "Pretrain/Loss (Raw)": 2.0081515312194824, "Pretrain/Step": 17886, "Pretrain/Step Time": 8.496602484956384} +{"Pretrain/Learning Rate": 5.052663587840289e-07, "Pretrain/Loss": 1.9697265625, "Pretrain/Loss (Raw)": 2.068451404571533, "Pretrain/Step": 17887, "Pretrain/Step Time": 8.492885621264577} +{"Pretrain/Learning Rate": 5.044175424911174e-07, "Pretrain/Loss": 1.9697880744934082, "Pretrain/Loss (Raw)": 2.1083931922912598, "Pretrain/Step": 17888, "Pretrain/Step Time": 8.495670409873128} +{"Pretrain/Learning Rate": 5.035694325110613e-07, "Pretrain/Loss": 1.9716534614562988, "Pretrain/Loss (Raw)": 1.9770864248275757, "Pretrain/Step": 17889, "Pretrain/Step Time": 8.493380956351757} +{"Pretrain/Learning Rate": 5.027220288683105e-07, "Pretrain/Loss": 1.9703640937805176, "Pretrain/Loss (Raw)": 1.9246777296066284, "Pretrain/Step": 17890, "Pretrain/Step Time": 8.491588285192847} +{"Pretrain/Learning Rate": 5.018753315872981e-07, "Pretrain/Loss": 1.9717081785202026, "Pretrain/Loss (Raw)": 2.1656250953674316, "Pretrain/Step": 17891, "Pretrain/Step Time": 8.496613174676895} +{"Pretrain/Learning Rate": 5.010293406924438e-07, "Pretrain/Loss": 1.971400499343872, "Pretrain/Loss (Raw)": 1.8925962448120117, "Pretrain/Step": 17892, "Pretrain/Step Time": 8.49645853228867} +{"Pretrain/Learning Rate": 5.001840562081362e-07, "Pretrain/Loss": 1.971482753753662, "Pretrain/Loss (Raw)": 1.8897415399551392, "Pretrain/Step": 17893, "Pretrain/Step Time": 8.497791238129139} +{"Pretrain/Learning Rate": 4.993394781587529e-07, "Pretrain/Loss": 1.9692630767822266, "Pretrain/Loss (Raw)": 1.9540088176727295, "Pretrain/Step": 17894, "Pretrain/Step Time": 8.489709487184882} +{"Pretrain/Learning Rate": 4.984956065686414e-07, "Pretrain/Loss": 1.9683842658996582, "Pretrain/Loss (Raw)": 1.9763199090957642, "Pretrain/Step": 17895, "Pretrain/Step Time": 8.489225907251239} +{"Pretrain/Learning Rate": 4.976524414621375e-07, "Pretrain/Loss": 1.9686862230300903, "Pretrain/Loss (Raw)": 2.0899059772491455, "Pretrain/Step": 17896, "Pretrain/Step Time": 8.491967948153615} +{"Pretrain/Learning Rate": 4.968099828635525e-07, "Pretrain/Loss": 1.967836856842041, "Pretrain/Loss (Raw)": 1.8965160846710205, "Pretrain/Step": 17897, "Pretrain/Step Time": 8.492850631475449} +{"Pretrain/Learning Rate": 4.959682307971753e-07, "Pretrain/Loss": 1.967747449874878, "Pretrain/Loss (Raw)": 1.8233195543289185, "Pretrain/Step": 17898, "Pretrain/Step Time": 8.493603114038706} +{"Pretrain/Learning Rate": 4.951271852872835e-07, "Pretrain/Loss": 1.9683133363723755, "Pretrain/Loss (Raw)": 1.9804699420928955, "Pretrain/Step": 17899, "Pretrain/Step Time": 8.49245966784656} +{"Pretrain/Learning Rate": 4.942868463581246e-07, "Pretrain/Loss": 1.9677865505218506, "Pretrain/Loss (Raw)": 1.9367483854293823, "Pretrain/Step": 17900, "Pretrain/Step Time": 8.490486718714237} +{"Pretrain/Learning Rate": 4.934472140339264e-07, "Pretrain/Loss": 1.9685170650482178, "Pretrain/Loss (Raw)": 2.0678482055664062, "Pretrain/Step": 17901, "Pretrain/Step Time": 8.48702254332602} +{"Pretrain/Learning Rate": 4.926082883389027e-07, "Pretrain/Loss": 1.968059778213501, "Pretrain/Loss (Raw)": 1.9715327024459839, "Pretrain/Step": 17902, "Pretrain/Step Time": 8.484874442219734} +{"Pretrain/Learning Rate": 4.917700692972427e-07, "Pretrain/Loss": 1.9694082736968994, "Pretrain/Loss (Raw)": 2.1904938220977783, "Pretrain/Step": 17903, "Pretrain/Step Time": 8.483072204515338} +{"Pretrain/Learning Rate": 4.909325569331158e-07, "Pretrain/Loss": 1.9713740348815918, "Pretrain/Loss (Raw)": 2.32021427154541, "Pretrain/Step": 17904, "Pretrain/Step Time": 8.486619714647532} +{"Pretrain/Learning Rate": 4.900957512706722e-07, "Pretrain/Loss": 1.9729666709899902, "Pretrain/Loss (Raw)": 2.180264949798584, "Pretrain/Step": 17905, "Pretrain/Step Time": 8.486058447510004} +{"Pretrain/Learning Rate": 4.892596523340343e-07, "Pretrain/Loss": 1.9704340696334839, "Pretrain/Loss (Raw)": 1.689664602279663, "Pretrain/Step": 17906, "Pretrain/Step Time": 8.477849025279284} +{"Pretrain/Learning Rate": 4.884242601473216e-07, "Pretrain/Loss": 1.9707436561584473, "Pretrain/Loss (Raw)": 2.023306131362915, "Pretrain/Step": 17907, "Pretrain/Step Time": 8.48121690377593} +{"Pretrain/Learning Rate": 4.875895747346121e-07, "Pretrain/Loss": 1.972151517868042, "Pretrain/Loss (Raw)": 2.0130457878112793, "Pretrain/Step": 17908, "Pretrain/Step Time": 8.48193884268403} +{"Pretrain/Learning Rate": 4.867555961199782e-07, "Pretrain/Loss": 1.9768178462982178, "Pretrain/Loss (Raw)": 2.251368284225464, "Pretrain/Step": 17909, "Pretrain/Step Time": 8.484409151598811} +{"Pretrain/Learning Rate": 4.859223243274647e-07, "Pretrain/Loss": 1.9793765544891357, "Pretrain/Loss (Raw)": 2.276304006576538, "Pretrain/Step": 17910, "Pretrain/Step Time": 8.481475587934256} +{"Pretrain/Learning Rate": 4.850897593811021e-07, "Pretrain/Loss": 1.9752578735351562, "Pretrain/Loss (Raw)": 1.7781368494033813, "Pretrain/Step": 17911, "Pretrain/Step Time": 8.47713641449809} +{"Pretrain/Learning Rate": 4.842579013048937e-07, "Pretrain/Loss": 1.9770588874816895, "Pretrain/Loss (Raw)": 2.048887252807617, "Pretrain/Step": 17912, "Pretrain/Step Time": 8.47802328504622} +{"Pretrain/Learning Rate": 4.834267501228229e-07, "Pretrain/Loss": 1.9785213470458984, "Pretrain/Loss (Raw)": 2.0283305644989014, "Pretrain/Step": 17913, "Pretrain/Step Time": 8.478268668055534} +{"Pretrain/Learning Rate": 4.82596305858865e-07, "Pretrain/Loss": 1.9769649505615234, "Pretrain/Loss (Raw)": 1.9234411716461182, "Pretrain/Step": 17914, "Pretrain/Step Time": 8.48065884783864} +{"Pretrain/Learning Rate": 4.817665685369538e-07, "Pretrain/Loss": 1.976900339126587, "Pretrain/Loss (Raw)": 1.8954976797103882, "Pretrain/Step": 17915, "Pretrain/Step Time": 8.475750673562288} +{"Pretrain/Learning Rate": 4.8093753818102e-07, "Pretrain/Loss": 1.9787266254425049, "Pretrain/Loss (Raw)": 2.129506826400757, "Pretrain/Step": 17916, "Pretrain/Step Time": 8.478071747347713} +{"Pretrain/Learning Rate": 4.801092148149722e-07, "Pretrain/Loss": 1.979715347290039, "Pretrain/Loss (Raw)": 2.0815958976745605, "Pretrain/Step": 17917, "Pretrain/Step Time": 8.479237293824553} +{"Pretrain/Learning Rate": 4.79281598462683e-07, "Pretrain/Loss": 1.9775145053863525, "Pretrain/Loss (Raw)": 1.960166573524475, "Pretrain/Step": 17918, "Pretrain/Step Time": 8.47943838313222} +{"Pretrain/Learning Rate": 4.784546891480279e-07, "Pretrain/Loss": 1.979443073272705, "Pretrain/Loss (Raw)": 2.105957269668579, "Pretrain/Step": 17919, "Pretrain/Step Time": 8.479575810953975} +{"Pretrain/Learning Rate": 4.776284868948433e-07, "Pretrain/Loss": 1.9782994985580444, "Pretrain/Loss (Raw)": 1.8822427988052368, "Pretrain/Step": 17920, "Pretrain/Step Time": 8.479296183213592} +{"Pretrain/Learning Rate": 4.768029917269545e-07, "Pretrain/Loss": 1.9769337177276611, "Pretrain/Loss (Raw)": 1.9280949831008911, "Pretrain/Step": 17921, "Pretrain/Step Time": 8.481508953496814} +{"Pretrain/Learning Rate": 4.7597820366816484e-07, "Pretrain/Loss": 1.9758515357971191, "Pretrain/Loss (Raw)": 2.092350959777832, "Pretrain/Step": 17922, "Pretrain/Step Time": 8.478082878515124} +{"Pretrain/Learning Rate": 4.7515412274225236e-07, "Pretrain/Loss": 1.9759305715560913, "Pretrain/Loss (Raw)": 1.9788655042648315, "Pretrain/Step": 17923, "Pretrain/Step Time": 8.481576349586248} +{"Pretrain/Learning Rate": 4.7433074897298426e-07, "Pretrain/Loss": 1.9754613637924194, "Pretrain/Loss (Raw)": 1.8308706283569336, "Pretrain/Step": 17924, "Pretrain/Step Time": 8.475659932941198} +{"Pretrain/Learning Rate": 4.7350808238409703e-07, "Pretrain/Loss": 1.9748789072036743, "Pretrain/Loss (Raw)": 1.8993040323257446, "Pretrain/Step": 17925, "Pretrain/Step Time": 8.481746315956116} +{"Pretrain/Learning Rate": 4.7268612299931623e-07, "Pretrain/Loss": 1.9718061685562134, "Pretrain/Loss (Raw)": 1.8337253332138062, "Pretrain/Step": 17926, "Pretrain/Step Time": 8.478516744449735} +{"Pretrain/Learning Rate": 4.718648708423423e-07, "Pretrain/Loss": 1.9718425273895264, "Pretrain/Loss (Raw)": 1.9594781398773193, "Pretrain/Step": 17927, "Pretrain/Step Time": 8.466735571622849} +{"Pretrain/Learning Rate": 4.7104432593685077e-07, "Pretrain/Loss": 1.9747400283813477, "Pretrain/Loss (Raw)": 2.434610605239868, "Pretrain/Step": 17928, "Pretrain/Step Time": 8.475784312933683} +{"Pretrain/Learning Rate": 4.7022448830650603e-07, "Pretrain/Loss": 1.9736822843551636, "Pretrain/Loss (Raw)": 1.9230409860610962, "Pretrain/Step": 17929, "Pretrain/Step Time": 8.475393710657954} +{"Pretrain/Learning Rate": 4.694053579749447e-07, "Pretrain/Loss": 1.972319483757019, "Pretrain/Loss (Raw)": 1.7731828689575195, "Pretrain/Step": 17930, "Pretrain/Step Time": 8.472400575876236} +{"Pretrain/Learning Rate": 4.6858693496578674e-07, "Pretrain/Loss": 1.9731475114822388, "Pretrain/Loss (Raw)": 2.187932014465332, "Pretrain/Step": 17931, "Pretrain/Step Time": 8.471766743808985} +{"Pretrain/Learning Rate": 4.6776921930263284e-07, "Pretrain/Loss": 1.972449541091919, "Pretrain/Loss (Raw)": 1.9655535221099854, "Pretrain/Step": 17932, "Pretrain/Step Time": 8.477073434740305} +{"Pretrain/Learning Rate": 4.6695221100905574e-07, "Pretrain/Loss": 1.9734410047531128, "Pretrain/Loss (Raw)": 1.8465399742126465, "Pretrain/Step": 17933, "Pretrain/Step Time": 8.476671442389488} +{"Pretrain/Learning Rate": 4.661359101086199e-07, "Pretrain/Loss": 1.9732885360717773, "Pretrain/Loss (Raw)": 2.067988872528076, "Pretrain/Step": 17934, "Pretrain/Step Time": 8.476461699232459} +{"Pretrain/Learning Rate": 4.653203166248593e-07, "Pretrain/Loss": 1.9751592874526978, "Pretrain/Loss (Raw)": 2.086411714553833, "Pretrain/Step": 17935, "Pretrain/Step Time": 8.474334383383393} +{"Pretrain/Learning Rate": 4.6450543058129125e-07, "Pretrain/Loss": 1.975629210472107, "Pretrain/Loss (Raw)": 1.8599729537963867, "Pretrain/Step": 17936, "Pretrain/Step Time": 8.472308550029993} +{"Pretrain/Learning Rate": 4.636912520014164e-07, "Pretrain/Loss": 1.9757537841796875, "Pretrain/Loss (Raw)": 2.0439229011535645, "Pretrain/Step": 17937, "Pretrain/Step Time": 8.47372056543827} +{"Pretrain/Learning Rate": 4.628777809087048e-07, "Pretrain/Loss": 1.976515531539917, "Pretrain/Loss (Raw)": 2.1229403018951416, "Pretrain/Step": 17938, "Pretrain/Step Time": 8.481242360547185} +{"Pretrain/Learning Rate": 4.6206501732661277e-07, "Pretrain/Loss": 1.9771463871002197, "Pretrain/Loss (Raw)": 1.922474980354309, "Pretrain/Step": 17939, "Pretrain/Step Time": 8.478388626128435} +{"Pretrain/Learning Rate": 4.6125296127857984e-07, "Pretrain/Loss": 1.9777624607086182, "Pretrain/Loss (Raw)": 1.8959373235702515, "Pretrain/Step": 17940, "Pretrain/Step Time": 8.47261449880898} +{"Pretrain/Learning Rate": 4.6044161278801787e-07, "Pretrain/Loss": 1.9786579608917236, "Pretrain/Loss (Raw)": 1.8208346366882324, "Pretrain/Step": 17941, "Pretrain/Step Time": 8.481814647093415} +{"Pretrain/Learning Rate": 4.5963097187832205e-07, "Pretrain/Loss": 1.975205659866333, "Pretrain/Loss (Raw)": 1.880812168121338, "Pretrain/Step": 17942, "Pretrain/Step Time": 8.479999657720327} +{"Pretrain/Learning Rate": 4.5882103857287086e-07, "Pretrain/Loss": 1.9765809774398804, "Pretrain/Loss (Raw)": 1.9518355131149292, "Pretrain/Step": 17943, "Pretrain/Step Time": 8.475947257131338} +{"Pretrain/Learning Rate": 4.5801181289501225e-07, "Pretrain/Loss": 1.976517915725708, "Pretrain/Loss (Raw)": 2.090500593185425, "Pretrain/Step": 17944, "Pretrain/Step Time": 8.480315400287509} +{"Pretrain/Learning Rate": 4.572032948680804e-07, "Pretrain/Loss": 1.9782915115356445, "Pretrain/Loss (Raw)": 1.937278389930725, "Pretrain/Step": 17945, "Pretrain/Step Time": 8.477122073993087} +{"Pretrain/Learning Rate": 4.5639548451539283e-07, "Pretrain/Loss": 1.9760332107543945, "Pretrain/Loss (Raw)": 1.828546404838562, "Pretrain/Step": 17946, "Pretrain/Step Time": 8.479377079755068} +{"Pretrain/Learning Rate": 4.5558838186023636e-07, "Pretrain/Loss": 1.9764432907104492, "Pretrain/Loss (Raw)": 2.0141589641571045, "Pretrain/Step": 17947, "Pretrain/Step Time": 8.478126371279359} +{"Pretrain/Learning Rate": 4.547819869258896e-07, "Pretrain/Loss": 1.9742244482040405, "Pretrain/Loss (Raw)": 1.6717146635055542, "Pretrain/Step": 17948, "Pretrain/Step Time": 8.481422875076532} +{"Pretrain/Learning Rate": 4.5397629973560064e-07, "Pretrain/Loss": 1.9746304750442505, "Pretrain/Loss (Raw)": 1.9738308191299438, "Pretrain/Step": 17949, "Pretrain/Step Time": 8.48415040411055} +{"Pretrain/Learning Rate": 4.5317132031259814e-07, "Pretrain/Loss": 1.9762799739837646, "Pretrain/Loss (Raw)": 2.108477830886841, "Pretrain/Step": 17950, "Pretrain/Step Time": 8.48553579673171} +{"Pretrain/Learning Rate": 4.523670486800996e-07, "Pretrain/Loss": 1.9720232486724854, "Pretrain/Loss (Raw)": 1.7428865432739258, "Pretrain/Step": 17951, "Pretrain/Step Time": 8.487066712230444} +{"Pretrain/Learning Rate": 4.515634848612893e-07, "Pretrain/Loss": 1.9743807315826416, "Pretrain/Loss (Raw)": 2.002164125442505, "Pretrain/Step": 17952, "Pretrain/Step Time": 8.485146651044488} +{"Pretrain/Learning Rate": 4.507606288793431e-07, "Pretrain/Loss": 1.97505521774292, "Pretrain/Loss (Raw)": 2.0758368968963623, "Pretrain/Step": 17953, "Pretrain/Step Time": 8.48467037640512} +{"Pretrain/Learning Rate": 4.499584807574064e-07, "Pretrain/Loss": 1.9762523174285889, "Pretrain/Loss (Raw)": 2.0269861221313477, "Pretrain/Step": 17954, "Pretrain/Step Time": 8.485359605401754} +{"Pretrain/Learning Rate": 4.4915704051861073e-07, "Pretrain/Loss": 1.9749488830566406, "Pretrain/Loss (Raw)": 1.8866581916809082, "Pretrain/Step": 17955, "Pretrain/Step Time": 8.490744607523084} +{"Pretrain/Learning Rate": 4.483563081860653e-07, "Pretrain/Loss": 1.9736052751541138, "Pretrain/Loss (Raw)": 2.031463146209717, "Pretrain/Step": 17956, "Pretrain/Step Time": 8.4844921939075} +{"Pretrain/Learning Rate": 4.475562837828573e-07, "Pretrain/Loss": 1.9752986431121826, "Pretrain/Loss (Raw)": 2.0658605098724365, "Pretrain/Step": 17957, "Pretrain/Step Time": 8.488580510020256} +{"Pretrain/Learning Rate": 4.4675696733205705e-07, "Pretrain/Loss": 1.9776362180709839, "Pretrain/Loss (Raw)": 2.089719295501709, "Pretrain/Step": 17958, "Pretrain/Step Time": 8.486329857259989} +{"Pretrain/Learning Rate": 4.459583588567101e-07, "Pretrain/Loss": 1.9773786067962646, "Pretrain/Loss (Raw)": 1.9350590705871582, "Pretrain/Step": 17959, "Pretrain/Step Time": 8.488086028024554} +{"Pretrain/Learning Rate": 4.451604583798424e-07, "Pretrain/Loss": 1.977897047996521, "Pretrain/Loss (Raw)": 2.1277780532836914, "Pretrain/Step": 17960, "Pretrain/Step Time": 8.486194908618927} +{"Pretrain/Learning Rate": 4.4436326592446343e-07, "Pretrain/Loss": 1.977583885192871, "Pretrain/Loss (Raw)": 1.897952675819397, "Pretrain/Step": 17961, "Pretrain/Step Time": 8.487573567777872} +{"Pretrain/Learning Rate": 4.4356678151355747e-07, "Pretrain/Loss": 1.9751653671264648, "Pretrain/Loss (Raw)": 1.9031105041503906, "Pretrain/Step": 17962, "Pretrain/Step Time": 8.485433736816049} +{"Pretrain/Learning Rate": 4.4277100517009785e-07, "Pretrain/Loss": 1.974928379058838, "Pretrain/Loss (Raw)": 1.9500747919082642, "Pretrain/Step": 17963, "Pretrain/Step Time": 8.488149967044592} +{"Pretrain/Learning Rate": 4.4197593691702176e-07, "Pretrain/Loss": 1.9742944240570068, "Pretrain/Loss (Raw)": 1.8759323358535767, "Pretrain/Step": 17964, "Pretrain/Step Time": 8.484649650752544} +{"Pretrain/Learning Rate": 4.4118157677725536e-07, "Pretrain/Loss": 1.973414659500122, "Pretrain/Loss (Raw)": 1.8899869918823242, "Pretrain/Step": 17965, "Pretrain/Step Time": 8.483856601640582} +{"Pretrain/Learning Rate": 4.4038792477370803e-07, "Pretrain/Loss": 1.9773774147033691, "Pretrain/Loss (Raw)": 1.9771531820297241, "Pretrain/Step": 17966, "Pretrain/Step Time": 8.484702728688717} +{"Pretrain/Learning Rate": 4.3959498092925877e-07, "Pretrain/Loss": 1.9806443452835083, "Pretrain/Loss (Raw)": 1.975006103515625, "Pretrain/Step": 17967, "Pretrain/Step Time": 8.485245607793331} +{"Pretrain/Learning Rate": 4.3880274526677535e-07, "Pretrain/Loss": 1.9770246744155884, "Pretrain/Loss (Raw)": 1.7701363563537598, "Pretrain/Step": 17968, "Pretrain/Step Time": 8.485023498535156} +{"Pretrain/Learning Rate": 4.380112178091006e-07, "Pretrain/Loss": 1.9765393733978271, "Pretrain/Loss (Raw)": 2.0487194061279297, "Pretrain/Step": 17969, "Pretrain/Step Time": 8.48638223670423} +{"Pretrain/Learning Rate": 4.3722039857905794e-07, "Pretrain/Loss": 1.9778772592544556, "Pretrain/Loss (Raw)": 1.910642147064209, "Pretrain/Step": 17970, "Pretrain/Step Time": 8.488903855904937} +{"Pretrain/Learning Rate": 4.364302875994486e-07, "Pretrain/Loss": 1.9795572757720947, "Pretrain/Loss (Raw)": 2.0838024616241455, "Pretrain/Step": 17971, "Pretrain/Step Time": 8.486205957829952} +{"Pretrain/Learning Rate": 4.3564088489305434e-07, "Pretrain/Loss": 1.9772275686264038, "Pretrain/Loss (Raw)": 1.8231971263885498, "Pretrain/Step": 17972, "Pretrain/Step Time": 8.479350186884403} +{"Pretrain/Learning Rate": 4.3485219048264304e-07, "Pretrain/Loss": 1.9759405851364136, "Pretrain/Loss (Raw)": 1.8699724674224854, "Pretrain/Step": 17973, "Pretrain/Step Time": 8.479345181956887} +{"Pretrain/Learning Rate": 4.340642043909493e-07, "Pretrain/Loss": 1.9761265516281128, "Pretrain/Loss (Raw)": 1.8580944538116455, "Pretrain/Step": 17974, "Pretrain/Step Time": 8.484615312889218} +{"Pretrain/Learning Rate": 4.3327692664069386e-07, "Pretrain/Loss": 1.972977876663208, "Pretrain/Loss (Raw)": 1.8387397527694702, "Pretrain/Step": 17975, "Pretrain/Step Time": 8.484513206407428} +{"Pretrain/Learning Rate": 4.324903572545808e-07, "Pretrain/Loss": 1.9746896028518677, "Pretrain/Loss (Raw)": 2.0361945629119873, "Pretrain/Step": 17976, "Pretrain/Step Time": 8.48552636988461} +{"Pretrain/Learning Rate": 4.317044962552891e-07, "Pretrain/Loss": 1.9743494987487793, "Pretrain/Loss (Raw)": 1.9366395473480225, "Pretrain/Step": 17977, "Pretrain/Step Time": 8.484775725752115} +{"Pretrain/Learning Rate": 4.309193436654813e-07, "Pretrain/Loss": 1.9727137088775635, "Pretrain/Loss (Raw)": 1.9014219045639038, "Pretrain/Step": 17978, "Pretrain/Step Time": 8.488342637196183} +{"Pretrain/Learning Rate": 4.3013489950779195e-07, "Pretrain/Loss": 1.9741686582565308, "Pretrain/Loss (Raw)": 2.089010000228882, "Pretrain/Step": 17979, "Pretrain/Step Time": 8.490068471059203} +{"Pretrain/Learning Rate": 4.293511638048447e-07, "Pretrain/Loss": 1.9760555028915405, "Pretrain/Loss (Raw)": 2.085756540298462, "Pretrain/Step": 17980, "Pretrain/Step Time": 8.485743397846818} +{"Pretrain/Learning Rate": 4.285681365792327e-07, "Pretrain/Loss": 1.9734280109405518, "Pretrain/Loss (Raw)": 1.7367969751358032, "Pretrain/Step": 17981, "Pretrain/Step Time": 8.491751929745078} +{"Pretrain/Learning Rate": 4.2778581785353765e-07, "Pretrain/Loss": 1.9715633392333984, "Pretrain/Loss (Raw)": 1.7853317260742188, "Pretrain/Step": 17982, "Pretrain/Step Time": 8.492182502523065} +{"Pretrain/Learning Rate": 4.270042076503167e-07, "Pretrain/Loss": 1.973751187324524, "Pretrain/Loss (Raw)": 2.194154977798462, "Pretrain/Step": 17983, "Pretrain/Step Time": 8.49610149860382} +{"Pretrain/Learning Rate": 4.262233059921045e-07, "Pretrain/Loss": 1.9741145372390747, "Pretrain/Loss (Raw)": 1.992066740989685, "Pretrain/Step": 17984, "Pretrain/Step Time": 8.49267009831965} +{"Pretrain/Learning Rate": 4.254431129014247e-07, "Pretrain/Loss": 1.9761379957199097, "Pretrain/Loss (Raw)": 2.282440185546875, "Pretrain/Step": 17985, "Pretrain/Step Time": 8.49083348363638} +{"Pretrain/Learning Rate": 4.246636284007649e-07, "Pretrain/Loss": 1.977487325668335, "Pretrain/Loss (Raw)": 2.188589572906494, "Pretrain/Step": 17986, "Pretrain/Step Time": 8.49255239032209} +{"Pretrain/Learning Rate": 4.2388485251260436e-07, "Pretrain/Loss": 1.978217601776123, "Pretrain/Loss (Raw)": 1.905595302581787, "Pretrain/Step": 17987, "Pretrain/Step Time": 8.488523192703724} +{"Pretrain/Learning Rate": 4.2310678525940285e-07, "Pretrain/Loss": 1.9809834957122803, "Pretrain/Loss (Raw)": 2.19242262840271, "Pretrain/Step": 17988, "Pretrain/Step Time": 8.487467214465141} +{"Pretrain/Learning Rate": 4.2232942666358687e-07, "Pretrain/Loss": 1.9798784255981445, "Pretrain/Loss (Raw)": 1.8563919067382812, "Pretrain/Step": 17989, "Pretrain/Step Time": 8.490185517817736} +{"Pretrain/Learning Rate": 4.215527767475802e-07, "Pretrain/Loss": 1.9773365259170532, "Pretrain/Loss (Raw)": 1.877501130104065, "Pretrain/Step": 17990, "Pretrain/Step Time": 8.483817420899868} +{"Pretrain/Learning Rate": 4.2077683553377046e-07, "Pretrain/Loss": 1.9798126220703125, "Pretrain/Loss (Raw)": 2.0944435596466064, "Pretrain/Step": 17991, "Pretrain/Step Time": 8.482177635654807} +{"Pretrain/Learning Rate": 4.200016030445314e-07, "Pretrain/Loss": 1.978502869606018, "Pretrain/Loss (Raw)": 1.8413134813308716, "Pretrain/Step": 17992, "Pretrain/Step Time": 8.491508416831493} +{"Pretrain/Learning Rate": 4.192270793022229e-07, "Pretrain/Loss": 1.9785284996032715, "Pretrain/Loss (Raw)": 2.0546085834503174, "Pretrain/Step": 17993, "Pretrain/Step Time": 8.491415355354548} +{"Pretrain/Learning Rate": 4.184532643291689e-07, "Pretrain/Loss": 1.9782085418701172, "Pretrain/Loss (Raw)": 2.0403733253479004, "Pretrain/Step": 17994, "Pretrain/Step Time": 8.486444149166346} +{"Pretrain/Learning Rate": 4.1768015814769026e-07, "Pretrain/Loss": 1.9788923263549805, "Pretrain/Loss (Raw)": 2.0283920764923096, "Pretrain/Step": 17995, "Pretrain/Step Time": 8.490010125562549} +{"Pretrain/Learning Rate": 4.16907760780072e-07, "Pretrain/Loss": 1.9791834354400635, "Pretrain/Loss (Raw)": 2.052213430404663, "Pretrain/Step": 17996, "Pretrain/Step Time": 8.490394566208124} +{"Pretrain/Learning Rate": 4.16136072248588e-07, "Pretrain/Loss": 1.9805982112884521, "Pretrain/Loss (Raw)": 2.029510259628296, "Pretrain/Step": 17997, "Pretrain/Step Time": 8.488853059709072} +{"Pretrain/Learning Rate": 4.153650925754926e-07, "Pretrain/Loss": 1.9792430400848389, "Pretrain/Loss (Raw)": 1.8573142290115356, "Pretrain/Step": 17998, "Pretrain/Step Time": 8.48954988643527} +{"Pretrain/Learning Rate": 4.145948217830098e-07, "Pretrain/Loss": 1.978068232536316, "Pretrain/Loss (Raw)": 1.86434006690979, "Pretrain/Step": 17999, "Pretrain/Step Time": 8.490175297483802} +{"Pretrain/Learning Rate": 4.1382525989335787e-07, "Pretrain/Loss": 1.977778673171997, "Pretrain/Loss (Raw)": 1.947572946548462, "Pretrain/Step": 18000, "Pretrain/Step Time": 8.494654148817062} +{"Pretrain/Learning Rate": 4.130564069287218e-07, "Pretrain/Loss": 1.9756299257278442, "Pretrain/Loss (Raw)": 1.8515619039535522, "Pretrain/Step": 18001, "Pretrain/Step Time": 8.491900024935603} +{"Pretrain/Learning Rate": 4.122882629112701e-07, "Pretrain/Loss": 1.9736340045928955, "Pretrain/Loss (Raw)": 1.748511791229248, "Pretrain/Step": 18002, "Pretrain/Step Time": 8.490084180608392} +{"Pretrain/Learning Rate": 4.1152082786315437e-07, "Pretrain/Loss": 1.9726176261901855, "Pretrain/Loss (Raw)": 1.912599802017212, "Pretrain/Step": 18003, "Pretrain/Step Time": 8.490609999746084} +{"Pretrain/Learning Rate": 4.1075410180649866e-07, "Pretrain/Loss": 1.9722329378128052, "Pretrain/Loss (Raw)": 1.9860610961914062, "Pretrain/Step": 18004, "Pretrain/Step Time": 8.48780963383615} +{"Pretrain/Learning Rate": 4.0998808476341853e-07, "Pretrain/Loss": 1.9776298999786377, "Pretrain/Loss (Raw)": 2.455021381378174, "Pretrain/Step": 18005, "Pretrain/Step Time": 8.488842802122235} +{"Pretrain/Learning Rate": 4.092227767559964e-07, "Pretrain/Loss": 1.9798541069030762, "Pretrain/Loss (Raw)": 2.1327366828918457, "Pretrain/Step": 18006, "Pretrain/Step Time": 8.48794156499207} +{"Pretrain/Learning Rate": 4.084581778062979e-07, "Pretrain/Loss": 1.9805525541305542, "Pretrain/Loss (Raw)": 1.9185357093811035, "Pretrain/Step": 18007, "Pretrain/Step Time": 8.489609755575657} +{"Pretrain/Learning Rate": 4.076942879363721e-07, "Pretrain/Loss": 1.9795141220092773, "Pretrain/Loss (Raw)": 1.9202519655227661, "Pretrain/Step": 18008, "Pretrain/Step Time": 8.494971996173263} +{"Pretrain/Learning Rate": 4.069311071682458e-07, "Pretrain/Loss": 1.980867624282837, "Pretrain/Loss (Raw)": 2.0328691005706787, "Pretrain/Step": 18009, "Pretrain/Step Time": 8.49399584531784} +{"Pretrain/Learning Rate": 4.061686355239236e-07, "Pretrain/Loss": 1.9795055389404297, "Pretrain/Loss (Raw)": 1.8468139171600342, "Pretrain/Step": 18010, "Pretrain/Step Time": 8.496956562623382} +{"Pretrain/Learning Rate": 4.054068730253935e-07, "Pretrain/Loss": 1.9794036149978638, "Pretrain/Loss (Raw)": 1.8436884880065918, "Pretrain/Step": 18011, "Pretrain/Step Time": 8.495467143133283} +{"Pretrain/Learning Rate": 4.0464581969461566e-07, "Pretrain/Loss": 1.979434847831726, "Pretrain/Loss (Raw)": 1.9370357990264893, "Pretrain/Step": 18012, "Pretrain/Step Time": 8.494790755212307} +{"Pretrain/Learning Rate": 4.038854755535393e-07, "Pretrain/Loss": 1.9812848567962646, "Pretrain/Loss (Raw)": 2.0504462718963623, "Pretrain/Step": 18013, "Pretrain/Step Time": 8.49374781921506} +{"Pretrain/Learning Rate": 4.031258406240829e-07, "Pretrain/Loss": 1.9806113243103027, "Pretrain/Loss (Raw)": 1.921939730644226, "Pretrain/Step": 18014, "Pretrain/Step Time": 8.49475659802556} +{"Pretrain/Learning Rate": 4.023669149281567e-07, "Pretrain/Loss": 1.9811828136444092, "Pretrain/Loss (Raw)": 2.141606330871582, "Pretrain/Step": 18015, "Pretrain/Step Time": 8.49479472078383} +{"Pretrain/Learning Rate": 4.016086984876377e-07, "Pretrain/Loss": 1.9820821285247803, "Pretrain/Loss (Raw)": 2.223487377166748, "Pretrain/Step": 18016, "Pretrain/Step Time": 8.496098756790161} +{"Pretrain/Learning Rate": 4.0085119132439173e-07, "Pretrain/Loss": 1.9815139770507812, "Pretrain/Loss (Raw)": 1.9043707847595215, "Pretrain/Step": 18017, "Pretrain/Step Time": 8.495662407949567} +{"Pretrain/Learning Rate": 4.0009439346026244e-07, "Pretrain/Loss": 1.980552315711975, "Pretrain/Loss (Raw)": 1.8015837669372559, "Pretrain/Step": 18018, "Pretrain/Step Time": 8.496829468756914} +{"Pretrain/Learning Rate": 3.993383049170657e-07, "Pretrain/Loss": 1.9793190956115723, "Pretrain/Loss (Raw)": 2.0077641010284424, "Pretrain/Step": 18019, "Pretrain/Step Time": 8.49151218868792} +{"Pretrain/Learning Rate": 3.98582925716609e-07, "Pretrain/Loss": 1.9820771217346191, "Pretrain/Loss (Raw)": 2.245647668838501, "Pretrain/Step": 18020, "Pretrain/Step Time": 8.489974373951554} +{"Pretrain/Learning Rate": 3.978282558806723e-07, "Pretrain/Loss": 1.9840443134307861, "Pretrain/Loss (Raw)": 2.1415231227874756, "Pretrain/Step": 18021, "Pretrain/Step Time": 8.488793114200234} +{"Pretrain/Learning Rate": 3.9707429543101304e-07, "Pretrain/Loss": 1.9857394695281982, "Pretrain/Loss (Raw)": 2.171006202697754, "Pretrain/Step": 18022, "Pretrain/Step Time": 8.490243377164006} +{"Pretrain/Learning Rate": 3.963210443893722e-07, "Pretrain/Loss": 1.9864126443862915, "Pretrain/Loss (Raw)": 2.0624725818634033, "Pretrain/Step": 18023, "Pretrain/Step Time": 8.493830302730203} +{"Pretrain/Learning Rate": 3.9556850277746857e-07, "Pretrain/Loss": 1.985508680343628, "Pretrain/Loss (Raw)": 1.9742053747177124, "Pretrain/Step": 18024, "Pretrain/Step Time": 8.490342834964395} +{"Pretrain/Learning Rate": 3.9481667061700424e-07, "Pretrain/Loss": 1.9872033596038818, "Pretrain/Loss (Raw)": 2.113431215286255, "Pretrain/Step": 18025, "Pretrain/Step Time": 8.49048338830471} +{"Pretrain/Learning Rate": 3.9406554792965347e-07, "Pretrain/Loss": 1.9880428314208984, "Pretrain/Loss (Raw)": 1.9307767152786255, "Pretrain/Step": 18026, "Pretrain/Step Time": 8.489544231444597} +{"Pretrain/Learning Rate": 3.933151347370795e-07, "Pretrain/Loss": 1.9890493154525757, "Pretrain/Loss (Raw)": 2.10929012298584, "Pretrain/Step": 18027, "Pretrain/Step Time": 8.495233999565244} +{"Pretrain/Learning Rate": 3.9256543106091503e-07, "Pretrain/Loss": 1.9897677898406982, "Pretrain/Loss (Raw)": 2.0287046432495117, "Pretrain/Step": 18028, "Pretrain/Step Time": 8.495384553447366} +{"Pretrain/Learning Rate": 3.9181643692277893e-07, "Pretrain/Loss": 1.9894729852676392, "Pretrain/Loss (Raw)": 2.030121326446533, "Pretrain/Step": 18029, "Pretrain/Step Time": 8.496370127424598} +{"Pretrain/Learning Rate": 3.9106815234427055e-07, "Pretrain/Loss": 1.9900290966033936, "Pretrain/Loss (Raw)": 2.042710065841675, "Pretrain/Step": 18030, "Pretrain/Step Time": 8.497823294252157} +{"Pretrain/Learning Rate": 3.9032057734696147e-07, "Pretrain/Loss": 1.992098331451416, "Pretrain/Loss (Raw)": 2.455355644226074, "Pretrain/Step": 18031, "Pretrain/Step Time": 8.498721968382597} +{"Pretrain/Learning Rate": 3.8957371195240954e-07, "Pretrain/Loss": 1.9896031618118286, "Pretrain/Loss (Raw)": 2.000837802886963, "Pretrain/Step": 18032, "Pretrain/Step Time": 8.49573753029108} +{"Pretrain/Learning Rate": 3.8882755618215306e-07, "Pretrain/Loss": 1.9863879680633545, "Pretrain/Loss (Raw)": 1.7687289714813232, "Pretrain/Step": 18033, "Pretrain/Step Time": 8.498715000227094} +{"Pretrain/Learning Rate": 3.880821100577026e-07, "Pretrain/Loss": 1.988081693649292, "Pretrain/Loss (Raw)": 1.9064539670944214, "Pretrain/Step": 18034, "Pretrain/Step Time": 8.499142181128263} +{"Pretrain/Learning Rate": 3.8733737360055475e-07, "Pretrain/Loss": 1.9888232946395874, "Pretrain/Loss (Raw)": 2.1182310581207275, "Pretrain/Step": 18035, "Pretrain/Step Time": 8.497172128409147} +{"Pretrain/Learning Rate": 3.865933468321814e-07, "Pretrain/Loss": 1.9920636415481567, "Pretrain/Loss (Raw)": 2.427816867828369, "Pretrain/Step": 18036, "Pretrain/Step Time": 8.49734602496028} +{"Pretrain/Learning Rate": 3.858500297740375e-07, "Pretrain/Loss": 1.9902493953704834, "Pretrain/Loss (Raw)": 2.0191426277160645, "Pretrain/Step": 18037, "Pretrain/Step Time": 8.492344638332725} +{"Pretrain/Learning Rate": 3.851074224475587e-07, "Pretrain/Loss": 1.9883885383605957, "Pretrain/Loss (Raw)": 2.0381205081939697, "Pretrain/Step": 18038, "Pretrain/Step Time": 8.495459357276559} +{"Pretrain/Learning Rate": 3.843655248741529e-07, "Pretrain/Loss": 1.9885897636413574, "Pretrain/Loss (Raw)": 1.8038748502731323, "Pretrain/Step": 18039, "Pretrain/Step Time": 8.49710737913847} +{"Pretrain/Learning Rate": 3.8362433707521684e-07, "Pretrain/Loss": 1.989664912223816, "Pretrain/Loss (Raw)": 2.186521530151367, "Pretrain/Step": 18040, "Pretrain/Step Time": 8.497729817405343} +{"Pretrain/Learning Rate": 3.828838590721168e-07, "Pretrain/Loss": 1.98826003074646, "Pretrain/Loss (Raw)": 1.8484952449798584, "Pretrain/Step": 18041, "Pretrain/Step Time": 8.492843590676785} +{"Pretrain/Learning Rate": 3.821440908862078e-07, "Pretrain/Loss": 1.9883391857147217, "Pretrain/Loss (Raw)": 1.933593511581421, "Pretrain/Step": 18042, "Pretrain/Step Time": 8.492060646414757} +{"Pretrain/Learning Rate": 3.814050325388174e-07, "Pretrain/Loss": 1.9866235256195068, "Pretrain/Loss (Raw)": 1.6758707761764526, "Pretrain/Step": 18043, "Pretrain/Step Time": 8.49800437875092} +{"Pretrain/Learning Rate": 3.806666840512618e-07, "Pretrain/Loss": 1.9858530759811401, "Pretrain/Loss (Raw)": 2.030888795852661, "Pretrain/Step": 18044, "Pretrain/Step Time": 8.493735868483782} +{"Pretrain/Learning Rate": 3.799290454448268e-07, "Pretrain/Loss": 1.9856390953063965, "Pretrain/Loss (Raw)": 2.054196834564209, "Pretrain/Step": 18045, "Pretrain/Step Time": 8.495491379871964} +{"Pretrain/Learning Rate": 3.791921167407786e-07, "Pretrain/Loss": 1.9865003824234009, "Pretrain/Loss (Raw)": 2.070422887802124, "Pretrain/Step": 18046, "Pretrain/Step Time": 8.496390026062727} +{"Pretrain/Learning Rate": 3.784558979603697e-07, "Pretrain/Loss": 1.9845763444900513, "Pretrain/Loss (Raw)": 1.8596771955490112, "Pretrain/Step": 18047, "Pretrain/Step Time": 8.489641573280096} +{"Pretrain/Learning Rate": 3.777203891248277e-07, "Pretrain/Loss": 1.9862984418869019, "Pretrain/Loss (Raw)": 2.1026806831359863, "Pretrain/Step": 18048, "Pretrain/Step Time": 8.49222813732922} +{"Pretrain/Learning Rate": 3.7698559025536316e-07, "Pretrain/Loss": 1.9903188943862915, "Pretrain/Loss (Raw)": 2.442702054977417, "Pretrain/Step": 18049, "Pretrain/Step Time": 8.49136881902814} +{"Pretrain/Learning Rate": 3.762515013731621e-07, "Pretrain/Loss": 1.9880127906799316, "Pretrain/Loss (Raw)": 1.7971760034561157, "Pretrain/Step": 18050, "Pretrain/Step Time": 8.495381383225322} +{"Pretrain/Learning Rate": 3.7551812249938535e-07, "Pretrain/Loss": 1.9873080253601074, "Pretrain/Loss (Raw)": 1.8886598348617554, "Pretrain/Step": 18051, "Pretrain/Step Time": 8.48863179795444} +{"Pretrain/Learning Rate": 3.7478545365518814e-07, "Pretrain/Loss": 1.9878239631652832, "Pretrain/Loss (Raw)": 1.8969017267227173, "Pretrain/Step": 18052, "Pretrain/Step Time": 8.49829781614244} +{"Pretrain/Learning Rate": 3.740534948616897e-07, "Pretrain/Loss": 1.9882614612579346, "Pretrain/Loss (Raw)": 1.9553042650222778, "Pretrain/Step": 18053, "Pretrain/Step Time": 8.491706233471632} +{"Pretrain/Learning Rate": 3.7332224614000375e-07, "Pretrain/Loss": 1.9885941743850708, "Pretrain/Loss (Raw)": 1.8763165473937988, "Pretrain/Step": 18054, "Pretrain/Step Time": 8.488598862662911} +{"Pretrain/Learning Rate": 3.7259170751120786e-07, "Pretrain/Loss": 1.9897992610931396, "Pretrain/Loss (Raw)": 2.113725185394287, "Pretrain/Step": 18055, "Pretrain/Step Time": 8.490638852119446} +{"Pretrain/Learning Rate": 3.7186187899636573e-07, "Pretrain/Loss": 1.9865740537643433, "Pretrain/Loss (Raw)": 2.021796464920044, "Pretrain/Step": 18056, "Pretrain/Step Time": 8.484859408810735} +{"Pretrain/Learning Rate": 3.7113276061652714e-07, "Pretrain/Loss": 1.9880549907684326, "Pretrain/Loss (Raw)": 2.112582206726074, "Pretrain/Step": 18057, "Pretrain/Step Time": 8.485912064090371} +{"Pretrain/Learning Rate": 3.704043523927114e-07, "Pretrain/Loss": 1.9886393547058105, "Pretrain/Loss (Raw)": 1.8479974269866943, "Pretrain/Step": 18058, "Pretrain/Step Time": 8.488773854449391} +{"Pretrain/Learning Rate": 3.696766543459268e-07, "Pretrain/Loss": 1.9884943962097168, "Pretrain/Loss (Raw)": 2.169370174407959, "Pretrain/Step": 18059, "Pretrain/Step Time": 8.492836942896247} +{"Pretrain/Learning Rate": 3.689496664971509e-07, "Pretrain/Loss": 1.9878926277160645, "Pretrain/Loss (Raw)": 1.8885287046432495, "Pretrain/Step": 18060, "Pretrain/Step Time": 8.486330267041922} +{"Pretrain/Learning Rate": 3.6822338886734756e-07, "Pretrain/Loss": 1.9911590814590454, "Pretrain/Loss (Raw)": 2.2646358013153076, "Pretrain/Step": 18061, "Pretrain/Step Time": 8.486630676314235} +{"Pretrain/Learning Rate": 3.6749782147745824e-07, "Pretrain/Loss": 1.9914307594299316, "Pretrain/Loss (Raw)": 2.1027731895446777, "Pretrain/Step": 18062, "Pretrain/Step Time": 8.485482923686504} +{"Pretrain/Learning Rate": 3.6677296434840524e-07, "Pretrain/Loss": 1.988662838935852, "Pretrain/Loss (Raw)": 1.7321206331253052, "Pretrain/Step": 18063, "Pretrain/Step Time": 8.483754990622401} +{"Pretrain/Learning Rate": 3.6604881750108846e-07, "Pretrain/Loss": 1.9903517961502075, "Pretrain/Loss (Raw)": 2.0761561393737793, "Pretrain/Step": 18064, "Pretrain/Step Time": 8.484535770490766} +{"Pretrain/Learning Rate": 3.6532538095638837e-07, "Pretrain/Loss": 1.9913183450698853, "Pretrain/Loss (Raw)": 2.167640209197998, "Pretrain/Step": 18065, "Pretrain/Step Time": 8.487448364496231} +{"Pretrain/Learning Rate": 3.646026547351633e-07, "Pretrain/Loss": 1.9902069568634033, "Pretrain/Loss (Raw)": 1.98067307472229, "Pretrain/Step": 18066, "Pretrain/Step Time": 8.485787767916918} +{"Pretrain/Learning Rate": 3.6388063885825495e-07, "Pretrain/Loss": 1.9929282665252686, "Pretrain/Loss (Raw)": 2.270812511444092, "Pretrain/Step": 18067, "Pretrain/Step Time": 8.486208567395806} +{"Pretrain/Learning Rate": 3.6315933334648e-07, "Pretrain/Loss": 1.9938938617706299, "Pretrain/Loss (Raw)": 2.0195329189300537, "Pretrain/Step": 18068, "Pretrain/Step Time": 8.490259138867259} +{"Pretrain/Learning Rate": 3.6243873822063846e-07, "Pretrain/Loss": 1.9960023164749146, "Pretrain/Loss (Raw)": 2.090702772140503, "Pretrain/Step": 18069, "Pretrain/Step Time": 8.483023466542363} +{"Pretrain/Learning Rate": 3.6171885350150815e-07, "Pretrain/Loss": 1.9981095790863037, "Pretrain/Loss (Raw)": 2.150559902191162, "Pretrain/Step": 18070, "Pretrain/Step Time": 8.480527495965362} +{"Pretrain/Learning Rate": 3.609996792098447e-07, "Pretrain/Loss": 1.9990465641021729, "Pretrain/Loss (Raw)": 2.0717484951019287, "Pretrain/Step": 18071, "Pretrain/Step Time": 8.481958830729127} +{"Pretrain/Learning Rate": 3.602812153663898e-07, "Pretrain/Loss": 1.9962642192840576, "Pretrain/Loss (Raw)": 1.734381079673767, "Pretrain/Step": 18072, "Pretrain/Step Time": 8.485282871872187} +{"Pretrain/Learning Rate": 3.59563461991852e-07, "Pretrain/Loss": 1.9956594705581665, "Pretrain/Loss (Raw)": 1.8598699569702148, "Pretrain/Step": 18073, "Pretrain/Step Time": 8.48646811582148} +{"Pretrain/Learning Rate": 3.588464191069313e-07, "Pretrain/Loss": 1.995192050933838, "Pretrain/Loss (Raw)": 1.7686967849731445, "Pretrain/Step": 18074, "Pretrain/Step Time": 8.480441737920046} +{"Pretrain/Learning Rate": 3.5813008673230566e-07, "Pretrain/Loss": 1.9948463439941406, "Pretrain/Loss (Raw)": 1.9699201583862305, "Pretrain/Step": 18075, "Pretrain/Step Time": 8.487602891400456} +{"Pretrain/Learning Rate": 3.574144648886252e-07, "Pretrain/Loss": 1.9951733350753784, "Pretrain/Loss (Raw)": 1.7135790586471558, "Pretrain/Step": 18076, "Pretrain/Step Time": 8.48807317391038} +{"Pretrain/Learning Rate": 3.5669955359652897e-07, "Pretrain/Loss": 1.9958081245422363, "Pretrain/Loss (Raw)": 2.0550730228424072, "Pretrain/Step": 18077, "Pretrain/Step Time": 8.483572801575065} +{"Pretrain/Learning Rate": 3.5598535287662825e-07, "Pretrain/Loss": 1.9956371784210205, "Pretrain/Loss (Raw)": 2.0866026878356934, "Pretrain/Step": 18078, "Pretrain/Step Time": 8.481100330129266} +{"Pretrain/Learning Rate": 3.5527186274951776e-07, "Pretrain/Loss": 1.9982763528823853, "Pretrain/Loss (Raw)": 2.0807065963745117, "Pretrain/Step": 18079, "Pretrain/Step Time": 8.480195559561253} +{"Pretrain/Learning Rate": 3.545590832357698e-07, "Pretrain/Loss": 1.9965226650238037, "Pretrain/Loss (Raw)": 1.7776864767074585, "Pretrain/Step": 18080, "Pretrain/Step Time": 8.481513669714332} +{"Pretrain/Learning Rate": 3.538470143559319e-07, "Pretrain/Loss": 1.9958351850509644, "Pretrain/Loss (Raw)": 1.9878501892089844, "Pretrain/Step": 18081, "Pretrain/Step Time": 8.480339469388127} +{"Pretrain/Learning Rate": 3.53135656130546e-07, "Pretrain/Loss": 1.9938294887542725, "Pretrain/Loss (Raw)": 1.7702399492263794, "Pretrain/Step": 18082, "Pretrain/Step Time": 8.479307366535068} +{"Pretrain/Learning Rate": 3.5242500858011787e-07, "Pretrain/Loss": 1.995121717453003, "Pretrain/Loss (Raw)": 2.052062749862671, "Pretrain/Step": 18083, "Pretrain/Step Time": 8.47689220122993} +{"Pretrain/Learning Rate": 3.517150717251394e-07, "Pretrain/Loss": 1.9936108589172363, "Pretrain/Loss (Raw)": 1.8380745649337769, "Pretrain/Step": 18084, "Pretrain/Step Time": 8.47688259370625} +{"Pretrain/Learning Rate": 3.510058455860804e-07, "Pretrain/Loss": 1.993010401725769, "Pretrain/Loss (Raw)": 1.9890012741088867, "Pretrain/Step": 18085, "Pretrain/Step Time": 8.471466610208154} +{"Pretrain/Learning Rate": 3.502973301833884e-07, "Pretrain/Loss": 1.9899752140045166, "Pretrain/Loss (Raw)": 1.701216697692871, "Pretrain/Step": 18086, "Pretrain/Step Time": 8.472443411126733} +{"Pretrain/Learning Rate": 3.495895255374998e-07, "Pretrain/Loss": 1.9875354766845703, "Pretrain/Loss (Raw)": 1.6227667331695557, "Pretrain/Step": 18087, "Pretrain/Step Time": 8.472932521253824} +{"Pretrain/Learning Rate": 3.488824316688177e-07, "Pretrain/Loss": 1.9890961647033691, "Pretrain/Loss (Raw)": 2.3275694847106934, "Pretrain/Step": 18088, "Pretrain/Step Time": 8.476483933627605} +{"Pretrain/Learning Rate": 3.481760485977342e-07, "Pretrain/Loss": 1.9906094074249268, "Pretrain/Loss (Raw)": 2.091649293899536, "Pretrain/Step": 18089, "Pretrain/Step Time": 8.477860121056437} +{"Pretrain/Learning Rate": 3.474703763446163e-07, "Pretrain/Loss": 1.9911205768585205, "Pretrain/Loss (Raw)": 1.968530535697937, "Pretrain/Step": 18090, "Pretrain/Step Time": 8.48254399932921} +{"Pretrain/Learning Rate": 3.4676541492981164e-07, "Pretrain/Loss": 1.9907941818237305, "Pretrain/Loss (Raw)": 1.908294677734375, "Pretrain/Step": 18091, "Pretrain/Step Time": 8.479872604832053} +{"Pretrain/Learning Rate": 3.4606116437364556e-07, "Pretrain/Loss": 1.990422248840332, "Pretrain/Loss (Raw)": 1.828322172164917, "Pretrain/Step": 18092, "Pretrain/Step Time": 8.476641213521361} +{"Pretrain/Learning Rate": 3.4535762469642406e-07, "Pretrain/Loss": 1.9876338243484497, "Pretrain/Loss (Raw)": 1.5330731868743896, "Pretrain/Step": 18093, "Pretrain/Step Time": 8.48201278038323} +{"Pretrain/Learning Rate": 3.446547959184393e-07, "Pretrain/Loss": 1.9872326850891113, "Pretrain/Loss (Raw)": 1.9257925748825073, "Pretrain/Step": 18094, "Pretrain/Step Time": 8.479086792096496} +{"Pretrain/Learning Rate": 3.4395267805995e-07, "Pretrain/Loss": 1.9851436614990234, "Pretrain/Loss (Raw)": 1.707615852355957, "Pretrain/Step": 18095, "Pretrain/Step Time": 8.479501416906714} +{"Pretrain/Learning Rate": 3.432512711412039e-07, "Pretrain/Loss": 1.9861489534378052, "Pretrain/Loss (Raw)": 1.8988341093063354, "Pretrain/Step": 18096, "Pretrain/Step Time": 8.480037655681372} +{"Pretrain/Learning Rate": 3.425505751824265e-07, "Pretrain/Loss": 1.9854453802108765, "Pretrain/Loss (Raw)": 1.9586514234542847, "Pretrain/Step": 18097, "Pretrain/Step Time": 8.478951279073954} +{"Pretrain/Learning Rate": 3.418505902038183e-07, "Pretrain/Loss": 1.9795600175857544, "Pretrain/Loss (Raw)": 1.1573151350021362, "Pretrain/Step": 18098, "Pretrain/Step Time": 8.480451185256243} +{"Pretrain/Learning Rate": 3.411513162255686e-07, "Pretrain/Loss": 1.9809198379516602, "Pretrain/Loss (Raw)": 2.2578511238098145, "Pretrain/Step": 18099, "Pretrain/Step Time": 8.479071389883757} +{"Pretrain/Learning Rate": 3.404527532678364e-07, "Pretrain/Loss": 1.9811010360717773, "Pretrain/Loss (Raw)": 1.8464019298553467, "Pretrain/Step": 18100, "Pretrain/Step Time": 8.484616242349148} +{"Pretrain/Learning Rate": 3.397549013507639e-07, "Pretrain/Loss": 1.9830098152160645, "Pretrain/Loss (Raw)": 2.1143031120300293, "Pretrain/Step": 18101, "Pretrain/Step Time": 8.483725998550653} +{"Pretrain/Learning Rate": 3.390577604944767e-07, "Pretrain/Loss": 1.9837733507156372, "Pretrain/Loss (Raw)": 1.9558128118515015, "Pretrain/Step": 18102, "Pretrain/Step Time": 8.480799093842506} +{"Pretrain/Learning Rate": 3.383613307190725e-07, "Pretrain/Loss": 1.9859356880187988, "Pretrain/Loss (Raw)": 2.115525007247925, "Pretrain/Step": 18103, "Pretrain/Step Time": 8.482897827401757} +{"Pretrain/Learning Rate": 3.376656120446353e-07, "Pretrain/Loss": 1.9852232933044434, "Pretrain/Loss (Raw)": 1.9450069665908813, "Pretrain/Step": 18104, "Pretrain/Step Time": 8.478365696966648} +{"Pretrain/Learning Rate": 3.369706044912241e-07, "Pretrain/Loss": 1.984490156173706, "Pretrain/Loss (Raw)": 1.8428151607513428, "Pretrain/Step": 18105, "Pretrain/Step Time": 8.476894117891788} +{"Pretrain/Learning Rate": 3.362763080788811e-07, "Pretrain/Loss": 1.98698091506958, "Pretrain/Loss (Raw)": 2.2202260494232178, "Pretrain/Step": 18106, "Pretrain/Step Time": 8.474346788600087} +{"Pretrain/Learning Rate": 3.355827228276182e-07, "Pretrain/Loss": 1.9845844507217407, "Pretrain/Loss (Raw)": 1.7822617292404175, "Pretrain/Step": 18107, "Pretrain/Step Time": 8.479084545746446} +{"Pretrain/Learning Rate": 3.348898487574442e-07, "Pretrain/Loss": 1.981873869895935, "Pretrain/Loss (Raw)": 1.7387940883636475, "Pretrain/Step": 18108, "Pretrain/Step Time": 8.483512377366424} +{"Pretrain/Learning Rate": 3.34197685888335e-07, "Pretrain/Loss": 1.9836969375610352, "Pretrain/Loss (Raw)": 1.9701682329177856, "Pretrain/Step": 18109, "Pretrain/Step Time": 8.477996557950974} +{"Pretrain/Learning Rate": 3.33506234240244e-07, "Pretrain/Loss": 1.9858343601226807, "Pretrain/Loss (Raw)": 2.0589029788970947, "Pretrain/Step": 18110, "Pretrain/Step Time": 8.480167197063565} +{"Pretrain/Learning Rate": 3.328154938331135e-07, "Pretrain/Loss": 1.9867548942565918, "Pretrain/Loss (Raw)": 2.311994791030884, "Pretrain/Step": 18111, "Pretrain/Step Time": 8.474781872704625} +{"Pretrain/Learning Rate": 3.3212546468685823e-07, "Pretrain/Loss": 1.9870072603225708, "Pretrain/Loss (Raw)": 2.024367332458496, "Pretrain/Step": 18112, "Pretrain/Step Time": 8.475541640073061} +{"Pretrain/Learning Rate": 3.314361468213789e-07, "Pretrain/Loss": 1.984527826309204, "Pretrain/Loss (Raw)": 1.965076208114624, "Pretrain/Step": 18113, "Pretrain/Step Time": 8.477753780782223} +{"Pretrain/Learning Rate": 3.3074754025654573e-07, "Pretrain/Loss": 1.983191967010498, "Pretrain/Loss (Raw)": 2.0175952911376953, "Pretrain/Step": 18114, "Pretrain/Step Time": 8.474853178486228} +{"Pretrain/Learning Rate": 3.300596450122151e-07, "Pretrain/Loss": 1.9838082790374756, "Pretrain/Loss (Raw)": 1.9844721555709839, "Pretrain/Step": 18115, "Pretrain/Step Time": 8.476460326462984} +{"Pretrain/Learning Rate": 3.2937246110822384e-07, "Pretrain/Loss": 1.9821908473968506, "Pretrain/Loss (Raw)": 1.985399603843689, "Pretrain/Step": 18116, "Pretrain/Step Time": 8.4751334823668} +{"Pretrain/Learning Rate": 3.286859885643867e-07, "Pretrain/Loss": 1.9819167852401733, "Pretrain/Loss (Raw)": 1.8213181495666504, "Pretrain/Step": 18117, "Pretrain/Step Time": 8.47480701841414} +{"Pretrain/Learning Rate": 3.280002274004962e-07, "Pretrain/Loss": 1.9818342924118042, "Pretrain/Loss (Raw)": 1.8669346570968628, "Pretrain/Step": 18118, "Pretrain/Step Time": 8.47704116255045} +{"Pretrain/Learning Rate": 3.273151776363281e-07, "Pretrain/Loss": 1.9814704656600952, "Pretrain/Loss (Raw)": 2.0478694438934326, "Pretrain/Step": 18119, "Pretrain/Step Time": 8.484934261068702} +{"Pretrain/Learning Rate": 3.266308392916334e-07, "Pretrain/Loss": 1.9828534126281738, "Pretrain/Loss (Raw)": 2.0183420181274414, "Pretrain/Step": 18120, "Pretrain/Step Time": 8.474822772666812} +{"Pretrain/Learning Rate": 3.259472123861462e-07, "Pretrain/Loss": 1.9809222221374512, "Pretrain/Loss (Raw)": 1.8074250221252441, "Pretrain/Step": 18121, "Pretrain/Step Time": 8.474119184538722} +{"Pretrain/Learning Rate": 3.2526429693957305e-07, "Pretrain/Loss": 1.9827638864517212, "Pretrain/Loss (Raw)": 2.276085138320923, "Pretrain/Step": 18122, "Pretrain/Step Time": 8.473343346267939} +{"Pretrain/Learning Rate": 3.2458209297161204e-07, "Pretrain/Loss": 1.9810141324996948, "Pretrain/Loss (Raw)": 1.8044320344924927, "Pretrain/Step": 18123, "Pretrain/Step Time": 8.46878581121564} +{"Pretrain/Learning Rate": 3.239006005019307e-07, "Pretrain/Loss": 1.9790034294128418, "Pretrain/Loss (Raw)": 1.7948386669158936, "Pretrain/Step": 18124, "Pretrain/Step Time": 8.471181694418192} +{"Pretrain/Learning Rate": 3.232198195501801e-07, "Pretrain/Loss": 1.9787373542785645, "Pretrain/Loss (Raw)": 1.9954578876495361, "Pretrain/Step": 18125, "Pretrain/Step Time": 8.47293472290039} +{"Pretrain/Learning Rate": 3.225397501359917e-07, "Pretrain/Loss": 1.9811111688613892, "Pretrain/Loss (Raw)": 2.1611523628234863, "Pretrain/Step": 18126, "Pretrain/Step Time": 8.470892988145351} +{"Pretrain/Learning Rate": 3.2186039227896923e-07, "Pretrain/Loss": 1.9828202724456787, "Pretrain/Loss (Raw)": 2.0831048488616943, "Pretrain/Step": 18127, "Pretrain/Step Time": 8.470896802842617} +{"Pretrain/Learning Rate": 3.211817459987082e-07, "Pretrain/Loss": 1.9824857711791992, "Pretrain/Loss (Raw)": 1.9047725200653076, "Pretrain/Step": 18128, "Pretrain/Step Time": 8.4675707872957} +{"Pretrain/Learning Rate": 3.2050381131477624e-07, "Pretrain/Loss": 1.983566164970398, "Pretrain/Loss (Raw)": 1.9898468255996704, "Pretrain/Step": 18129, "Pretrain/Step Time": 8.468981593847275} +{"Pretrain/Learning Rate": 3.198265882467133e-07, "Pretrain/Loss": 1.9851447343826294, "Pretrain/Loss (Raw)": 1.9505711793899536, "Pretrain/Step": 18130, "Pretrain/Step Time": 8.465195780619979} +{"Pretrain/Learning Rate": 3.1915007681405653e-07, "Pretrain/Loss": 1.9855962991714478, "Pretrain/Loss (Raw)": 1.9703965187072754, "Pretrain/Step": 18131, "Pretrain/Step Time": 8.465979866683483} +{"Pretrain/Learning Rate": 3.184742770363069e-07, "Pretrain/Loss": 1.9842066764831543, "Pretrain/Loss (Raw)": 1.8082010746002197, "Pretrain/Step": 18132, "Pretrain/Step Time": 8.465064369142056} +{"Pretrain/Learning Rate": 3.1779918893295456e-07, "Pretrain/Loss": 1.9807994365692139, "Pretrain/Loss (Raw)": 2.018871545791626, "Pretrain/Step": 18133, "Pretrain/Step Time": 8.462289718911052} +{"Pretrain/Learning Rate": 3.171248125234616e-07, "Pretrain/Loss": 1.9812045097351074, "Pretrain/Loss (Raw)": 2.1845905780792236, "Pretrain/Step": 18134, "Pretrain/Step Time": 8.464552540332079} +{"Pretrain/Learning Rate": 3.164511478272708e-07, "Pretrain/Loss": 1.9808021783828735, "Pretrain/Loss (Raw)": 1.8670469522476196, "Pretrain/Step": 18135, "Pretrain/Step Time": 8.464814715087414} +{"Pretrain/Learning Rate": 3.157781948638139e-07, "Pretrain/Loss": 1.9794507026672363, "Pretrain/Loss (Raw)": 1.7472511529922485, "Pretrain/Step": 18136, "Pretrain/Step Time": 8.457914421334863} +{"Pretrain/Learning Rate": 3.15105953652492e-07, "Pretrain/Loss": 1.9783296585083008, "Pretrain/Loss (Raw)": 1.8893811702728271, "Pretrain/Step": 18137, "Pretrain/Step Time": 8.458914753049612} +{"Pretrain/Learning Rate": 3.1443442421268674e-07, "Pretrain/Loss": 1.9768781661987305, "Pretrain/Loss (Raw)": 1.6610172986984253, "Pretrain/Step": 18138, "Pretrain/Step Time": 8.45606986247003} +{"Pretrain/Learning Rate": 3.1376360656376335e-07, "Pretrain/Loss": 1.978575587272644, "Pretrain/Loss (Raw)": 2.06097149848938, "Pretrain/Step": 18139, "Pretrain/Step Time": 8.452608592808247} +{"Pretrain/Learning Rate": 3.1309350072506184e-07, "Pretrain/Loss": 1.9798412322998047, "Pretrain/Loss (Raw)": 2.0990519523620605, "Pretrain/Step": 18140, "Pretrain/Step Time": 8.455494482070208} +{"Pretrain/Learning Rate": 3.124241067159084e-07, "Pretrain/Loss": 1.9769476652145386, "Pretrain/Loss (Raw)": 1.6800442934036255, "Pretrain/Step": 18141, "Pretrain/Step Time": 8.460858387872577} +{"Pretrain/Learning Rate": 3.1175542455560147e-07, "Pretrain/Loss": 1.9761383533477783, "Pretrain/Loss (Raw)": 1.8183417320251465, "Pretrain/Step": 18142, "Pretrain/Step Time": 8.459442555904388} +{"Pretrain/Learning Rate": 3.110874542634229e-07, "Pretrain/Loss": 1.9748117923736572, "Pretrain/Loss (Raw)": 1.9718129634857178, "Pretrain/Step": 18143, "Pretrain/Step Time": 8.45953095331788} +{"Pretrain/Learning Rate": 3.1042019585863504e-07, "Pretrain/Loss": 1.9753705263137817, "Pretrain/Loss (Raw)": 2.2950079441070557, "Pretrain/Step": 18144, "Pretrain/Step Time": 8.459788938984275} +{"Pretrain/Learning Rate": 3.097536493604725e-07, "Pretrain/Loss": 1.975034236907959, "Pretrain/Loss (Raw)": 1.8613245487213135, "Pretrain/Step": 18145, "Pretrain/Step Time": 8.457296278327703} +{"Pretrain/Learning Rate": 3.0908781478815874e-07, "Pretrain/Loss": 1.9770705699920654, "Pretrain/Loss (Raw)": 2.0622215270996094, "Pretrain/Step": 18146, "Pretrain/Step Time": 8.4595030490309} +{"Pretrain/Learning Rate": 3.0842269216089235e-07, "Pretrain/Loss": 1.9769550561904907, "Pretrain/Loss (Raw)": 1.993005394935608, "Pretrain/Step": 18147, "Pretrain/Step Time": 8.456550892442465} +{"Pretrain/Learning Rate": 3.0775828149785246e-07, "Pretrain/Loss": 1.9755761623382568, "Pretrain/Loss (Raw)": 2.069148540496826, "Pretrain/Step": 18148, "Pretrain/Step Time": 8.459767956286669} +{"Pretrain/Learning Rate": 3.0709458281819315e-07, "Pretrain/Loss": 1.9746136665344238, "Pretrain/Loss (Raw)": 2.0182995796203613, "Pretrain/Step": 18149, "Pretrain/Step Time": 8.462086960673332} +{"Pretrain/Learning Rate": 3.0643159614105464e-07, "Pretrain/Loss": 1.97332763671875, "Pretrain/Loss (Raw)": 2.006408214569092, "Pretrain/Step": 18150, "Pretrain/Step Time": 8.457708850502968} +{"Pretrain/Learning Rate": 3.0576932148555506e-07, "Pretrain/Loss": 1.9732751846313477, "Pretrain/Loss (Raw)": 2.055757761001587, "Pretrain/Step": 18151, "Pretrain/Step Time": 8.456012964248657} +{"Pretrain/Learning Rate": 3.0510775887078733e-07, "Pretrain/Loss": 1.9744129180908203, "Pretrain/Loss (Raw)": 2.1198229789733887, "Pretrain/Step": 18152, "Pretrain/Step Time": 8.460121234878898} +{"Pretrain/Learning Rate": 3.044469083158308e-07, "Pretrain/Loss": 1.971815824508667, "Pretrain/Loss (Raw)": 1.7810195684432983, "Pretrain/Step": 18153, "Pretrain/Step Time": 8.457320541143417} +{"Pretrain/Learning Rate": 3.0378676983973674e-07, "Pretrain/Loss": 1.9711860418319702, "Pretrain/Loss (Raw)": 1.8501633405685425, "Pretrain/Step": 18154, "Pretrain/Step Time": 8.458196554332972} +{"Pretrain/Learning Rate": 3.0312734346154003e-07, "Pretrain/Loss": 1.9700409173965454, "Pretrain/Loss (Raw)": 1.9627190828323364, "Pretrain/Step": 18155, "Pretrain/Step Time": 8.450729565694928} +{"Pretrain/Learning Rate": 3.0246862920025874e-07, "Pretrain/Loss": 1.9692771434783936, "Pretrain/Loss (Raw)": 1.930942416191101, "Pretrain/Step": 18156, "Pretrain/Step Time": 8.454051399603486} +{"Pretrain/Learning Rate": 3.018106270748833e-07, "Pretrain/Loss": 1.9667015075683594, "Pretrain/Loss (Raw)": 1.7004413604736328, "Pretrain/Step": 18157, "Pretrain/Step Time": 8.455215469002724} +{"Pretrain/Learning Rate": 3.0115333710438734e-07, "Pretrain/Loss": 1.9655652046203613, "Pretrain/Loss (Raw)": 1.8972465991973877, "Pretrain/Step": 18158, "Pretrain/Step Time": 8.459737412631512} +{"Pretrain/Learning Rate": 3.004967593077224e-07, "Pretrain/Loss": 1.958642601966858, "Pretrain/Loss (Raw)": 1.5692732334136963, "Pretrain/Step": 18159, "Pretrain/Step Time": 8.458164151757956} +{"Pretrain/Learning Rate": 2.998408937038205e-07, "Pretrain/Loss": 1.9609909057617188, "Pretrain/Loss (Raw)": 2.301403760910034, "Pretrain/Step": 18160, "Pretrain/Step Time": 8.457188187167048} +{"Pretrain/Learning Rate": 2.991857403115972e-07, "Pretrain/Loss": 1.9620875120162964, "Pretrain/Loss (Raw)": 1.9091132879257202, "Pretrain/Step": 18161, "Pretrain/Step Time": 8.456510731950402} +{"Pretrain/Learning Rate": 2.985312991499373e-07, "Pretrain/Loss": 1.9635432958602905, "Pretrain/Loss (Raw)": 2.0927863121032715, "Pretrain/Step": 18162, "Pretrain/Step Time": 8.458190267905593} +{"Pretrain/Learning Rate": 2.9787757023771455e-07, "Pretrain/Loss": 1.9635041952133179, "Pretrain/Loss (Raw)": 2.1132349967956543, "Pretrain/Step": 18163, "Pretrain/Step Time": 8.454881085082889} +{"Pretrain/Learning Rate": 2.9722455359378064e-07, "Pretrain/Loss": 1.9599335193634033, "Pretrain/Loss (Raw)": 1.9707577228546143, "Pretrain/Step": 18164, "Pretrain/Step Time": 8.451107285916805} +{"Pretrain/Learning Rate": 2.9657224923695934e-07, "Pretrain/Loss": 1.9591283798217773, "Pretrain/Loss (Raw)": 1.9160895347595215, "Pretrain/Step": 18165, "Pretrain/Step Time": 8.455250417813659} +{"Pretrain/Learning Rate": 2.959206571860634e-07, "Pretrain/Loss": 1.9588193893432617, "Pretrain/Loss (Raw)": 1.9985729455947876, "Pretrain/Step": 18166, "Pretrain/Step Time": 8.455144630745053} +{"Pretrain/Learning Rate": 2.952697774598806e-07, "Pretrain/Loss": 1.9603962898254395, "Pretrain/Loss (Raw)": 2.005709171295166, "Pretrain/Step": 18167, "Pretrain/Step Time": 8.455274168401957} +{"Pretrain/Learning Rate": 2.946196100771792e-07, "Pretrain/Loss": 1.9598429203033447, "Pretrain/Loss (Raw)": 2.115689516067505, "Pretrain/Step": 18168, "Pretrain/Step Time": 8.456428932026029} +{"Pretrain/Learning Rate": 2.9397015505670257e-07, "Pretrain/Loss": 1.9608521461486816, "Pretrain/Loss (Raw)": 1.977683424949646, "Pretrain/Step": 18169, "Pretrain/Step Time": 8.458855122327805} +{"Pretrain/Learning Rate": 2.9332141241718016e-07, "Pretrain/Loss": 1.9606508016586304, "Pretrain/Loss (Raw)": 1.9078260660171509, "Pretrain/Step": 18170, "Pretrain/Step Time": 8.456165835261345} +{"Pretrain/Learning Rate": 2.926733821773192e-07, "Pretrain/Loss": 1.9626895189285278, "Pretrain/Loss (Raw)": 1.9368274211883545, "Pretrain/Step": 18171, "Pretrain/Step Time": 8.451459184288979} +{"Pretrain/Learning Rate": 2.9202606435580203e-07, "Pretrain/Loss": 1.9626438617706299, "Pretrain/Loss (Raw)": 2.0250425338745117, "Pretrain/Step": 18172, "Pretrain/Step Time": 8.454932207241654} +{"Pretrain/Learning Rate": 2.913794589712998e-07, "Pretrain/Loss": 1.9634371995925903, "Pretrain/Loss (Raw)": 2.155745506286621, "Pretrain/Step": 18173, "Pretrain/Step Time": 8.453016240149736} +{"Pretrain/Learning Rate": 2.907335660424476e-07, "Pretrain/Loss": 1.961777687072754, "Pretrain/Loss (Raw)": 1.8580052852630615, "Pretrain/Step": 18174, "Pretrain/Step Time": 8.452663889154792} +{"Pretrain/Learning Rate": 2.90088385587875e-07, "Pretrain/Loss": 1.9611177444458008, "Pretrain/Loss (Raw)": 1.7752023935317993, "Pretrain/Step": 18175, "Pretrain/Step Time": 8.461010184139013} +{"Pretrain/Learning Rate": 2.894439176261865e-07, "Pretrain/Loss": 1.9603018760681152, "Pretrain/Loss (Raw)": 1.9982482194900513, "Pretrain/Step": 18176, "Pretrain/Step Time": 8.45984023064375} +{"Pretrain/Learning Rate": 2.888001621759617e-07, "Pretrain/Loss": 1.9556735754013062, "Pretrain/Loss (Raw)": 1.8502744436264038, "Pretrain/Step": 18177, "Pretrain/Step Time": 8.458684390410781} +{"Pretrain/Learning Rate": 2.881571192557636e-07, "Pretrain/Loss": 1.9554712772369385, "Pretrain/Loss (Raw)": 1.7712819576263428, "Pretrain/Step": 18178, "Pretrain/Step Time": 8.4594467561692} +{"Pretrain/Learning Rate": 2.8751478888413285e-07, "Pretrain/Loss": 1.9553587436676025, "Pretrain/Loss (Raw)": 1.874250054359436, "Pretrain/Step": 18179, "Pretrain/Step Time": 8.45821082778275} +{"Pretrain/Learning Rate": 2.8687317107959356e-07, "Pretrain/Loss": 1.9559974670410156, "Pretrain/Loss (Raw)": 1.9786773920059204, "Pretrain/Step": 18180, "Pretrain/Step Time": 8.451012236997485} +{"Pretrain/Learning Rate": 2.8623226586064757e-07, "Pretrain/Loss": 1.957390546798706, "Pretrain/Loss (Raw)": 2.133599281311035, "Pretrain/Step": 18181, "Pretrain/Step Time": 8.453171011060476} +{"Pretrain/Learning Rate": 2.85592073245769e-07, "Pretrain/Loss": 1.9589539766311646, "Pretrain/Loss (Raw)": 2.076460123062134, "Pretrain/Step": 18182, "Pretrain/Step Time": 8.452359838411212} +{"Pretrain/Learning Rate": 2.849525932534208e-07, "Pretrain/Loss": 1.957977294921875, "Pretrain/Loss (Raw)": 1.9886953830718994, "Pretrain/Step": 18183, "Pretrain/Step Time": 8.455442782491446} +{"Pretrain/Learning Rate": 2.8431382590204116e-07, "Pretrain/Loss": 1.9548158645629883, "Pretrain/Loss (Raw)": 1.6171263456344604, "Pretrain/Step": 18184, "Pretrain/Step Time": 8.457981321960688} +{"Pretrain/Learning Rate": 2.836757712100485e-07, "Pretrain/Loss": 1.952624797821045, "Pretrain/Loss (Raw)": 1.8321439027786255, "Pretrain/Step": 18185, "Pretrain/Step Time": 8.456749249249697} +{"Pretrain/Learning Rate": 2.830384291958421e-07, "Pretrain/Loss": 1.9531182050704956, "Pretrain/Loss (Raw)": 1.911149501800537, "Pretrain/Step": 18186, "Pretrain/Step Time": 8.458458252251148} +{"Pretrain/Learning Rate": 2.8240179987779893e-07, "Pretrain/Loss": 1.951192855834961, "Pretrain/Loss (Raw)": 1.9229135513305664, "Pretrain/Step": 18187, "Pretrain/Step Time": 8.453791568055749} +{"Pretrain/Learning Rate": 2.8176588327427367e-07, "Pretrain/Loss": 1.9528818130493164, "Pretrain/Loss (Raw)": 2.1047239303588867, "Pretrain/Step": 18188, "Pretrain/Step Time": 8.456835810095072} +{"Pretrain/Learning Rate": 2.811306794036045e-07, "Pretrain/Loss": 1.9494601488113403, "Pretrain/Loss (Raw)": 1.826656699180603, "Pretrain/Step": 18189, "Pretrain/Step Time": 8.4592562969774} +{"Pretrain/Learning Rate": 2.8049618828411004e-07, "Pretrain/Loss": 1.9500728845596313, "Pretrain/Loss (Raw)": 2.1812081336975098, "Pretrain/Step": 18190, "Pretrain/Step Time": 8.462701624259353} +{"Pretrain/Learning Rate": 2.798624099340785e-07, "Pretrain/Loss": 1.9501256942749023, "Pretrain/Loss (Raw)": 1.7388769388198853, "Pretrain/Step": 18191, "Pretrain/Step Time": 8.465555554255843} +{"Pretrain/Learning Rate": 2.7922934437178695e-07, "Pretrain/Loss": 1.950764536857605, "Pretrain/Loss (Raw)": 2.1579337120056152, "Pretrain/Step": 18192, "Pretrain/Step Time": 8.462693352252245} +{"Pretrain/Learning Rate": 2.785969916154929e-07, "Pretrain/Loss": 1.947108507156372, "Pretrain/Loss (Raw)": 1.6996591091156006, "Pretrain/Step": 18193, "Pretrain/Step Time": 8.458918239921331} +{"Pretrain/Learning Rate": 2.779653516834235e-07, "Pretrain/Loss": 1.9479091167449951, "Pretrain/Loss (Raw)": 2.083164930343628, "Pretrain/Step": 18194, "Pretrain/Step Time": 8.462107451632619} +{"Pretrain/Learning Rate": 2.7733442459379754e-07, "Pretrain/Loss": 1.9443817138671875, "Pretrain/Loss (Raw)": 1.8193081617355347, "Pretrain/Step": 18195, "Pretrain/Step Time": 8.462592834606767} +{"Pretrain/Learning Rate": 2.76704210364806e-07, "Pretrain/Loss": 1.9451016187667847, "Pretrain/Loss (Raw)": 2.1116738319396973, "Pretrain/Step": 18196, "Pretrain/Step Time": 8.458564227446914} +{"Pretrain/Learning Rate": 2.760747090146176e-07, "Pretrain/Loss": 1.942276954650879, "Pretrain/Loss (Raw)": 1.7291345596313477, "Pretrain/Step": 18197, "Pretrain/Step Time": 8.459271194413304} +{"Pretrain/Learning Rate": 2.754459205613874e-07, "Pretrain/Loss": 1.9408122301101685, "Pretrain/Loss (Raw)": 1.9630898237228394, "Pretrain/Step": 18198, "Pretrain/Step Time": 8.462871596217155} +{"Pretrain/Learning Rate": 2.7481784502324246e-07, "Pretrain/Loss": 1.9405460357666016, "Pretrain/Loss (Raw)": 2.0376744270324707, "Pretrain/Step": 18199, "Pretrain/Step Time": 8.458408389240503} +{"Pretrain/Learning Rate": 2.741904824182989e-07, "Pretrain/Loss": 1.9406428337097168, "Pretrain/Loss (Raw)": 1.7467632293701172, "Pretrain/Step": 18200, "Pretrain/Step Time": 8.461376948282123} +{"Pretrain/Learning Rate": 2.735638327646367e-07, "Pretrain/Loss": 1.9413073062896729, "Pretrain/Loss (Raw)": 1.9449234008789062, "Pretrain/Step": 18201, "Pretrain/Step Time": 8.459628500044346} +{"Pretrain/Learning Rate": 2.7293789608033583e-07, "Pretrain/Loss": 1.9446356296539307, "Pretrain/Loss (Raw)": 2.194720983505249, "Pretrain/Step": 18202, "Pretrain/Step Time": 8.464615438133478} +{"Pretrain/Learning Rate": 2.723126723834374e-07, "Pretrain/Loss": 1.9449156522750854, "Pretrain/Loss (Raw)": 2.005765438079834, "Pretrain/Step": 18203, "Pretrain/Step Time": 8.456671563908458} +{"Pretrain/Learning Rate": 2.7168816169196866e-07, "Pretrain/Loss": 1.9492623805999756, "Pretrain/Loss (Raw)": 2.269955635070801, "Pretrain/Step": 18204, "Pretrain/Step Time": 8.458598148077726} +{"Pretrain/Learning Rate": 2.7106436402394297e-07, "Pretrain/Loss": 1.9495728015899658, "Pretrain/Loss (Raw)": 2.0948047637939453, "Pretrain/Step": 18205, "Pretrain/Step Time": 8.461053056642413} +{"Pretrain/Learning Rate": 2.704412793973404e-07, "Pretrain/Loss": 1.9459948539733887, "Pretrain/Loss (Raw)": 1.628639817237854, "Pretrain/Step": 18206, "Pretrain/Step Time": 8.46682464517653} +{"Pretrain/Learning Rate": 2.6981890783013276e-07, "Pretrain/Loss": 1.946649432182312, "Pretrain/Loss (Raw)": 2.164491653442383, "Pretrain/Step": 18207, "Pretrain/Step Time": 8.467753492295742} +{"Pretrain/Learning Rate": 2.6919724934026116e-07, "Pretrain/Loss": 1.9493086338043213, "Pretrain/Loss (Raw)": 2.118053436279297, "Pretrain/Step": 18208, "Pretrain/Step Time": 8.472284965217113} +{"Pretrain/Learning Rate": 2.685763039456529e-07, "Pretrain/Loss": 1.9503083229064941, "Pretrain/Loss (Raw)": 2.1158041954040527, "Pretrain/Step": 18209, "Pretrain/Step Time": 8.4730841293931} +{"Pretrain/Learning Rate": 2.67956071664216e-07, "Pretrain/Loss": 1.9514331817626953, "Pretrain/Loss (Raw)": 1.9142239093780518, "Pretrain/Step": 18210, "Pretrain/Step Time": 8.472770491614938} +{"Pretrain/Learning Rate": 2.673365525138277e-07, "Pretrain/Loss": 1.950959324836731, "Pretrain/Loss (Raw)": 1.991416573524475, "Pretrain/Step": 18211, "Pretrain/Step Time": 8.47516748122871} +{"Pretrain/Learning Rate": 2.6671774651235437e-07, "Pretrain/Loss": 1.9521666765213013, "Pretrain/Loss (Raw)": 1.9926248788833618, "Pretrain/Step": 18212, "Pretrain/Step Time": 8.477581355720758} +{"Pretrain/Learning Rate": 2.6609965367764e-07, "Pretrain/Loss": 1.951151728630066, "Pretrain/Loss (Raw)": 1.8590744733810425, "Pretrain/Step": 18213, "Pretrain/Step Time": 8.477219996973872} +{"Pretrain/Learning Rate": 2.6548227402750645e-07, "Pretrain/Loss": 1.9593091011047363, "Pretrain/Loss (Raw)": 2.745365858078003, "Pretrain/Step": 18214, "Pretrain/Step Time": 8.478359945118427} +{"Pretrain/Learning Rate": 2.648656075797534e-07, "Pretrain/Loss": 1.9618122577667236, "Pretrain/Loss (Raw)": 1.9431769847869873, "Pretrain/Step": 18215, "Pretrain/Step Time": 8.473363790661097} +{"Pretrain/Learning Rate": 2.6424965435216386e-07, "Pretrain/Loss": 1.9585000276565552, "Pretrain/Loss (Raw)": 1.9036078453063965, "Pretrain/Step": 18216, "Pretrain/Step Time": 8.472754361107945} +{"Pretrain/Learning Rate": 2.6363441436249856e-07, "Pretrain/Loss": 1.9578514099121094, "Pretrain/Loss (Raw)": 2.0086188316345215, "Pretrain/Step": 18217, "Pretrain/Step Time": 8.470869340002537} +{"Pretrain/Learning Rate": 2.6301988762849617e-07, "Pretrain/Loss": 1.9570708274841309, "Pretrain/Loss (Raw)": 1.8686225414276123, "Pretrain/Step": 18218, "Pretrain/Step Time": 8.472058292478323} +{"Pretrain/Learning Rate": 2.624060741678785e-07, "Pretrain/Loss": 1.9580259323120117, "Pretrain/Loss (Raw)": 2.0305466651916504, "Pretrain/Step": 18219, "Pretrain/Step Time": 8.470769617706537} +{"Pretrain/Learning Rate": 2.617929739983427e-07, "Pretrain/Loss": 1.9593963623046875, "Pretrain/Loss (Raw)": 2.0037429332733154, "Pretrain/Step": 18220, "Pretrain/Step Time": 8.472117021679878} +{"Pretrain/Learning Rate": 2.611805871375633e-07, "Pretrain/Loss": 1.9640257358551025, "Pretrain/Loss (Raw)": 2.1256182193756104, "Pretrain/Step": 18221, "Pretrain/Step Time": 8.468609431758523} +{"Pretrain/Learning Rate": 2.605689136032069e-07, "Pretrain/Loss": 1.9643281698226929, "Pretrain/Loss (Raw)": 1.9645112752914429, "Pretrain/Step": 18222, "Pretrain/Step Time": 8.469731200486422} +{"Pretrain/Learning Rate": 2.599579534129037e-07, "Pretrain/Loss": 1.9665932655334473, "Pretrain/Loss (Raw)": 1.9975560903549194, "Pretrain/Step": 18223, "Pretrain/Step Time": 8.473777685314417} +{"Pretrain/Learning Rate": 2.593477065842703e-07, "Pretrain/Loss": 1.9663355350494385, "Pretrain/Loss (Raw)": 1.8658301830291748, "Pretrain/Step": 18224, "Pretrain/Step Time": 8.474780566990376} +{"Pretrain/Learning Rate": 2.587381731349092e-07, "Pretrain/Loss": 1.9667134284973145, "Pretrain/Loss (Raw)": 2.007007598876953, "Pretrain/Step": 18225, "Pretrain/Step Time": 8.474835464730859} +{"Pretrain/Learning Rate": 2.5812935308238696e-07, "Pretrain/Loss": 1.9723931550979614, "Pretrain/Loss (Raw)": 1.8843364715576172, "Pretrain/Step": 18226, "Pretrain/Step Time": 8.475549617782235} +{"Pretrain/Learning Rate": 2.575212464442672e-07, "Pretrain/Loss": 1.96983802318573, "Pretrain/Loss (Raw)": 1.9307879209518433, "Pretrain/Step": 18227, "Pretrain/Step Time": 8.472628820687532} +{"Pretrain/Learning Rate": 2.569138532380777e-07, "Pretrain/Loss": 1.9699151515960693, "Pretrain/Loss (Raw)": 1.8562923669815063, "Pretrain/Step": 18228, "Pretrain/Step Time": 8.470840848982334} +{"Pretrain/Learning Rate": 2.5630717348133215e-07, "Pretrain/Loss": 1.9691267013549805, "Pretrain/Loss (Raw)": 2.01336407661438, "Pretrain/Step": 18229, "Pretrain/Step Time": 8.473954822868109} +{"Pretrain/Learning Rate": 2.5570120719153043e-07, "Pretrain/Loss": 1.9702510833740234, "Pretrain/Loss (Raw)": 2.099730968475342, "Pretrain/Step": 18230, "Pretrain/Step Time": 8.471521887928247} +{"Pretrain/Learning Rate": 2.550959543861364e-07, "Pretrain/Loss": 1.9687575101852417, "Pretrain/Loss (Raw)": 1.9243570566177368, "Pretrain/Step": 18231, "Pretrain/Step Time": 8.469018381088972} +{"Pretrain/Learning Rate": 2.544914150826111e-07, "Pretrain/Loss": 1.9674224853515625, "Pretrain/Loss (Raw)": 1.7741315364837646, "Pretrain/Step": 18232, "Pretrain/Step Time": 8.469144051894546} +{"Pretrain/Learning Rate": 2.538875892983794e-07, "Pretrain/Loss": 1.9719610214233398, "Pretrain/Loss (Raw)": 2.4237258434295654, "Pretrain/Step": 18233, "Pretrain/Step Time": 8.473142487928271} +{"Pretrain/Learning Rate": 2.5328447705085246e-07, "Pretrain/Loss": 1.970352053642273, "Pretrain/Loss (Raw)": 2.014292001724243, "Pretrain/Step": 18234, "Pretrain/Step Time": 8.479735990986228} +{"Pretrain/Learning Rate": 2.5268207835742464e-07, "Pretrain/Loss": 1.9717408418655396, "Pretrain/Loss (Raw)": 1.9600300788879395, "Pretrain/Step": 18235, "Pretrain/Step Time": 8.47395258396864} +{"Pretrain/Learning Rate": 2.5208039323546263e-07, "Pretrain/Loss": 1.9730348587036133, "Pretrain/Loss (Raw)": 1.9044321775436401, "Pretrain/Step": 18236, "Pretrain/Step Time": 8.473537910729647} +{"Pretrain/Learning Rate": 2.514794217023164e-07, "Pretrain/Loss": 1.9734699726104736, "Pretrain/Loss (Raw)": 2.025855779647827, "Pretrain/Step": 18237, "Pretrain/Step Time": 8.473475156351924} +{"Pretrain/Learning Rate": 2.5087916377531664e-07, "Pretrain/Loss": 1.9727299213409424, "Pretrain/Loss (Raw)": 1.9641673564910889, "Pretrain/Step": 18238, "Pretrain/Step Time": 8.473142962902784} +{"Pretrain/Learning Rate": 2.5027961947176605e-07, "Pretrain/Loss": 1.9686286449432373, "Pretrain/Loss (Raw)": 1.7870548963546753, "Pretrain/Step": 18239, "Pretrain/Step Time": 8.475311106070876} +{"Pretrain/Learning Rate": 2.496807888089564e-07, "Pretrain/Loss": 1.9685786962509155, "Pretrain/Loss (Raw)": 2.017957925796509, "Pretrain/Step": 18240, "Pretrain/Step Time": 8.476024858653545} +{"Pretrain/Learning Rate": 2.490826718041517e-07, "Pretrain/Loss": 1.969287633895874, "Pretrain/Loss (Raw)": 2.0558111667633057, "Pretrain/Step": 18241, "Pretrain/Step Time": 8.48116903938353} +{"Pretrain/Learning Rate": 2.4848526847460194e-07, "Pretrain/Loss": 1.9677225351333618, "Pretrain/Loss (Raw)": 1.81727135181427, "Pretrain/Step": 18242, "Pretrain/Step Time": 8.483059089630842} +{"Pretrain/Learning Rate": 2.4788857883752956e-07, "Pretrain/Loss": 1.968498706817627, "Pretrain/Loss (Raw)": 2.0838215351104736, "Pretrain/Step": 18243, "Pretrain/Step Time": 8.483329776674509} +{"Pretrain/Learning Rate": 2.47292602910143e-07, "Pretrain/Loss": 1.9676929712295532, "Pretrain/Loss (Raw)": 1.8822617530822754, "Pretrain/Step": 18244, "Pretrain/Step Time": 8.483961997553706} +{"Pretrain/Learning Rate": 2.4669734070962567e-07, "Pretrain/Loss": 1.9675474166870117, "Pretrain/Loss (Raw)": 1.802701711654663, "Pretrain/Step": 18245, "Pretrain/Step Time": 8.480259438976645} +{"Pretrain/Learning Rate": 2.4610279225313614e-07, "Pretrain/Loss": 1.9687649011611938, "Pretrain/Loss (Raw)": 2.0227603912353516, "Pretrain/Step": 18246, "Pretrain/Step Time": 8.484129842370749} +{"Pretrain/Learning Rate": 2.4550895755782457e-07, "Pretrain/Loss": 1.9678146839141846, "Pretrain/Loss (Raw)": 1.9262405633926392, "Pretrain/Step": 18247, "Pretrain/Step Time": 8.476084044203162} +{"Pretrain/Learning Rate": 2.4491583664081053e-07, "Pretrain/Loss": 1.96677827835083, "Pretrain/Loss (Raw)": 1.8856884241104126, "Pretrain/Step": 18248, "Pretrain/Step Time": 8.47492858581245} +{"Pretrain/Learning Rate": 2.4432342951919986e-07, "Pretrain/Loss": 1.9703426361083984, "Pretrain/Loss (Raw)": 2.263664960861206, "Pretrain/Step": 18249, "Pretrain/Step Time": 8.474160173907876} +{"Pretrain/Learning Rate": 2.437317362100705e-07, "Pretrain/Loss": 1.967724323272705, "Pretrain/Loss (Raw)": 1.9409291744232178, "Pretrain/Step": 18250, "Pretrain/Step Time": 8.478125670924783} +{"Pretrain/Learning Rate": 2.431407567304811e-07, "Pretrain/Loss": 1.9698870182037354, "Pretrain/Loss (Raw)": 2.0812716484069824, "Pretrain/Step": 18251, "Pretrain/Step Time": 8.477814195677638} +{"Pretrain/Learning Rate": 2.425504910974791e-07, "Pretrain/Loss": 1.9725542068481445, "Pretrain/Loss (Raw)": 2.136225700378418, "Pretrain/Step": 18252, "Pretrain/Step Time": 8.480906644836068} +{"Pretrain/Learning Rate": 2.419609393280786e-07, "Pretrain/Loss": 1.973984956741333, "Pretrain/Loss (Raw)": 2.178600311279297, "Pretrain/Step": 18253, "Pretrain/Step Time": 8.477362211793661} +{"Pretrain/Learning Rate": 2.4137210143928277e-07, "Pretrain/Loss": 1.9724125862121582, "Pretrain/Loss (Raw)": 1.9598851203918457, "Pretrain/Step": 18254, "Pretrain/Step Time": 8.480543037876487} +{"Pretrain/Learning Rate": 2.4078397744806967e-07, "Pretrain/Loss": 1.9730713367462158, "Pretrain/Loss (Raw)": 2.1674277782440186, "Pretrain/Step": 18255, "Pretrain/Step Time": 8.478448450565338} +{"Pretrain/Learning Rate": 2.401965673713952e-07, "Pretrain/Loss": 1.9739899635314941, "Pretrain/Loss (Raw)": 2.0223476886749268, "Pretrain/Step": 18256, "Pretrain/Step Time": 8.481766698881984} +{"Pretrain/Learning Rate": 2.396098712261985e-07, "Pretrain/Loss": 1.9737635850906372, "Pretrain/Loss (Raw)": 1.9608808755874634, "Pretrain/Step": 18257, "Pretrain/Step Time": 8.483670571818948} +{"Pretrain/Learning Rate": 2.390238890293939e-07, "Pretrain/Loss": 1.9731690883636475, "Pretrain/Loss (Raw)": 1.8744654655456543, "Pretrain/Step": 18258, "Pretrain/Step Time": 8.483140155673027} +{"Pretrain/Learning Rate": 2.384386207978817e-07, "Pretrain/Loss": 1.9716107845306396, "Pretrain/Loss (Raw)": 1.7709370851516724, "Pretrain/Step": 18259, "Pretrain/Step Time": 8.481677945703268} +{"Pretrain/Learning Rate": 2.3785406654853738e-07, "Pretrain/Loss": 1.9745392799377441, "Pretrain/Loss (Raw)": 2.1830437183380127, "Pretrain/Step": 18260, "Pretrain/Step Time": 8.484484078362584} +{"Pretrain/Learning Rate": 2.3727022629821405e-07, "Pretrain/Loss": 1.9735559225082397, "Pretrain/Loss (Raw)": 1.8930168151855469, "Pretrain/Step": 18261, "Pretrain/Step Time": 8.485102087259293} +{"Pretrain/Learning Rate": 2.3668710006374828e-07, "Pretrain/Loss": 1.9743821620941162, "Pretrain/Loss (Raw)": 2.290358543395996, "Pretrain/Step": 18262, "Pretrain/Step Time": 8.48497305624187} +{"Pretrain/Learning Rate": 2.3610468786194884e-07, "Pretrain/Loss": 1.9759411811828613, "Pretrain/Loss (Raw)": 2.066581964492798, "Pretrain/Step": 18263, "Pretrain/Step Time": 8.480950314551592} +{"Pretrain/Learning Rate": 2.3552298970961895e-07, "Pretrain/Loss": 1.9761924743652344, "Pretrain/Loss (Raw)": 1.7794238328933716, "Pretrain/Step": 18264, "Pretrain/Step Time": 8.480309568345547} +{"Pretrain/Learning Rate": 2.3494200562352298e-07, "Pretrain/Loss": 1.97784423828125, "Pretrain/Loss (Raw)": 2.10080623626709, "Pretrain/Step": 18265, "Pretrain/Step Time": 8.482927115634084} +{"Pretrain/Learning Rate": 2.343617356204142e-07, "Pretrain/Loss": 1.9814661741256714, "Pretrain/Loss (Raw)": 2.1246182918548584, "Pretrain/Step": 18266, "Pretrain/Step Time": 8.481974771246314} +{"Pretrain/Learning Rate": 2.337821797170292e-07, "Pretrain/Loss": 1.980944037437439, "Pretrain/Loss (Raw)": 1.9941478967666626, "Pretrain/Step": 18267, "Pretrain/Step Time": 8.488278113305569} +{"Pretrain/Learning Rate": 2.332033379300741e-07, "Pretrain/Loss": 1.980257272720337, "Pretrain/Loss (Raw)": 2.0111494064331055, "Pretrain/Step": 18268, "Pretrain/Step Time": 8.488227495923638} +{"Pretrain/Learning Rate": 2.3262521027624384e-07, "Pretrain/Loss": 1.9823272228240967, "Pretrain/Loss (Raw)": 1.944984793663025, "Pretrain/Step": 18269, "Pretrain/Step Time": 8.483946982771158} +{"Pretrain/Learning Rate": 2.320477967722029e-07, "Pretrain/Loss": 1.9829556941986084, "Pretrain/Loss (Raw)": 1.898804783821106, "Pretrain/Step": 18270, "Pretrain/Step Time": 8.482537906616926} +{"Pretrain/Learning Rate": 2.314710974346046e-07, "Pretrain/Loss": 1.9827680587768555, "Pretrain/Loss (Raw)": 1.9477803707122803, "Pretrain/Step": 18271, "Pretrain/Step Time": 8.482175894081593} +{"Pretrain/Learning Rate": 2.308951122800773e-07, "Pretrain/Loss": 1.9810278415679932, "Pretrain/Loss (Raw)": 2.072255849838257, "Pretrain/Step": 18272, "Pretrain/Step Time": 8.48330063931644} +{"Pretrain/Learning Rate": 2.303198413252272e-07, "Pretrain/Loss": 1.9817661046981812, "Pretrain/Loss (Raw)": 1.9558284282684326, "Pretrain/Step": 18273, "Pretrain/Step Time": 8.484782570973039} +{"Pretrain/Learning Rate": 2.297452845866438e-07, "Pretrain/Loss": 1.980069637298584, "Pretrain/Loss (Raw)": 1.8450696468353271, "Pretrain/Step": 18274, "Pretrain/Step Time": 8.487102722749114} +{"Pretrain/Learning Rate": 2.2917144208089437e-07, "Pretrain/Loss": 1.9805811643600464, "Pretrain/Loss (Raw)": 2.058485507965088, "Pretrain/Step": 18275, "Pretrain/Step Time": 8.487982405349612} +{"Pretrain/Learning Rate": 2.2859831382452402e-07, "Pretrain/Loss": 1.9815192222595215, "Pretrain/Loss (Raw)": 2.189229726791382, "Pretrain/Step": 18276, "Pretrain/Step Time": 8.487760724499822} +{"Pretrain/Learning Rate": 2.2802589983405565e-07, "Pretrain/Loss": 1.9796092510223389, "Pretrain/Loss (Raw)": 1.7738195657730103, "Pretrain/Step": 18277, "Pretrain/Step Time": 8.48464652709663} +{"Pretrain/Learning Rate": 2.2745420012599827e-07, "Pretrain/Loss": 1.9793798923492432, "Pretrain/Loss (Raw)": 1.9770557880401611, "Pretrain/Step": 18278, "Pretrain/Step Time": 8.489988535642624} +{"Pretrain/Learning Rate": 2.268832147168387e-07, "Pretrain/Loss": 1.9779354333877563, "Pretrain/Loss (Raw)": 1.8708535432815552, "Pretrain/Step": 18279, "Pretrain/Step Time": 8.488511864095926} +{"Pretrain/Learning Rate": 2.2631294362303323e-07, "Pretrain/Loss": 1.9761312007904053, "Pretrain/Loss (Raw)": 1.8888872861862183, "Pretrain/Step": 18280, "Pretrain/Step Time": 8.490866189822555} +{"Pretrain/Learning Rate": 2.2574338686103258e-07, "Pretrain/Loss": 1.9785304069519043, "Pretrain/Loss (Raw)": 2.0881128311157227, "Pretrain/Step": 18281, "Pretrain/Step Time": 8.491137705743313} +{"Pretrain/Learning Rate": 2.2517454444725694e-07, "Pretrain/Loss": 1.9802584648132324, "Pretrain/Loss (Raw)": 2.071345806121826, "Pretrain/Step": 18282, "Pretrain/Step Time": 8.490377526730299} +{"Pretrain/Learning Rate": 2.246064163981071e-07, "Pretrain/Loss": 1.980644702911377, "Pretrain/Loss (Raw)": 2.0121614933013916, "Pretrain/Step": 18283, "Pretrain/Step Time": 8.49046130105853} +{"Pretrain/Learning Rate": 2.2403900272996436e-07, "Pretrain/Loss": 1.9804894924163818, "Pretrain/Loss (Raw)": 1.9110894203186035, "Pretrain/Step": 18284, "Pretrain/Step Time": 8.491750748828053} +{"Pretrain/Learning Rate": 2.2347230345919347e-07, "Pretrain/Loss": 1.982398271560669, "Pretrain/Loss (Raw)": 1.944760799407959, "Pretrain/Step": 18285, "Pretrain/Step Time": 8.491789262741804} +{"Pretrain/Learning Rate": 2.229063186021313e-07, "Pretrain/Loss": 1.9835350513458252, "Pretrain/Loss (Raw)": 2.042745590209961, "Pretrain/Step": 18286, "Pretrain/Step Time": 8.488187531009316} +{"Pretrain/Learning Rate": 2.2234104817510093e-07, "Pretrain/Loss": 1.9875129461288452, "Pretrain/Loss (Raw)": 2.078442335128784, "Pretrain/Step": 18287, "Pretrain/Step Time": 8.49029184319079} +{"Pretrain/Learning Rate": 2.2177649219439488e-07, "Pretrain/Loss": 1.9872727394104004, "Pretrain/Loss (Raw)": 2.270671844482422, "Pretrain/Step": 18288, "Pretrain/Step Time": 8.48902047611773} +{"Pretrain/Learning Rate": 2.2121265067630015e-07, "Pretrain/Loss": 1.9874827861785889, "Pretrain/Loss (Raw)": 1.9359824657440186, "Pretrain/Step": 18289, "Pretrain/Step Time": 8.492694482207298} +{"Pretrain/Learning Rate": 2.2064952363706759e-07, "Pretrain/Loss": 1.9871615171432495, "Pretrain/Loss (Raw)": 2.051669120788574, "Pretrain/Step": 18290, "Pretrain/Step Time": 8.493080958724022} +{"Pretrain/Learning Rate": 2.2008711109293977e-07, "Pretrain/Loss": 1.9876971244812012, "Pretrain/Loss (Raw)": 2.1817853450775146, "Pretrain/Step": 18291, "Pretrain/Step Time": 8.492636278271675} +{"Pretrain/Learning Rate": 2.1952541306013152e-07, "Pretrain/Loss": 1.987080693244934, "Pretrain/Loss (Raw)": 1.8918718099594116, "Pretrain/Step": 18292, "Pretrain/Step Time": 8.495706314221025} +{"Pretrain/Learning Rate": 2.189644295548382e-07, "Pretrain/Loss": 1.9871935844421387, "Pretrain/Loss (Raw)": 1.9305421113967896, "Pretrain/Step": 18293, "Pretrain/Step Time": 8.494599718600512} +{"Pretrain/Learning Rate": 2.1840416059323575e-07, "Pretrain/Loss": 1.9874541759490967, "Pretrain/Loss (Raw)": 2.0319175720214844, "Pretrain/Step": 18294, "Pretrain/Step Time": 8.492809120565653} +{"Pretrain/Learning Rate": 2.1784460619148072e-07, "Pretrain/Loss": 1.9878312349319458, "Pretrain/Loss (Raw)": 2.0539705753326416, "Pretrain/Step": 18295, "Pretrain/Step Time": 8.494050066918135} +{"Pretrain/Learning Rate": 2.1728576636570462e-07, "Pretrain/Loss": 1.9869836568832397, "Pretrain/Loss (Raw)": 2.007207155227661, "Pretrain/Step": 18296, "Pretrain/Step Time": 8.489705776795745} +{"Pretrain/Learning Rate": 2.1672764113202515e-07, "Pretrain/Loss": 1.987944483757019, "Pretrain/Loss (Raw)": 2.100661277770996, "Pretrain/Step": 18297, "Pretrain/Step Time": 8.489905735477805} +{"Pretrain/Learning Rate": 2.161702305065294e-07, "Pretrain/Loss": 1.9862964153289795, "Pretrain/Loss (Raw)": 1.6968790292739868, "Pretrain/Step": 18298, "Pretrain/Step Time": 8.492993095889688} +{"Pretrain/Learning Rate": 2.156135345052962e-07, "Pretrain/Loss": 1.9862124919891357, "Pretrain/Loss (Raw)": 1.9260672330856323, "Pretrain/Step": 18299, "Pretrain/Step Time": 8.494906600564718} +{"Pretrain/Learning Rate": 2.1505755314437381e-07, "Pretrain/Loss": 1.9869155883789062, "Pretrain/Loss (Raw)": 2.1150548458099365, "Pretrain/Step": 18300, "Pretrain/Step Time": 8.497137870639563} +{"Pretrain/Learning Rate": 2.1450228643979663e-07, "Pretrain/Loss": 1.9845871925354004, "Pretrain/Loss (Raw)": 1.857704997062683, "Pretrain/Step": 18301, "Pretrain/Step Time": 8.495167875662446} +{"Pretrain/Learning Rate": 2.139477344075713e-07, "Pretrain/Loss": 1.9854481220245361, "Pretrain/Loss (Raw)": 1.9682115316390991, "Pretrain/Step": 18302, "Pretrain/Step Time": 8.500130370259285} +{"Pretrain/Learning Rate": 2.133938970636906e-07, "Pretrain/Loss": 1.9870660305023193, "Pretrain/Loss (Raw)": 1.9822965860366821, "Pretrain/Step": 18303, "Pretrain/Step Time": 8.491852015256882} +{"Pretrain/Learning Rate": 2.128407744241251e-07, "Pretrain/Loss": 1.986022710800171, "Pretrain/Loss (Raw)": 1.864707112312317, "Pretrain/Step": 18304, "Pretrain/Step Time": 8.496055155992508} +{"Pretrain/Learning Rate": 2.122883665048203e-07, "Pretrain/Loss": 1.9871717691421509, "Pretrain/Loss (Raw)": 1.9973385334014893, "Pretrain/Step": 18305, "Pretrain/Step Time": 8.492279658094049} +{"Pretrain/Learning Rate": 2.1173667332170522e-07, "Pretrain/Loss": 1.988370418548584, "Pretrain/Loss (Raw)": 1.924712061882019, "Pretrain/Step": 18306, "Pretrain/Step Time": 8.49386196397245} +{"Pretrain/Learning Rate": 2.1118569489069207e-07, "Pretrain/Loss": 1.9889123439788818, "Pretrain/Loss (Raw)": 1.9436064958572388, "Pretrain/Step": 18307, "Pretrain/Step Time": 8.502244809642434} +{"Pretrain/Learning Rate": 2.1063543122765983e-07, "Pretrain/Loss": 1.9892120361328125, "Pretrain/Loss (Raw)": 2.0170507431030273, "Pretrain/Step": 18308, "Pretrain/Step Time": 8.503440294414759} +{"Pretrain/Learning Rate": 2.100858823484847e-07, "Pretrain/Loss": 1.9883861541748047, "Pretrain/Loss (Raw)": 2.027880907058716, "Pretrain/Step": 18309, "Pretrain/Step Time": 8.502577425912023} +{"Pretrain/Learning Rate": 2.09537048269004e-07, "Pretrain/Loss": 1.9877452850341797, "Pretrain/Loss (Raw)": 1.994437336921692, "Pretrain/Step": 18310, "Pretrain/Step Time": 8.502083119004965} +{"Pretrain/Learning Rate": 2.0898892900504673e-07, "Pretrain/Loss": 1.9870556592941284, "Pretrain/Loss (Raw)": 1.9004203081130981, "Pretrain/Step": 18311, "Pretrain/Step Time": 8.503221752122045} +{"Pretrain/Learning Rate": 2.0844152457241695e-07, "Pretrain/Loss": 1.9904365539550781, "Pretrain/Loss (Raw)": 2.049880266189575, "Pretrain/Step": 18312, "Pretrain/Step Time": 8.497150449082255} +{"Pretrain/Learning Rate": 2.078948349868992e-07, "Pretrain/Loss": 1.9922624826431274, "Pretrain/Loss (Raw)": 2.065868854522705, "Pretrain/Step": 18313, "Pretrain/Step Time": 8.4987120218575} +{"Pretrain/Learning Rate": 2.073488602642587e-07, "Pretrain/Loss": 1.99380362033844, "Pretrain/Loss (Raw)": 2.1084015369415283, "Pretrain/Step": 18314, "Pretrain/Step Time": 8.496440198272467} +{"Pretrain/Learning Rate": 2.0680360042023283e-07, "Pretrain/Loss": 1.9938361644744873, "Pretrain/Loss (Raw)": 1.9270869493484497, "Pretrain/Step": 18315, "Pretrain/Step Time": 8.499268922954798} +{"Pretrain/Learning Rate": 2.0625905547055069e-07, "Pretrain/Loss": 1.9931483268737793, "Pretrain/Loss (Raw)": 2.0166797637939453, "Pretrain/Step": 18316, "Pretrain/Step Time": 8.498493248596787} +{"Pretrain/Learning Rate": 2.0571522543090526e-07, "Pretrain/Loss": 1.9944863319396973, "Pretrain/Loss (Raw)": 1.997916340827942, "Pretrain/Step": 18317, "Pretrain/Step Time": 8.498294621706009} +{"Pretrain/Learning Rate": 2.051721103169868e-07, "Pretrain/Loss": 1.992809772491455, "Pretrain/Loss (Raw)": 1.9666047096252441, "Pretrain/Step": 18318, "Pretrain/Step Time": 8.493640473112464} +{"Pretrain/Learning Rate": 2.0462971014444943e-07, "Pretrain/Loss": 1.9955781698226929, "Pretrain/Loss (Raw)": 2.0932459831237793, "Pretrain/Step": 18319, "Pretrain/Step Time": 8.49560314975679} +{"Pretrain/Learning Rate": 2.040880249289362e-07, "Pretrain/Loss": 1.9950189590454102, "Pretrain/Loss (Raw)": 2.0863640308380127, "Pretrain/Step": 18320, "Pretrain/Step Time": 8.49516779743135} +{"Pretrain/Learning Rate": 2.0354705468606516e-07, "Pretrain/Loss": 1.9971622228622437, "Pretrain/Loss (Raw)": 1.973987102508545, "Pretrain/Step": 18321, "Pretrain/Step Time": 8.495094522833824} +{"Pretrain/Learning Rate": 2.0300679943143218e-07, "Pretrain/Loss": 1.9957741498947144, "Pretrain/Loss (Raw)": 1.9054762125015259, "Pretrain/Step": 18322, "Pretrain/Step Time": 8.489243481308222} +{"Pretrain/Learning Rate": 2.0246725918061926e-07, "Pretrain/Loss": 1.9972814321517944, "Pretrain/Loss (Raw)": 2.0122463703155518, "Pretrain/Step": 18323, "Pretrain/Step Time": 8.492541084066033} +{"Pretrain/Learning Rate": 2.0192843394918058e-07, "Pretrain/Loss": 1.9951748847961426, "Pretrain/Loss (Raw)": 1.8420425653457642, "Pretrain/Step": 18324, "Pretrain/Step Time": 8.49374627880752} +{"Pretrain/Learning Rate": 2.0139032375265377e-07, "Pretrain/Loss": 1.9966163635253906, "Pretrain/Loss (Raw)": 1.9136329889297485, "Pretrain/Step": 18325, "Pretrain/Step Time": 8.492431782186031} +{"Pretrain/Learning Rate": 2.0085292860655691e-07, "Pretrain/Loss": 1.9978814125061035, "Pretrain/Loss (Raw)": 2.125014305114746, "Pretrain/Step": 18326, "Pretrain/Step Time": 8.492012551054358} +{"Pretrain/Learning Rate": 2.0031624852638042e-07, "Pretrain/Loss": 1.9975284337997437, "Pretrain/Loss (Raw)": 1.992505669593811, "Pretrain/Step": 18327, "Pretrain/Step Time": 8.495109679177403} +{"Pretrain/Learning Rate": 1.9978028352760637e-07, "Pretrain/Loss": 1.999624252319336, "Pretrain/Loss (Raw)": 2.015031099319458, "Pretrain/Step": 18328, "Pretrain/Step Time": 8.489493289962411} +{"Pretrain/Learning Rate": 1.992450336256807e-07, "Pretrain/Loss": 2.0000104904174805, "Pretrain/Loss (Raw)": 1.9943819046020508, "Pretrain/Step": 18329, "Pretrain/Step Time": 8.488210942596197} +{"Pretrain/Learning Rate": 1.9871049883604388e-07, "Pretrain/Loss": 1.998025894165039, "Pretrain/Loss (Raw)": 1.9406697750091553, "Pretrain/Step": 18330, "Pretrain/Step Time": 8.487450290471315} +{"Pretrain/Learning Rate": 1.9817667917410576e-07, "Pretrain/Loss": 1.9984793663024902, "Pretrain/Loss (Raw)": 2.0638091564178467, "Pretrain/Step": 18331, "Pretrain/Step Time": 8.492075545713305} +{"Pretrain/Learning Rate": 1.9764357465525684e-07, "Pretrain/Loss": 1.995863914489746, "Pretrain/Loss (Raw)": 1.9351681470870972, "Pretrain/Step": 18332, "Pretrain/Step Time": 8.488497393205762} +{"Pretrain/Learning Rate": 1.9711118529487372e-07, "Pretrain/Loss": 1.994943618774414, "Pretrain/Loss (Raw)": 1.9770258665084839, "Pretrain/Step": 18333, "Pretrain/Step Time": 8.48677964694798} +{"Pretrain/Learning Rate": 1.9657951110830518e-07, "Pretrain/Loss": 1.9975135326385498, "Pretrain/Loss (Raw)": 1.95757257938385, "Pretrain/Step": 18334, "Pretrain/Step Time": 8.482579253613949} +{"Pretrain/Learning Rate": 1.960485521108779e-07, "Pretrain/Loss": 1.9962489604949951, "Pretrain/Loss (Raw)": 2.0026321411132812, "Pretrain/Step": 18335, "Pretrain/Step Time": 8.482380909845233} +{"Pretrain/Learning Rate": 1.955183083179074e-07, "Pretrain/Loss": 1.9942729473114014, "Pretrain/Loss (Raw)": 1.8651297092437744, "Pretrain/Step": 18336, "Pretrain/Step Time": 8.479220159351826} +{"Pretrain/Learning Rate": 1.9498877974467867e-07, "Pretrain/Loss": 1.9935868978500366, "Pretrain/Loss (Raw)": 2.0279886722564697, "Pretrain/Step": 18337, "Pretrain/Step Time": 8.480409117415547} +{"Pretrain/Learning Rate": 1.9445996640646559e-07, "Pretrain/Loss": 1.995553731918335, "Pretrain/Loss (Raw)": 2.1659634113311768, "Pretrain/Step": 18338, "Pretrain/Step Time": 8.479894423857331} +{"Pretrain/Learning Rate": 1.9393186831850873e-07, "Pretrain/Loss": 1.9952168464660645, "Pretrain/Loss (Raw)": 1.9483002424240112, "Pretrain/Step": 18339, "Pretrain/Step Time": 8.480985410511494} +{"Pretrain/Learning Rate": 1.934044854960404e-07, "Pretrain/Loss": 1.9965009689331055, "Pretrain/Loss (Raw)": 2.157017469406128, "Pretrain/Step": 18340, "Pretrain/Step Time": 8.480981983244419} +{"Pretrain/Learning Rate": 1.9287781795426786e-07, "Pretrain/Loss": 1.997565746307373, "Pretrain/Loss (Raw)": 1.9953432083129883, "Pretrain/Step": 18341, "Pretrain/Step Time": 8.480249498039484} +{"Pretrain/Learning Rate": 1.9235186570837338e-07, "Pretrain/Loss": 1.9905576705932617, "Pretrain/Loss (Raw)": 1.848341703414917, "Pretrain/Step": 18342, "Pretrain/Step Time": 8.481877254322171} +{"Pretrain/Learning Rate": 1.9182662877352543e-07, "Pretrain/Loss": 1.9896093606948853, "Pretrain/Loss (Raw)": 1.821790099143982, "Pretrain/Step": 18343, "Pretrain/Step Time": 8.483916252851486} +{"Pretrain/Learning Rate": 1.913021071648702e-07, "Pretrain/Loss": 1.9913990497589111, "Pretrain/Loss (Raw)": 2.132697582244873, "Pretrain/Step": 18344, "Pretrain/Step Time": 8.483674123883247} +{"Pretrain/Learning Rate": 1.9077830089752614e-07, "Pretrain/Loss": 1.9913766384124756, "Pretrain/Loss (Raw)": 2.0057501792907715, "Pretrain/Step": 18345, "Pretrain/Step Time": 8.482193604111671} +{"Pretrain/Learning Rate": 1.902552099866034e-07, "Pretrain/Loss": 1.9923335313796997, "Pretrain/Loss (Raw)": 1.9911006689071655, "Pretrain/Step": 18346, "Pretrain/Step Time": 8.481539750471711} +{"Pretrain/Learning Rate": 1.8973283444717882e-07, "Pretrain/Loss": 1.9926296472549438, "Pretrain/Loss (Raw)": 2.0684316158294678, "Pretrain/Step": 18347, "Pretrain/Step Time": 8.478779688477516} +{"Pretrain/Learning Rate": 1.892111742943209e-07, "Pretrain/Loss": 1.9935195446014404, "Pretrain/Loss (Raw)": 2.1176769733428955, "Pretrain/Step": 18348, "Pretrain/Step Time": 8.482774257659912} +{"Pretrain/Learning Rate": 1.886902295430676e-07, "Pretrain/Loss": 1.9935429096221924, "Pretrain/Loss (Raw)": 2.1285812854766846, "Pretrain/Step": 18349, "Pretrain/Step Time": 8.48148800060153} +{"Pretrain/Learning Rate": 1.8817000020843744e-07, "Pretrain/Loss": 1.9934096336364746, "Pretrain/Loss (Raw)": 1.9474766254425049, "Pretrain/Step": 18350, "Pretrain/Step Time": 8.480924425646663} +{"Pretrain/Learning Rate": 1.8765048630543792e-07, "Pretrain/Loss": 1.9945765733718872, "Pretrain/Loss (Raw)": 2.1469063758850098, "Pretrain/Step": 18351, "Pretrain/Step Time": 8.475696939975023} +{"Pretrain/Learning Rate": 1.871316878490431e-07, "Pretrain/Loss": 1.9954441785812378, "Pretrain/Loss (Raw)": 1.9768939018249512, "Pretrain/Step": 18352, "Pretrain/Step Time": 8.478866383433342} +{"Pretrain/Learning Rate": 1.8661360485421608e-07, "Pretrain/Loss": 1.9957493543624878, "Pretrain/Loss (Raw)": 2.0460562705993652, "Pretrain/Step": 18353, "Pretrain/Step Time": 8.47915687598288} +{"Pretrain/Learning Rate": 1.860962373358921e-07, "Pretrain/Loss": 1.9959145784378052, "Pretrain/Loss (Raw)": 1.9054867029190063, "Pretrain/Step": 18354, "Pretrain/Step Time": 8.475952964276075} +{"Pretrain/Learning Rate": 1.8557958530899256e-07, "Pretrain/Loss": 1.9951510429382324, "Pretrain/Loss (Raw)": 1.8330583572387695, "Pretrain/Step": 18355, "Pretrain/Step Time": 8.479864183813334} +{"Pretrain/Learning Rate": 1.8506364878841108e-07, "Pretrain/Loss": 1.9965779781341553, "Pretrain/Loss (Raw)": 2.038949728012085, "Pretrain/Step": 18356, "Pretrain/Step Time": 8.478391060605645} +{"Pretrain/Learning Rate": 1.845484277890247e-07, "Pretrain/Loss": 1.9969730377197266, "Pretrain/Loss (Raw)": 2.06394100189209, "Pretrain/Step": 18357, "Pretrain/Step Time": 8.48063525930047} +{"Pretrain/Learning Rate": 1.8403392232569094e-07, "Pretrain/Loss": 1.9962427616119385, "Pretrain/Loss (Raw)": 2.0062568187713623, "Pretrain/Step": 18358, "Pretrain/Step Time": 8.479126827791333} +{"Pretrain/Learning Rate": 1.8352013241324794e-07, "Pretrain/Loss": 1.9965163469314575, "Pretrain/Loss (Raw)": 1.9593722820281982, "Pretrain/Step": 18359, "Pretrain/Step Time": 8.480032585561275} +{"Pretrain/Learning Rate": 1.830070580665033e-07, "Pretrain/Loss": 1.99785578250885, "Pretrain/Loss (Raw)": 1.9455735683441162, "Pretrain/Step": 18360, "Pretrain/Step Time": 8.48037737980485} +{"Pretrain/Learning Rate": 1.8249469930025909e-07, "Pretrain/Loss": 1.995227575302124, "Pretrain/Loss (Raw)": 2.0873000621795654, "Pretrain/Step": 18361, "Pretrain/Step Time": 8.480927884578705} +{"Pretrain/Learning Rate": 1.8198305612928125e-07, "Pretrain/Loss": 1.9930994510650635, "Pretrain/Loss (Raw)": 1.7418924570083618, "Pretrain/Step": 18362, "Pretrain/Step Time": 8.478768859058619} +{"Pretrain/Learning Rate": 1.814721285683302e-07, "Pretrain/Loss": 1.9913805723190308, "Pretrain/Loss (Raw)": 1.7400155067443848, "Pretrain/Step": 18363, "Pretrain/Step Time": 8.480392338708043} +{"Pretrain/Learning Rate": 1.8096191663213025e-07, "Pretrain/Loss": 1.9905121326446533, "Pretrain/Loss (Raw)": 1.7932943105697632, "Pretrain/Step": 18364, "Pretrain/Step Time": 8.478017587214708} +{"Pretrain/Learning Rate": 1.8045242033540021e-07, "Pretrain/Loss": 1.989119291305542, "Pretrain/Loss (Raw)": 1.8475576639175415, "Pretrain/Step": 18365, "Pretrain/Step Time": 8.48105176910758} +{"Pretrain/Learning Rate": 1.7994363969282835e-07, "Pretrain/Loss": 1.9916284084320068, "Pretrain/Loss (Raw)": 2.2853317260742188, "Pretrain/Step": 18366, "Pretrain/Step Time": 8.477003356441855} +{"Pretrain/Learning Rate": 1.7943557471908344e-07, "Pretrain/Loss": 1.9928607940673828, "Pretrain/Loss (Raw)": 1.94481360912323, "Pretrain/Step": 18367, "Pretrain/Step Time": 8.478781968355179} +{"Pretrain/Learning Rate": 1.789282254288177e-07, "Pretrain/Loss": 1.991591453552246, "Pretrain/Loss (Raw)": 1.8554723262786865, "Pretrain/Step": 18368, "Pretrain/Step Time": 8.482129365205765} +{"Pretrain/Learning Rate": 1.7842159183665553e-07, "Pretrain/Loss": 1.9928337335586548, "Pretrain/Loss (Raw)": 2.214823007583618, "Pretrain/Step": 18369, "Pretrain/Step Time": 8.479029688984156} +{"Pretrain/Learning Rate": 1.7791567395721298e-07, "Pretrain/Loss": 1.995233178138733, "Pretrain/Loss (Raw)": 2.124389886856079, "Pretrain/Step": 18370, "Pretrain/Step Time": 8.478705037385225} +{"Pretrain/Learning Rate": 1.774104718050701e-07, "Pretrain/Loss": 1.9937419891357422, "Pretrain/Loss (Raw)": 1.892959475517273, "Pretrain/Step": 18371, "Pretrain/Step Time": 8.47654528170824} +{"Pretrain/Learning Rate": 1.7690598539479852e-07, "Pretrain/Loss": 1.9958703517913818, "Pretrain/Loss (Raw)": 2.154698133468628, "Pretrain/Step": 18372, "Pretrain/Step Time": 8.480030708014965} +{"Pretrain/Learning Rate": 1.7640221474094498e-07, "Pretrain/Loss": 1.9955859184265137, "Pretrain/Loss (Raw)": 1.766283631324768, "Pretrain/Step": 18373, "Pretrain/Step Time": 8.484543876722455} +{"Pretrain/Learning Rate": 1.758991598580312e-07, "Pretrain/Loss": 1.996282696723938, "Pretrain/Loss (Raw)": 2.111964464187622, "Pretrain/Step": 18374, "Pretrain/Step Time": 8.476623862981796} +{"Pretrain/Learning Rate": 1.7539682076056775e-07, "Pretrain/Loss": 1.9975048303604126, "Pretrain/Loss (Raw)": 2.0826668739318848, "Pretrain/Step": 18375, "Pretrain/Step Time": 8.479669068008661} +{"Pretrain/Learning Rate": 1.748951974630375e-07, "Pretrain/Loss": 1.996922254562378, "Pretrain/Loss (Raw)": 1.8111189603805542, "Pretrain/Step": 18376, "Pretrain/Step Time": 8.484281713142991} +{"Pretrain/Learning Rate": 1.7439428997990114e-07, "Pretrain/Loss": 1.9951269626617432, "Pretrain/Loss (Raw)": 2.033856153488159, "Pretrain/Step": 18377, "Pretrain/Step Time": 8.486362632364035} +{"Pretrain/Learning Rate": 1.7389409832560822e-07, "Pretrain/Loss": 1.9959197044372559, "Pretrain/Loss (Raw)": 2.0424063205718994, "Pretrain/Step": 18378, "Pretrain/Step Time": 8.48377106897533} +{"Pretrain/Learning Rate": 1.7339462251457218e-07, "Pretrain/Loss": 1.9959965944290161, "Pretrain/Loss (Raw)": 2.091109037399292, "Pretrain/Step": 18379, "Pretrain/Step Time": 8.489570759236813} +{"Pretrain/Learning Rate": 1.728958625612065e-07, "Pretrain/Loss": 1.9942436218261719, "Pretrain/Loss (Raw)": 1.9118434190750122, "Pretrain/Step": 18380, "Pretrain/Step Time": 8.48624755255878} +{"Pretrain/Learning Rate": 1.72397818479883e-07, "Pretrain/Loss": 1.9929816722869873, "Pretrain/Loss (Raw)": 2.0170695781707764, "Pretrain/Step": 18381, "Pretrain/Step Time": 8.488315548747778} +{"Pretrain/Learning Rate": 1.7190049028496523e-07, "Pretrain/Loss": 1.9919393062591553, "Pretrain/Loss (Raw)": 1.8264832496643066, "Pretrain/Step": 18382, "Pretrain/Step Time": 8.487769458442926} +{"Pretrain/Learning Rate": 1.7140387799079728e-07, "Pretrain/Loss": 1.9917113780975342, "Pretrain/Loss (Raw)": 2.138252019882202, "Pretrain/Step": 18383, "Pretrain/Step Time": 8.486764807254076} +{"Pretrain/Learning Rate": 1.7090798161169265e-07, "Pretrain/Loss": 1.9914672374725342, "Pretrain/Loss (Raw)": 1.9910811185836792, "Pretrain/Step": 18384, "Pretrain/Step Time": 8.486742928624153} +{"Pretrain/Learning Rate": 1.7041280116195656e-07, "Pretrain/Loss": 1.9946635961532593, "Pretrain/Loss (Raw)": 2.3700289726257324, "Pretrain/Step": 18385, "Pretrain/Step Time": 8.486476620659232} +{"Pretrain/Learning Rate": 1.69918336655861e-07, "Pretrain/Loss": 1.9956259727478027, "Pretrain/Loss (Raw)": 1.9976428747177124, "Pretrain/Step": 18386, "Pretrain/Step Time": 8.487668253481388} +{"Pretrain/Learning Rate": 1.694245881076667e-07, "Pretrain/Loss": 1.9972703456878662, "Pretrain/Loss (Raw)": 1.9814176559448242, "Pretrain/Step": 18387, "Pretrain/Step Time": 8.491411259397864} +{"Pretrain/Learning Rate": 1.6893155553160954e-07, "Pretrain/Loss": 1.9964945316314697, "Pretrain/Loss (Raw)": 2.0837345123291016, "Pretrain/Step": 18388, "Pretrain/Step Time": 8.491427570581436} +{"Pretrain/Learning Rate": 1.6843923894190594e-07, "Pretrain/Loss": 1.99663245677948, "Pretrain/Loss (Raw)": 1.9106643199920654, "Pretrain/Step": 18389, "Pretrain/Step Time": 8.497934887185693} +{"Pretrain/Learning Rate": 1.6794763835275563e-07, "Pretrain/Loss": 1.9927297830581665, "Pretrain/Loss (Raw)": 1.7908273935317993, "Pretrain/Step": 18390, "Pretrain/Step Time": 8.49663851223886} +{"Pretrain/Learning Rate": 1.6745675377832504e-07, "Pretrain/Loss": 1.9920531511306763, "Pretrain/Loss (Raw)": 1.9799734354019165, "Pretrain/Step": 18391, "Pretrain/Step Time": 8.49701145105064} +{"Pretrain/Learning Rate": 1.6696658523277508e-07, "Pretrain/Loss": 1.9916422367095947, "Pretrain/Loss (Raw)": 1.7267998456954956, "Pretrain/Step": 18392, "Pretrain/Step Time": 8.500577479600906} +{"Pretrain/Learning Rate": 1.6647713273023612e-07, "Pretrain/Loss": 1.9908006191253662, "Pretrain/Loss (Raw)": 1.9930979013442993, "Pretrain/Step": 18393, "Pretrain/Step Time": 8.499552568420768} +{"Pretrain/Learning Rate": 1.6598839628482465e-07, "Pretrain/Loss": 1.9897973537445068, "Pretrain/Loss (Raw)": 1.9962067604064941, "Pretrain/Step": 18394, "Pretrain/Step Time": 8.497445318847895} +{"Pretrain/Learning Rate": 1.655003759106294e-07, "Pretrain/Loss": 1.9904322624206543, "Pretrain/Loss (Raw)": 2.075424909591675, "Pretrain/Step": 18395, "Pretrain/Step Time": 8.491580059751868} +{"Pretrain/Learning Rate": 1.650130716217252e-07, "Pretrain/Loss": 1.9912892580032349, "Pretrain/Loss (Raw)": 2.120828628540039, "Pretrain/Step": 18396, "Pretrain/Step Time": 8.490355912595987} +{"Pretrain/Learning Rate": 1.6452648343215915e-07, "Pretrain/Loss": 1.9905599355697632, "Pretrain/Loss (Raw)": 1.8516356945037842, "Pretrain/Step": 18397, "Pretrain/Step Time": 8.492847878485918} +{"Pretrain/Learning Rate": 1.6404061135596726e-07, "Pretrain/Loss": 1.98960280418396, "Pretrain/Loss (Raw)": 1.7763034105300903, "Pretrain/Step": 18398, "Pretrain/Step Time": 8.499896191060543} +{"Pretrain/Learning Rate": 1.6355545540715221e-07, "Pretrain/Loss": 1.9902622699737549, "Pretrain/Loss (Raw)": 2.032188653945923, "Pretrain/Step": 18399, "Pretrain/Step Time": 8.498172670602798} +{"Pretrain/Learning Rate": 1.6307101559971115e-07, "Pretrain/Loss": 1.98908269405365, "Pretrain/Loss (Raw)": 1.9212546348571777, "Pretrain/Step": 18400, "Pretrain/Step Time": 8.49447568319738} +{"Pretrain/Learning Rate": 1.6258729194760514e-07, "Pretrain/Loss": 1.9881861209869385, "Pretrain/Loss (Raw)": 1.841084599494934, "Pretrain/Step": 18401, "Pretrain/Step Time": 8.495569420978427} +{"Pretrain/Learning Rate": 1.6210428446478686e-07, "Pretrain/Loss": 1.9906023740768433, "Pretrain/Loss (Raw)": 2.154345989227295, "Pretrain/Step": 18402, "Pretrain/Step Time": 8.488205349072814} +{"Pretrain/Learning Rate": 1.6162199316518412e-07, "Pretrain/Loss": 1.98897123336792, "Pretrain/Loss (Raw)": 1.8496942520141602, "Pretrain/Step": 18403, "Pretrain/Step Time": 8.493825696408749} +{"Pretrain/Learning Rate": 1.6114041806269686e-07, "Pretrain/Loss": 1.9857196807861328, "Pretrain/Loss (Raw)": 1.7730352878570557, "Pretrain/Step": 18404, "Pretrain/Step Time": 8.49456311762333} +{"Pretrain/Learning Rate": 1.6065955917121956e-07, "Pretrain/Loss": 1.9902997016906738, "Pretrain/Loss (Raw)": 2.3600547313690186, "Pretrain/Step": 18405, "Pretrain/Step Time": 8.500824496150017} +{"Pretrain/Learning Rate": 1.6017941650461056e-07, "Pretrain/Loss": 1.993851661682129, "Pretrain/Loss (Raw)": 2.431720018386841, "Pretrain/Step": 18406, "Pretrain/Step Time": 8.500791201367974} +{"Pretrain/Learning Rate": 1.596999900767171e-07, "Pretrain/Loss": 1.9950083494186401, "Pretrain/Loss (Raw)": 2.0189075469970703, "Pretrain/Step": 18407, "Pretrain/Step Time": 8.497028993442655} +{"Pretrain/Learning Rate": 1.5922127990136426e-07, "Pretrain/Loss": 1.9958380460739136, "Pretrain/Loss (Raw)": 1.9950644969940186, "Pretrain/Step": 18408, "Pretrain/Step Time": 8.49167506955564} +{"Pretrain/Learning Rate": 1.5874328599235488e-07, "Pretrain/Loss": 1.9924167394638062, "Pretrain/Loss (Raw)": 1.6502065658569336, "Pretrain/Step": 18409, "Pretrain/Step Time": 8.496249612420797} +{"Pretrain/Learning Rate": 1.5826600836346962e-07, "Pretrain/Loss": 1.9918851852416992, "Pretrain/Loss (Raw)": 2.0032942295074463, "Pretrain/Step": 18410, "Pretrain/Step Time": 8.492980848997831} +{"Pretrain/Learning Rate": 1.5778944702846964e-07, "Pretrain/Loss": 1.9922271966934204, "Pretrain/Loss (Raw)": 2.0559446811676025, "Pretrain/Step": 18411, "Pretrain/Step Time": 8.494406331330538} +{"Pretrain/Learning Rate": 1.5731360200110235e-07, "Pretrain/Loss": 1.9914288520812988, "Pretrain/Loss (Raw)": 1.8089118003845215, "Pretrain/Step": 18412, "Pretrain/Step Time": 8.492175228893757} +{"Pretrain/Learning Rate": 1.568384732950845e-07, "Pretrain/Loss": 1.9914970397949219, "Pretrain/Loss (Raw)": 1.9534860849380493, "Pretrain/Step": 18413, "Pretrain/Step Time": 8.490818439051509} +{"Pretrain/Learning Rate": 1.563640609241135e-07, "Pretrain/Loss": 1.98941969871521, "Pretrain/Loss (Raw)": 1.77683424949646, "Pretrain/Step": 18414, "Pretrain/Step Time": 8.491694737225771} +{"Pretrain/Learning Rate": 1.558903649018728e-07, "Pretrain/Loss": 1.988248348236084, "Pretrain/Loss (Raw)": 1.9285277128219604, "Pretrain/Step": 18415, "Pretrain/Step Time": 8.492284398525953} +{"Pretrain/Learning Rate": 1.554173852420182e-07, "Pretrain/Loss": 1.9854460954666138, "Pretrain/Loss (Raw)": 1.911971092224121, "Pretrain/Step": 18416, "Pretrain/Step Time": 8.492123670876026} +{"Pretrain/Learning Rate": 1.5494512195818877e-07, "Pretrain/Loss": 1.98570716381073, "Pretrain/Loss (Raw)": 1.9694044589996338, "Pretrain/Step": 18417, "Pretrain/Step Time": 8.488258155062795} +{"Pretrain/Learning Rate": 1.5447357506400417e-07, "Pretrain/Loss": 1.9860726594924927, "Pretrain/Loss (Raw)": 2.0984461307525635, "Pretrain/Step": 18418, "Pretrain/Step Time": 8.485616805031896} +{"Pretrain/Learning Rate": 1.540027445730563e-07, "Pretrain/Loss": 1.9836028814315796, "Pretrain/Loss (Raw)": 1.8656471967697144, "Pretrain/Step": 18419, "Pretrain/Step Time": 8.493285657837987} +{"Pretrain/Learning Rate": 1.5353263049892597e-07, "Pretrain/Loss": 1.983752727508545, "Pretrain/Loss (Raw)": 1.911054253578186, "Pretrain/Step": 18420, "Pretrain/Step Time": 8.494746198877692} +{"Pretrain/Learning Rate": 1.530632328551662e-07, "Pretrain/Loss": 1.9837589263916016, "Pretrain/Loss (Raw)": 1.9313361644744873, "Pretrain/Step": 18421, "Pretrain/Step Time": 8.49664450250566} +{"Pretrain/Learning Rate": 1.5259455165531068e-07, "Pretrain/Loss": 1.9844045639038086, "Pretrain/Loss (Raw)": 2.114558696746826, "Pretrain/Step": 18422, "Pretrain/Step Time": 8.494798947125673} +{"Pretrain/Learning Rate": 1.5212658691287907e-07, "Pretrain/Loss": 1.9851891994476318, "Pretrain/Loss (Raw)": 2.154419183731079, "Pretrain/Step": 18423, "Pretrain/Step Time": 8.490672174841166} +{"Pretrain/Learning Rate": 1.5165933864135784e-07, "Pretrain/Loss": 1.984983205795288, "Pretrain/Loss (Raw)": 1.980824589729309, "Pretrain/Step": 18424, "Pretrain/Step Time": 8.494650358334184} +{"Pretrain/Learning Rate": 1.5119280685422233e-07, "Pretrain/Loss": 1.9840362071990967, "Pretrain/Loss (Raw)": 1.9794459342956543, "Pretrain/Step": 18425, "Pretrain/Step Time": 8.49303761869669} +{"Pretrain/Learning Rate": 1.5072699156492565e-07, "Pretrain/Loss": 1.9864232540130615, "Pretrain/Loss (Raw)": 2.0024349689483643, "Pretrain/Step": 18426, "Pretrain/Step Time": 8.493592169135809} +{"Pretrain/Learning Rate": 1.5026189278689872e-07, "Pretrain/Loss": 1.9831364154815674, "Pretrain/Loss (Raw)": 1.5053448677062988, "Pretrain/Step": 18427, "Pretrain/Step Time": 8.494418563321233} +{"Pretrain/Learning Rate": 1.4979751053355307e-07, "Pretrain/Loss": 1.9798190593719482, "Pretrain/Loss (Raw)": 1.6904363632202148, "Pretrain/Step": 18428, "Pretrain/Step Time": 8.492744805291295} +{"Pretrain/Learning Rate": 1.4933384481827517e-07, "Pretrain/Loss": 1.9804842472076416, "Pretrain/Loss (Raw)": 1.942855954170227, "Pretrain/Step": 18429, "Pretrain/Step Time": 8.493794227018952} +{"Pretrain/Learning Rate": 1.4887089565444045e-07, "Pretrain/Loss": 1.979703426361084, "Pretrain/Loss (Raw)": 1.868243932723999, "Pretrain/Step": 18430, "Pretrain/Step Time": 8.491850260645151} +{"Pretrain/Learning Rate": 1.4840866305539102e-07, "Pretrain/Loss": 1.9800984859466553, "Pretrain/Loss (Raw)": 2.032867908477783, "Pretrain/Step": 18431, "Pretrain/Step Time": 8.490638494491577} +{"Pretrain/Learning Rate": 1.4794714703446066e-07, "Pretrain/Loss": 1.9811396598815918, "Pretrain/Loss (Raw)": 1.9979926347732544, "Pretrain/Step": 18432, "Pretrain/Step Time": 8.486823666840792} +{"Pretrain/Learning Rate": 1.474863476049554e-07, "Pretrain/Loss": 1.9808201789855957, "Pretrain/Loss (Raw)": 1.956441044807434, "Pretrain/Step": 18433, "Pretrain/Step Time": 8.488961840048432} +{"Pretrain/Learning Rate": 1.470262647801618e-07, "Pretrain/Loss": 1.9810092449188232, "Pretrain/Loss (Raw)": 1.9489037990570068, "Pretrain/Step": 18434, "Pretrain/Step Time": 8.48628580570221} +{"Pretrain/Learning Rate": 1.4656689857334426e-07, "Pretrain/Loss": 1.9819941520690918, "Pretrain/Loss (Raw)": 2.0696656703948975, "Pretrain/Step": 18435, "Pretrain/Step Time": 8.486036822199821} +{"Pretrain/Learning Rate": 1.4610824899775055e-07, "Pretrain/Loss": 1.9813854694366455, "Pretrain/Loss (Raw)": 1.9391547441482544, "Pretrain/Step": 18436, "Pretrain/Step Time": 8.487460372969508} +{"Pretrain/Learning Rate": 1.456503160666034e-07, "Pretrain/Loss": 1.9811692237854004, "Pretrain/Loss (Raw)": 2.000216007232666, "Pretrain/Step": 18437, "Pretrain/Step Time": 8.487834066152573} +{"Pretrain/Learning Rate": 1.451930997931089e-07, "Pretrain/Loss": 1.9801136255264282, "Pretrain/Loss (Raw)": 1.8593080043792725, "Pretrain/Step": 18438, "Pretrain/Step Time": 8.490442719310522} +{"Pretrain/Learning Rate": 1.4473660019045098e-07, "Pretrain/Loss": 1.9828240871429443, "Pretrain/Loss (Raw)": 2.24735164642334, "Pretrain/Step": 18439, "Pretrain/Step Time": 8.48548024892807} +{"Pretrain/Learning Rate": 1.4428081727179132e-07, "Pretrain/Loss": 1.980607509613037, "Pretrain/Loss (Raw)": 1.7661561965942383, "Pretrain/Step": 18440, "Pretrain/Step Time": 8.486996939405799} +{"Pretrain/Learning Rate": 1.438257510502694e-07, "Pretrain/Loss": 1.9809541702270508, "Pretrain/Loss (Raw)": 2.11025333404541, "Pretrain/Step": 18441, "Pretrain/Step Time": 8.486256621778011} +{"Pretrain/Learning Rate": 1.4337140153901086e-07, "Pretrain/Loss": 1.9787474870681763, "Pretrain/Loss (Raw)": 1.8259363174438477, "Pretrain/Step": 18442, "Pretrain/Step Time": 8.48520733602345} +{"Pretrain/Learning Rate": 1.4291776875111627e-07, "Pretrain/Loss": 1.9799323081970215, "Pretrain/Loss (Raw)": 2.0787525177001953, "Pretrain/Step": 18443, "Pretrain/Step Time": 8.482643472030759} +{"Pretrain/Learning Rate": 1.4246485269966691e-07, "Pretrain/Loss": 1.9809144735336304, "Pretrain/Loss (Raw)": 2.142383337020874, "Pretrain/Step": 18444, "Pretrain/Step Time": 8.485355772078037} +{"Pretrain/Learning Rate": 1.420126533977162e-07, "Pretrain/Loss": 1.980615496635437, "Pretrain/Loss (Raw)": 1.9596543312072754, "Pretrain/Step": 18445, "Pretrain/Step Time": 8.483464494347572} +{"Pretrain/Learning Rate": 1.4156117085830644e-07, "Pretrain/Loss": 1.9803650379180908, "Pretrain/Loss (Raw)": 1.9345452785491943, "Pretrain/Step": 18446, "Pretrain/Step Time": 8.494452705606818} +{"Pretrain/Learning Rate": 1.411104050944606e-07, "Pretrain/Loss": 1.9807738065719604, "Pretrain/Loss (Raw)": 2.1455695629119873, "Pretrain/Step": 18447, "Pretrain/Step Time": 8.490355458110571} +{"Pretrain/Learning Rate": 1.4066035611916828e-07, "Pretrain/Loss": 1.9800976514816284, "Pretrain/Loss (Raw)": 1.9998191595077515, "Pretrain/Step": 18448, "Pretrain/Step Time": 8.489174585789442} +{"Pretrain/Learning Rate": 1.4021102394541076e-07, "Pretrain/Loss": 1.9791953563690186, "Pretrain/Loss (Raw)": 1.8584935665130615, "Pretrain/Step": 18449, "Pretrain/Step Time": 8.490649761632085} +{"Pretrain/Learning Rate": 1.3976240858614153e-07, "Pretrain/Loss": 1.9806175231933594, "Pretrain/Loss (Raw)": 2.0875089168548584, "Pretrain/Step": 18450, "Pretrain/Step Time": 8.4909305293113} +{"Pretrain/Learning Rate": 1.393145100543003e-07, "Pretrain/Loss": 1.9802601337432861, "Pretrain/Loss (Raw)": 1.9665113687515259, "Pretrain/Step": 18451, "Pretrain/Step Time": 8.489096578210592} +{"Pretrain/Learning Rate": 1.388673283628017e-07, "Pretrain/Loss": 1.9826514720916748, "Pretrain/Loss (Raw)": 2.1481316089630127, "Pretrain/Step": 18452, "Pretrain/Step Time": 8.495364557951689} +{"Pretrain/Learning Rate": 1.3842086352453264e-07, "Pretrain/Loss": 1.984233021736145, "Pretrain/Loss (Raw)": 2.116072416305542, "Pretrain/Step": 18453, "Pretrain/Step Time": 8.496139451861382} +{"Pretrain/Learning Rate": 1.3797511555237452e-07, "Pretrain/Loss": 1.982762098312378, "Pretrain/Loss (Raw)": 1.9367300271987915, "Pretrain/Step": 18454, "Pretrain/Step Time": 8.49272770434618} +{"Pretrain/Learning Rate": 1.3753008445917815e-07, "Pretrain/Loss": 1.982757806777954, "Pretrain/Loss (Raw)": 1.9919567108154297, "Pretrain/Step": 18455, "Pretrain/Step Time": 8.494686301797628} +{"Pretrain/Learning Rate": 1.3708577025777214e-07, "Pretrain/Loss": 1.9819210767745972, "Pretrain/Loss (Raw)": 1.9079222679138184, "Pretrain/Step": 18456, "Pretrain/Step Time": 8.49076702259481} +{"Pretrain/Learning Rate": 1.3664217296097405e-07, "Pretrain/Loss": 1.9815659523010254, "Pretrain/Loss (Raw)": 1.9489312171936035, "Pretrain/Step": 18457, "Pretrain/Step Time": 8.492414213716984} +{"Pretrain/Learning Rate": 1.3619929258156805e-07, "Pretrain/Loss": 1.9810965061187744, "Pretrain/Loss (Raw)": 1.8805772066116333, "Pretrain/Step": 18458, "Pretrain/Step Time": 8.490518607199192} +{"Pretrain/Learning Rate": 1.3575712913233009e-07, "Pretrain/Loss": 1.9790685176849365, "Pretrain/Loss (Raw)": 1.8042194843292236, "Pretrain/Step": 18459, "Pretrain/Step Time": 8.488498345017433} +{"Pretrain/Learning Rate": 1.3531568262600547e-07, "Pretrain/Loss": 1.979537010192871, "Pretrain/Loss (Raw)": 1.995129108428955, "Pretrain/Step": 18460, "Pretrain/Step Time": 8.488670531660318} +{"Pretrain/Learning Rate": 1.3487495307532572e-07, "Pretrain/Loss": 1.9787715673446655, "Pretrain/Loss (Raw)": 1.87905752658844, "Pretrain/Step": 18461, "Pretrain/Step Time": 8.49371099844575} +{"Pretrain/Learning Rate": 1.344349404930001e-07, "Pretrain/Loss": 1.978861927986145, "Pretrain/Loss (Raw)": 1.9691447019577026, "Pretrain/Step": 18462, "Pretrain/Step Time": 8.49276509694755} +{"Pretrain/Learning Rate": 1.3399564489171013e-07, "Pretrain/Loss": 1.9783668518066406, "Pretrain/Loss (Raw)": 1.939263939857483, "Pretrain/Step": 18463, "Pretrain/Step Time": 8.495390210300684} +{"Pretrain/Learning Rate": 1.33557066284129e-07, "Pretrain/Loss": 1.9789113998413086, "Pretrain/Loss (Raw)": 1.934834599494934, "Pretrain/Step": 18464, "Pretrain/Step Time": 8.491780638694763} +{"Pretrain/Learning Rate": 1.3311920468289664e-07, "Pretrain/Loss": 1.9810981750488281, "Pretrain/Loss (Raw)": 2.3078877925872803, "Pretrain/Step": 18465, "Pretrain/Step Time": 8.492715448141098} +{"Pretrain/Learning Rate": 1.3268206010064454e-07, "Pretrain/Loss": 1.9802721738815308, "Pretrain/Loss (Raw)": 2.0602402687072754, "Pretrain/Step": 18466, "Pretrain/Step Time": 8.494700871407986} +{"Pretrain/Learning Rate": 1.3224563254997658e-07, "Pretrain/Loss": 1.98190438747406, "Pretrain/Loss (Raw)": 2.1572275161743164, "Pretrain/Step": 18467, "Pretrain/Step Time": 8.49617520160973} +{"Pretrain/Learning Rate": 1.3180992204347153e-07, "Pretrain/Loss": 1.9786367416381836, "Pretrain/Loss (Raw)": 1.7387663125991821, "Pretrain/Step": 18468, "Pretrain/Step Time": 8.494046680629253} +{"Pretrain/Learning Rate": 1.3137492859369992e-07, "Pretrain/Loss": 1.9786949157714844, "Pretrain/Loss (Raw)": 2.0027761459350586, "Pretrain/Step": 18469, "Pretrain/Step Time": 8.498231248930097} +{"Pretrain/Learning Rate": 1.3094065221319895e-07, "Pretrain/Loss": 1.9812332391738892, "Pretrain/Loss (Raw)": 2.1732428073883057, "Pretrain/Step": 18470, "Pretrain/Step Time": 8.495012756437063} +{"Pretrain/Learning Rate": 1.3050709291449193e-07, "Pretrain/Loss": 1.9844938516616821, "Pretrain/Loss (Raw)": 2.2391653060913086, "Pretrain/Step": 18471, "Pretrain/Step Time": 8.492548270151019} +{"Pretrain/Learning Rate": 1.300742507100827e-07, "Pretrain/Loss": 1.9838382005691528, "Pretrain/Loss (Raw)": 2.0487711429595947, "Pretrain/Step": 18472, "Pretrain/Step Time": 8.492808263748884} +{"Pretrain/Learning Rate": 1.2964212561245026e-07, "Pretrain/Loss": 1.9852403402328491, "Pretrain/Loss (Raw)": 2.185210943222046, "Pretrain/Step": 18473, "Pretrain/Step Time": 8.495368454605341} +{"Pretrain/Learning Rate": 1.2921071763405401e-07, "Pretrain/Loss": 1.9850032329559326, "Pretrain/Loss (Raw)": 1.9607627391815186, "Pretrain/Step": 18474, "Pretrain/Step Time": 8.492009920999408} +{"Pretrain/Learning Rate": 1.2878002678733402e-07, "Pretrain/Loss": 1.9855386018753052, "Pretrain/Loss (Raw)": 2.1369540691375732, "Pretrain/Step": 18475, "Pretrain/Step Time": 8.497949071228504} +{"Pretrain/Learning Rate": 1.2835005308471093e-07, "Pretrain/Loss": 1.9819709062576294, "Pretrain/Loss (Raw)": 1.6610103845596313, "Pretrain/Step": 18476, "Pretrain/Step Time": 8.490868847817183} +{"Pretrain/Learning Rate": 1.279207965385776e-07, "Pretrain/Loss": 1.9801501035690308, "Pretrain/Loss (Raw)": 1.8955070972442627, "Pretrain/Step": 18477, "Pretrain/Step Time": 8.492431303486228} +{"Pretrain/Learning Rate": 1.2749225716131575e-07, "Pretrain/Loss": 1.9815583229064941, "Pretrain/Loss (Raw)": 2.127732038497925, "Pretrain/Step": 18478, "Pretrain/Step Time": 8.496513513848186} +{"Pretrain/Learning Rate": 1.270644349652822e-07, "Pretrain/Loss": 1.980723261833191, "Pretrain/Loss (Raw)": 2.040036201477051, "Pretrain/Step": 18479, "Pretrain/Step Time": 8.500005094334483} +{"Pretrain/Learning Rate": 1.2663732996280875e-07, "Pretrain/Loss": 1.9813382625579834, "Pretrain/Loss (Raw)": 2.05560564994812, "Pretrain/Step": 18480, "Pretrain/Step Time": 8.495901178568602} +{"Pretrain/Learning Rate": 1.262109421662161e-07, "Pretrain/Loss": 1.9842349290847778, "Pretrain/Loss (Raw)": 2.4168293476104736, "Pretrain/Step": 18481, "Pretrain/Step Time": 8.499766672030091} +{"Pretrain/Learning Rate": 1.257852715877944e-07, "Pretrain/Loss": 1.983240008354187, "Pretrain/Loss (Raw)": 1.778146743774414, "Pretrain/Step": 18482, "Pretrain/Step Time": 8.503166675567627} +{"Pretrain/Learning Rate": 1.253603182398172e-07, "Pretrain/Loss": 1.9843870401382446, "Pretrain/Loss (Raw)": 1.9798691272735596, "Pretrain/Step": 18483, "Pretrain/Step Time": 8.500628115609288} +{"Pretrain/Learning Rate": 1.249360821345441e-07, "Pretrain/Loss": 1.9822466373443604, "Pretrain/Loss (Raw)": 1.7649824619293213, "Pretrain/Step": 18484, "Pretrain/Step Time": 8.502514403313398} +{"Pretrain/Learning Rate": 1.245125632841987e-07, "Pretrain/Loss": 1.9810352325439453, "Pretrain/Loss (Raw)": 1.908864140510559, "Pretrain/Step": 18485, "Pretrain/Step Time": 8.502730270847678} +{"Pretrain/Learning Rate": 1.2408976170100172e-07, "Pretrain/Loss": 1.9820345640182495, "Pretrain/Loss (Raw)": 2.134174108505249, "Pretrain/Step": 18486, "Pretrain/Step Time": 8.505798792466521} +{"Pretrain/Learning Rate": 1.2366767739713792e-07, "Pretrain/Loss": 1.983229398727417, "Pretrain/Loss (Raw)": 2.112335205078125, "Pretrain/Step": 18487, "Pretrain/Step Time": 8.502719795331359} +{"Pretrain/Learning Rate": 1.2324631038478084e-07, "Pretrain/Loss": 1.9828232526779175, "Pretrain/Loss (Raw)": 1.8935801982879639, "Pretrain/Step": 18488, "Pretrain/Step Time": 8.505073765292764} +{"Pretrain/Learning Rate": 1.2282566067607915e-07, "Pretrain/Loss": 1.9824060201644897, "Pretrain/Loss (Raw)": 2.0338852405548096, "Pretrain/Step": 18489, "Pretrain/Step Time": 8.505057049915195} +{"Pretrain/Learning Rate": 1.224057282831592e-07, "Pretrain/Loss": 1.9838863611221313, "Pretrain/Loss (Raw)": 1.9313850402832031, "Pretrain/Step": 18490, "Pretrain/Step Time": 8.50139164738357} +{"Pretrain/Learning Rate": 1.2198651321813637e-07, "Pretrain/Loss": 1.9864449501037598, "Pretrain/Loss (Raw)": 2.0675086975097656, "Pretrain/Step": 18491, "Pretrain/Step Time": 8.500073842704296} +{"Pretrain/Learning Rate": 1.2156801549309538e-07, "Pretrain/Loss": 1.9885776042938232, "Pretrain/Loss (Raw)": 2.066289186477661, "Pretrain/Step": 18492, "Pretrain/Step Time": 8.499745424836874} +{"Pretrain/Learning Rate": 1.2115023512009882e-07, "Pretrain/Loss": 1.9887865781784058, "Pretrain/Loss (Raw)": 1.874289870262146, "Pretrain/Step": 18493, "Pretrain/Step Time": 8.500503789633512} +{"Pretrain/Learning Rate": 1.2073317211120094e-07, "Pretrain/Loss": 1.9856858253479004, "Pretrain/Loss (Raw)": 1.8884280920028687, "Pretrain/Step": 18494, "Pretrain/Step Time": 8.503398669883609} +{"Pretrain/Learning Rate": 1.2031682647841991e-07, "Pretrain/Loss": 1.9862550497055054, "Pretrain/Loss (Raw)": 2.0176870822906494, "Pretrain/Step": 18495, "Pretrain/Step Time": 8.501669432967901} +{"Pretrain/Learning Rate": 1.1990119823376554e-07, "Pretrain/Loss": 1.988242745399475, "Pretrain/Loss (Raw)": 2.1098880767822266, "Pretrain/Step": 18496, "Pretrain/Step Time": 8.501168079674244} +{"Pretrain/Learning Rate": 1.1948628738921997e-07, "Pretrain/Loss": 1.9856014251708984, "Pretrain/Loss (Raw)": 1.8767547607421875, "Pretrain/Step": 18497, "Pretrain/Step Time": 8.499596262350678} +{"Pretrain/Learning Rate": 1.1907209395674857e-07, "Pretrain/Loss": 1.9853211641311646, "Pretrain/Loss (Raw)": 2.088514566421509, "Pretrain/Step": 18498, "Pretrain/Step Time": 8.499410290271044} +{"Pretrain/Learning Rate": 1.1865861794829181e-07, "Pretrain/Loss": 1.98471200466156, "Pretrain/Loss (Raw)": 1.8149724006652832, "Pretrain/Step": 18499, "Pretrain/Step Time": 8.50074390694499} +{"Pretrain/Learning Rate": 1.1824585937577626e-07, "Pretrain/Loss": 1.9832196235656738, "Pretrain/Loss (Raw)": 1.9636865854263306, "Pretrain/Step": 18500, "Pretrain/Step Time": 8.500677268952131} +{"Pretrain/Learning Rate": 1.1783381825109796e-07, "Pretrain/Loss": 1.9820408821105957, "Pretrain/Loss (Raw)": 1.6153943538665771, "Pretrain/Step": 18501, "Pretrain/Step Time": 8.499655120074749} +{"Pretrain/Learning Rate": 1.1742249458614463e-07, "Pretrain/Loss": 1.978087067604065, "Pretrain/Loss (Raw)": 1.6058682203292847, "Pretrain/Step": 18502, "Pretrain/Step Time": 8.507227381691337} +{"Pretrain/Learning Rate": 1.1701188839276789e-07, "Pretrain/Loss": 1.978123664855957, "Pretrain/Loss (Raw)": 2.0873546600341797, "Pretrain/Step": 18503, "Pretrain/Step Time": 8.504756286740303} +{"Pretrain/Learning Rate": 1.166019996828166e-07, "Pretrain/Loss": 1.9806487560272217, "Pretrain/Loss (Raw)": 2.1343302726745605, "Pretrain/Step": 18504, "Pretrain/Step Time": 8.505183501169086} +{"Pretrain/Learning Rate": 1.1619282846810075e-07, "Pretrain/Loss": 1.9796444177627563, "Pretrain/Loss (Raw)": 1.9053081274032593, "Pretrain/Step": 18505, "Pretrain/Step Time": 8.50069940648973} +{"Pretrain/Learning Rate": 1.1578437476042758e-07, "Pretrain/Loss": 1.9801898002624512, "Pretrain/Loss (Raw)": 2.112217426300049, "Pretrain/Step": 18506, "Pretrain/Step Time": 8.500836344435811} +{"Pretrain/Learning Rate": 1.1537663857156544e-07, "Pretrain/Loss": 1.9800310134887695, "Pretrain/Loss (Raw)": 2.070772647857666, "Pretrain/Step": 18507, "Pretrain/Step Time": 8.497143357992172} +{"Pretrain/Learning Rate": 1.1496961991327715e-07, "Pretrain/Loss": 1.981747031211853, "Pretrain/Loss (Raw)": 2.131511926651001, "Pretrain/Step": 18508, "Pretrain/Step Time": 8.495935751125216} +{"Pretrain/Learning Rate": 1.1456331879729776e-07, "Pretrain/Loss": 1.980482816696167, "Pretrain/Loss (Raw)": 1.855250358581543, "Pretrain/Step": 18509, "Pretrain/Step Time": 8.495349429547787} +{"Pretrain/Learning Rate": 1.1415773523534012e-07, "Pretrain/Loss": 1.9818146228790283, "Pretrain/Loss (Raw)": 1.996932864189148, "Pretrain/Step": 18510, "Pretrain/Step Time": 8.498137461021543} +{"Pretrain/Learning Rate": 1.1375286923910323e-07, "Pretrain/Loss": 1.9801057577133179, "Pretrain/Loss (Raw)": 1.9195257425308228, "Pretrain/Step": 18511, "Pretrain/Step Time": 8.495410978794098} +{"Pretrain/Learning Rate": 1.1334872082025549e-07, "Pretrain/Loss": 1.9786181449890137, "Pretrain/Loss (Raw)": 1.8006651401519775, "Pretrain/Step": 18512, "Pretrain/Step Time": 8.498576819896698} +{"Pretrain/Learning Rate": 1.1294528999045707e-07, "Pretrain/Loss": 1.9760048389434814, "Pretrain/Loss (Raw)": 2.035515785217285, "Pretrain/Step": 18513, "Pretrain/Step Time": 8.495603896677494} +{"Pretrain/Learning Rate": 1.1254257676133473e-07, "Pretrain/Loss": 1.9759315252304077, "Pretrain/Loss (Raw)": 1.9882712364196777, "Pretrain/Step": 18514, "Pretrain/Step Time": 8.495774112641811} +{"Pretrain/Learning Rate": 1.1214058114450144e-07, "Pretrain/Loss": 1.97835373878479, "Pretrain/Loss (Raw)": 2.2914648056030273, "Pretrain/Step": 18515, "Pretrain/Step Time": 8.491361999884248} +{"Pretrain/Learning Rate": 1.1173930315155346e-07, "Pretrain/Loss": 1.9778488874435425, "Pretrain/Loss (Raw)": 2.019115924835205, "Pretrain/Step": 18516, "Pretrain/Step Time": 8.490841392427683} +{"Pretrain/Learning Rate": 1.1133874279405377e-07, "Pretrain/Loss": 1.9776612520217896, "Pretrain/Loss (Raw)": 1.8866376876831055, "Pretrain/Step": 18517, "Pretrain/Step Time": 8.482642641291022} +{"Pretrain/Learning Rate": 1.1093890008355978e-07, "Pretrain/Loss": 1.9800654649734497, "Pretrain/Loss (Raw)": 2.0985634326934814, "Pretrain/Step": 18518, "Pretrain/Step Time": 8.485837172716856} +{"Pretrain/Learning Rate": 1.1053977503159563e-07, "Pretrain/Loss": 1.9817702770233154, "Pretrain/Loss (Raw)": 2.19818377494812, "Pretrain/Step": 18519, "Pretrain/Step Time": 8.489936493337154} +{"Pretrain/Learning Rate": 1.1014136764966875e-07, "Pretrain/Loss": 1.9842102527618408, "Pretrain/Loss (Raw)": 2.0391247272491455, "Pretrain/Step": 18520, "Pretrain/Step Time": 8.48690427094698} +{"Pretrain/Learning Rate": 1.0974367794927276e-07, "Pretrain/Loss": 1.9850103855133057, "Pretrain/Loss (Raw)": 2.0955166816711426, "Pretrain/Step": 18521, "Pretrain/Step Time": 8.488940436393023} +{"Pretrain/Learning Rate": 1.0934670594186792e-07, "Pretrain/Loss": 1.9826314449310303, "Pretrain/Loss (Raw)": 1.6917126178741455, "Pretrain/Step": 18522, "Pretrain/Step Time": 8.489535490050912} +{"Pretrain/Learning Rate": 1.0895045163890615e-07, "Pretrain/Loss": 1.9817990064620972, "Pretrain/Loss (Raw)": 1.9688587188720703, "Pretrain/Step": 18523, "Pretrain/Step Time": 8.486917288973927} +{"Pretrain/Learning Rate": 1.085549150518117e-07, "Pretrain/Loss": 1.9815380573272705, "Pretrain/Loss (Raw)": 2.087441921234131, "Pretrain/Step": 18524, "Pretrain/Step Time": 8.486289028078318} +{"Pretrain/Learning Rate": 1.0816009619198653e-07, "Pretrain/Loss": 1.9815146923065186, "Pretrain/Loss (Raw)": 1.8486367464065552, "Pretrain/Step": 18525, "Pretrain/Step Time": 8.485769672319293} +{"Pretrain/Learning Rate": 1.0776599507082152e-07, "Pretrain/Loss": 1.9859322309494019, "Pretrain/Loss (Raw)": 2.341749429702759, "Pretrain/Step": 18526, "Pretrain/Step Time": 8.480048952624202} +{"Pretrain/Learning Rate": 1.073726116996715e-07, "Pretrain/Loss": 1.9851422309875488, "Pretrain/Loss (Raw)": 1.9310697317123413, "Pretrain/Step": 18527, "Pretrain/Step Time": 8.483078021556139} +{"Pretrain/Learning Rate": 1.0697994608988848e-07, "Pretrain/Loss": 1.9853246212005615, "Pretrain/Loss (Raw)": 1.9445832967758179, "Pretrain/Step": 18528, "Pretrain/Step Time": 8.48468534834683} +{"Pretrain/Learning Rate": 1.0658799825278565e-07, "Pretrain/Loss": 1.9875143766403198, "Pretrain/Loss (Raw)": 2.1213793754577637, "Pretrain/Step": 18529, "Pretrain/Step Time": 8.484354557469487} +{"Pretrain/Learning Rate": 1.0619676819967339e-07, "Pretrain/Loss": 1.9849878549575806, "Pretrain/Loss (Raw)": 1.8309584856033325, "Pretrain/Step": 18530, "Pretrain/Step Time": 8.49236218072474} +{"Pretrain/Learning Rate": 1.0580625594182603e-07, "Pretrain/Loss": 1.9875154495239258, "Pretrain/Loss (Raw)": 2.1732234954833984, "Pretrain/Step": 18531, "Pretrain/Step Time": 8.486443750560284} +{"Pretrain/Learning Rate": 1.0541646149050677e-07, "Pretrain/Loss": 1.9889256954193115, "Pretrain/Loss (Raw)": 1.953551173210144, "Pretrain/Step": 18532, "Pretrain/Step Time": 8.486572779715061} +{"Pretrain/Learning Rate": 1.0502738485695384e-07, "Pretrain/Loss": 1.9860957860946655, "Pretrain/Loss (Raw)": 1.997817039489746, "Pretrain/Step": 18533, "Pretrain/Step Time": 8.482409372925758} +{"Pretrain/Learning Rate": 1.0463902605238607e-07, "Pretrain/Loss": 1.9831342697143555, "Pretrain/Loss (Raw)": 2.052649974822998, "Pretrain/Step": 18534, "Pretrain/Step Time": 8.478007843717933} +{"Pretrain/Learning Rate": 1.0425138508800281e-07, "Pretrain/Loss": 1.9832344055175781, "Pretrain/Loss (Raw)": 2.0317206382751465, "Pretrain/Step": 18535, "Pretrain/Step Time": 8.480911508202553} +{"Pretrain/Learning Rate": 1.0386446197498123e-07, "Pretrain/Loss": 1.9823224544525146, "Pretrain/Loss (Raw)": 1.8783446550369263, "Pretrain/Step": 18536, "Pretrain/Step Time": 8.487339114770293} +{"Pretrain/Learning Rate": 1.034782567244763e-07, "Pretrain/Loss": 1.9859668016433716, "Pretrain/Loss (Raw)": 2.116675615310669, "Pretrain/Step": 18537, "Pretrain/Step Time": 8.484301880002022} +{"Pretrain/Learning Rate": 1.0309276934762357e-07, "Pretrain/Loss": 1.9855366945266724, "Pretrain/Loss (Raw)": 1.9482461214065552, "Pretrain/Step": 18538, "Pretrain/Step Time": 8.48419028148055} +{"Pretrain/Learning Rate": 1.0270799985554191e-07, "Pretrain/Loss": 1.9843913316726685, "Pretrain/Loss (Raw)": 1.909332513809204, "Pretrain/Step": 18539, "Pretrain/Step Time": 8.48257315158844} +{"Pretrain/Learning Rate": 1.0232394825932245e-07, "Pretrain/Loss": 1.9833636283874512, "Pretrain/Loss (Raw)": 1.6773709058761597, "Pretrain/Step": 18540, "Pretrain/Step Time": 8.480785539373755} +{"Pretrain/Learning Rate": 1.0194061457003968e-07, "Pretrain/Loss": 1.9832050800323486, "Pretrain/Loss (Raw)": 1.9331904649734497, "Pretrain/Step": 18541, "Pretrain/Step Time": 8.483175840228796} +{"Pretrain/Learning Rate": 1.0155799879874861e-07, "Pretrain/Loss": 1.983597993850708, "Pretrain/Loss (Raw)": 1.8271247148513794, "Pretrain/Step": 18542, "Pretrain/Step Time": 8.480784058570862} +{"Pretrain/Learning Rate": 1.0117610095647934e-07, "Pretrain/Loss": 1.9843864440917969, "Pretrain/Loss (Raw)": 2.029442548751831, "Pretrain/Step": 18543, "Pretrain/Step Time": 8.484641505405307} +{"Pretrain/Learning Rate": 1.0079492105424526e-07, "Pretrain/Loss": 1.9847099781036377, "Pretrain/Loss (Raw)": 1.9534022808074951, "Pretrain/Step": 18544, "Pretrain/Step Time": 8.484410181641579} +{"Pretrain/Learning Rate": 1.004144591030376e-07, "Pretrain/Loss": 1.9848699569702148, "Pretrain/Loss (Raw)": 1.9898736476898193, "Pretrain/Step": 18545, "Pretrain/Step Time": 8.4847327824682} +{"Pretrain/Learning Rate": 1.0003471511382534e-07, "Pretrain/Loss": 1.9845025539398193, "Pretrain/Loss (Raw)": 2.0514211654663086, "Pretrain/Step": 18546, "Pretrain/Step Time": 8.489594655111432} +{"Pretrain/Learning Rate": 9.965568909755806e-08, "Pretrain/Loss": 1.9853790998458862, "Pretrain/Loss (Raw)": 1.9778403043746948, "Pretrain/Step": 18547, "Pretrain/Step Time": 8.487400859594345} +{"Pretrain/Learning Rate": 9.927738106516593e-08, "Pretrain/Loss": 1.9864599704742432, "Pretrain/Loss (Raw)": 2.0493993759155273, "Pretrain/Step": 18548, "Pretrain/Step Time": 8.482492113485932} +{"Pretrain/Learning Rate": 9.889979102755687e-08, "Pretrain/Loss": 1.985948920249939, "Pretrain/Loss (Raw)": 1.8659306764602661, "Pretrain/Step": 18549, "Pretrain/Step Time": 8.478130144998431} +{"Pretrain/Learning Rate": 9.852291899561938e-08, "Pretrain/Loss": 1.9851486682891846, "Pretrain/Loss (Raw)": 2.0121161937713623, "Pretrain/Step": 18550, "Pretrain/Step Time": 8.481931803748012} +{"Pretrain/Learning Rate": 9.814676498021702e-08, "Pretrain/Loss": 1.9824256896972656, "Pretrain/Loss (Raw)": 1.8058855533599854, "Pretrain/Step": 18551, "Pretrain/Step Time": 8.486768873408437} +{"Pretrain/Learning Rate": 9.777132899219943e-08, "Pretrain/Loss": 1.9816079139709473, "Pretrain/Loss (Raw)": 1.8761621713638306, "Pretrain/Step": 18552, "Pretrain/Step Time": 8.485117113217711} +{"Pretrain/Learning Rate": 9.739661104238851e-08, "Pretrain/Loss": 1.9816980361938477, "Pretrain/Loss (Raw)": 1.9909783601760864, "Pretrain/Step": 18553, "Pretrain/Step Time": 8.486713118851185} +{"Pretrain/Learning Rate": 9.702261114159228e-08, "Pretrain/Loss": 1.9821176528930664, "Pretrain/Loss (Raw)": 2.0561437606811523, "Pretrain/Step": 18554, "Pretrain/Step Time": 8.484189534559846} +{"Pretrain/Learning Rate": 9.664932930059378e-08, "Pretrain/Loss": 1.9862816333770752, "Pretrain/Loss (Raw)": 2.0383148193359375, "Pretrain/Step": 18555, "Pretrain/Step Time": 8.48061558790505} +{"Pretrain/Learning Rate": 9.627676553015663e-08, "Pretrain/Loss": 1.98722505569458, "Pretrain/Loss (Raw)": 1.8112190961837769, "Pretrain/Step": 18556, "Pretrain/Step Time": 8.47583362646401} +{"Pretrain/Learning Rate": 9.590491984102224e-08, "Pretrain/Loss": 1.9887468814849854, "Pretrain/Loss (Raw)": 2.1376402378082275, "Pretrain/Step": 18557, "Pretrain/Step Time": 8.481698505580425} +{"Pretrain/Learning Rate": 9.553379224391534e-08, "Pretrain/Loss": 1.9912775754928589, "Pretrain/Loss (Raw)": 2.1921701431274414, "Pretrain/Step": 18558, "Pretrain/Step Time": 8.478894878178835} +{"Pretrain/Learning Rate": 9.516338274953296e-08, "Pretrain/Loss": 1.9907883405685425, "Pretrain/Loss (Raw)": 1.9702471494674683, "Pretrain/Step": 18559, "Pretrain/Step Time": 8.486032783985138} +{"Pretrain/Learning Rate": 9.47936913685582e-08, "Pretrain/Loss": 1.9916105270385742, "Pretrain/Loss (Raw)": 2.1032416820526123, "Pretrain/Step": 18560, "Pretrain/Step Time": 8.484569994732738} +{"Pretrain/Learning Rate": 9.442471811165199e-08, "Pretrain/Loss": 1.9922055006027222, "Pretrain/Loss (Raw)": 2.032602310180664, "Pretrain/Step": 18561, "Pretrain/Step Time": 8.493704326450825} +{"Pretrain/Learning Rate": 9.405646298944748e-08, "Pretrain/Loss": 1.993326187133789, "Pretrain/Loss (Raw)": 2.0923357009887695, "Pretrain/Step": 18562, "Pretrain/Step Time": 8.493387632071972} +{"Pretrain/Learning Rate": 9.368892601257228e-08, "Pretrain/Loss": 1.9938912391662598, "Pretrain/Loss (Raw)": 2.14198899269104, "Pretrain/Step": 18563, "Pretrain/Step Time": 8.488609284162521} +{"Pretrain/Learning Rate": 9.332210719161516e-08, "Pretrain/Loss": 1.9951131343841553, "Pretrain/Loss (Raw)": 2.095566511154175, "Pretrain/Step": 18564, "Pretrain/Step Time": 8.485265046358109} +{"Pretrain/Learning Rate": 9.29560065371593e-08, "Pretrain/Loss": 1.9951258897781372, "Pretrain/Loss (Raw)": 2.001849412918091, "Pretrain/Step": 18565, "Pretrain/Step Time": 8.483354683965445} +{"Pretrain/Learning Rate": 9.259062405975738e-08, "Pretrain/Loss": 1.9949121475219727, "Pretrain/Loss (Raw)": 1.8319475650787354, "Pretrain/Step": 18566, "Pretrain/Step Time": 8.484512615948915} +{"Pretrain/Learning Rate": 9.222595976994541e-08, "Pretrain/Loss": 1.9925322532653809, "Pretrain/Loss (Raw)": 1.9427130222320557, "Pretrain/Step": 18567, "Pretrain/Step Time": 8.490412387996912} +{"Pretrain/Learning Rate": 9.186201367824276e-08, "Pretrain/Loss": 1.9945420026779175, "Pretrain/Loss (Raw)": 2.023420810699463, "Pretrain/Step": 18568, "Pretrain/Step Time": 8.489162690937519} +{"Pretrain/Learning Rate": 9.14987857951355e-08, "Pretrain/Loss": 1.994269847869873, "Pretrain/Loss (Raw)": 2.0754311084747314, "Pretrain/Step": 18569, "Pretrain/Step Time": 8.48877733387053} +{"Pretrain/Learning Rate": 9.113627613110409e-08, "Pretrain/Loss": 1.9994430541992188, "Pretrain/Loss (Raw)": 2.488093376159668, "Pretrain/Step": 18570, "Pretrain/Step Time": 8.487771466374397} +{"Pretrain/Learning Rate": 9.077448469659854e-08, "Pretrain/Loss": 1.9993817806243896, "Pretrain/Loss (Raw)": 2.0709142684936523, "Pretrain/Step": 18571, "Pretrain/Step Time": 8.488600727170706} +{"Pretrain/Learning Rate": 9.041341150204941e-08, "Pretrain/Loss": 1.9972548484802246, "Pretrain/Loss (Raw)": 1.870119571685791, "Pretrain/Step": 18572, "Pretrain/Step Time": 8.485736297443509} +{"Pretrain/Learning Rate": 9.005305655787055e-08, "Pretrain/Loss": 1.9962362051010132, "Pretrain/Loss (Raw)": 1.829275131225586, "Pretrain/Step": 18573, "Pretrain/Step Time": 8.487272068858147} +{"Pretrain/Learning Rate": 8.96934198744509e-08, "Pretrain/Loss": 1.9965441226959229, "Pretrain/Loss (Raw)": 1.9739588499069214, "Pretrain/Step": 18574, "Pretrain/Step Time": 8.481444848701358} +{"Pretrain/Learning Rate": 8.933450146216271e-08, "Pretrain/Loss": 1.9952929019927979, "Pretrain/Loss (Raw)": 1.9854109287261963, "Pretrain/Step": 18575, "Pretrain/Step Time": 8.484175935387611} +{"Pretrain/Learning Rate": 8.897630133135048e-08, "Pretrain/Loss": 1.992720365524292, "Pretrain/Loss (Raw)": 1.6705387830734253, "Pretrain/Step": 18576, "Pretrain/Step Time": 8.488628100603819} +{"Pretrain/Learning Rate": 8.861881949234763e-08, "Pretrain/Loss": 1.9936730861663818, "Pretrain/Loss (Raw)": 1.9804575443267822, "Pretrain/Step": 18577, "Pretrain/Step Time": 8.487861812114716} +{"Pretrain/Learning Rate": 8.826205595545978e-08, "Pretrain/Loss": 1.993504524230957, "Pretrain/Loss (Raw)": 2.0659048557281494, "Pretrain/Step": 18578, "Pretrain/Step Time": 8.489748299121857} +{"Pretrain/Learning Rate": 8.790601073097316e-08, "Pretrain/Loss": 1.992957353591919, "Pretrain/Loss (Raw)": 1.8964698314666748, "Pretrain/Step": 18579, "Pretrain/Step Time": 8.485908241942525} +{"Pretrain/Learning Rate": 8.755068382915455e-08, "Pretrain/Loss": 1.9920865297317505, "Pretrain/Loss (Raw)": 2.036682367324829, "Pretrain/Step": 18580, "Pretrain/Step Time": 8.481406055390835} +{"Pretrain/Learning Rate": 8.719607526024853e-08, "Pretrain/Loss": 1.990821123123169, "Pretrain/Loss (Raw)": 1.9541056156158447, "Pretrain/Step": 18581, "Pretrain/Step Time": 8.48262595757842} +{"Pretrain/Learning Rate": 8.684218503448304e-08, "Pretrain/Loss": 1.9924774169921875, "Pretrain/Loss (Raw)": 2.1487324237823486, "Pretrain/Step": 18582, "Pretrain/Step Time": 8.483678936958313} +{"Pretrain/Learning Rate": 8.648901316206104e-08, "Pretrain/Loss": 1.9928719997406006, "Pretrain/Loss (Raw)": 2.0424671173095703, "Pretrain/Step": 18583, "Pretrain/Step Time": 8.481027375906706} +{"Pretrain/Learning Rate": 8.613655965316603e-08, "Pretrain/Loss": 1.9925930500030518, "Pretrain/Loss (Raw)": 1.872200608253479, "Pretrain/Step": 18584, "Pretrain/Step Time": 8.486751751974225} +{"Pretrain/Learning Rate": 8.578482451795933e-08, "Pretrain/Loss": 1.9938973188400269, "Pretrain/Loss (Raw)": 2.115891218185425, "Pretrain/Step": 18585, "Pretrain/Step Time": 8.488736107945442} +{"Pretrain/Learning Rate": 8.543380776658283e-08, "Pretrain/Loss": 1.995046854019165, "Pretrain/Loss (Raw)": 2.0277152061462402, "Pretrain/Step": 18586, "Pretrain/Step Time": 8.489979974925518} +{"Pretrain/Learning Rate": 8.508350940915899e-08, "Pretrain/Loss": 1.9974536895751953, "Pretrain/Loss (Raw)": 2.1122941970825195, "Pretrain/Step": 18587, "Pretrain/Step Time": 8.488525396212935} +{"Pretrain/Learning Rate": 8.473392945578806e-08, "Pretrain/Loss": 1.99636709690094, "Pretrain/Loss (Raw)": 1.856034755706787, "Pretrain/Step": 18588, "Pretrain/Step Time": 8.486516896635294} +{"Pretrain/Learning Rate": 8.438506791655088e-08, "Pretrain/Loss": 1.9963582754135132, "Pretrain/Loss (Raw)": 1.8779386281967163, "Pretrain/Step": 18589, "Pretrain/Step Time": 8.483527354896069} +{"Pretrain/Learning Rate": 8.403692480150604e-08, "Pretrain/Loss": 1.99576735496521, "Pretrain/Loss (Raw)": 1.8935070037841797, "Pretrain/Step": 18590, "Pretrain/Step Time": 8.485362775623798} +{"Pretrain/Learning Rate": 8.368950012069276e-08, "Pretrain/Loss": 1.9963587522506714, "Pretrain/Loss (Raw)": 2.0149571895599365, "Pretrain/Step": 18591, "Pretrain/Step Time": 8.48399499990046} +{"Pretrain/Learning Rate": 8.334279388412525e-08, "Pretrain/Loss": 1.9965624809265137, "Pretrain/Loss (Raw)": 1.9609112739562988, "Pretrain/Step": 18592, "Pretrain/Step Time": 8.485889449715614} +{"Pretrain/Learning Rate": 8.299680610180661e-08, "Pretrain/Loss": 1.9955254793167114, "Pretrain/Loss (Raw)": 2.1751580238342285, "Pretrain/Step": 18593, "Pretrain/Step Time": 8.485561534762383} +{"Pretrain/Learning Rate": 8.265153678370664e-08, "Pretrain/Loss": 1.9944264888763428, "Pretrain/Loss (Raw)": 1.9195934534072876, "Pretrain/Step": 18594, "Pretrain/Step Time": 8.48323805257678} +{"Pretrain/Learning Rate": 8.230698593978681e-08, "Pretrain/Loss": 1.9922142028808594, "Pretrain/Loss (Raw)": 1.8740307092666626, "Pretrain/Step": 18595, "Pretrain/Step Time": 8.480656368657947} +{"Pretrain/Learning Rate": 8.196315357997809e-08, "Pretrain/Loss": 1.9932191371917725, "Pretrain/Loss (Raw)": 1.8674015998840332, "Pretrain/Step": 18596, "Pretrain/Step Time": 8.480505913496017} +{"Pretrain/Learning Rate": 8.162003971419474e-08, "Pretrain/Loss": 1.9933717250823975, "Pretrain/Loss (Raw)": 2.0223097801208496, "Pretrain/Step": 18597, "Pretrain/Step Time": 8.477421075105667} +{"Pretrain/Learning Rate": 8.127764435233165e-08, "Pretrain/Loss": 1.9904837608337402, "Pretrain/Loss (Raw)": 1.803576111793518, "Pretrain/Step": 18598, "Pretrain/Step Time": 8.477879432961345} +{"Pretrain/Learning Rate": 8.093596750426147e-08, "Pretrain/Loss": 1.9887986183166504, "Pretrain/Loss (Raw)": 2.023472309112549, "Pretrain/Step": 18599, "Pretrain/Step Time": 8.47858602926135} +{"Pretrain/Learning Rate": 8.059500917983742e-08, "Pretrain/Loss": 1.9881045818328857, "Pretrain/Loss (Raw)": 1.9599285125732422, "Pretrain/Step": 18600, "Pretrain/Step Time": 8.483367789536715} +{"Pretrain/Learning Rate": 8.025476938888776e-08, "Pretrain/Loss": 1.984378695487976, "Pretrain/Loss (Raw)": 1.7083003520965576, "Pretrain/Step": 18601, "Pretrain/Step Time": 8.484198305755854} +{"Pretrain/Learning Rate": 7.991524814122408e-08, "Pretrain/Loss": 1.9841749668121338, "Pretrain/Loss (Raw)": 1.934699296951294, "Pretrain/Step": 18602, "Pretrain/Step Time": 8.486607497557998} +{"Pretrain/Learning Rate": 7.957644544663578e-08, "Pretrain/Loss": 1.9827934503555298, "Pretrain/Loss (Raw)": 1.9601011276245117, "Pretrain/Step": 18603, "Pretrain/Step Time": 8.485178453847766} +{"Pretrain/Learning Rate": 7.92383613148956e-08, "Pretrain/Loss": 1.986013650894165, "Pretrain/Loss (Raw)": 2.0732061862945557, "Pretrain/Step": 18604, "Pretrain/Step Time": 8.486561296507716} +{"Pretrain/Learning Rate": 7.890099575574849e-08, "Pretrain/Loss": 1.9864637851715088, "Pretrain/Loss (Raw)": 1.9531142711639404, "Pretrain/Step": 18605, "Pretrain/Step Time": 8.486220279708505} +{"Pretrain/Learning Rate": 7.856434877892004e-08, "Pretrain/Loss": 1.9862185716629028, "Pretrain/Loss (Raw)": 2.0963430404663086, "Pretrain/Step": 18606, "Pretrain/Step Time": 8.480026321485639} +{"Pretrain/Learning Rate": 7.82284203941247e-08, "Pretrain/Loss": 1.986265778541565, "Pretrain/Loss (Raw)": 2.0460760593414307, "Pretrain/Step": 18607, "Pretrain/Step Time": 8.482396321371198} +{"Pretrain/Learning Rate": 7.789321061104082e-08, "Pretrain/Loss": 1.9859122037887573, "Pretrain/Loss (Raw)": 2.0103578567504883, "Pretrain/Step": 18608, "Pretrain/Step Time": 8.486839229241014} +{"Pretrain/Learning Rate": 7.755871943933845e-08, "Pretrain/Loss": 1.9812133312225342, "Pretrain/Loss (Raw)": 1.8153653144836426, "Pretrain/Step": 18609, "Pretrain/Step Time": 8.483001425862312} +{"Pretrain/Learning Rate": 7.722494688866267e-08, "Pretrain/Loss": 1.9812952280044556, "Pretrain/Loss (Raw)": 1.788653016090393, "Pretrain/Step": 18610, "Pretrain/Step Time": 8.484988564625382} +{"Pretrain/Learning Rate": 7.689189296863353e-08, "Pretrain/Loss": 1.9811797142028809, "Pretrain/Loss (Raw)": 1.9650753736495972, "Pretrain/Step": 18611, "Pretrain/Step Time": 8.485480982810259} +{"Pretrain/Learning Rate": 7.655955768886003e-08, "Pretrain/Loss": 1.9821722507476807, "Pretrain/Loss (Raw)": 1.8920234441757202, "Pretrain/Step": 18612, "Pretrain/Step Time": 8.483173782005906} +{"Pretrain/Learning Rate": 7.622794105892061e-08, "Pretrain/Loss": 1.9818718433380127, "Pretrain/Loss (Raw)": 1.8704125881195068, "Pretrain/Step": 18613, "Pretrain/Step Time": 8.477983433753252} +{"Pretrain/Learning Rate": 7.589704308837708e-08, "Pretrain/Loss": 1.982025384902954, "Pretrain/Loss (Raw)": 2.153830051422119, "Pretrain/Step": 18614, "Pretrain/Step Time": 8.476420084014535} +{"Pretrain/Learning Rate": 7.55668637867718e-08, "Pretrain/Loss": 1.9805893898010254, "Pretrain/Loss (Raw)": 1.9285049438476562, "Pretrain/Step": 18615, "Pretrain/Step Time": 8.477774793282151} +{"Pretrain/Learning Rate": 7.52374031636277e-08, "Pretrain/Loss": 1.9805920124053955, "Pretrain/Loss (Raw)": 1.8939248323440552, "Pretrain/Step": 18616, "Pretrain/Step Time": 8.47725821658969} +{"Pretrain/Learning Rate": 7.490866122843998e-08, "Pretrain/Loss": 1.9799370765686035, "Pretrain/Loss (Raw)": 1.9500677585601807, "Pretrain/Step": 18617, "Pretrain/Step Time": 8.47941443696618} +{"Pretrain/Learning Rate": 7.458063799068993e-08, "Pretrain/Loss": 1.9802050590515137, "Pretrain/Loss (Raw)": 1.96566641330719, "Pretrain/Step": 18618, "Pretrain/Step Time": 8.482969053089619} +{"Pretrain/Learning Rate": 7.425333345983943e-08, "Pretrain/Loss": 1.9795689582824707, "Pretrain/Loss (Raw)": 1.9860931634902954, "Pretrain/Step": 18619, "Pretrain/Step Time": 8.485068483278155} +{"Pretrain/Learning Rate": 7.392674764531981e-08, "Pretrain/Loss": 1.9811880588531494, "Pretrain/Loss (Raw)": 2.2735395431518555, "Pretrain/Step": 18620, "Pretrain/Step Time": 8.486509289592505} +{"Pretrain/Learning Rate": 7.360088055654857e-08, "Pretrain/Loss": 1.9817936420440674, "Pretrain/Loss (Raw)": 1.9517937898635864, "Pretrain/Step": 18621, "Pretrain/Step Time": 8.482544461265206} +{"Pretrain/Learning Rate": 7.327573220292928e-08, "Pretrain/Loss": 1.9819252490997314, "Pretrain/Loss (Raw)": 1.9052821397781372, "Pretrain/Step": 18622, "Pretrain/Step Time": 8.478872682899237} +{"Pretrain/Learning Rate": 7.295130259382665e-08, "Pretrain/Loss": 1.9813482761383057, "Pretrain/Loss (Raw)": 1.9438399076461792, "Pretrain/Step": 18623, "Pretrain/Step Time": 8.4771932605654} +{"Pretrain/Learning Rate": 7.262759173860544e-08, "Pretrain/Loss": 1.9824930429458618, "Pretrain/Loss (Raw)": 2.2564191818237305, "Pretrain/Step": 18624, "Pretrain/Step Time": 8.478627493605018} +{"Pretrain/Learning Rate": 7.230459964659153e-08, "Pretrain/Loss": 1.9843566417694092, "Pretrain/Loss (Raw)": 2.1153042316436768, "Pretrain/Step": 18625, "Pretrain/Step Time": 8.477693865075707} +{"Pretrain/Learning Rate": 7.198232632710244e-08, "Pretrain/Loss": 1.9822593927383423, "Pretrain/Loss (Raw)": 1.8200480937957764, "Pretrain/Step": 18626, "Pretrain/Step Time": 8.481494227424264} +{"Pretrain/Learning Rate": 7.166077178943076e-08, "Pretrain/Loss": 1.9838850498199463, "Pretrain/Loss (Raw)": 2.0230705738067627, "Pretrain/Step": 18627, "Pretrain/Step Time": 8.480888932943344} +{"Pretrain/Learning Rate": 7.133993604284684e-08, "Pretrain/Loss": 1.983655571937561, "Pretrain/Loss (Raw)": 1.9343101978302002, "Pretrain/Step": 18628, "Pretrain/Step Time": 8.478927059099078} +{"Pretrain/Learning Rate": 7.101981909660437e-08, "Pretrain/Loss": 1.987731695175171, "Pretrain/Loss (Raw)": 2.1371214389801025, "Pretrain/Step": 18629, "Pretrain/Step Time": 8.474439965561032} +{"Pretrain/Learning Rate": 7.070042095992934e-08, "Pretrain/Loss": 1.990812063217163, "Pretrain/Loss (Raw)": 2.0001678466796875, "Pretrain/Step": 18630, "Pretrain/Step Time": 8.473013620823622} +{"Pretrain/Learning Rate": 7.038174164203381e-08, "Pretrain/Loss": 1.990767478942871, "Pretrain/Loss (Raw)": 2.0816445350646973, "Pretrain/Step": 18631, "Pretrain/Step Time": 8.474190335720778} +{"Pretrain/Learning Rate": 7.006378115210766e-08, "Pretrain/Loss": 1.9895939826965332, "Pretrain/Loss (Raw)": 1.9841134548187256, "Pretrain/Step": 18632, "Pretrain/Step Time": 8.4745135884732} +{"Pretrain/Learning Rate": 6.974653949931575e-08, "Pretrain/Loss": 1.9909422397613525, "Pretrain/Loss (Raw)": 2.0779037475585938, "Pretrain/Step": 18633, "Pretrain/Step Time": 8.479562854394317} +{"Pretrain/Learning Rate": 6.943001669280913e-08, "Pretrain/Loss": 1.9900357723236084, "Pretrain/Loss (Raw)": 1.9961713552474976, "Pretrain/Step": 18634, "Pretrain/Step Time": 8.485651608556509} +{"Pretrain/Learning Rate": 6.911421274171382e-08, "Pretrain/Loss": 1.990419864654541, "Pretrain/Loss (Raw)": 2.119934320449829, "Pretrain/Step": 18635, "Pretrain/Step Time": 8.48726400732994} +{"Pretrain/Learning Rate": 6.879912765513363e-08, "Pretrain/Loss": 1.9883503913879395, "Pretrain/Loss (Raw)": 1.8666350841522217, "Pretrain/Step": 18636, "Pretrain/Step Time": 8.487586215138435} +{"Pretrain/Learning Rate": 6.848476144215577e-08, "Pretrain/Loss": 1.9918861389160156, "Pretrain/Loss (Raw)": 2.307814598083496, "Pretrain/Step": 18637, "Pretrain/Step Time": 8.486909473314881} +{"Pretrain/Learning Rate": 6.81711141118424e-08, "Pretrain/Loss": 1.991905927658081, "Pretrain/Loss (Raw)": 1.9994736909866333, "Pretrain/Step": 18638, "Pretrain/Step Time": 8.484289284795523} +{"Pretrain/Learning Rate": 6.785818567324187e-08, "Pretrain/Loss": 1.9918434619903564, "Pretrain/Loss (Raw)": 1.9115257263183594, "Pretrain/Step": 18639, "Pretrain/Step Time": 8.488746801391244} +{"Pretrain/Learning Rate": 6.754597613537472e-08, "Pretrain/Loss": 1.9934587478637695, "Pretrain/Loss (Raw)": 2.0074291229248047, "Pretrain/Step": 18640, "Pretrain/Step Time": 8.484448093920946} +{"Pretrain/Learning Rate": 6.72344855072421e-08, "Pretrain/Loss": 1.9942688941955566, "Pretrain/Loss (Raw)": 2.13922381401062, "Pretrain/Step": 18641, "Pretrain/Step Time": 8.484994143247604} +{"Pretrain/Learning Rate": 6.69237137978257e-08, "Pretrain/Loss": 1.9945622682571411, "Pretrain/Loss (Raw)": 2.0258076190948486, "Pretrain/Step": 18642, "Pretrain/Step Time": 8.482915697619319} +{"Pretrain/Learning Rate": 6.661366101609057e-08, "Pretrain/Loss": 1.9963568449020386, "Pretrain/Loss (Raw)": 2.5211727619171143, "Pretrain/Step": 18643, "Pretrain/Step Time": 8.490898506715894} +{"Pretrain/Learning Rate": 6.630432717097124e-08, "Pretrain/Loss": 1.995303750038147, "Pretrain/Loss (Raw)": 1.8843286037445068, "Pretrain/Step": 18644, "Pretrain/Step Time": 8.487662769854069} +{"Pretrain/Learning Rate": 6.599571227138834e-08, "Pretrain/Loss": 1.9939124584197998, "Pretrain/Loss (Raw)": 1.7085464000701904, "Pretrain/Step": 18645, "Pretrain/Step Time": 8.490518059581518} +{"Pretrain/Learning Rate": 6.56878163262431e-08, "Pretrain/Loss": 1.9912827014923096, "Pretrain/Loss (Raw)": 1.7619549036026, "Pretrain/Step": 18646, "Pretrain/Step Time": 8.489477973431349} +{"Pretrain/Learning Rate": 6.538063934441452e-08, "Pretrain/Loss": 1.9911386966705322, "Pretrain/Loss (Raw)": 2.1797592639923096, "Pretrain/Step": 18647, "Pretrain/Step Time": 8.48704437352717} +{"Pretrain/Learning Rate": 6.507418133475385e-08, "Pretrain/Loss": 1.9900784492492676, "Pretrain/Loss (Raw)": 1.9034074544906616, "Pretrain/Step": 18648, "Pretrain/Step Time": 8.486334005370736} +{"Pretrain/Learning Rate": 6.476844230610125e-08, "Pretrain/Loss": 1.987152338027954, "Pretrain/Loss (Raw)": 1.7209666967391968, "Pretrain/Step": 18649, "Pretrain/Step Time": 8.487389672547579} +{"Pretrain/Learning Rate": 6.446342226727464e-08, "Pretrain/Loss": 1.9901307821273804, "Pretrain/Loss (Raw)": 2.0729565620422363, "Pretrain/Step": 18650, "Pretrain/Step Time": 8.489359641447663} +{"Pretrain/Learning Rate": 6.415912122706702e-08, "Pretrain/Loss": 1.9909751415252686, "Pretrain/Loss (Raw)": 2.0769333839416504, "Pretrain/Step": 18651, "Pretrain/Step Time": 8.491310251876712} +{"Pretrain/Learning Rate": 6.385553919425191e-08, "Pretrain/Loss": 1.9885340929031372, "Pretrain/Loss (Raw)": 1.7749959230422974, "Pretrain/Step": 18652, "Pretrain/Step Time": 8.494751887395978} +{"Pretrain/Learning Rate": 6.355267617758065e-08, "Pretrain/Loss": 1.9910175800323486, "Pretrain/Loss (Raw)": 2.1665279865264893, "Pretrain/Step": 18653, "Pretrain/Step Time": 8.494514489546418} +{"Pretrain/Learning Rate": 6.325053218579346e-08, "Pretrain/Loss": 1.9866870641708374, "Pretrain/Loss (Raw)": 1.7874339818954468, "Pretrain/Step": 18654, "Pretrain/Step Time": 8.491187993437052} +{"Pretrain/Learning Rate": 6.29491072275945e-08, "Pretrain/Loss": 1.9864537715911865, "Pretrain/Loss (Raw)": 1.9012043476104736, "Pretrain/Step": 18655, "Pretrain/Step Time": 8.489965915679932} +{"Pretrain/Learning Rate": 6.26484013116796e-08, "Pretrain/Loss": 1.9871628284454346, "Pretrain/Loss (Raw)": 2.0353403091430664, "Pretrain/Step": 18656, "Pretrain/Step Time": 8.489875212311745} +{"Pretrain/Learning Rate": 6.234841444671957e-08, "Pretrain/Loss": 1.9865880012512207, "Pretrain/Loss (Raw)": 2.047809600830078, "Pretrain/Step": 18657, "Pretrain/Step Time": 8.488144354894757} +{"Pretrain/Learning Rate": 6.20491466413603e-08, "Pretrain/Loss": 1.9869930744171143, "Pretrain/Loss (Raw)": 1.882806658744812, "Pretrain/Step": 18658, "Pretrain/Step Time": 8.487543124705553} +{"Pretrain/Learning Rate": 6.175059790423654e-08, "Pretrain/Loss": 1.9854671955108643, "Pretrain/Loss (Raw)": 1.9779131412506104, "Pretrain/Step": 18659, "Pretrain/Step Time": 8.486700028181076} +{"Pretrain/Learning Rate": 6.145276824395252e-08, "Pretrain/Loss": 1.9842357635498047, "Pretrain/Loss (Raw)": 1.7959141731262207, "Pretrain/Step": 18660, "Pretrain/Step Time": 8.4917230643332} +{"Pretrain/Learning Rate": 6.115565766909858e-08, "Pretrain/Loss": 1.9832289218902588, "Pretrain/Loss (Raw)": 1.8689433336257935, "Pretrain/Step": 18661, "Pretrain/Step Time": 8.491061760112643} +{"Pretrain/Learning Rate": 6.085926618824012e-08, "Pretrain/Loss": 1.9828135967254639, "Pretrain/Loss (Raw)": 1.9995019435882568, "Pretrain/Step": 18662, "Pretrain/Step Time": 8.491780428215861} +{"Pretrain/Learning Rate": 6.056359380992305e-08, "Pretrain/Loss": 1.9821527004241943, "Pretrain/Loss (Raw)": 1.9471122026443481, "Pretrain/Step": 18663, "Pretrain/Step Time": 8.490185773000121} +{"Pretrain/Learning Rate": 6.026864054267389e-08, "Pretrain/Loss": 1.981710433959961, "Pretrain/Loss (Raw)": 1.8217450380325317, "Pretrain/Step": 18664, "Pretrain/Step Time": 8.488870834931731} +{"Pretrain/Learning Rate": 5.997440639499696e-08, "Pretrain/Loss": 1.9794058799743652, "Pretrain/Loss (Raw)": 1.8216813802719116, "Pretrain/Step": 18665, "Pretrain/Step Time": 8.488775068894029} +{"Pretrain/Learning Rate": 5.968089137537713e-08, "Pretrain/Loss": 1.9803770780563354, "Pretrain/Loss (Raw)": 2.0725700855255127, "Pretrain/Step": 18666, "Pretrain/Step Time": 8.49504023604095} +{"Pretrain/Learning Rate": 5.938809549227708e-08, "Pretrain/Loss": 1.9812843799591064, "Pretrain/Loss (Raw)": 2.025470018386841, "Pretrain/Step": 18667, "Pretrain/Step Time": 8.494793638586998} +{"Pretrain/Learning Rate": 5.9096018754140056e-08, "Pretrain/Loss": 1.9844785928726196, "Pretrain/Loss (Raw)": 2.086228609085083, "Pretrain/Step": 18668, "Pretrain/Step Time": 8.495729668065906} +{"Pretrain/Learning Rate": 5.8804661169384326e-08, "Pretrain/Loss": 1.9858605861663818, "Pretrain/Loss (Raw)": 2.1100869178771973, "Pretrain/Step": 18669, "Pretrain/Step Time": 8.495225602760911} +{"Pretrain/Learning Rate": 5.8514022746417044e-08, "Pretrain/Loss": 1.9866178035736084, "Pretrain/Loss (Raw)": 1.9240493774414062, "Pretrain/Step": 18670, "Pretrain/Step Time": 8.497472608461976} +{"Pretrain/Learning Rate": 5.8224103493614845e-08, "Pretrain/Loss": 1.9862060546875, "Pretrain/Loss (Raw)": 1.9767214059829712, "Pretrain/Step": 18671, "Pretrain/Step Time": 8.489847965538502} +{"Pretrain/Learning Rate": 5.793490341933494e-08, "Pretrain/Loss": 1.9866433143615723, "Pretrain/Loss (Raw)": 2.0093913078308105, "Pretrain/Step": 18672, "Pretrain/Step Time": 8.494899235665798} +{"Pretrain/Learning Rate": 5.764642253192065e-08, "Pretrain/Loss": 1.9858732223510742, "Pretrain/Loss (Raw)": 1.891303300857544, "Pretrain/Step": 18673, "Pretrain/Step Time": 8.495397688820958} +{"Pretrain/Learning Rate": 5.7358660839690325e-08, "Pretrain/Loss": 1.98546302318573, "Pretrain/Loss (Raw)": 1.9988982677459717, "Pretrain/Step": 18674, "Pretrain/Step Time": 8.494408074766397} +{"Pretrain/Learning Rate": 5.707161835093733e-08, "Pretrain/Loss": 1.9846999645233154, "Pretrain/Loss (Raw)": 1.8801742792129517, "Pretrain/Step": 18675, "Pretrain/Step Time": 8.495142675936222} +{"Pretrain/Learning Rate": 5.6785295073941146e-08, "Pretrain/Loss": 1.9853384494781494, "Pretrain/Loss (Raw)": 2.131114959716797, "Pretrain/Step": 18676, "Pretrain/Step Time": 8.495910160243511} +{"Pretrain/Learning Rate": 5.649969101695907e-08, "Pretrain/Loss": 1.9856418371200562, "Pretrain/Loss (Raw)": 1.9047737121582031, "Pretrain/Step": 18677, "Pretrain/Step Time": 8.498777534812689} +{"Pretrain/Learning Rate": 5.6214806188220616e-08, "Pretrain/Loss": 1.9868624210357666, "Pretrain/Loss (Raw)": 2.1683521270751953, "Pretrain/Step": 18678, "Pretrain/Step Time": 8.49630118533969} +{"Pretrain/Learning Rate": 5.5930640595946995e-08, "Pretrain/Loss": 1.9862966537475586, "Pretrain/Loss (Raw)": 1.7334740161895752, "Pretrain/Step": 18679, "Pretrain/Step Time": 8.492179417982697} +{"Pretrain/Learning Rate": 5.564719424832887e-08, "Pretrain/Loss": 1.9886471033096313, "Pretrain/Loss (Raw)": 2.1770167350769043, "Pretrain/Step": 18680, "Pretrain/Step Time": 8.491196533665061} +{"Pretrain/Learning Rate": 5.536446715353749e-08, "Pretrain/Loss": 1.9875423908233643, "Pretrain/Loss (Raw)": 1.849577784538269, "Pretrain/Step": 18681, "Pretrain/Step Time": 8.49080815166235} +{"Pretrain/Learning Rate": 5.5082459319730215e-08, "Pretrain/Loss": 1.9845131635665894, "Pretrain/Loss (Raw)": 1.6683995723724365, "Pretrain/Step": 18682, "Pretrain/Step Time": 8.493591088801622} +{"Pretrain/Learning Rate": 5.4801170755031104e-08, "Pretrain/Loss": 1.984662413597107, "Pretrain/Loss (Raw)": 2.0574214458465576, "Pretrain/Step": 18683, "Pretrain/Step Time": 8.494457924738526} +{"Pretrain/Learning Rate": 5.4520601467558664e-08, "Pretrain/Loss": 1.9838242530822754, "Pretrain/Loss (Raw)": 1.703938364982605, "Pretrain/Step": 18684, "Pretrain/Step Time": 8.496666653081775} +{"Pretrain/Learning Rate": 5.424075146539531e-08, "Pretrain/Loss": 1.982155680656433, "Pretrain/Loss (Raw)": 1.924052119255066, "Pretrain/Step": 18685, "Pretrain/Step Time": 8.489957785233855} +{"Pretrain/Learning Rate": 5.3961620756617926e-08, "Pretrain/Loss": 1.9798840284347534, "Pretrain/Loss (Raw)": 1.9014092683792114, "Pretrain/Step": 18686, "Pretrain/Step Time": 8.490511734038591} +{"Pretrain/Learning Rate": 5.368320934927007e-08, "Pretrain/Loss": 1.9816118478775024, "Pretrain/Loss (Raw)": 2.191396951675415, "Pretrain/Step": 18687, "Pretrain/Step Time": 8.48392635397613} +{"Pretrain/Learning Rate": 5.340551725138143e-08, "Pretrain/Loss": 1.979567050933838, "Pretrain/Loss (Raw)": 1.8415241241455078, "Pretrain/Step": 18688, "Pretrain/Step Time": 8.487728118896484} +{"Pretrain/Learning Rate": 5.3128544470956723e-08, "Pretrain/Loss": 1.9802284240722656, "Pretrain/Loss (Raw)": 2.117245674133301, "Pretrain/Step": 18689, "Pretrain/Step Time": 8.481467947363853} +{"Pretrain/Learning Rate": 5.285229101598399e-08, "Pretrain/Loss": 1.9792661666870117, "Pretrain/Loss (Raw)": 1.9691741466522217, "Pretrain/Step": 18690, "Pretrain/Step Time": 8.480020025745034} +{"Pretrain/Learning Rate": 5.257675689443187e-08, "Pretrain/Loss": 1.9783066511154175, "Pretrain/Loss (Raw)": 2.019171714782715, "Pretrain/Step": 18691, "Pretrain/Step Time": 8.481354959309101} +{"Pretrain/Learning Rate": 5.230194211424122e-08, "Pretrain/Loss": 1.9776362180709839, "Pretrain/Loss (Raw)": 2.0097498893737793, "Pretrain/Step": 18692, "Pretrain/Step Time": 8.486532881855965} +{"Pretrain/Learning Rate": 5.202784668333349e-08, "Pretrain/Loss": 1.9761128425598145, "Pretrain/Loss (Raw)": 1.8068406581878662, "Pretrain/Step": 18693, "Pretrain/Step Time": 8.489294692873955} +{"Pretrain/Learning Rate": 5.175447060961902e-08, "Pretrain/Loss": 1.978264331817627, "Pretrain/Loss (Raw)": 2.107344388961792, "Pretrain/Step": 18694, "Pretrain/Step Time": 8.49020903557539} +{"Pretrain/Learning Rate": 5.148181390097762e-08, "Pretrain/Loss": 1.9788082838058472, "Pretrain/Loss (Raw)": 2.0123450756073, "Pretrain/Step": 18695, "Pretrain/Step Time": 8.484788339585066} +{"Pretrain/Learning Rate": 5.1209876565269654e-08, "Pretrain/Loss": 1.9766120910644531, "Pretrain/Loss (Raw)": 1.742309331893921, "Pretrain/Step": 18696, "Pretrain/Step Time": 8.48824979737401} +{"Pretrain/Learning Rate": 5.093865861033609e-08, "Pretrain/Loss": 1.9765870571136475, "Pretrain/Loss (Raw)": 2.0722312927246094, "Pretrain/Step": 18697, "Pretrain/Step Time": 8.48760186508298} +{"Pretrain/Learning Rate": 5.066816004399844e-08, "Pretrain/Loss": 1.9729251861572266, "Pretrain/Loss (Raw)": 2.01936936378479, "Pretrain/Step": 18698, "Pretrain/Step Time": 8.491733057424426} +{"Pretrain/Learning Rate": 5.039838087405879e-08, "Pretrain/Loss": 1.972819209098816, "Pretrain/Loss (Raw)": 2.057349920272827, "Pretrain/Step": 18699, "Pretrain/Step Time": 8.491763042286038} +{"Pretrain/Learning Rate": 5.012932110829149e-08, "Pretrain/Loss": 1.9743459224700928, "Pretrain/Loss (Raw)": 2.06554913520813, "Pretrain/Step": 18700, "Pretrain/Step Time": 8.488277811557055} +{"Pretrain/Learning Rate": 4.9860980754456997e-08, "Pretrain/Loss": 1.9763349294662476, "Pretrain/Loss (Raw)": 2.083858013153076, "Pretrain/Step": 18701, "Pretrain/Step Time": 8.488491645082831} +{"Pretrain/Learning Rate": 4.9593359820290785e-08, "Pretrain/Loss": 1.9756062030792236, "Pretrain/Loss (Raw)": 1.88068687915802, "Pretrain/Step": 18702, "Pretrain/Step Time": 8.486961718648672} +{"Pretrain/Learning Rate": 4.932645831351446e-08, "Pretrain/Loss": 1.9774324893951416, "Pretrain/Loss (Raw)": 2.219162940979004, "Pretrain/Step": 18703, "Pretrain/Step Time": 8.483968887478113} +{"Pretrain/Learning Rate": 4.906027624181908e-08, "Pretrain/Loss": 1.9789988994598389, "Pretrain/Loss (Raw)": 1.8710484504699707, "Pretrain/Step": 18704, "Pretrain/Step Time": 8.481310414150357} +{"Pretrain/Learning Rate": 4.879481361288185e-08, "Pretrain/Loss": 1.9766429662704468, "Pretrain/Loss (Raw)": 1.6788958311080933, "Pretrain/Step": 18705, "Pretrain/Step Time": 8.487435713410378} +{"Pretrain/Learning Rate": 4.853007043435498e-08, "Pretrain/Loss": 1.9756298065185547, "Pretrain/Loss (Raw)": 1.9362246990203857, "Pretrain/Step": 18706, "Pretrain/Step Time": 8.484375026077032} +{"Pretrain/Learning Rate": 4.8266046713874026e-08, "Pretrain/Loss": 1.9797444343566895, "Pretrain/Loss (Raw)": 2.4231503009796143, "Pretrain/Step": 18707, "Pretrain/Step Time": 8.486174698919058} +{"Pretrain/Learning Rate": 4.800274245905512e-08, "Pretrain/Loss": 1.9804272651672363, "Pretrain/Loss (Raw)": 2.124070167541504, "Pretrain/Step": 18708, "Pretrain/Step Time": 8.481375323608518} +{"Pretrain/Learning Rate": 4.7740157677483854e-08, "Pretrain/Loss": 1.9816969633102417, "Pretrain/Loss (Raw)": 2.1166179180145264, "Pretrain/Step": 18709, "Pretrain/Step Time": 8.486633082851768} +{"Pretrain/Learning Rate": 4.7478292376734735e-08, "Pretrain/Loss": 1.980711817741394, "Pretrain/Loss (Raw)": 2.022641897201538, "Pretrain/Step": 18710, "Pretrain/Step Time": 8.486505286768079} +{"Pretrain/Learning Rate": 4.7217146564360045e-08, "Pretrain/Loss": 1.9811276197433472, "Pretrain/Loss (Raw)": 2.0956881046295166, "Pretrain/Step": 18711, "Pretrain/Step Time": 8.490047667175531} +{"Pretrain/Learning Rate": 4.695672024788989e-08, "Pretrain/Loss": 1.9817039966583252, "Pretrain/Loss (Raw)": 1.945966362953186, "Pretrain/Step": 18712, "Pretrain/Step Time": 8.48268255777657} +{"Pretrain/Learning Rate": 4.669701343482935e-08, "Pretrain/Loss": 1.9813964366912842, "Pretrain/Loss (Raw)": 2.0765388011932373, "Pretrain/Step": 18713, "Pretrain/Step Time": 8.481189223006368} +{"Pretrain/Learning Rate": 4.6438026132669676e-08, "Pretrain/Loss": 1.978381633758545, "Pretrain/Loss (Raw)": 1.641821026802063, "Pretrain/Step": 18714, "Pretrain/Step Time": 8.486091800034046} +{"Pretrain/Learning Rate": 4.6179758348879884e-08, "Pretrain/Loss": 1.9788618087768555, "Pretrain/Loss (Raw)": 2.173753499984741, "Pretrain/Step": 18715, "Pretrain/Step Time": 8.487047398462892} +{"Pretrain/Learning Rate": 4.5922210090904026e-08, "Pretrain/Loss": 1.9781627655029297, "Pretrain/Loss (Raw)": 1.7665587663650513, "Pretrain/Step": 18716, "Pretrain/Step Time": 8.490676490589976} +{"Pretrain/Learning Rate": 4.566538136616949e-08, "Pretrain/Loss": 1.9787170886993408, "Pretrain/Loss (Raw)": 1.948893427848816, "Pretrain/Step": 18717, "Pretrain/Step Time": 8.488866562023759} +{"Pretrain/Learning Rate": 4.540927218208424e-08, "Pretrain/Loss": 1.980413556098938, "Pretrain/Loss (Raw)": 2.1106598377227783, "Pretrain/Step": 18718, "Pretrain/Step Time": 8.49350779876113} +{"Pretrain/Learning Rate": 4.5153882546028484e-08, "Pretrain/Loss": 1.9803646802902222, "Pretrain/Loss (Raw)": 2.0086865425109863, "Pretrain/Step": 18719, "Pretrain/Step Time": 8.489933939650655} +{"Pretrain/Learning Rate": 4.489921246537132e-08, "Pretrain/Loss": 1.9807745218276978, "Pretrain/Loss (Raw)": 2.0133748054504395, "Pretrain/Step": 18720, "Pretrain/Step Time": 8.489241441711783} +{"Pretrain/Learning Rate": 4.464526194745133e-08, "Pretrain/Loss": 1.9781885147094727, "Pretrain/Loss (Raw)": 1.84415602684021, "Pretrain/Step": 18721, "Pretrain/Step Time": 8.488596653565764} +{"Pretrain/Learning Rate": 4.439203099959322e-08, "Pretrain/Loss": 1.977830171585083, "Pretrain/Loss (Raw)": 1.873708724975586, "Pretrain/Step": 18722, "Pretrain/Step Time": 8.49246433377266} +{"Pretrain/Learning Rate": 4.413951962909668e-08, "Pretrain/Loss": 1.9782907962799072, "Pretrain/Loss (Raw)": 1.9330165386199951, "Pretrain/Step": 18723, "Pretrain/Step Time": 8.498647678643465} +{"Pretrain/Learning Rate": 4.3887727843247575e-08, "Pretrain/Loss": 1.979053020477295, "Pretrain/Loss (Raw)": 1.9649397134780884, "Pretrain/Step": 18724, "Pretrain/Step Time": 8.494367457926273} +{"Pretrain/Learning Rate": 4.3636655649301194e-08, "Pretrain/Loss": 1.9795688390731812, "Pretrain/Loss (Raw)": 2.0883421897888184, "Pretrain/Step": 18725, "Pretrain/Step Time": 8.500943725928664} +{"Pretrain/Learning Rate": 4.3386303054498976e-08, "Pretrain/Loss": 1.980443000793457, "Pretrain/Loss (Raw)": 1.915467381477356, "Pretrain/Step": 18726, "Pretrain/Step Time": 8.498910577967763} +{"Pretrain/Learning Rate": 4.313667006605737e-08, "Pretrain/Loss": 1.9795747995376587, "Pretrain/Loss (Raw)": 1.912354588508606, "Pretrain/Step": 18727, "Pretrain/Step Time": 8.49998065829277} +{"Pretrain/Learning Rate": 4.2887756691178946e-08, "Pretrain/Loss": 1.9800748825073242, "Pretrain/Loss (Raw)": 2.0239322185516357, "Pretrain/Step": 18728, "Pretrain/Step Time": 8.492706833407283} +{"Pretrain/Learning Rate": 4.2639562937038525e-08, "Pretrain/Loss": 1.9816386699676514, "Pretrain/Loss (Raw)": 1.9084666967391968, "Pretrain/Step": 18729, "Pretrain/Step Time": 8.490152049809694} +{"Pretrain/Learning Rate": 4.2392088810791486e-08, "Pretrain/Loss": 1.982172966003418, "Pretrain/Loss (Raw)": 2.0030970573425293, "Pretrain/Step": 18730, "Pretrain/Step Time": 8.491631539538503} +{"Pretrain/Learning Rate": 4.214533431957657e-08, "Pretrain/Loss": 1.9817490577697754, "Pretrain/Loss (Raw)": 1.9058207273483276, "Pretrain/Step": 18731, "Pretrain/Step Time": 8.493172600865364} +{"Pretrain/Learning Rate": 4.189929947050475e-08, "Pretrain/Loss": 1.978595495223999, "Pretrain/Loss (Raw)": 1.669557809829712, "Pretrain/Step": 18732, "Pretrain/Step Time": 8.497560570016503} +{"Pretrain/Learning Rate": 4.165398427067313e-08, "Pretrain/Loss": 1.9778072834014893, "Pretrain/Loss (Raw)": 1.852219581604004, "Pretrain/Step": 18733, "Pretrain/Step Time": 8.495256520807743} +{"Pretrain/Learning Rate": 4.140938872715105e-08, "Pretrain/Loss": 1.9765063524246216, "Pretrain/Loss (Raw)": 1.9298356771469116, "Pretrain/Step": 18734, "Pretrain/Step Time": 8.496262051165104} +{"Pretrain/Learning Rate": 4.1165512846999545e-08, "Pretrain/Loss": 1.9746323823928833, "Pretrain/Loss (Raw)": 1.8062011003494263, "Pretrain/Step": 18735, "Pretrain/Step Time": 8.49500997364521} +{"Pretrain/Learning Rate": 4.092235663724353e-08, "Pretrain/Loss": 1.9755792617797852, "Pretrain/Loss (Raw)": 2.1315548419952393, "Pretrain/Step": 18736, "Pretrain/Step Time": 8.48914834111929} +{"Pretrain/Learning Rate": 4.067992010489685e-08, "Pretrain/Loss": 1.9774203300476074, "Pretrain/Loss (Raw)": 2.0510385036468506, "Pretrain/Step": 18737, "Pretrain/Step Time": 8.488527061417699} +{"Pretrain/Learning Rate": 4.043820325694836e-08, "Pretrain/Loss": 1.9812700748443604, "Pretrain/Loss (Raw)": 2.2814035415649414, "Pretrain/Step": 18738, "Pretrain/Step Time": 8.48621103912592} +{"Pretrain/Learning Rate": 4.019720610037025e-08, "Pretrain/Loss": 1.9816055297851562, "Pretrain/Loss (Raw)": 2.0080149173736572, "Pretrain/Step": 18739, "Pretrain/Step Time": 8.493568511679769} +{"Pretrain/Learning Rate": 3.995692864210976e-08, "Pretrain/Loss": 1.983475923538208, "Pretrain/Loss (Raw)": 2.1314265727996826, "Pretrain/Step": 18740, "Pretrain/Step Time": 8.497064296156168} +{"Pretrain/Learning Rate": 3.971737088909466e-08, "Pretrain/Loss": 1.983760118484497, "Pretrain/Loss (Raw)": 1.9068025350570679, "Pretrain/Step": 18741, "Pretrain/Step Time": 8.5071652084589} +{"Pretrain/Learning Rate": 3.9478532848236107e-08, "Pretrain/Loss": 1.9837156534194946, "Pretrain/Loss (Raw)": 2.1481194496154785, "Pretrain/Step": 18742, "Pretrain/Step Time": 8.506987372413278} +{"Pretrain/Learning Rate": 3.924041452641469e-08, "Pretrain/Loss": 1.9844764471054077, "Pretrain/Loss (Raw)": 2.0259077548980713, "Pretrain/Step": 18743, "Pretrain/Step Time": 8.507477419450879} +{"Pretrain/Learning Rate": 3.900301593049993e-08, "Pretrain/Loss": 1.985640287399292, "Pretrain/Loss (Raw)": 2.04288911819458, "Pretrain/Step": 18744, "Pretrain/Step Time": 8.504602050408721} +{"Pretrain/Learning Rate": 3.876633706733912e-08, "Pretrain/Loss": 1.9871388673782349, "Pretrain/Loss (Raw)": 2.141876220703125, "Pretrain/Step": 18745, "Pretrain/Step Time": 8.500806665048003} +{"Pretrain/Learning Rate": 3.853037794375458e-08, "Pretrain/Loss": 1.9875216484069824, "Pretrain/Loss (Raw)": 2.014677047729492, "Pretrain/Step": 18746, "Pretrain/Step Time": 8.501443797722459} +{"Pretrain/Learning Rate": 3.829513856654921e-08, "Pretrain/Loss": 1.988008975982666, "Pretrain/Loss (Raw)": 2.0484561920166016, "Pretrain/Step": 18747, "Pretrain/Step Time": 8.498369140550494} +{"Pretrain/Learning Rate": 3.8060618942506454e-08, "Pretrain/Loss": 1.9858397245407104, "Pretrain/Loss (Raw)": 1.9958895444869995, "Pretrain/Step": 18748, "Pretrain/Step Time": 8.500747300684452} +{"Pretrain/Learning Rate": 3.782681907838759e-08, "Pretrain/Loss": 1.9860097169876099, "Pretrain/Loss (Raw)": 1.9735429286956787, "Pretrain/Step": 18749, "Pretrain/Step Time": 8.501493267714977} +{"Pretrain/Learning Rate": 3.759373898093721e-08, "Pretrain/Loss": 1.9863276481628418, "Pretrain/Loss (Raw)": 1.9459744691848755, "Pretrain/Step": 18750, "Pretrain/Step Time": 8.505163315683603} +{"Pretrain/Learning Rate": 3.736137865687217e-08, "Pretrain/Loss": 1.9854822158813477, "Pretrain/Loss (Raw)": 1.8356298208236694, "Pretrain/Step": 18751, "Pretrain/Step Time": 8.508573241531849} +{"Pretrain/Learning Rate": 3.712973811289544e-08, "Pretrain/Loss": 1.9842009544372559, "Pretrain/Loss (Raw)": 2.0924127101898193, "Pretrain/Step": 18752, "Pretrain/Step Time": 8.507348636165261} +{"Pretrain/Learning Rate": 3.689881735568501e-08, "Pretrain/Loss": 1.9849879741668701, "Pretrain/Loss (Raw)": 2.216052293777466, "Pretrain/Step": 18753, "Pretrain/Step Time": 8.50395074672997} +{"Pretrain/Learning Rate": 3.666861639189667e-08, "Pretrain/Loss": 1.9877912998199463, "Pretrain/Loss (Raw)": 2.1788723468780518, "Pretrain/Step": 18754, "Pretrain/Step Time": 8.497460424900055} +{"Pretrain/Learning Rate": 3.6439135228175105e-08, "Pretrain/Loss": 1.9879580736160278, "Pretrain/Loss (Raw)": 2.0444083213806152, "Pretrain/Step": 18755, "Pretrain/Step Time": 8.497256295755506} +{"Pretrain/Learning Rate": 3.6210373871131684e-08, "Pretrain/Loss": 1.9870967864990234, "Pretrain/Loss (Raw)": 1.824079990386963, "Pretrain/Step": 18756, "Pretrain/Step Time": 8.502966862171888} +{"Pretrain/Learning Rate": 3.5982332327361145e-08, "Pretrain/Loss": 1.9859840869903564, "Pretrain/Loss (Raw)": 1.994695782661438, "Pretrain/Step": 18757, "Pretrain/Step Time": 8.50646672025323} +{"Pretrain/Learning Rate": 3.5755010603444325e-08, "Pretrain/Loss": 1.9858423471450806, "Pretrain/Loss (Raw)": 1.9820189476013184, "Pretrain/Step": 18758, "Pretrain/Step Time": 8.504763767123222} +{"Pretrain/Learning Rate": 3.552840870593155e-08, "Pretrain/Loss": 1.9868457317352295, "Pretrain/Loss (Raw)": 2.210083484649658, "Pretrain/Step": 18759, "Pretrain/Step Time": 8.50245102494955} +{"Pretrain/Learning Rate": 3.530252664135925e-08, "Pretrain/Loss": 1.9863172769546509, "Pretrain/Loss (Raw)": 1.9164763689041138, "Pretrain/Step": 18760, "Pretrain/Step Time": 8.500668531283736} +{"Pretrain/Learning Rate": 3.507736441624165e-08, "Pretrain/Loss": 1.9864795207977295, "Pretrain/Loss (Raw)": 2.0986452102661133, "Pretrain/Step": 18761, "Pretrain/Step Time": 8.496952952817082} +{"Pretrain/Learning Rate": 3.485292203706525e-08, "Pretrain/Loss": 1.9875479936599731, "Pretrain/Loss (Raw)": 2.1329472064971924, "Pretrain/Step": 18762, "Pretrain/Step Time": 8.49243925884366} +{"Pretrain/Learning Rate": 3.462919951030819e-08, "Pretrain/Loss": 1.9899815320968628, "Pretrain/Loss (Raw)": 2.431432008743286, "Pretrain/Step": 18763, "Pretrain/Step Time": 8.490923779085279} +{"Pretrain/Learning Rate": 3.440619684241808e-08, "Pretrain/Loss": 1.9892561435699463, "Pretrain/Loss (Raw)": 1.773793339729309, "Pretrain/Step": 18764, "Pretrain/Step Time": 8.492431171238422} +{"Pretrain/Learning Rate": 3.4183914039825904e-08, "Pretrain/Loss": 1.9874454736709595, "Pretrain/Loss (Raw)": 2.076045513153076, "Pretrain/Step": 18765, "Pretrain/Step Time": 8.490835020318627} +{"Pretrain/Learning Rate": 3.3962351108940414e-08, "Pretrain/Loss": 1.987891435623169, "Pretrain/Loss (Raw)": 2.056546449661255, "Pretrain/Step": 18766, "Pretrain/Step Time": 8.489465156570077} +{"Pretrain/Learning Rate": 3.3741508056148174e-08, "Pretrain/Loss": 1.9892857074737549, "Pretrain/Loss (Raw)": 2.0899996757507324, "Pretrain/Step": 18767, "Pretrain/Step Time": 8.492921156808734} +{"Pretrain/Learning Rate": 3.3521384887824634e-08, "Pretrain/Loss": 1.9885773658752441, "Pretrain/Loss (Raw)": 1.916765570640564, "Pretrain/Step": 18768, "Pretrain/Step Time": 8.492683766409755} +{"Pretrain/Learning Rate": 3.3301981610306396e-08, "Pretrain/Loss": 1.9858081340789795, "Pretrain/Loss (Raw)": 1.784766674041748, "Pretrain/Step": 18769, "Pretrain/Step Time": 8.488773081451654} +{"Pretrain/Learning Rate": 3.308329822993006e-08, "Pretrain/Loss": 1.9841313362121582, "Pretrain/Loss (Raw)": 1.8111672401428223, "Pretrain/Step": 18770, "Pretrain/Step Time": 8.48854810744524} +{"Pretrain/Learning Rate": 3.286533475299336e-08, "Pretrain/Loss": 1.9804967641830444, "Pretrain/Loss (Raw)": 2.0559444427490234, "Pretrain/Step": 18771, "Pretrain/Step Time": 8.487371139228344} +{"Pretrain/Learning Rate": 3.2648091185785713e-08, "Pretrain/Loss": 1.9803318977355957, "Pretrain/Loss (Raw)": 1.8632310628890991, "Pretrain/Step": 18772, "Pretrain/Step Time": 8.491644186899066} +{"Pretrain/Learning Rate": 3.243156753456877e-08, "Pretrain/Loss": 1.9826033115386963, "Pretrain/Loss (Raw)": 1.9992852210998535, "Pretrain/Step": 18773, "Pretrain/Step Time": 8.492007803171873} +{"Pretrain/Learning Rate": 3.2215763805584776e-08, "Pretrain/Loss": 1.9852029085159302, "Pretrain/Loss (Raw)": 2.094721794128418, "Pretrain/Step": 18774, "Pretrain/Step Time": 8.490730991587043} +{"Pretrain/Learning Rate": 3.200068000505929e-08, "Pretrain/Loss": 1.9828801155090332, "Pretrain/Loss (Raw)": 1.8824220895767212, "Pretrain/Step": 18775, "Pretrain/Step Time": 8.488738542422652} +{"Pretrain/Learning Rate": 3.1786316139192917e-08, "Pretrain/Loss": 1.9839239120483398, "Pretrain/Loss (Raw)": 2.037010669708252, "Pretrain/Step": 18776, "Pretrain/Step Time": 8.488341281190515} +{"Pretrain/Learning Rate": 3.1572672214169596e-08, "Pretrain/Loss": 1.9871208667755127, "Pretrain/Loss (Raw)": 2.1301839351654053, "Pretrain/Step": 18777, "Pretrain/Step Time": 8.488197408616543} +{"Pretrain/Learning Rate": 3.135974823614274e-08, "Pretrain/Loss": 1.9849252700805664, "Pretrain/Loss (Raw)": 1.7919199466705322, "Pretrain/Step": 18778, "Pretrain/Step Time": 8.487979730591178} +{"Pretrain/Learning Rate": 3.114754421125743e-08, "Pretrain/Loss": 1.9845380783081055, "Pretrain/Loss (Raw)": 2.0273613929748535, "Pretrain/Step": 18779, "Pretrain/Step Time": 8.486802026629448} +{"Pretrain/Learning Rate": 3.0936060145630996e-08, "Pretrain/Loss": 1.9853907823562622, "Pretrain/Loss (Raw)": 1.8841474056243896, "Pretrain/Step": 18780, "Pretrain/Step Time": 8.48232945613563} +{"Pretrain/Learning Rate": 3.072529604536134e-08, "Pretrain/Loss": 1.9838526248931885, "Pretrain/Loss (Raw)": 1.9696613550186157, "Pretrain/Step": 18781, "Pretrain/Step Time": 8.485573768615723} +{"Pretrain/Learning Rate": 3.0515251916524155e-08, "Pretrain/Loss": 1.9853214025497437, "Pretrain/Loss (Raw)": 1.9754295349121094, "Pretrain/Step": 18782, "Pretrain/Step Time": 8.491034433245659} +{"Pretrain/Learning Rate": 3.030592776517849e-08, "Pretrain/Loss": 1.9855132102966309, "Pretrain/Loss (Raw)": 1.9257477521896362, "Pretrain/Step": 18783, "Pretrain/Step Time": 8.494604181498289} +{"Pretrain/Learning Rate": 3.0097323597358394e-08, "Pretrain/Loss": 1.984954595565796, "Pretrain/Loss (Raw)": 1.9638378620147705, "Pretrain/Step": 18784, "Pretrain/Step Time": 8.491678619757295} +{"Pretrain/Learning Rate": 2.988943941908129e-08, "Pretrain/Loss": 1.9863765239715576, "Pretrain/Loss (Raw)": 2.229823112487793, "Pretrain/Step": 18785, "Pretrain/Step Time": 8.48932782560587} +{"Pretrain/Learning Rate": 2.968227523633682e-08, "Pretrain/Loss": 1.9872775077819824, "Pretrain/Loss (Raw)": 1.9981416463851929, "Pretrain/Step": 18786, "Pretrain/Step Time": 8.48630136065185} +{"Pretrain/Learning Rate": 2.947583105510354e-08, "Pretrain/Loss": 1.9889233112335205, "Pretrain/Loss (Raw)": 2.188554525375366, "Pretrain/Step": 18787, "Pretrain/Step Time": 8.488828400149941} +{"Pretrain/Learning Rate": 2.9270106881329474e-08, "Pretrain/Loss": 1.992050290107727, "Pretrain/Loss (Raw)": 2.196173667907715, "Pretrain/Step": 18788, "Pretrain/Step Time": 8.48709373921156} +{"Pretrain/Learning Rate": 2.9065102720948756e-08, "Pretrain/Loss": 1.9933232069015503, "Pretrain/Loss (Raw)": 2.0318822860717773, "Pretrain/Step": 18789, "Pretrain/Step Time": 8.486884528771043} +{"Pretrain/Learning Rate": 2.8860818579873327e-08, "Pretrain/Loss": 1.991382360458374, "Pretrain/Loss (Raw)": 1.751084566116333, "Pretrain/Step": 18790, "Pretrain/Step Time": 8.490160824730992} +{"Pretrain/Learning Rate": 2.865725446399292e-08, "Pretrain/Loss": 1.991480827331543, "Pretrain/Loss (Raw)": 1.9597119092941284, "Pretrain/Step": 18791, "Pretrain/Step Time": 8.492584938183427} +{"Pretrain/Learning Rate": 2.8454410379175066e-08, "Pretrain/Loss": 1.992841362953186, "Pretrain/Loss (Raw)": 1.9958674907684326, "Pretrain/Step": 18792, "Pretrain/Step Time": 8.486576052382588} +{"Pretrain/Learning Rate": 2.8252286331273413e-08, "Pretrain/Loss": 1.9967026710510254, "Pretrain/Loss (Raw)": 2.315957546234131, "Pretrain/Step": 18793, "Pretrain/Step Time": 8.486516961827874} +{"Pretrain/Learning Rate": 2.8050882326111082e-08, "Pretrain/Loss": 1.996680498123169, "Pretrain/Loss (Raw)": 2.0697197914123535, "Pretrain/Step": 18794, "Pretrain/Step Time": 8.481552435085177} +{"Pretrain/Learning Rate": 2.7850198369497316e-08, "Pretrain/Loss": 1.9961652755737305, "Pretrain/Loss (Raw)": 1.9595056772232056, "Pretrain/Step": 18795, "Pretrain/Step Time": 8.482259701937437} +{"Pretrain/Learning Rate": 2.7650234467221926e-08, "Pretrain/Loss": 1.9944534301757812, "Pretrain/Loss (Raw)": 1.8671185970306396, "Pretrain/Step": 18796, "Pretrain/Step Time": 8.486588573083282} +{"Pretrain/Learning Rate": 2.7450990625044192e-08, "Pretrain/Loss": 1.9938559532165527, "Pretrain/Loss (Raw)": 2.0336050987243652, "Pretrain/Step": 18797, "Pretrain/Step Time": 8.482253916561604} +{"Pretrain/Learning Rate": 2.72524668487123e-08, "Pretrain/Loss": 1.9943301677703857, "Pretrain/Loss (Raw)": 1.984763503074646, "Pretrain/Step": 18798, "Pretrain/Step Time": 8.48219844698906} +{"Pretrain/Learning Rate": 2.7054663143954995e-08, "Pretrain/Loss": 1.993462085723877, "Pretrain/Loss (Raw)": 1.8656208515167236, "Pretrain/Step": 18799, "Pretrain/Step Time": 8.48627483844757} +{"Pretrain/Learning Rate": 2.6857579516467725e-08, "Pretrain/Loss": 1.9920501708984375, "Pretrain/Loss (Raw)": 1.8286347389221191, "Pretrain/Step": 18800, "Pretrain/Step Time": 8.484911927953362} +{"Pretrain/Learning Rate": 2.6661215971937602e-08, "Pretrain/Loss": 1.992987871170044, "Pretrain/Loss (Raw)": 2.0113437175750732, "Pretrain/Step": 18801, "Pretrain/Step Time": 8.484485868364573} +{"Pretrain/Learning Rate": 2.6465572516029547e-08, "Pretrain/Loss": 1.9938039779663086, "Pretrain/Loss (Raw)": 2.103358745574951, "Pretrain/Step": 18802, "Pretrain/Step Time": 8.482393257319927} +{"Pretrain/Learning Rate": 2.6270649154377937e-08, "Pretrain/Loss": 1.9943616390228271, "Pretrain/Loss (Raw)": 1.9515440464019775, "Pretrain/Step": 18803, "Pretrain/Step Time": 8.477671032771468} +{"Pretrain/Learning Rate": 2.6076445892608826e-08, "Pretrain/Loss": 1.992917776107788, "Pretrain/Loss (Raw)": 1.9463131427764893, "Pretrain/Step": 18804, "Pretrain/Step Time": 8.478220945224166} +{"Pretrain/Learning Rate": 2.5882962736320515e-08, "Pretrain/Loss": 1.9935297966003418, "Pretrain/Loss (Raw)": 1.983119249343872, "Pretrain/Step": 18805, "Pretrain/Step Time": 8.478514689952135} +{"Pretrain/Learning Rate": 2.56901996910891e-08, "Pretrain/Loss": 1.9916448593139648, "Pretrain/Loss (Raw)": 1.9270691871643066, "Pretrain/Step": 18806, "Pretrain/Step Time": 8.483245505020022} +{"Pretrain/Learning Rate": 2.54981567624768e-08, "Pretrain/Loss": 1.9954801797866821, "Pretrain/Loss (Raw)": 2.2243926525115967, "Pretrain/Step": 18807, "Pretrain/Step Time": 8.481330608949065} +{"Pretrain/Learning Rate": 2.5306833956018072e-08, "Pretrain/Loss": 1.99595046043396, "Pretrain/Loss (Raw)": 2.237212657928467, "Pretrain/Step": 18808, "Pretrain/Step Time": 8.485258888453245} +{"Pretrain/Learning Rate": 2.511623127723073e-08, "Pretrain/Loss": 1.997100830078125, "Pretrain/Loss (Raw)": 1.9968061447143555, "Pretrain/Step": 18809, "Pretrain/Step Time": 8.483342420309782} +{"Pretrain/Learning Rate": 2.492634873161037e-08, "Pretrain/Loss": 2.0000295639038086, "Pretrain/Loss (Raw)": 2.04331111907959, "Pretrain/Step": 18810, "Pretrain/Step Time": 8.479477433487773} +{"Pretrain/Learning Rate": 2.4737186324633177e-08, "Pretrain/Loss": 1.999601125717163, "Pretrain/Loss (Raw)": 2.002573251724243, "Pretrain/Step": 18811, "Pretrain/Step Time": 8.480315940454602} +{"Pretrain/Learning Rate": 2.454874406175589e-08, "Pretrain/Loss": 2.0012757778167725, "Pretrain/Loss (Raw)": 1.918298363685608, "Pretrain/Step": 18812, "Pretrain/Step Time": 8.487642299383879} +{"Pretrain/Learning Rate": 2.4361021948404728e-08, "Pretrain/Loss": 1.9998879432678223, "Pretrain/Loss (Raw)": 1.7463911771774292, "Pretrain/Step": 18813, "Pretrain/Step Time": 8.491302870213985} +{"Pretrain/Learning Rate": 2.4174019989997575e-08, "Pretrain/Loss": 2.001697540283203, "Pretrain/Loss (Raw)": 2.1330347061157227, "Pretrain/Step": 18814, "Pretrain/Step Time": 8.492924945428967} +{"Pretrain/Learning Rate": 2.3987738191927345e-08, "Pretrain/Loss": 2.000598430633545, "Pretrain/Loss (Raw)": 2.0507397651672363, "Pretrain/Step": 18815, "Pretrain/Step Time": 8.496428726240993} +{"Pretrain/Learning Rate": 2.3802176559561963e-08, "Pretrain/Loss": 2.004972457885742, "Pretrain/Loss (Raw)": 2.401392936706543, "Pretrain/Step": 18816, "Pretrain/Step Time": 8.492633495479822} +{"Pretrain/Learning Rate": 2.3617335098255478e-08, "Pretrain/Loss": 2.003387928009033, "Pretrain/Loss (Raw)": 1.9144102334976196, "Pretrain/Step": 18817, "Pretrain/Step Time": 8.489882752299309} +{"Pretrain/Learning Rate": 2.343321381333419e-08, "Pretrain/Loss": 2.003584384918213, "Pretrain/Loss (Raw)": 1.9943090677261353, "Pretrain/Step": 18818, "Pretrain/Step Time": 8.490571450442076} +{"Pretrain/Learning Rate": 2.3249812710110507e-08, "Pretrain/Loss": 2.0029072761535645, "Pretrain/Loss (Raw)": 1.9325180053710938, "Pretrain/Step": 18819, "Pretrain/Step Time": 8.489524368196726} +{"Pretrain/Learning Rate": 2.3067131793871875e-08, "Pretrain/Loss": 2.002162456512451, "Pretrain/Loss (Raw)": 1.9144201278686523, "Pretrain/Step": 18820, "Pretrain/Step Time": 8.486485300585628} +{"Pretrain/Learning Rate": 2.2885171069880752e-08, "Pretrain/Loss": 2.0047948360443115, "Pretrain/Loss (Raw)": 2.143789529800415, "Pretrain/Step": 18821, "Pretrain/Step Time": 8.486897116526961} +{"Pretrain/Learning Rate": 2.270393054339126e-08, "Pretrain/Loss": 2.005563735961914, "Pretrain/Loss (Raw)": 2.2057344913482666, "Pretrain/Step": 18822, "Pretrain/Step Time": 8.484759882092476} +{"Pretrain/Learning Rate": 2.2523410219627005e-08, "Pretrain/Loss": 2.0057249069213867, "Pretrain/Loss (Raw)": 2.032985210418701, "Pretrain/Step": 18823, "Pretrain/Step Time": 8.49399895593524} +{"Pretrain/Learning Rate": 2.2343610103789382e-08, "Pretrain/Loss": 2.0076217651367188, "Pretrain/Loss (Raw)": 1.98514986038208, "Pretrain/Step": 18824, "Pretrain/Step Time": 8.492924241349101} +{"Pretrain/Learning Rate": 2.2164530201068677e-08, "Pretrain/Loss": 2.003682851791382, "Pretrain/Loss (Raw)": 1.568013072013855, "Pretrain/Step": 18825, "Pretrain/Step Time": 8.494304774329066} +{"Pretrain/Learning Rate": 2.1986170516621886e-08, "Pretrain/Loss": 2.003648281097412, "Pretrain/Loss (Raw)": 2.0149214267730713, "Pretrain/Step": 18826, "Pretrain/Step Time": 8.492107715457678} +{"Pretrain/Learning Rate": 2.1808531055597657e-08, "Pretrain/Loss": 2.003053665161133, "Pretrain/Loss (Raw)": 1.981258511543274, "Pretrain/Step": 18827, "Pretrain/Step Time": 8.494169272482395} +{"Pretrain/Learning Rate": 2.1631611823116906e-08, "Pretrain/Loss": 2.00376296043396, "Pretrain/Loss (Raw)": 2.1563501358032227, "Pretrain/Step": 18828, "Pretrain/Step Time": 8.495725877583027} +{"Pretrain/Learning Rate": 2.1455412824278322e-08, "Pretrain/Loss": 2.0071680545806885, "Pretrain/Loss (Raw)": 2.5197134017944336, "Pretrain/Step": 18829, "Pretrain/Step Time": 8.49324250780046} +{"Pretrain/Learning Rate": 2.1279934064166728e-08, "Pretrain/Loss": 2.009896993637085, "Pretrain/Loss (Raw)": 2.2299797534942627, "Pretrain/Step": 18830, "Pretrain/Step Time": 8.494447270408273} +{"Pretrain/Learning Rate": 2.110517554783642e-08, "Pretrain/Loss": 2.009634017944336, "Pretrain/Loss (Raw)": 2.1855111122131348, "Pretrain/Step": 18831, "Pretrain/Step Time": 8.496162831783295} +{"Pretrain/Learning Rate": 2.093113728033058e-08, "Pretrain/Loss": 2.0109403133392334, "Pretrain/Loss (Raw)": 2.0382442474365234, "Pretrain/Step": 18832, "Pretrain/Step Time": 8.495643872767687} +{"Pretrain/Learning Rate": 2.0757819266664648e-08, "Pretrain/Loss": 2.0142664909362793, "Pretrain/Loss (Raw)": 2.104640007019043, "Pretrain/Step": 18833, "Pretrain/Step Time": 8.49051639251411} +{"Pretrain/Learning Rate": 2.058522151184017e-08, "Pretrain/Loss": 2.0157864093780518, "Pretrain/Loss (Raw)": 2.1307830810546875, "Pretrain/Step": 18834, "Pretrain/Step Time": 8.492771353572607} +{"Pretrain/Learning Rate": 2.0413344020830948e-08, "Pretrain/Loss": 2.011770725250244, "Pretrain/Loss (Raw)": 1.9091360569000244, "Pretrain/Step": 18835, "Pretrain/Step Time": 8.49298476614058} +{"Pretrain/Learning Rate": 2.024218679859413e-08, "Pretrain/Loss": 2.010450839996338, "Pretrain/Loss (Raw)": 1.9551130533218384, "Pretrain/Step": 18836, "Pretrain/Step Time": 8.496910454705358} +{"Pretrain/Learning Rate": 2.0071749850061883e-08, "Pretrain/Loss": 2.0114569664001465, "Pretrain/Loss (Raw)": 2.2454216480255127, "Pretrain/Step": 18837, "Pretrain/Step Time": 8.489121479913592} +{"Pretrain/Learning Rate": 1.9902033180152492e-08, "Pretrain/Loss": 2.0096445083618164, "Pretrain/Loss (Raw)": 1.7906640768051147, "Pretrain/Step": 18838, "Pretrain/Step Time": 8.494297614321113} +{"Pretrain/Learning Rate": 1.9733036793759264e-08, "Pretrain/Loss": 2.0044991970062256, "Pretrain/Loss (Raw)": 1.4370648860931396, "Pretrain/Step": 18839, "Pretrain/Step Time": 8.489252928644419} +{"Pretrain/Learning Rate": 1.9564760695753303e-08, "Pretrain/Loss": 2.004807949066162, "Pretrain/Loss (Raw)": 1.9855085611343384, "Pretrain/Step": 18840, "Pretrain/Step Time": 8.49957481585443} +{"Pretrain/Learning Rate": 1.9397204890986288e-08, "Pretrain/Loss": 2.004788637161255, "Pretrain/Loss (Raw)": 2.0740604400634766, "Pretrain/Step": 18841, "Pretrain/Step Time": 8.49685818515718} +{"Pretrain/Learning Rate": 1.9230369384293233e-08, "Pretrain/Loss": 2.0087437629699707, "Pretrain/Loss (Raw)": 2.1480519771575928, "Pretrain/Step": 18842, "Pretrain/Step Time": 8.495102792978287} +{"Pretrain/Learning Rate": 1.9064254180478636e-08, "Pretrain/Loss": 2.0066041946411133, "Pretrain/Loss (Raw)": 1.8999274969100952, "Pretrain/Step": 18843, "Pretrain/Step Time": 8.498270446434617} +{"Pretrain/Learning Rate": 1.8898859284338654e-08, "Pretrain/Loss": 2.010195255279541, "Pretrain/Loss (Raw)": 2.2261791229248047, "Pretrain/Step": 18844, "Pretrain/Step Time": 8.497706910595298} +{"Pretrain/Learning Rate": 1.8734184700638923e-08, "Pretrain/Loss": 2.0101118087768555, "Pretrain/Loss (Raw)": 1.9382448196411133, "Pretrain/Step": 18845, "Pretrain/Step Time": 8.499167481437325} +{"Pretrain/Learning Rate": 1.8570230434125645e-08, "Pretrain/Loss": 2.0088605880737305, "Pretrain/Loss (Raw)": 1.950467824935913, "Pretrain/Step": 18846, "Pretrain/Step Time": 8.49435105547309} +{"Pretrain/Learning Rate": 1.8406996489533923e-08, "Pretrain/Loss": 2.0091090202331543, "Pretrain/Loss (Raw)": 2.040511131286621, "Pretrain/Step": 18847, "Pretrain/Step Time": 8.496489414945245} +{"Pretrain/Learning Rate": 1.8244482871562772e-08, "Pretrain/Loss": 2.008180856704712, "Pretrain/Loss (Raw)": 1.8945688009262085, "Pretrain/Step": 18848, "Pretrain/Step Time": 8.499928463250399} +{"Pretrain/Learning Rate": 1.8082689584900113e-08, "Pretrain/Loss": 2.0099985599517822, "Pretrain/Loss (Raw)": 2.0768213272094727, "Pretrain/Step": 18849, "Pretrain/Step Time": 8.495698895305395} +{"Pretrain/Learning Rate": 1.7921616634214434e-08, "Pretrain/Loss": 2.0125908851623535, "Pretrain/Loss (Raw)": 2.205517292022705, "Pretrain/Step": 18850, "Pretrain/Step Time": 8.49707529693842} +{"Pretrain/Learning Rate": 1.7761264024146462e-08, "Pretrain/Loss": 2.012788772583008, "Pretrain/Loss (Raw)": 1.9583494663238525, "Pretrain/Step": 18851, "Pretrain/Step Time": 8.490575348958373} +{"Pretrain/Learning Rate": 1.760163175932028e-08, "Pretrain/Loss": 2.014477252960205, "Pretrain/Loss (Raw)": 2.181088447570801, "Pretrain/Step": 18852, "Pretrain/Step Time": 8.491084787994623} +{"Pretrain/Learning Rate": 1.744271984434054e-08, "Pretrain/Loss": 2.0142788887023926, "Pretrain/Loss (Raw)": 2.0629076957702637, "Pretrain/Step": 18853, "Pretrain/Step Time": 8.486246462911367} +{"Pretrain/Learning Rate": 1.7284528283786905e-08, "Pretrain/Loss": 2.01438570022583, "Pretrain/Loss (Raw)": 1.9291319847106934, "Pretrain/Step": 18854, "Pretrain/Step Time": 8.493686113506556} +{"Pretrain/Learning Rate": 1.7127057082225174e-08, "Pretrain/Loss": 2.0142202377319336, "Pretrain/Loss (Raw)": 1.8911865949630737, "Pretrain/Step": 18855, "Pretrain/Step Time": 8.49176524952054} +{"Pretrain/Learning Rate": 1.6970306244190603e-08, "Pretrain/Loss": 2.012312889099121, "Pretrain/Loss (Raw)": 1.7797893285751343, "Pretrain/Step": 18856, "Pretrain/Step Time": 8.498165383934975} +{"Pretrain/Learning Rate": 1.6814275774207357e-08, "Pretrain/Loss": 2.0139577388763428, "Pretrain/Loss (Raw)": 2.1190125942230225, "Pretrain/Step": 18857, "Pretrain/Step Time": 8.499103747308254} +{"Pretrain/Learning Rate": 1.6658965676771833e-08, "Pretrain/Loss": 2.0153253078460693, "Pretrain/Loss (Raw)": 2.178166389465332, "Pretrain/Step": 18858, "Pretrain/Step Time": 8.493047948926687} +{"Pretrain/Learning Rate": 1.6504375956361006e-08, "Pretrain/Loss": 2.0142102241516113, "Pretrain/Loss (Raw)": 1.7630975246429443, "Pretrain/Step": 18859, "Pretrain/Step Time": 8.489619135856628} +{"Pretrain/Learning Rate": 1.63505066174352e-08, "Pretrain/Loss": 2.0165021419525146, "Pretrain/Loss (Raw)": 1.9628995656967163, "Pretrain/Step": 18860, "Pretrain/Step Time": 8.490323079749942} +{"Pretrain/Learning Rate": 1.6197357664432533e-08, "Pretrain/Loss": 2.0173237323760986, "Pretrain/Loss (Raw)": 1.9573942422866821, "Pretrain/Step": 18861, "Pretrain/Step Time": 8.491207564249635} +{"Pretrain/Learning Rate": 1.6044929101763362e-08, "Pretrain/Loss": 2.0184895992279053, "Pretrain/Loss (Raw)": 2.0790672302246094, "Pretrain/Step": 18862, "Pretrain/Step Time": 8.493970623239875} +{"Pretrain/Learning Rate": 1.5893220933829723e-08, "Pretrain/Loss": 2.018673896789551, "Pretrain/Loss (Raw)": 1.829798936843872, "Pretrain/Step": 18863, "Pretrain/Step Time": 8.493594072759151} +{"Pretrain/Learning Rate": 1.5742233165000342e-08, "Pretrain/Loss": 2.016892910003662, "Pretrain/Loss (Raw)": 1.9035803079605103, "Pretrain/Step": 18864, "Pretrain/Step Time": 8.493597012013197} +{"Pretrain/Learning Rate": 1.559196579963007e-08, "Pretrain/Loss": 2.015152931213379, "Pretrain/Loss (Raw)": 1.8283261060714722, "Pretrain/Step": 18865, "Pretrain/Step Time": 8.49353395588696} +{"Pretrain/Learning Rate": 1.544241884205433e-08, "Pretrain/Loss": 2.010993719100952, "Pretrain/Loss (Raw)": 1.7490284442901611, "Pretrain/Step": 18866, "Pretrain/Step Time": 8.490815652534366} +{"Pretrain/Learning Rate": 1.5293592296580785e-08, "Pretrain/Loss": 2.0116918087005615, "Pretrain/Loss (Raw)": 2.0973634719848633, "Pretrain/Step": 18867, "Pretrain/Step Time": 8.484416285529733} +{"Pretrain/Learning Rate": 1.5145486167505997e-08, "Pretrain/Loss": 2.010713577270508, "Pretrain/Loss (Raw)": 2.0062108039855957, "Pretrain/Step": 18868, "Pretrain/Step Time": 8.480477245524526} +{"Pretrain/Learning Rate": 1.4998100459098774e-08, "Pretrain/Loss": 2.0136466026306152, "Pretrain/Loss (Raw)": 2.282236337661743, "Pretrain/Step": 18869, "Pretrain/Step Time": 8.472450444474816} +{"Pretrain/Learning Rate": 1.485143517560572e-08, "Pretrain/Loss": 2.0122454166412354, "Pretrain/Loss (Raw)": 1.9687632322311401, "Pretrain/Step": 18870, "Pretrain/Step Time": 8.475574953481555} +{"Pretrain/Learning Rate": 1.4705490321259563e-08, "Pretrain/Loss": 2.012843132019043, "Pretrain/Loss (Raw)": 2.1023988723754883, "Pretrain/Step": 18871, "Pretrain/Step Time": 8.4741883110255} +{"Pretrain/Learning Rate": 1.4560265900265268e-08, "Pretrain/Loss": 2.0134449005126953, "Pretrain/Loss (Raw)": 2.1199469566345215, "Pretrain/Step": 18872, "Pretrain/Step Time": 8.477397587150335} +{"Pretrain/Learning Rate": 1.441576191681393e-08, "Pretrain/Loss": 2.0114071369171143, "Pretrain/Loss (Raw)": 1.8810110092163086, "Pretrain/Step": 18873, "Pretrain/Step Time": 8.47597410902381} +{"Pretrain/Learning Rate": 1.4271978375068884e-08, "Pretrain/Loss": 2.0132670402526855, "Pretrain/Loss (Raw)": 2.2527928352355957, "Pretrain/Step": 18874, "Pretrain/Step Time": 8.47094239667058} +{"Pretrain/Learning Rate": 1.4128915279179589e-08, "Pretrain/Loss": 2.012850522994995, "Pretrain/Loss (Raw)": 1.9951201677322388, "Pretrain/Step": 18875, "Pretrain/Step Time": 8.472350327298045} +{"Pretrain/Learning Rate": 1.3986572633267748e-08, "Pretrain/Loss": 2.012115478515625, "Pretrain/Loss (Raw)": 1.9018033742904663, "Pretrain/Step": 18876, "Pretrain/Step Time": 8.474850906059146} +{"Pretrain/Learning Rate": 1.3844950441438409e-08, "Pretrain/Loss": 2.0139267444610596, "Pretrain/Loss (Raw)": 2.2053797245025635, "Pretrain/Step": 18877, "Pretrain/Step Time": 8.474638983607292} +{"Pretrain/Learning Rate": 1.3704048707777196e-08, "Pretrain/Loss": 2.0145602226257324, "Pretrain/Loss (Raw)": 2.027040719985962, "Pretrain/Step": 18878, "Pretrain/Step Time": 8.474312020465732} +{"Pretrain/Learning Rate": 1.3563867436344747e-08, "Pretrain/Loss": 2.015822410583496, "Pretrain/Loss (Raw)": 1.9972162246704102, "Pretrain/Step": 18879, "Pretrain/Step Time": 8.47199147939682} +{"Pretrain/Learning Rate": 1.3424406631185049e-08, "Pretrain/Loss": 2.0174508094787598, "Pretrain/Loss (Raw)": 2.300828695297241, "Pretrain/Step": 18880, "Pretrain/Step Time": 8.47266642935574} +{"Pretrain/Learning Rate": 1.3285666296317112e-08, "Pretrain/Loss": 2.0157175064086914, "Pretrain/Loss (Raw)": 1.9941951036453247, "Pretrain/Step": 18881, "Pretrain/Step Time": 8.474560771137476} +{"Pretrain/Learning Rate": 1.3147646435743288e-08, "Pretrain/Loss": 2.0144968032836914, "Pretrain/Loss (Raw)": 2.022630453109741, "Pretrain/Step": 18882, "Pretrain/Step Time": 8.477393556386232} +{"Pretrain/Learning Rate": 1.3010347053443728e-08, "Pretrain/Loss": 2.014153003692627, "Pretrain/Loss (Raw)": 2.0004148483276367, "Pretrain/Step": 18883, "Pretrain/Step Time": 8.476750930771232} +{"Pretrain/Learning Rate": 1.28737681533736e-08, "Pretrain/Loss": 2.0145177841186523, "Pretrain/Loss (Raw)": 1.8707795143127441, "Pretrain/Step": 18884, "Pretrain/Step Time": 8.472291924059391} +{"Pretrain/Learning Rate": 1.2737909739474196e-08, "Pretrain/Loss": 2.0146193504333496, "Pretrain/Loss (Raw)": 2.0076611042022705, "Pretrain/Step": 18885, "Pretrain/Step Time": 8.471453718841076} +{"Pretrain/Learning Rate": 1.2602771815664604e-08, "Pretrain/Loss": 2.0146825313568115, "Pretrain/Loss (Raw)": 1.9901185035705566, "Pretrain/Step": 18886, "Pretrain/Step Time": 8.472846560180187} +{"Pretrain/Learning Rate": 1.2468354385836157e-08, "Pretrain/Loss": 2.0117361545562744, "Pretrain/Loss (Raw)": 1.8329386711120605, "Pretrain/Step": 18887, "Pretrain/Step Time": 8.47499300353229} +{"Pretrain/Learning Rate": 1.2334657453869081e-08, "Pretrain/Loss": 2.0118484497070312, "Pretrain/Loss (Raw)": 1.9308537244796753, "Pretrain/Step": 18888, "Pretrain/Step Time": 8.477427270263433} +{"Pretrain/Learning Rate": 1.2201681023615853e-08, "Pretrain/Loss": 2.0101919174194336, "Pretrain/Loss (Raw)": 1.8865879774093628, "Pretrain/Step": 18889, "Pretrain/Step Time": 8.479016112163663} +{"Pretrain/Learning Rate": 1.2069425098912291e-08, "Pretrain/Loss": 2.0089755058288574, "Pretrain/Loss (Raw)": 1.9772967100143433, "Pretrain/Step": 18890, "Pretrain/Step Time": 8.475237753242254} +{"Pretrain/Learning Rate": 1.1937889683572011e-08, "Pretrain/Loss": 2.003541946411133, "Pretrain/Loss (Raw)": 1.735925316810608, "Pretrain/Step": 18891, "Pretrain/Step Time": 8.478686226531863} +{"Pretrain/Learning Rate": 1.1807074781389204e-08, "Pretrain/Loss": 2.0061402320861816, "Pretrain/Loss (Raw)": 2.106349229812622, "Pretrain/Step": 18892, "Pretrain/Step Time": 8.475345104932785} +{"Pretrain/Learning Rate": 1.16769803961303e-08, "Pretrain/Loss": 2.005220413208008, "Pretrain/Loss (Raw)": 1.9583115577697754, "Pretrain/Step": 18893, "Pretrain/Step Time": 8.479868223890662} +{"Pretrain/Learning Rate": 1.15476065315534e-08, "Pretrain/Loss": 2.004443645477295, "Pretrain/Loss (Raw)": 1.957135796546936, "Pretrain/Step": 18894, "Pretrain/Step Time": 8.480613842606544} +{"Pretrain/Learning Rate": 1.1418953191383309e-08, "Pretrain/Loss": 2.003551483154297, "Pretrain/Loss (Raw)": 1.975767970085144, "Pretrain/Step": 18895, "Pretrain/Step Time": 8.475166784599423} +{"Pretrain/Learning Rate": 1.1291020379330942e-08, "Pretrain/Loss": 2.0055341720581055, "Pretrain/Loss (Raw)": 2.1705901622772217, "Pretrain/Step": 18896, "Pretrain/Step Time": 8.477449465543032} +{"Pretrain/Learning Rate": 1.1163808099087792e-08, "Pretrain/Loss": 2.005622148513794, "Pretrain/Loss (Raw)": 1.7960076332092285, "Pretrain/Step": 18897, "Pretrain/Step Time": 8.480631105601788} +{"Pretrain/Learning Rate": 1.103731635432037e-08, "Pretrain/Loss": 2.0049550533294678, "Pretrain/Loss (Raw)": 1.7257862091064453, "Pretrain/Step": 18898, "Pretrain/Step Time": 8.481072686612606} +{"Pretrain/Learning Rate": 1.0911545148675762e-08, "Pretrain/Loss": 2.00502347946167, "Pretrain/Loss (Raw)": 2.064685583114624, "Pretrain/Step": 18899, "Pretrain/Step Time": 8.476634215563536} +{"Pretrain/Learning Rate": 1.0786494485781618e-08, "Pretrain/Loss": 2.0077810287475586, "Pretrain/Loss (Raw)": 2.216195583343506, "Pretrain/Step": 18900, "Pretrain/Step Time": 8.474875845015049} +{"Pretrain/Learning Rate": 1.0662164369240613e-08, "Pretrain/Loss": 2.007944107055664, "Pretrain/Loss (Raw)": 2.020164966583252, "Pretrain/Step": 18901, "Pretrain/Step Time": 8.472999781370163} +{"Pretrain/Learning Rate": 1.0538554802641543e-08, "Pretrain/Loss": 2.007935047149658, "Pretrain/Loss (Raw)": 2.0935659408569336, "Pretrain/Step": 18902, "Pretrain/Step Time": 8.472820203751326} +{"Pretrain/Learning Rate": 1.0415665789545448e-08, "Pretrain/Loss": 2.0072593688964844, "Pretrain/Loss (Raw)": 1.7959309816360474, "Pretrain/Step": 18903, "Pretrain/Step Time": 8.472327971830964} +{"Pretrain/Learning Rate": 1.0293497333496715e-08, "Pretrain/Loss": 2.0065338611602783, "Pretrain/Loss (Raw)": 1.9441449642181396, "Pretrain/Step": 18904, "Pretrain/Step Time": 8.474551668390632} +{"Pretrain/Learning Rate": 1.0172049438020304e-08, "Pretrain/Loss": 2.0035479068756104, "Pretrain/Loss (Raw)": 1.7479884624481201, "Pretrain/Step": 18905, "Pretrain/Step Time": 8.473991902545094} +{"Pretrain/Learning Rate": 1.0051322106613415e-08, "Pretrain/Loss": 2.0014824867248535, "Pretrain/Loss (Raw)": 1.5275530815124512, "Pretrain/Step": 18906, "Pretrain/Step Time": 8.473474357277155} +{"Pretrain/Learning Rate": 9.931315342762148e-09, "Pretrain/Loss": 2.001067876815796, "Pretrain/Loss (Raw)": 1.9742869138717651, "Pretrain/Step": 18907, "Pretrain/Step Time": 8.475801151245832} +{"Pretrain/Learning Rate": 9.812029149924851e-09, "Pretrain/Loss": 2.0019373893737793, "Pretrain/Loss (Raw)": 1.995422601699829, "Pretrain/Step": 18908, "Pretrain/Step Time": 8.476881856098771} +{"Pretrain/Learning Rate": 9.693463531540436e-09, "Pretrain/Loss": 2.0033984184265137, "Pretrain/Loss (Raw)": 2.1566884517669678, "Pretrain/Step": 18909, "Pretrain/Step Time": 8.472351104021072} +{"Pretrain/Learning Rate": 9.575618491025618e-09, "Pretrain/Loss": 2.004585027694702, "Pretrain/Loss (Raw)": 2.1273181438446045, "Pretrain/Step": 18910, "Pretrain/Step Time": 8.473113415762782} +{"Pretrain/Learning Rate": 9.458494031783227e-09, "Pretrain/Loss": 2.0064520835876465, "Pretrain/Loss (Raw)": 2.1647398471832275, "Pretrain/Step": 18911, "Pretrain/Step Time": 8.470262926071882} +{"Pretrain/Learning Rate": 9.342090157188343e-09, "Pretrain/Loss": 2.0066089630126953, "Pretrain/Loss (Raw)": 1.9839304685592651, "Pretrain/Step": 18912, "Pretrain/Step Time": 8.471561765298247} +{"Pretrain/Learning Rate": 9.226406870596616e-09, "Pretrain/Loss": 2.004331588745117, "Pretrain/Loss (Raw)": 1.9382989406585693, "Pretrain/Step": 18913, "Pretrain/Step Time": 8.474417915567756} +{"Pretrain/Learning Rate": 9.111444175341488e-09, "Pretrain/Loss": 2.004733085632324, "Pretrain/Loss (Raw)": 2.0495238304138184, "Pretrain/Step": 18914, "Pretrain/Step Time": 8.470070704817772} +{"Pretrain/Learning Rate": 8.997202074745303e-09, "Pretrain/Loss": 2.0046226978302, "Pretrain/Loss (Raw)": 2.1744329929351807, "Pretrain/Step": 18915, "Pretrain/Step Time": 8.472416615113616} +{"Pretrain/Learning Rate": 8.883680572094322e-09, "Pretrain/Loss": 2.002647638320923, "Pretrain/Loss (Raw)": 1.9433667659759521, "Pretrain/Step": 18916, "Pretrain/Step Time": 8.46972594410181} +{"Pretrain/Learning Rate": 8.770879670663701e-09, "Pretrain/Loss": 2.001098394393921, "Pretrain/Loss (Raw)": 1.8335812091827393, "Pretrain/Step": 18917, "Pretrain/Step Time": 8.470475627109408} +{"Pretrain/Learning Rate": 8.65879937370917e-09, "Pretrain/Loss": 2.002290725708008, "Pretrain/Loss (Raw)": 1.9037278890609741, "Pretrain/Step": 18918, "Pretrain/Step Time": 8.46791297197342} +{"Pretrain/Learning Rate": 8.547439684458702e-09, "Pretrain/Loss": 2.0034806728363037, "Pretrain/Loss (Raw)": 2.1119883060455322, "Pretrain/Step": 18919, "Pretrain/Step Time": 8.465290512889624} +{"Pretrain/Learning Rate": 8.436800606126393e-09, "Pretrain/Loss": 2.002589225769043, "Pretrain/Loss (Raw)": 1.8817819356918335, "Pretrain/Step": 18920, "Pretrain/Step Time": 8.466590318828821} +{"Pretrain/Learning Rate": 8.32688214190136e-09, "Pretrain/Loss": 1.9993526935577393, "Pretrain/Loss (Raw)": 1.9017077684402466, "Pretrain/Step": 18921, "Pretrain/Step Time": 8.4697658829391} +{"Pretrain/Learning Rate": 8.217684294950512e-09, "Pretrain/Loss": 1.9973455667495728, "Pretrain/Loss (Raw)": 1.8127756118774414, "Pretrain/Step": 18922, "Pretrain/Step Time": 8.471807304769754} +{"Pretrain/Learning Rate": 8.109207068426883e-09, "Pretrain/Loss": 1.9969232082366943, "Pretrain/Loss (Raw)": 1.9054535627365112, "Pretrain/Step": 18923, "Pretrain/Step Time": 8.47079772502184} +{"Pretrain/Learning Rate": 8.001450465455751e-09, "Pretrain/Loss": 1.9964735507965088, "Pretrain/Loss (Raw)": 1.809556007385254, "Pretrain/Step": 18924, "Pretrain/Step Time": 8.467176796868443} +{"Pretrain/Learning Rate": 7.89441448914574e-09, "Pretrain/Loss": 1.9974814653396606, "Pretrain/Loss (Raw)": 2.1626060009002686, "Pretrain/Step": 18925, "Pretrain/Step Time": 8.472309792414308} +{"Pretrain/Learning Rate": 7.788099142580495e-09, "Pretrain/Loss": 1.994942545890808, "Pretrain/Loss (Raw)": 1.659793734550476, "Pretrain/Step": 18926, "Pretrain/Step Time": 8.470245903357863} +{"Pretrain/Learning Rate": 7.682504428827009e-09, "Pretrain/Loss": 1.997110366821289, "Pretrain/Loss (Raw)": 2.1430916786193848, "Pretrain/Step": 18927, "Pretrain/Step Time": 8.466345984488726} +{"Pretrain/Learning Rate": 7.577630350930064e-09, "Pretrain/Loss": 1.9972296953201294, "Pretrain/Loss (Raw)": 1.8439172506332397, "Pretrain/Step": 18928, "Pretrain/Step Time": 8.466982094570994} +{"Pretrain/Learning Rate": 7.473476911912248e-09, "Pretrain/Loss": 1.9973763227462769, "Pretrain/Loss (Raw)": 2.030111074447632, "Pretrain/Step": 18929, "Pretrain/Step Time": 8.465655997395515} +{"Pretrain/Learning Rate": 7.370044114779484e-09, "Pretrain/Loss": 1.9963574409484863, "Pretrain/Loss (Raw)": 1.972953200340271, "Pretrain/Step": 18930, "Pretrain/Step Time": 8.465080378577113} +{"Pretrain/Learning Rate": 7.2673319625155e-09, "Pretrain/Loss": 1.998013973236084, "Pretrain/Loss (Raw)": 2.163564443588257, "Pretrain/Step": 18931, "Pretrain/Step Time": 8.461738184094429} +{"Pretrain/Learning Rate": 7.165340458076264e-09, "Pretrain/Loss": 2.0012364387512207, "Pretrain/Loss (Raw)": 2.358781337738037, "Pretrain/Step": 18932, "Pretrain/Step Time": 8.463386481627822} +{"Pretrain/Learning Rate": 7.064069604406642e-09, "Pretrain/Loss": 2.002314805984497, "Pretrain/Loss (Raw)": 2.12115478515625, "Pretrain/Step": 18933, "Pretrain/Step Time": 8.461422562599182} +{"Pretrain/Learning Rate": 6.963519404423746e-09, "Pretrain/Loss": 2.003129482269287, "Pretrain/Loss (Raw)": 2.031374454498291, "Pretrain/Step": 18934, "Pretrain/Step Time": 8.45977434515953} +{"Pretrain/Learning Rate": 6.863689861030809e-09, "Pretrain/Loss": 2.0017378330230713, "Pretrain/Loss (Raw)": 2.0462379455566406, "Pretrain/Step": 18935, "Pretrain/Step Time": 8.460356274619699} +{"Pretrain/Learning Rate": 6.7645809771033074e-09, "Pretrain/Loss": 1.9997797012329102, "Pretrain/Loss (Raw)": 1.9866029024124146, "Pretrain/Step": 18936, "Pretrain/Step Time": 8.455819517374039} +{"Pretrain/Learning Rate": 6.666192755502842e-09, "Pretrain/Loss": 1.9990248680114746, "Pretrain/Loss (Raw)": 1.9001842737197876, "Pretrain/Step": 18937, "Pretrain/Step Time": 8.456546820700169} +{"Pretrain/Learning Rate": 6.5685251990604825e-09, "Pretrain/Loss": 1.9985029697418213, "Pretrain/Loss (Raw)": 1.976475477218628, "Pretrain/Step": 18938, "Pretrain/Step Time": 8.461971713230014} +{"Pretrain/Learning Rate": 6.471578310596194e-09, "Pretrain/Loss": 1.9979405403137207, "Pretrain/Loss (Raw)": 1.9305917024612427, "Pretrain/Step": 18939, "Pretrain/Step Time": 8.459442084655166} +{"Pretrain/Learning Rate": 6.375352092904962e-09, "Pretrain/Loss": 1.9975813627243042, "Pretrain/Loss (Raw)": 1.8723307847976685, "Pretrain/Step": 18940, "Pretrain/Step Time": 8.454506104812026} +{"Pretrain/Learning Rate": 6.279846548762347e-09, "Pretrain/Loss": 2.0001962184906006, "Pretrain/Loss (Raw)": 2.081076145172119, "Pretrain/Step": 18941, "Pretrain/Step Time": 8.448578661307693} +{"Pretrain/Learning Rate": 6.185061680918925e-09, "Pretrain/Loss": 1.9986121654510498, "Pretrain/Loss (Raw)": 1.9302970170974731, "Pretrain/Step": 18942, "Pretrain/Step Time": 8.45350562594831} +{"Pretrain/Learning Rate": 6.090997492111394e-09, "Pretrain/Loss": 1.9972907304763794, "Pretrain/Loss (Raw)": 1.8815940618515015, "Pretrain/Step": 18943, "Pretrain/Step Time": 8.449404766783118} +{"Pretrain/Learning Rate": 5.997653985048701e-09, "Pretrain/Loss": 1.992736577987671, "Pretrain/Loss (Raw)": 1.8184542655944824, "Pretrain/Step": 18944, "Pretrain/Step Time": 8.450609793886542} +{"Pretrain/Learning Rate": 5.905031162423136e-09, "Pretrain/Loss": 1.990709662437439, "Pretrain/Loss (Raw)": 1.6549687385559082, "Pretrain/Step": 18945, "Pretrain/Step Time": 8.452554542571306} +{"Pretrain/Learning Rate": 5.8131290269103354e-09, "Pretrain/Loss": 1.9869062900543213, "Pretrain/Loss (Raw)": 1.5074641704559326, "Pretrain/Step": 18946, "Pretrain/Step Time": 8.454280868172646} +{"Pretrain/Learning Rate": 5.7219475811526316e-09, "Pretrain/Loss": 1.9890499114990234, "Pretrain/Loss (Raw)": 2.206915855407715, "Pretrain/Step": 18947, "Pretrain/Step Time": 8.452969955280423} +{"Pretrain/Learning Rate": 5.631486827784027e-09, "Pretrain/Loss": 1.9905116558074951, "Pretrain/Loss (Raw)": 2.1015172004699707, "Pretrain/Step": 18948, "Pretrain/Step Time": 8.449076743796468} +{"Pretrain/Learning Rate": 5.541746769410772e-09, "Pretrain/Loss": 1.9900774955749512, "Pretrain/Loss (Raw)": 2.0882158279418945, "Pretrain/Step": 18949, "Pretrain/Step Time": 8.447684722021222} +{"Pretrain/Learning Rate": 5.45272740862246e-09, "Pretrain/Loss": 1.9887375831604004, "Pretrain/Loss (Raw)": 2.0342323780059814, "Pretrain/Step": 18950, "Pretrain/Step Time": 8.4469592012465} +{"Pretrain/Learning Rate": 5.364428747986483e-09, "Pretrain/Loss": 1.9889469146728516, "Pretrain/Loss (Raw)": 2.059788942337036, "Pretrain/Step": 18951, "Pretrain/Step Time": 8.438028203323483} +{"Pretrain/Learning Rate": 5.276850790045251e-09, "Pretrain/Loss": 1.9887018203735352, "Pretrain/Loss (Raw)": 1.953782558441162, "Pretrain/Step": 18952, "Pretrain/Step Time": 8.436039244756103} +{"Pretrain/Learning Rate": 5.189993537324523e-09, "Pretrain/Loss": 1.9917194843292236, "Pretrain/Loss (Raw)": 1.9542598724365234, "Pretrain/Step": 18953, "Pretrain/Step Time": 8.437000662088394} +{"Pretrain/Learning Rate": 5.103856992330624e-09, "Pretrain/Loss": 1.990921974182129, "Pretrain/Loss (Raw)": 1.9128321409225464, "Pretrain/Step": 18954, "Pretrain/Step Time": 8.438066879287362} +{"Pretrain/Learning Rate": 5.018441157547682e-09, "Pretrain/Loss": 1.988952875137329, "Pretrain/Loss (Raw)": 1.7292144298553467, "Pretrain/Step": 18955, "Pretrain/Step Time": 8.43589204736054} +{"Pretrain/Learning Rate": 4.933746035437614e-09, "Pretrain/Loss": 1.9880151748657227, "Pretrain/Loss (Raw)": 2.0363309383392334, "Pretrain/Step": 18956, "Pretrain/Step Time": 8.433558467775583} +{"Pretrain/Learning Rate": 4.849771628442912e-09, "Pretrain/Loss": 1.9842791557312012, "Pretrain/Loss (Raw)": 2.041498899459839, "Pretrain/Step": 18957, "Pretrain/Step Time": 8.43866970576346} +{"Pretrain/Learning Rate": 4.766517938983861e-09, "Pretrain/Loss": 1.9819813966751099, "Pretrain/Loss (Raw)": 1.935871958732605, "Pretrain/Step": 18958, "Pretrain/Step Time": 8.439147602766752} +{"Pretrain/Learning Rate": 4.683984969464095e-09, "Pretrain/Loss": 1.9794789552688599, "Pretrain/Loss (Raw)": 1.8652029037475586, "Pretrain/Step": 18959, "Pretrain/Step Time": 8.440170073881745} +{"Pretrain/Learning Rate": 4.60217272225949e-09, "Pretrain/Loss": 1.9791851043701172, "Pretrain/Loss (Raw)": 2.0006258487701416, "Pretrain/Step": 18960, "Pretrain/Step Time": 8.438815919682384} +{"Pretrain/Learning Rate": 4.521081199729271e-09, "Pretrain/Loss": 1.9764089584350586, "Pretrain/Loss (Raw)": 1.7492997646331787, "Pretrain/Step": 18961, "Pretrain/Step Time": 8.441860565915704} +{"Pretrain/Learning Rate": 4.440710404213233e-09, "Pretrain/Loss": 1.977543830871582, "Pretrain/Loss (Raw)": 2.27604079246521, "Pretrain/Step": 18962, "Pretrain/Step Time": 8.442030569538474} +{"Pretrain/Learning Rate": 4.361060338031742e-09, "Pretrain/Loss": 1.9754236936569214, "Pretrain/Loss (Raw)": 1.6377530097961426, "Pretrain/Step": 18963, "Pretrain/Step Time": 8.442138060927391} +{"Pretrain/Learning Rate": 4.282131003474632e-09, "Pretrain/Loss": 1.9757899045944214, "Pretrain/Loss (Raw)": 2.001981019973755, "Pretrain/Step": 18964, "Pretrain/Step Time": 8.442689357325435} +{"Pretrain/Learning Rate": 4.203922402823412e-09, "Pretrain/Loss": 1.9720745086669922, "Pretrain/Loss (Raw)": 1.7698558568954468, "Pretrain/Step": 18965, "Pretrain/Step Time": 8.441226257011294} +{"Pretrain/Learning Rate": 4.12643453832906e-09, "Pretrain/Loss": 1.9743139743804932, "Pretrain/Loss (Raw)": 2.0773167610168457, "Pretrain/Step": 18966, "Pretrain/Step Time": 8.439657483249903} +{"Pretrain/Learning Rate": 4.049667412231451e-09, "Pretrain/Loss": 1.977729320526123, "Pretrain/Loss (Raw)": 1.8742414712905884, "Pretrain/Step": 18967, "Pretrain/Step Time": 8.445032693445683} +{"Pretrain/Learning Rate": 3.9736210267399265e-09, "Pretrain/Loss": 1.9809327125549316, "Pretrain/Loss (Raw)": 2.3955397605895996, "Pretrain/Step": 18968, "Pretrain/Step Time": 8.439345587044954} +{"Pretrain/Learning Rate": 3.898295384044403e-09, "Pretrain/Loss": 1.980010986328125, "Pretrain/Loss (Raw)": 1.9560625553131104, "Pretrain/Step": 18969, "Pretrain/Step Time": 8.441263735294342} +{"Pretrain/Learning Rate": 3.823690486323694e-09, "Pretrain/Loss": 1.9778189659118652, "Pretrain/Loss (Raw)": 1.8674744367599487, "Pretrain/Step": 18970, "Pretrain/Step Time": 8.443669514730573} +{"Pretrain/Learning Rate": 3.74980633572608e-09, "Pretrain/Loss": 1.9797722101211548, "Pretrain/Loss (Raw)": 2.1499505043029785, "Pretrain/Step": 18971, "Pretrain/Step Time": 8.43768429942429} +{"Pretrain/Learning Rate": 3.676642934380414e-09, "Pretrain/Loss": 1.9765996932983398, "Pretrain/Loss (Raw)": 1.8201014995574951, "Pretrain/Step": 18972, "Pretrain/Step Time": 8.438311895355582} +{"Pretrain/Learning Rate": 3.6042002843961196e-09, "Pretrain/Loss": 1.9774599075317383, "Pretrain/Loss (Raw)": 2.048349380493164, "Pretrain/Step": 18973, "Pretrain/Step Time": 8.439014134928584} +{"Pretrain/Learning Rate": 3.5324783878659673e-09, "Pretrain/Loss": 1.9774837493896484, "Pretrain/Loss (Raw)": 1.9535064697265625, "Pretrain/Step": 18974, "Pretrain/Step Time": 8.44193760305643} +{"Pretrain/Learning Rate": 3.4614772468549715e-09, "Pretrain/Loss": 1.979764699935913, "Pretrain/Loss (Raw)": 2.332491874694824, "Pretrain/Step": 18975, "Pretrain/Step Time": 8.444703582674265} +{"Pretrain/Learning Rate": 3.3911968634087188e-09, "Pretrain/Loss": 1.9793386459350586, "Pretrain/Loss (Raw)": 1.840031623840332, "Pretrain/Step": 18976, "Pretrain/Step Time": 8.441770680248737} +{"Pretrain/Learning Rate": 3.321637239558917e-09, "Pretrain/Loss": 1.9777860641479492, "Pretrain/Loss (Raw)": 1.878087043762207, "Pretrain/Step": 18977, "Pretrain/Step Time": 8.44250769354403} +{"Pretrain/Learning Rate": 3.252798377306743e-09, "Pretrain/Loss": 1.976285457611084, "Pretrain/Loss (Raw)": 2.0134332180023193, "Pretrain/Step": 18978, "Pretrain/Step Time": 8.443937296047807} +{"Pretrain/Learning Rate": 3.1846802786394957e-09, "Pretrain/Loss": 1.9764025211334229, "Pretrain/Loss (Raw)": 1.9733387231826782, "Pretrain/Step": 18979, "Pretrain/Step Time": 8.441227328032255} +{"Pretrain/Learning Rate": 3.117282945519495e-09, "Pretrain/Loss": 1.9747456312179565, "Pretrain/Loss (Raw)": 1.9690020084381104, "Pretrain/Step": 18980, "Pretrain/Step Time": 8.444061310961843} +{"Pretrain/Learning Rate": 3.050606379889631e-09, "Pretrain/Loss": 1.9745612144470215, "Pretrain/Loss (Raw)": 2.0392966270446777, "Pretrain/Step": 18981, "Pretrain/Step Time": 8.442862713709474} +{"Pretrain/Learning Rate": 2.984650583676141e-09, "Pretrain/Loss": 1.9739527702331543, "Pretrain/Loss (Raw)": 1.8512624502182007, "Pretrain/Step": 18982, "Pretrain/Step Time": 8.436648136004806} +{"Pretrain/Learning Rate": 2.919415558777505e-09, "Pretrain/Loss": 1.9760897159576416, "Pretrain/Loss (Raw)": 2.1647071838378906, "Pretrain/Step": 18983, "Pretrain/Step Time": 8.43864157795906} +{"Pretrain/Learning Rate": 2.8549013070755526e-09, "Pretrain/Loss": 1.976392149925232, "Pretrain/Loss (Raw)": 1.8185137510299683, "Pretrain/Step": 18984, "Pretrain/Step Time": 8.435697859153152} +{"Pretrain/Learning Rate": 2.7911078304299064e-09, "Pretrain/Loss": 1.9728058576583862, "Pretrain/Loss (Raw)": 1.6599485874176025, "Pretrain/Step": 18985, "Pretrain/Step Time": 8.4333072360605} +{"Pretrain/Learning Rate": 2.728035130683537e-09, "Pretrain/Loss": 1.9702019691467285, "Pretrain/Loss (Raw)": 1.84488046169281, "Pretrain/Step": 18986, "Pretrain/Step Time": 8.43789511360228} +{"Pretrain/Learning Rate": 2.6656832096488836e-09, "Pretrain/Loss": 1.9722918272018433, "Pretrain/Loss (Raw)": 2.0306026935577393, "Pretrain/Step": 18987, "Pretrain/Step Time": 8.443072417750955} +{"Pretrain/Learning Rate": 2.6040520691300585e-09, "Pretrain/Loss": 1.9721745252609253, "Pretrain/Loss (Raw)": 1.9478833675384521, "Pretrain/Step": 18988, "Pretrain/Step Time": 8.44248222373426} +{"Pretrain/Learning Rate": 2.543141710900643e-09, "Pretrain/Loss": 1.9735639095306396, "Pretrain/Loss (Raw)": 2.1352460384368896, "Pretrain/Step": 18989, "Pretrain/Step Time": 8.440021933987737} +{"Pretrain/Learning Rate": 2.4829521367175645e-09, "Pretrain/Loss": 1.9727778434753418, "Pretrain/Loss (Raw)": 1.9784462451934814, "Pretrain/Step": 18990, "Pretrain/Step Time": 8.44013286754489} +{"Pretrain/Learning Rate": 2.4234833483155474e-09, "Pretrain/Loss": 1.9735181331634521, "Pretrain/Loss (Raw)": 1.9245562553405762, "Pretrain/Step": 18991, "Pretrain/Step Time": 8.438908336684108} +{"Pretrain/Learning Rate": 2.364735347412661e-09, "Pretrain/Loss": 1.9754045009613037, "Pretrain/Loss (Raw)": 2.1450355052948, "Pretrain/Step": 18992, "Pretrain/Step Time": 8.440249383449554} +{"Pretrain/Learning Rate": 2.306708135696445e-09, "Pretrain/Loss": 1.9774243831634521, "Pretrain/Loss (Raw)": 2.0868563652038574, "Pretrain/Step": 18993, "Pretrain/Step Time": 8.43958943337202} +{"Pretrain/Learning Rate": 2.2494017148488865e-09, "Pretrain/Loss": 1.9802640676498413, "Pretrain/Loss (Raw)": 2.112522602081299, "Pretrain/Step": 18994, "Pretrain/Step Time": 8.446950074285269} +{"Pretrain/Learning Rate": 2.1928160865131165e-09, "Pretrain/Loss": 1.9789903163909912, "Pretrain/Loss (Raw)": 1.9343243837356567, "Pretrain/Step": 18995, "Pretrain/Step Time": 8.443777481094003} +{"Pretrain/Learning Rate": 2.136951252326713e-09, "Pretrain/Loss": 1.9793989658355713, "Pretrain/Loss (Raw)": 2.0585062503814697, "Pretrain/Step": 18996, "Pretrain/Step Time": 8.443095149472356} +{"Pretrain/Learning Rate": 2.0818072138995003e-09, "Pretrain/Loss": 1.9766298532485962, "Pretrain/Loss (Raw)": 1.9277927875518799, "Pretrain/Step": 18997, "Pretrain/Step Time": 8.445452867075801} +{"Pretrain/Learning Rate": 2.0273839728218723e-09, "Pretrain/Loss": 1.9765667915344238, "Pretrain/Loss (Raw)": 1.9606975317001343, "Pretrain/Step": 18998, "Pretrain/Step Time": 8.44254732131958} +{"Pretrain/Learning Rate": 1.9736815306620193e-09, "Pretrain/Loss": 1.9756522178649902, "Pretrain/Loss (Raw)": 1.9853278398513794, "Pretrain/Step": 18999, "Pretrain/Step Time": 8.44529365748167} +{"Pretrain/Learning Rate": 1.920699888968702e-09, "Pretrain/Loss": 1.974755048751831, "Pretrain/Loss (Raw)": 2.005122184753418, "Pretrain/Step": 19000, "Pretrain/Step Time": 8.447188407182693} +{"Pretrain/Learning Rate": 1.8684390492684778e-09, "Pretrain/Loss": 1.9773902893066406, "Pretrain/Loss (Raw)": 2.2183120250701904, "Pretrain/Step": 19001, "Pretrain/Step Time": 8.44821272790432} +{"Pretrain/Learning Rate": 1.8168990130684738e-09, "Pretrain/Loss": 1.9752795696258545, "Pretrain/Loss (Raw)": 1.9826233386993408, "Pretrain/Step": 19002, "Pretrain/Step Time": 8.451029688119888} +{"Pretrain/Learning Rate": 1.766079781856389e-09, "Pretrain/Loss": 1.9749443531036377, "Pretrain/Loss (Raw)": 1.9522101879119873, "Pretrain/Step": 19003, "Pretrain/Step Time": 8.451409235596657} +{"Pretrain/Learning Rate": 1.7159813570977179e-09, "Pretrain/Loss": 1.977422833442688, "Pretrain/Loss (Raw)": 2.2190489768981934, "Pretrain/Step": 19004, "Pretrain/Step Time": 8.444552272558212} +{"Pretrain/Learning Rate": 1.6666037402357503e-09, "Pretrain/Loss": 1.9745311737060547, "Pretrain/Loss (Raw)": 1.8352524042129517, "Pretrain/Step": 19005, "Pretrain/Step Time": 8.446052992716432} +{"Pretrain/Learning Rate": 1.6179469326943474e-09, "Pretrain/Loss": 1.9730052947998047, "Pretrain/Loss (Raw)": 1.8317244052886963, "Pretrain/Step": 19006, "Pretrain/Step Time": 8.445900563150644} +{"Pretrain/Learning Rate": 1.5700109358779413e-09, "Pretrain/Loss": 1.973656177520752, "Pretrain/Loss (Raw)": 2.0805249214172363, "Pretrain/Step": 19007, "Pretrain/Step Time": 8.449658932164311} +{"Pretrain/Learning Rate": 1.5227957511659841e-09, "Pretrain/Loss": 1.9694565534591675, "Pretrain/Loss (Raw)": 1.763275384902954, "Pretrain/Step": 19008, "Pretrain/Step Time": 8.452734181657434} +{"Pretrain/Learning Rate": 1.4763013799212744e-09, "Pretrain/Loss": 1.9687983989715576, "Pretrain/Loss (Raw)": 1.9099550247192383, "Pretrain/Step": 19009, "Pretrain/Step Time": 8.448394792154431} +{"Pretrain/Learning Rate": 1.4305278234844065e-09, "Pretrain/Loss": 1.968177318572998, "Pretrain/Loss (Raw)": 1.943124771118164, "Pretrain/Step": 19010, "Pretrain/Step Time": 8.455351388081908} +{"Pretrain/Learning Rate": 1.385475083176546e-09, "Pretrain/Loss": 1.967572569847107, "Pretrain/Loss (Raw)": 1.9230107069015503, "Pretrain/Step": 19011, "Pretrain/Step Time": 8.453281929716468} +{"Pretrain/Learning Rate": 1.341143160296654e-09, "Pretrain/Loss": 1.9694921970367432, "Pretrain/Loss (Raw)": 2.116483211517334, "Pretrain/Step": 19012, "Pretrain/Step Time": 8.451514419168234} +{"Pretrain/Learning Rate": 1.297532056118711e-09, "Pretrain/Loss": 1.9690406322479248, "Pretrain/Loss (Raw)": 1.9498718976974487, "Pretrain/Step": 19013, "Pretrain/Step Time": 8.456400401890278} +{"Pretrain/Learning Rate": 1.2546417719055958e-09, "Pretrain/Loss": 1.9694368839263916, "Pretrain/Loss (Raw)": 2.0408434867858887, "Pretrain/Step": 19014, "Pretrain/Step Time": 8.455083651468158} +{"Pretrain/Learning Rate": 1.2124723088924316e-09, "Pretrain/Loss": 1.9710434675216675, "Pretrain/Loss (Raw)": 2.038571357727051, "Pretrain/Step": 19015, "Pretrain/Step Time": 8.452450117096305} +{"Pretrain/Learning Rate": 1.1710236682949127e-09, "Pretrain/Loss": 1.9711790084838867, "Pretrain/Loss (Raw)": 1.948198676109314, "Pretrain/Step": 19016, "Pretrain/Step Time": 8.452183300629258} +{"Pretrain/Learning Rate": 1.1302958513065287e-09, "Pretrain/Loss": 1.9743051528930664, "Pretrain/Loss (Raw)": 2.2867350578308105, "Pretrain/Step": 19017, "Pretrain/Step Time": 8.450981261208653} +{"Pretrain/Learning Rate": 1.090288859104116e-09, "Pretrain/Loss": 1.9747424125671387, "Pretrain/Loss (Raw)": 2.033266067504883, "Pretrain/Step": 19018, "Pretrain/Step Time": 8.45097772590816} +{"Pretrain/Learning Rate": 1.0510026928395311e-09, "Pretrain/Loss": 1.9763808250427246, "Pretrain/Loss (Raw)": 1.9456535577774048, "Pretrain/Step": 19019, "Pretrain/Step Time": 8.446555064991117} +{"Pretrain/Learning Rate": 1.0124373536452014e-09, "Pretrain/Loss": 1.976019024848938, "Pretrain/Loss (Raw)": 2.060037851333618, "Pretrain/Step": 19020, "Pretrain/Step Time": 8.452292958274484} +{"Pretrain/Learning Rate": 9.745928426369011e-10, "Pretrain/Loss": 1.9774177074432373, "Pretrain/Loss (Raw)": 2.137328863143921, "Pretrain/Step": 19021, "Pretrain/Step Time": 8.4488924741745} +{"Pretrain/Learning Rate": 9.37469160899873e-10, "Pretrain/Loss": 1.977076768875122, "Pretrain/Loss (Raw)": 1.913511037826538, "Pretrain/Step": 19022, "Pretrain/Step Time": 8.449145121499896} +{"Pretrain/Learning Rate": 9.010663095082584e-10, "Pretrain/Loss": 1.9770795106887817, "Pretrain/Loss (Raw)": 1.976116418838501, "Pretrain/Step": 19023, "Pretrain/Step Time": 8.446785664185882} +{"Pretrain/Learning Rate": 8.65384289513993e-10, "Pretrain/Loss": 1.9731760025024414, "Pretrain/Loss (Raw)": 1.6709288358688354, "Pretrain/Step": 19024, "Pretrain/Step Time": 8.450728544965386} +{"Pretrain/Learning Rate": 8.304231019412578e-10, "Pretrain/Loss": 1.973125696182251, "Pretrain/Loss (Raw)": 1.7895689010620117, "Pretrain/Step": 19025, "Pretrain/Step Time": 8.453179657459259} +{"Pretrain/Learning Rate": 7.961827477975803e-10, "Pretrain/Loss": 1.9747822284698486, "Pretrain/Loss (Raw)": 1.937827467918396, "Pretrain/Step": 19026, "Pretrain/Step Time": 8.454866891726851} +{"Pretrain/Learning Rate": 7.626632280766099e-10, "Pretrain/Loss": 1.973568320274353, "Pretrain/Loss (Raw)": 1.9093096256256104, "Pretrain/Step": 19027, "Pretrain/Step Time": 8.454716876149178} +{"Pretrain/Learning Rate": 7.298645437386898e-10, "Pretrain/Loss": 1.9699821472167969, "Pretrain/Loss (Raw)": 1.7571666240692139, "Pretrain/Step": 19028, "Pretrain/Step Time": 8.45529523678124} +{"Pretrain/Learning Rate": 6.977866957330604e-10, "Pretrain/Loss": 1.9707766771316528, "Pretrain/Loss (Raw)": 2.121868133544922, "Pretrain/Step": 19029, "Pretrain/Step Time": 8.455745430663228} +{"Pretrain/Learning Rate": 6.664296849839824e-10, "Pretrain/Loss": 1.9699829816818237, "Pretrain/Loss (Raw)": 1.9919639825820923, "Pretrain/Step": 19030, "Pretrain/Step Time": 8.457145366817713} +{"Pretrain/Learning Rate": 6.357935123935122e-10, "Pretrain/Loss": 1.9722347259521484, "Pretrain/Loss (Raw)": 2.08415150642395, "Pretrain/Step": 19031, "Pretrain/Step Time": 8.46061778254807} +{"Pretrain/Learning Rate": 6.058781788470524e-10, "Pretrain/Loss": 1.9729143381118774, "Pretrain/Loss (Raw)": 2.0311427116394043, "Pretrain/Step": 19032, "Pretrain/Step Time": 8.457526134327054} +{"Pretrain/Learning Rate": 5.766836852050261e-10, "Pretrain/Loss": 1.9743281602859497, "Pretrain/Loss (Raw)": 1.928966999053955, "Pretrain/Step": 19033, "Pretrain/Step Time": 8.456489093601704} +{"Pretrain/Learning Rate": 5.482100323139782e-10, "Pretrain/Loss": 1.9787883758544922, "Pretrain/Loss (Raw)": 2.0984506607055664, "Pretrain/Step": 19034, "Pretrain/Step Time": 8.456595165655017} +{"Pretrain/Learning Rate": 5.204572209899228e-10, "Pretrain/Loss": 1.9780133962631226, "Pretrain/Loss (Raw)": 1.8750920295715332, "Pretrain/Step": 19035, "Pretrain/Step Time": 8.453005710616708} +{"Pretrain/Learning Rate": 4.934252520349958e-10, "Pretrain/Loss": 1.977471113204956, "Pretrain/Loss (Raw)": 1.9260131120681763, "Pretrain/Step": 19036, "Pretrain/Step Time": 8.457971841096878} +{"Pretrain/Learning Rate": 4.67114126229129e-10, "Pretrain/Loss": 1.9746766090393066, "Pretrain/Loss (Raw)": 1.7989957332611084, "Pretrain/Step": 19037, "Pretrain/Step Time": 8.46116016805172} +{"Pretrain/Learning Rate": 4.415238443300496e-10, "Pretrain/Loss": 1.9729115962982178, "Pretrain/Loss (Raw)": 1.9013956785202026, "Pretrain/Step": 19038, "Pretrain/Step Time": 8.454842308536172} +{"Pretrain/Learning Rate": 4.1665440707605587e-10, "Pretrain/Loss": 1.9683009386062622, "Pretrain/Loss (Raw)": 1.5745742321014404, "Pretrain/Step": 19039, "Pretrain/Step Time": 8.457782860845327} +{"Pretrain/Learning Rate": 3.9250581518601725e-10, "Pretrain/Loss": 1.9682581424713135, "Pretrain/Loss (Raw)": 1.9784444570541382, "Pretrain/Step": 19040, "Pretrain/Step Time": 8.460430124774575} +{"Pretrain/Learning Rate": 3.6907806935382317e-10, "Pretrain/Loss": 1.9693717956542969, "Pretrain/Loss (Raw)": 2.08085298538208, "Pretrain/Step": 19041, "Pretrain/Step Time": 8.461008543148637} +{"Pretrain/Learning Rate": 3.4637117025393406e-10, "Pretrain/Loss": 1.9690568447113037, "Pretrain/Loss (Raw)": 2.0092194080352783, "Pretrain/Step": 19042, "Pretrain/Step Time": 8.46380808390677} +{"Pretrain/Learning Rate": 3.243851185441571e-10, "Pretrain/Loss": 1.966500997543335, "Pretrain/Loss (Raw)": 1.8472645282745361, "Pretrain/Step": 19043, "Pretrain/Step Time": 8.466730196028948} +{"Pretrain/Learning Rate": 3.031199148573194e-10, "Pretrain/Loss": 1.9662469625473022, "Pretrain/Loss (Raw)": 1.9108566045761108, "Pretrain/Step": 19044, "Pretrain/Step Time": 8.464084878563881} +{"Pretrain/Learning Rate": 2.8257555980681915e-10, "Pretrain/Loss": 1.967970848083496, "Pretrain/Loss (Raw)": 2.054246187210083, "Pretrain/Step": 19045, "Pretrain/Step Time": 8.4638062864542} +{"Pretrain/Learning Rate": 2.627520539838502e-10, "Pretrain/Loss": 1.967200517654419, "Pretrain/Loss (Raw)": 1.8051047325134277, "Pretrain/Step": 19046, "Pretrain/Step Time": 8.462526984512806} +{"Pretrain/Learning Rate": 2.4364939796017726e-10, "Pretrain/Loss": 1.9661056995391846, "Pretrain/Loss (Raw)": 1.971867561340332, "Pretrain/Step": 19047, "Pretrain/Step Time": 8.465356113389134} +{"Pretrain/Learning Rate": 2.2526759228813642e-10, "Pretrain/Loss": 1.9671592712402344, "Pretrain/Loss (Raw)": 2.0166268348693848, "Pretrain/Step": 19048, "Pretrain/Step Time": 8.465263767167926} +{"Pretrain/Learning Rate": 2.0760663749508358e-10, "Pretrain/Loss": 1.966341257095337, "Pretrain/Loss (Raw)": 1.7970287799835205, "Pretrain/Step": 19049, "Pretrain/Step Time": 8.464694306254387} +{"Pretrain/Learning Rate": 1.9066653409449686e-10, "Pretrain/Loss": 1.971862554550171, "Pretrain/Loss (Raw)": 2.51949143409729, "Pretrain/Step": 19050, "Pretrain/Step Time": 8.464689636602998} +{"Pretrain/Learning Rate": 1.7444728256932331e-10, "Pretrain/Loss": 1.972697138786316, "Pretrain/Loss (Raw)": 2.0122785568237305, "Pretrain/Step": 19051, "Pretrain/Step Time": 8.470078211277723} +{"Pretrain/Learning Rate": 1.5894888339418324e-10, "Pretrain/Loss": 1.9736568927764893, "Pretrain/Loss (Raw)": 1.932403564453125, "Pretrain/Step": 19052, "Pretrain/Step Time": 8.467059789225459} +{"Pretrain/Learning Rate": 1.4417133700761476e-10, "Pretrain/Loss": 1.9740204811096191, "Pretrain/Loss (Raw)": 2.209155797958374, "Pretrain/Step": 19053, "Pretrain/Step Time": 8.466906549409032} +{"Pretrain/Learning Rate": 1.3011464384260484e-10, "Pretrain/Loss": 1.978163480758667, "Pretrain/Loss (Raw)": 2.190094470977783, "Pretrain/Step": 19054, "Pretrain/Step Time": 8.46509631536901} +{"Pretrain/Learning Rate": 1.1677880430438493e-10, "Pretrain/Loss": 1.9759025573730469, "Pretrain/Loss (Raw)": 1.853688359260559, "Pretrain/Step": 19055, "Pretrain/Step Time": 8.466290108859539} +{"Pretrain/Learning Rate": 1.041638187704308e-10, "Pretrain/Loss": 1.9730678796768188, "Pretrain/Loss (Raw)": 1.481068730354309, "Pretrain/Step": 19056, "Pretrain/Step Time": 8.468544520437717} +{"Pretrain/Learning Rate": 9.22696876126672e-11, "Pretrain/Loss": 1.974435806274414, "Pretrain/Loss (Raw)": 2.2052078247070312, "Pretrain/Step": 19057, "Pretrain/Step Time": 8.46913387440145} +{"Pretrain/Learning Rate": 8.109641116971212e-11, "Pretrain/Loss": 1.9747517108917236, "Pretrain/Loss (Raw)": 2.013383626937866, "Pretrain/Step": 19058, "Pretrain/Step Time": 8.472097778692842} +{"Pretrain/Learning Rate": 7.064398976353026e-11, "Pretrain/Loss": 1.9739320278167725, "Pretrain/Loss (Raw)": 2.058656930923462, "Pretrain/Step": 19059, "Pretrain/Step Time": 8.474113496020436} +{"Pretrain/Learning Rate": 6.091242369665739e-11, "Pretrain/Loss": 1.9700349569320679, "Pretrain/Loss (Raw)": 1.8599482774734497, "Pretrain/Step": 19060, "Pretrain/Step Time": 8.480325432494283} +{"Pretrain/Learning Rate": 5.1901713249424833e-11, "Pretrain/Loss": 1.9683854579925537, "Pretrain/Loss (Raw)": 1.910027265548706, "Pretrain/Step": 19061, "Pretrain/Step Time": 8.480520997196436} +{"Pretrain/Learning Rate": 4.3611858682734985e-11, "Pretrain/Loss": 1.9680123329162598, "Pretrain/Loss (Raw)": 1.983614444732666, "Pretrain/Step": 19062, "Pretrain/Step Time": 8.479260612279177} +{"Pretrain/Learning Rate": 3.60428602352858e-11, "Pretrain/Loss": 1.9673908948898315, "Pretrain/Loss (Raw)": 1.9666837453842163, "Pretrain/Step": 19063, "Pretrain/Step Time": 8.480282697826624} +{"Pretrain/Learning Rate": 2.9194718123570774e-11, "Pretrain/Loss": 1.9684951305389404, "Pretrain/Loss (Raw)": 2.1279537677764893, "Pretrain/Step": 19064, "Pretrain/Step Time": 8.481581123545766} +{"Pretrain/Learning Rate": 2.3067432544654488e-11, "Pretrain/Loss": 1.9681870937347412, "Pretrain/Loss (Raw)": 1.860738754272461, "Pretrain/Step": 19065, "Pretrain/Step Time": 8.483093211427331} +{"Pretrain/Learning Rate": 1.7661003678948184e-11, "Pretrain/Loss": 1.968529224395752, "Pretrain/Loss (Raw)": 2.0202763080596924, "Pretrain/Step": 19066, "Pretrain/Step Time": 8.477437635883689} +{"Pretrain/Learning Rate": 1.297543167910753e-11, "Pretrain/Loss": 1.9679994583129883, "Pretrain/Loss (Raw)": 1.862785816192627, "Pretrain/Step": 19067, "Pretrain/Step Time": 8.481518194079399} +{"Pretrain/Learning Rate": 9.010716681134845e-12, "Pretrain/Loss": 1.969957709312439, "Pretrain/Loss (Raw)": 2.122986078262329, "Pretrain/Step": 19068, "Pretrain/Step Time": 8.478307984769344} +{"Pretrain/Learning Rate": 5.766858801603547e-12, "Pretrain/Loss": 1.9685437679290771, "Pretrain/Loss (Raw)": 1.9000859260559082, "Pretrain/Step": 19069, "Pretrain/Step Time": 8.482636453583837} +{"Pretrain/Learning Rate": 3.2438581293314784e-12, "Pretrain/Loss": 1.9713691473007202, "Pretrain/Loss (Raw)": 2.29194974899292, "Pretrain/Step": 19070, "Pretrain/Step Time": 8.475736228749156} +{"Pretrain/Learning Rate": 1.4417147420342503e-12, "Pretrain/Loss": 1.9738433361053467, "Pretrain/Loss (Raw)": 2.198288679122925, "Pretrain/Step": 19071, "Pretrain/Step Time": 8.478763757273555} +{"Pretrain/Learning Rate": 3.6042868689634133e-13, "Pretrain/Loss": 1.9741710424423218, "Pretrain/Loss (Raw)": 1.8603953123092651, "Pretrain/Step": 19072, "Pretrain/Step Time": 8.482152888551354} +{"Pretrain/Learning Rate": 0.0, "Pretrain/Loss": 1.9757804870605469, "Pretrain/Loss (Raw)": 1.8609930276870728, "Pretrain/Step": 19073, "Pretrain/Step Time": 8.480708558112383} diff --git a/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/run-metrics.jsonl b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/run-metrics.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..db7997dd02becf7cfc691fb4e926f3246f0a6194 --- /dev/null +++ b/obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7/run-metrics.jsonl @@ -0,0 +1 @@ +{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "obelics", "dataset_resampled": true, "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_hq_single_pkl_pil:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl_pil/", "finetune_stage_components": ["/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/llava_v1_5_mix665k.json", "/fsx-training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/llava/data"], "max_num_images": 6, "min_num_images": 1, "train_num_samples": 4882814, "type": "obelics", "workers": 4}, "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "no-align+avgpool", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 128, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "resize-naive", "llm_backbone_id": "phi3-3b", "llm_max_length": 4096, "model_id": "phi3-3b-continue-training-hq-20b", "pretrain_epochs": 1, "pretrain_global_batch_size": 256, "pretrain_learning_rate": 5e-05, "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", "pretrain_max_grad_norm": 1.0, "pretrain_max_steps": 19073, "pretrain_per_device_batch_size": 8, "pretrain_train_strategy": "fsdp-full-shard", "pretrain_warmup_ratio": 0.03, "pretrain_weight_decay": 0.01, "reduce_in_full_precision": false, "type": "one-stage+7b", "vision_backbone_id": "siglip-vit-so400m-384px"}, "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", "pretrained_checkpoint": null, "run_id": "obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7", "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints/mllm_pretrain_checkpoints", "seed": 7, "stage": "pretrain", "trackers": ["jsonl", "wandb"], "wandb_entity": null, "wandb_project": "mmpretrain"}, "run_id": "obelics+phi3-3b-continue-training-hq-20b+stage-pretrain+x7"}