diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.8167.pt b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.8167.pt new file mode 100644 index 0000000000000000000000000000000000000000..2158e90fc5d4b37966d1793d3805055703104a2a --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-005000-epoch-00-loss=1.8167.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50449ea7df02d364976782380658c8e10fb061600fac752e898d6994fb32805b +size 15335044635 diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=1.9695.pt b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=1.9695.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9ded6e228e2459bb475959252b59b91fc184668 --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/checkpoints/step-009537-epoch-01-loss=1.9695.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e95c5b8551b0445cc199892df872a70277302dc45267d6b71cbb8073573599 +size 15335044635 diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.json b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e0ec3590d4a179570913d509927cf2b060f2f4ae --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.json @@ -0,0 +1,74 @@ +{ + "dataset": { + "align_stage_components": [ + "download/llava-laion-cc-sbu-558k/chat.json", + "download/llava-laion-cc-sbu-558k" + ], + "dataset_id": "obelics", + "dataset_resampled": true, + "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_dfn_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/", + "finetune_stage_components": [ + "/mnt/raid5/weizhi/llava/llava_v1_5_mix665k.json", + "/mnt/raid5/weizhi/llava/data" + ], + "max_num_images": 6, + "min_num_images": 1, + "train_num_samples": 2441407, + "type": "obelics", + "workers": 4 + }, + "model": { + "align_epochs": 1, + "align_global_batch_size": 256, + "align_learning_rate": 0.001, + "align_lr_scheduler_type": "linear-warmup+cosine-decay", + "align_max_grad_norm": 1.0, + "align_max_steps": null, + "align_per_device_batch_size": 16, + "align_train_strategy": "fsdp-shard-grad-op", + "align_warmup_ratio": 0.03, + "align_weight_decay": 0.0, + "arch_specifier": "no-align+avgpool", + "enable_gradient_checkpointing": true, + "enable_mixed_precision_training": true, + "finetune_epochs": 1, + "finetune_global_batch_size": 128, + "finetune_learning_rate": 2e-05, + "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", + "finetune_max_grad_norm": 1.0, + "finetune_max_steps": null, + "finetune_per_device_batch_size": 16, + "finetune_train_strategy": "fsdp-full-shard", + "finetune_warmup_ratio": 0.03, + "finetune_weight_decay": 0.1, + "image_resize_strategy": "resize-naive", + "llm_backbone_id": "phi3-3b", + "llm_max_length": 4096, + "model_id": "phi3-3b-continue-training-dfn", + "pretrain_epochs": 1, + "pretrain_global_batch_size": 256, + "pretrain_learning_rate": 5e-05, + "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", + "pretrain_max_grad_norm": 1.0, + "pretrain_max_steps": 9537, + "pretrain_per_device_batch_size": 8, + "pretrain_train_strategy": "fsdp-full-shard", + "pretrain_warmup_ratio": 0.03, + "pretrain_weight_decay": 0.01, + "reduce_in_full_precision": false, + "type": "one-stage+7b", + "vision_backbone_id": "siglip-vit-so400m-384px" + }, + "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", + "pretrained_checkpoint": null, + "run_id": "obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7", + "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints", + "seed": 7, + "stage": "pretrain", + "trackers": [ + "jsonl", + "wandb" + ], + "wandb_entity": null, + "wandb_project": "mmpretrain" +} \ No newline at end of file diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.yaml b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..5d0c6b78c56a0bd4393bcc06d30c682562616473 --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/config.yaml @@ -0,0 +1,67 @@ +dataset: + align_stage_components: + - download/llava-laion-cc-sbu-558k/chat.json + - download/llava-laion-cc-sbu-558k + dataset_id: obelics + dataset_resampled: true + dataset_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_dfn_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/ + finetune_stage_components: + - /mnt/raid5/weizhi/llava/llava_v1_5_mix665k.json + - /mnt/raid5/weizhi/llava/data + max_num_images: 6 + min_num_images: 1 + train_num_samples: 2441407 + type: obelics + workers: 4 +model: + align_epochs: 1 + align_global_batch_size: 256 + align_learning_rate: 0.001 + align_lr_scheduler_type: linear-warmup+cosine-decay + align_max_grad_norm: 1.0 + align_max_steps: null + align_per_device_batch_size: 16 + align_train_strategy: fsdp-shard-grad-op + align_warmup_ratio: 0.03 + align_weight_decay: 0.0 + arch_specifier: no-align+avgpool + enable_gradient_checkpointing: true + enable_mixed_precision_training: true + finetune_epochs: 1 + finetune_global_batch_size: 128 + finetune_learning_rate: 2.0e-05 + finetune_lr_scheduler_type: linear-warmup+cosine-decay + finetune_max_grad_norm: 1.0 + finetune_max_steps: null + finetune_per_device_batch_size: 16 + finetune_train_strategy: fsdp-full-shard + finetune_warmup_ratio: 0.03 + finetune_weight_decay: 0.1 + image_resize_strategy: resize-naive + llm_backbone_id: phi3-3b + llm_max_length: 4096 + model_id: phi3-3b-continue-training-dfn + pretrain_epochs: 1 + pretrain_global_batch_size: 256 + pretrain_learning_rate: 5.0e-05 + pretrain_lr_scheduler_type: linear-warmup+cosine-decay + pretrain_max_grad_norm: 1.0 + pretrain_max_steps: 9537 + pretrain_per_device_batch_size: 8 + pretrain_train_strategy: fsdp-full-shard + pretrain_warmup_ratio: 0.03 + pretrain_weight_decay: 0.01 + reduce_in_full_precision: false + type: one-stage+7b + vision_backbone_id: siglip-vit-so400m-384px +mount_path: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models +pretrained_checkpoint: null +run_id: obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7 +run_root_dir: /fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints +seed: 7 +stage: pretrain +trackers: +- jsonl +- wandb +wandb_entity: null +wandb_project: mmpretrain diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7.jsonl b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c16dc2e26b750a200b879c3de9d8b8bc1381a006 --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7.jsonl @@ -0,0 +1,9537 @@ +{"Pretrain/Learning Rate": 1.7482517482517484e-07, "Pretrain/Loss": 3.8894991874694824, "Pretrain/Loss (Raw)": 3.8894991874694824, "Pretrain/Step": 1, "Pretrain/Step Time": 33.36893820762634} +{"Pretrain/Learning Rate": 3.496503496503497e-07, "Pretrain/Loss": 3.7566332817077637, "Pretrain/Loss (Raw)": 3.623767375946045, "Pretrain/Step": 2, "Pretrain/Step Time": 21.028563737869263} +{"Pretrain/Learning Rate": 5.244755244755246e-07, "Pretrain/Loss": 3.8617606163024902, "Pretrain/Loss (Raw)": 4.072014808654785, "Pretrain/Step": 3, "Pretrain/Step Time": 16.73505695660909} +{"Pretrain/Learning Rate": 6.993006993006994e-07, "Pretrain/Loss": 3.936904191970825, "Pretrain/Loss (Raw)": 4.16233491897583, "Pretrain/Step": 4, "Pretrain/Step Time": 14.815589249134064} +{"Pretrain/Learning Rate": 8.741258741258743e-07, "Pretrain/Loss": 3.9310543537139893, "Pretrain/Loss (Raw)": 3.9076554775238037, "Pretrain/Step": 5, "Pretrain/Step Time": 13.498903703689574} +{"Pretrain/Learning Rate": 1.0489510489510491e-06, "Pretrain/Loss": 3.761594772338867, "Pretrain/Loss (Raw)": 2.9142959117889404, "Pretrain/Step": 6, "Pretrain/Step Time": 12.804352164268494} +{"Pretrain/Learning Rate": 1.2237762237762238e-06, "Pretrain/Loss": 3.957918167114258, "Pretrain/Loss (Raw)": 5.135859966278076, "Pretrain/Step": 7, "Pretrain/Step Time": 12.968994004385811} +{"Pretrain/Learning Rate": 1.3986013986013987e-06, "Pretrain/Loss": 3.860006809234619, "Pretrain/Loss (Raw)": 3.1746275424957275, "Pretrain/Step": 8, "Pretrain/Step Time": 12.418182790279388} +{"Pretrain/Learning Rate": 1.5734265734265736e-06, "Pretrain/Loss": 3.8062994480133057, "Pretrain/Loss (Raw)": 3.376638889312744, "Pretrain/Step": 9, "Pretrain/Step Time": 12.939719120661417} +{"Pretrain/Learning Rate": 1.7482517482517485e-06, "Pretrain/Loss": 3.9094979763031006, "Pretrain/Loss (Raw)": 4.838284015655518, "Pretrain/Step": 10, "Pretrain/Step Time": 12.55443708896637} +{"Pretrain/Learning Rate": 1.9230769230769234e-06, "Pretrain/Loss": 3.8874354362487793, "Pretrain/Loss (Raw)": 3.6668083667755127, "Pretrain/Step": 11, "Pretrain/Step Time": 12.24622123891657} +{"Pretrain/Learning Rate": 2.0979020979020983e-06, "Pretrain/Loss": 3.857403516769409, "Pretrain/Loss (Raw)": 3.52705717086792, "Pretrain/Step": 12, "Pretrain/Step Time": 12.163614273071289} +{"Pretrain/Learning Rate": 2.2727272727272728e-06, "Pretrain/Loss": 3.8359594345092773, "Pretrain/Loss (Raw)": 3.5786232948303223, "Pretrain/Step": 13, "Pretrain/Step Time": 11.896164453946627} +{"Pretrain/Learning Rate": 2.4475524475524477e-06, "Pretrain/Loss": 3.8424313068389893, "Pretrain/Loss (Raw)": 3.926572322845459, "Pretrain/Step": 14, "Pretrain/Step Time": 11.96382476602282} +{"Pretrain/Learning Rate": 2.6223776223776225e-06, "Pretrain/Loss": 3.8086774349212646, "Pretrain/Loss (Raw)": 3.336117744445801, "Pretrain/Step": 15, "Pretrain/Step Time": 11.862312157948812} +{"Pretrain/Learning Rate": 2.7972027972027974e-06, "Pretrain/Loss": 3.756086587905884, "Pretrain/Loss (Raw)": 2.9672276973724365, "Pretrain/Step": 16, "Pretrain/Step Time": 11.875931099057198} +{"Pretrain/Learning Rate": 2.9720279720279723e-06, "Pretrain/Loss": 3.7146620750427246, "Pretrain/Loss (Raw)": 3.0518651008605957, "Pretrain/Step": 17, "Pretrain/Step Time": 12.053339565501494} +{"Pretrain/Learning Rate": 3.1468531468531472e-06, "Pretrain/Loss": 3.6617953777313232, "Pretrain/Loss (Raw)": 2.763063430786133, "Pretrain/Step": 18, "Pretrain/Step Time": 12.100582745340136} +{"Pretrain/Learning Rate": 3.3216783216783217e-06, "Pretrain/Loss": 3.622372627258301, "Pretrain/Loss (Raw)": 2.9127678871154785, "Pretrain/Step": 19, "Pretrain/Step Time": 11.91103946535211} +{"Pretrain/Learning Rate": 3.496503496503497e-06, "Pretrain/Loss": 3.58227801322937, "Pretrain/Loss (Raw)": 2.820479393005371, "Pretrain/Step": 20, "Pretrain/Step Time": 11.774526703357697} +{"Pretrain/Learning Rate": 3.6713286713286715e-06, "Pretrain/Loss": 3.567016363143921, "Pretrain/Loss (Raw)": 3.2617790699005127, "Pretrain/Step": 21, "Pretrain/Step Time": 11.96100764047532} +{"Pretrain/Learning Rate": 3.846153846153847e-06, "Pretrain/Loss": 3.57159423828125, "Pretrain/Loss (Raw)": 3.6677279472351074, "Pretrain/Step": 22, "Pretrain/Step Time": 12.034447073936462} +{"Pretrain/Learning Rate": 4.020979020979021e-06, "Pretrain/Loss": 3.5659916400909424, "Pretrain/Loss (Raw)": 3.442739248275757, "Pretrain/Step": 23, "Pretrain/Step Time": 11.888847724251125} +{"Pretrain/Learning Rate": 4.195804195804197e-06, "Pretrain/Loss": 3.5320181846618652, "Pretrain/Loss (Raw)": 2.750622272491455, "Pretrain/Step": 24, "Pretrain/Step Time": 11.846547345320383} +{"Pretrain/Learning Rate": 4.370629370629371e-06, "Pretrain/Loss": 3.5012049674987793, "Pretrain/Loss (Raw)": 2.7617027759552, "Pretrain/Step": 25, "Pretrain/Step Time": 12.000730409622193} +{"Pretrain/Learning Rate": 4.5454545454545455e-06, "Pretrain/Loss": 3.476688861846924, "Pretrain/Loss (Raw)": 2.8637802600860596, "Pretrain/Step": 26, "Pretrain/Step Time": 11.995871956531818} +{"Pretrain/Learning Rate": 4.72027972027972e-06, "Pretrain/Loss": 3.4503095149993896, "Pretrain/Loss (Raw)": 2.764446973800659, "Pretrain/Step": 27, "Pretrain/Step Time": 12.02665059654801} +{"Pretrain/Learning Rate": 4.895104895104895e-06, "Pretrain/Loss": 3.432020664215088, "Pretrain/Loss (Raw)": 2.93821382522583, "Pretrain/Step": 28, "Pretrain/Step Time": 12.14872795343399} +{"Pretrain/Learning Rate": 5.06993006993007e-06, "Pretrain/Loss": 3.405959129333496, "Pretrain/Loss (Raw)": 2.6762442588806152, "Pretrain/Step": 29, "Pretrain/Step Time": 12.063370433346979} +{"Pretrain/Learning Rate": 5.244755244755245e-06, "Pretrain/Loss": 3.384737253189087, "Pretrain/Loss (Raw)": 2.7693049907684326, "Pretrain/Step": 30, "Pretrain/Step Time": 12.27836884657542} +{"Pretrain/Learning Rate": 5.419580419580419e-06, "Pretrain/Loss": 3.3637566566467285, "Pretrain/Loss (Raw)": 2.7343413829803467, "Pretrain/Step": 31, "Pretrain/Step Time": 12.15408868174399} +{"Pretrain/Learning Rate": 5.594405594405595e-06, "Pretrain/Loss": 3.338712692260742, "Pretrain/Loss (Raw)": 2.562344789505005, "Pretrain/Step": 32, "Pretrain/Step Time": 12.147332347929478} +{"Pretrain/Learning Rate": 5.76923076923077e-06, "Pretrain/Loss": 3.3086695671081543, "Pretrain/Loss (Raw)": 2.3472888469696045, "Pretrain/Step": 33, "Pretrain/Step Time": 12.02712860251918} +{"Pretrain/Learning Rate": 5.944055944055945e-06, "Pretrain/Loss": 3.2850534915924072, "Pretrain/Loss (Raw)": 2.50571870803833, "Pretrain/Step": 34, "Pretrain/Step Time": 12.023845595471998} +{"Pretrain/Learning Rate": 6.1188811188811196e-06, "Pretrain/Loss": 3.2656025886535645, "Pretrain/Loss (Raw)": 2.6042699813842773, "Pretrain/Step": 35, "Pretrain/Step Time": 11.959171220234461} +{"Pretrain/Learning Rate": 6.2937062937062944e-06, "Pretrain/Loss": 3.2566049098968506, "Pretrain/Loss (Raw)": 2.941687822341919, "Pretrain/Step": 36, "Pretrain/Step Time": 11.962148778968388} +{"Pretrain/Learning Rate": 6.468531468531469e-06, "Pretrain/Loss": 3.230924129486084, "Pretrain/Loss (Raw)": 2.306415319442749, "Pretrain/Step": 37, "Pretrain/Step Time": 11.953258804372838} +{"Pretrain/Learning Rate": 6.643356643356643e-06, "Pretrain/Loss": 3.2119743824005127, "Pretrain/Loss (Raw)": 2.510828733444214, "Pretrain/Step": 38, "Pretrain/Step Time": 11.864301317616514} +{"Pretrain/Learning Rate": 6.818181818181818e-06, "Pretrain/Loss": 3.193474769592285, "Pretrain/Loss (Raw)": 2.4905004501342773, "Pretrain/Step": 39, "Pretrain/Step Time": 11.965054872708443} +{"Pretrain/Learning Rate": 6.993006993006994e-06, "Pretrain/Loss": 3.17541766166687, "Pretrain/Loss (Raw)": 2.471189498901367, "Pretrain/Step": 40, "Pretrain/Step Time": 11.92178699374199} +{"Pretrain/Learning Rate": 7.167832167832168e-06, "Pretrain/Loss": 3.1608996391296387, "Pretrain/Loss (Raw)": 2.580183267593384, "Pretrain/Step": 41, "Pretrain/Step Time": 12.06594284569345} +{"Pretrain/Learning Rate": 7.342657342657343e-06, "Pretrain/Loss": 3.1537084579467773, "Pretrain/Loss (Raw)": 2.8588547706604004, "Pretrain/Step": 42, "Pretrain/Step Time": 11.987700229599362} +{"Pretrain/Learning Rate": 7.517482517482517e-06, "Pretrain/Loss": 3.1328654289245605, "Pretrain/Loss (Raw)": 2.257464647293091, "Pretrain/Step": 43, "Pretrain/Step Time": 12.05769711317018} +{"Pretrain/Learning Rate": 7.692307692307694e-06, "Pretrain/Loss": 3.1162314414978027, "Pretrain/Loss (Raw)": 2.400967836380005, "Pretrain/Step": 44, "Pretrain/Step Time": 11.987738674337214} +{"Pretrain/Learning Rate": 7.867132867132867e-06, "Pretrain/Loss": 3.101541519165039, "Pretrain/Loss (Raw)": 2.4551913738250732, "Pretrain/Step": 45, "Pretrain/Step Time": 11.93748336368137} +{"Pretrain/Learning Rate": 8.041958041958042e-06, "Pretrain/Loss": 3.0867621898651123, "Pretrain/Loss (Raw)": 2.421684503555298, "Pretrain/Step": 46, "Pretrain/Step Time": 11.94977955714516} +{"Pretrain/Learning Rate": 8.216783216783217e-06, "Pretrain/Loss": 3.0948257446289062, "Pretrain/Loss (Raw)": 3.4657716751098633, "Pretrain/Step": 47, "Pretrain/Step Time": 11.892402024979287} +{"Pretrain/Learning Rate": 8.391608391608393e-06, "Pretrain/Loss": 3.0758140087127686, "Pretrain/Loss (Raw)": 2.1822478771209717, "Pretrain/Step": 48, "Pretrain/Step Time": 11.839107548197111} +{"Pretrain/Learning Rate": 8.566433566433566e-06, "Pretrain/Loss": 3.065105676651001, "Pretrain/Loss (Raw)": 2.5511209964752197, "Pretrain/Step": 49, "Pretrain/Step Time": 11.91234470873463} +{"Pretrain/Learning Rate": 8.741258741258741e-06, "Pretrain/Loss": 3.052373170852661, "Pretrain/Loss (Raw)": 2.4284791946411133, "Pretrain/Step": 50, "Pretrain/Step Time": 11.83723307132721} +{"Pretrain/Learning Rate": 8.916083916083918e-06, "Pretrain/Loss": 3.0407888889312744, "Pretrain/Loss (Raw)": 2.4615590572357178, "Pretrain/Step": 51, "Pretrain/Step Time": 11.79565443244635} +{"Pretrain/Learning Rate": 9.090909090909091e-06, "Pretrain/Loss": 3.0319766998291016, "Pretrain/Loss (Raw)": 2.5825610160827637, "Pretrain/Step": 52, "Pretrain/Step Time": 11.737327497739058} +{"Pretrain/Learning Rate": 9.265734265734266e-06, "Pretrain/Loss": 3.021334171295166, "Pretrain/Loss (Raw)": 2.4679250717163086, "Pretrain/Step": 53, "Pretrain/Step Time": 11.77728290827769} +{"Pretrain/Learning Rate": 9.44055944055944e-06, "Pretrain/Loss": 3.008605718612671, "Pretrain/Loss (Raw)": 2.3339924812316895, "Pretrain/Step": 54, "Pretrain/Step Time": 11.74110574633987} +{"Pretrain/Learning Rate": 9.615384615384616e-06, "Pretrain/Loss": 3.0039684772491455, "Pretrain/Loss (Raw)": 2.753572463989258, "Pretrain/Step": 55, "Pretrain/Step Time": 11.703945415670221} +{"Pretrain/Learning Rate": 9.79020979020979e-06, "Pretrain/Loss": 2.9915592670440674, "Pretrain/Loss (Raw)": 2.30904483795166, "Pretrain/Step": 56, "Pretrain/Step Time": 11.693684684378761} +{"Pretrain/Learning Rate": 9.965034965034966e-06, "Pretrain/Loss": 2.982963800430298, "Pretrain/Loss (Raw)": 2.5015993118286133, "Pretrain/Step": 57, "Pretrain/Step Time": 11.704938625034533} +{"Pretrain/Learning Rate": 1.013986013986014e-05, "Pretrain/Loss": 2.980400800704956, "Pretrain/Loss (Raw)": 2.8343262672424316, "Pretrain/Step": 58, "Pretrain/Step Time": 11.65294012941163} +{"Pretrain/Learning Rate": 1.0314685314685315e-05, "Pretrain/Loss": 2.973672389984131, "Pretrain/Loss (Raw)": 2.5834245681762695, "Pretrain/Step": 59, "Pretrain/Step Time": 11.738370830729856} +{"Pretrain/Learning Rate": 1.048951048951049e-05, "Pretrain/Loss": 2.963120698928833, "Pretrain/Loss (Raw)": 2.3405611515045166, "Pretrain/Step": 60, "Pretrain/Step Time": 11.687917447090149} +{"Pretrain/Learning Rate": 1.0664335664335665e-05, "Pretrain/Loss": 2.9525399208068848, "Pretrain/Loss (Raw)": 2.3177075386047363, "Pretrain/Step": 61, "Pretrain/Step Time": 11.653943800535359} +{"Pretrain/Learning Rate": 1.0839160839160838e-05, "Pretrain/Loss": 2.941657543182373, "Pretrain/Loss (Raw)": 2.2778210639953613, "Pretrain/Step": 62, "Pretrain/Step Time": 11.604603763549559} +{"Pretrain/Learning Rate": 1.1013986013986015e-05, "Pretrain/Loss": 2.935575008392334, "Pretrain/Loss (Raw)": 2.558450222015381, "Pretrain/Step": 63, "Pretrain/Step Time": 11.581333164184812} +{"Pretrain/Learning Rate": 1.118881118881119e-05, "Pretrain/Loss": 2.930685043334961, "Pretrain/Loss (Raw)": 2.6226346492767334, "Pretrain/Step": 64, "Pretrain/Step Time": 11.536587726324797} +{"Pretrain/Learning Rate": 1.1363636363636365e-05, "Pretrain/Loss": 2.9236629009246826, "Pretrain/Loss (Raw)": 2.4742302894592285, "Pretrain/Step": 65, "Pretrain/Step Time": 11.63589005103478} +{"Pretrain/Learning Rate": 1.153846153846154e-05, "Pretrain/Loss": 2.913391351699829, "Pretrain/Loss (Raw)": 2.2457544803619385, "Pretrain/Step": 66, "Pretrain/Step Time": 11.595840739481377} +{"Pretrain/Learning Rate": 1.1713286713286714e-05, "Pretrain/Loss": 2.9089622497558594, "Pretrain/Loss (Raw)": 2.616647720336914, "Pretrain/Step": 67, "Pretrain/Step Time": 11.551605655186211} +{"Pretrain/Learning Rate": 1.188811188811189e-05, "Pretrain/Loss": 2.916097402572632, "Pretrain/Loss (Raw)": 3.394138813018799, "Pretrain/Step": 68, "Pretrain/Step Time": 11.505937067901387} +{"Pretrain/Learning Rate": 1.2062937062937063e-05, "Pretrain/Loss": 2.9243521690368652, "Pretrain/Loss (Raw)": 3.485668182373047, "Pretrain/Step": 69, "Pretrain/Step Time": 11.585203613060107} +{"Pretrain/Learning Rate": 1.2237762237762239e-05, "Pretrain/Loss": 2.921539068222046, "Pretrain/Loss (Raw)": 2.727450370788574, "Pretrain/Step": 70, "Pretrain/Step Time": 11.54796506336757} +{"Pretrain/Learning Rate": 1.2412587412587414e-05, "Pretrain/Loss": 2.9161622524261475, "Pretrain/Loss (Raw)": 2.5397937297821045, "Pretrain/Step": 71, "Pretrain/Step Time": 11.525303031357241} +{"Pretrain/Learning Rate": 1.2587412587412589e-05, "Pretrain/Loss": 2.909897804260254, "Pretrain/Loss (Raw)": 2.465100049972534, "Pretrain/Step": 72, "Pretrain/Step Time": 11.47898433274693} +{"Pretrain/Learning Rate": 1.2762237762237764e-05, "Pretrain/Loss": 2.9023759365081787, "Pretrain/Loss (Raw)": 2.3608200550079346, "Pretrain/Step": 73, "Pretrain/Step Time": 11.491121406424535} +{"Pretrain/Learning Rate": 1.2937062937062939e-05, "Pretrain/Loss": 2.9017744064331055, "Pretrain/Loss (Raw)": 2.857846975326538, "Pretrain/Step": 74, "Pretrain/Step Time": 11.475047317711082} +{"Pretrain/Learning Rate": 1.3111888111888112e-05, "Pretrain/Loss": 2.8953123092651367, "Pretrain/Loss (Raw)": 2.4171273708343506, "Pretrain/Step": 75, "Pretrain/Step Time": 11.451805480321248} +{"Pretrain/Learning Rate": 1.3286713286713287e-05, "Pretrain/Loss": 2.8891232013702393, "Pretrain/Loss (Raw)": 2.4249417781829834, "Pretrain/Step": 76, "Pretrain/Step Time": 11.488923643764696} +{"Pretrain/Learning Rate": 1.3461538461538462e-05, "Pretrain/Loss": 2.8847672939300537, "Pretrain/Loss (Raw)": 2.553727865219116, "Pretrain/Step": 77, "Pretrain/Step Time": 11.523877400856513} +{"Pretrain/Learning Rate": 1.3636363636363637e-05, "Pretrain/Loss": 2.878950595855713, "Pretrain/Loss (Raw)": 2.4310312271118164, "Pretrain/Step": 78, "Pretrain/Step Time": 11.48289075264564} +{"Pretrain/Learning Rate": 1.381118881118881e-05, "Pretrain/Loss": 2.8751423358917236, "Pretrain/Loss (Raw)": 2.578096628189087, "Pretrain/Step": 79, "Pretrain/Step Time": 11.507657950437522} +{"Pretrain/Learning Rate": 1.3986013986013988e-05, "Pretrain/Loss": 2.872887372970581, "Pretrain/Loss (Raw)": 2.694772243499756, "Pretrain/Step": 80, "Pretrain/Step Time": 11.465653544664383} +{"Pretrain/Learning Rate": 1.4160839160839163e-05, "Pretrain/Loss": 2.865260124206543, "Pretrain/Loss (Raw)": 2.255074977874756, "Pretrain/Step": 81, "Pretrain/Step Time": 11.499631840505717} +{"Pretrain/Learning Rate": 1.4335664335664336e-05, "Pretrain/Loss": 2.8588478565216064, "Pretrain/Loss (Raw)": 2.3394577503204346, "Pretrain/Step": 82, "Pretrain/Step Time": 11.46878893782453} +{"Pretrain/Learning Rate": 1.4510489510489511e-05, "Pretrain/Loss": 2.8638601303100586, "Pretrain/Loss (Raw)": 3.2748889923095703, "Pretrain/Step": 83, "Pretrain/Step Time": 11.511506726942867} +{"Pretrain/Learning Rate": 1.4685314685314686e-05, "Pretrain/Loss": 2.8635802268981934, "Pretrain/Loss (Raw)": 2.840315818786621, "Pretrain/Step": 84, "Pretrain/Step Time": 11.481279784724826} +{"Pretrain/Learning Rate": 1.486013986013986e-05, "Pretrain/Loss": 2.860196352005005, "Pretrain/Loss (Raw)": 2.5759470462799072, "Pretrain/Step": 85, "Pretrain/Step Time": 11.485212522394518} +{"Pretrain/Learning Rate": 1.5034965034965034e-05, "Pretrain/Loss": 2.8536927700042725, "Pretrain/Loss (Raw)": 2.3008975982666016, "Pretrain/Step": 86, "Pretrain/Step Time": 11.465672409811685} +{"Pretrain/Learning Rate": 1.5209790209790212e-05, "Pretrain/Loss": 2.8487751483917236, "Pretrain/Loss (Raw)": 2.42586350440979, "Pretrain/Step": 87, "Pretrain/Step Time": 11.44684765804773} +{"Pretrain/Learning Rate": 1.5384615384615387e-05, "Pretrain/Loss": 2.8408830165863037, "Pretrain/Loss (Raw)": 2.1542601585388184, "Pretrain/Step": 88, "Pretrain/Step Time": 11.424329895864833} +{"Pretrain/Learning Rate": 1.555944055944056e-05, "Pretrain/Loss": 2.83492112159729, "Pretrain/Loss (Raw)": 2.3102920055389404, "Pretrain/Step": 89, "Pretrain/Step Time": 11.423274610819442} +{"Pretrain/Learning Rate": 1.5734265734265734e-05, "Pretrain/Loss": 2.8345463275909424, "Pretrain/Loss (Raw)": 2.801180124282837, "Pretrain/Step": 90, "Pretrain/Step Time": 11.401907369825576} +{"Pretrain/Learning Rate": 1.590909090909091e-05, "Pretrain/Loss": 2.8310654163360596, "Pretrain/Loss (Raw)": 2.5177652835845947, "Pretrain/Step": 91, "Pretrain/Step Time": 11.400237754151062} +{"Pretrain/Learning Rate": 1.6083916083916083e-05, "Pretrain/Loss": 2.8271491527557373, "Pretrain/Loss (Raw)": 2.4707934856414795, "Pretrain/Step": 92, "Pretrain/Step Time": 11.371369359285936} +{"Pretrain/Learning Rate": 1.625874125874126e-05, "Pretrain/Loss": 2.8229856491088867, "Pretrain/Loss (Raw)": 2.4399425983428955, "Pretrain/Step": 93, "Pretrain/Step Time": 11.35301253872533} +{"Pretrain/Learning Rate": 1.6433566433566433e-05, "Pretrain/Loss": 2.8201894760131836, "Pretrain/Loss (Raw)": 2.56014084815979, "Pretrain/Step": 94, "Pretrain/Step Time": 11.342093340894008} +{"Pretrain/Learning Rate": 1.660839160839161e-05, "Pretrain/Loss": 2.819171905517578, "Pretrain/Loss (Raw)": 2.723517656326294, "Pretrain/Step": 95, "Pretrain/Step Time": 11.315282369914808} +{"Pretrain/Learning Rate": 1.6783216783216786e-05, "Pretrain/Loss": 2.8124303817749023, "Pretrain/Loss (Raw)": 2.1719963550567627, "Pretrain/Step": 96, "Pretrain/Step Time": 11.288258574903011} +{"Pretrain/Learning Rate": 1.695804195804196e-05, "Pretrain/Loss": 2.8079283237457275, "Pretrain/Loss (Raw)": 2.3757402896881104, "Pretrain/Step": 97, "Pretrain/Step Time": 11.33269877777886} +{"Pretrain/Learning Rate": 1.7132867132867133e-05, "Pretrain/Loss": 2.803431272506714, "Pretrain/Loss (Raw)": 2.367213726043701, "Pretrain/Step": 98, "Pretrain/Step Time": 11.302485444107834} +{"Pretrain/Learning Rate": 1.730769230769231e-05, "Pretrain/Loss": 2.798374652862549, "Pretrain/Loss (Raw)": 2.3028080463409424, "Pretrain/Step": 99, "Pretrain/Step Time": 11.309131588598694} +{"Pretrain/Learning Rate": 1.7482517482517483e-05, "Pretrain/Loss": 2.793274402618408, "Pretrain/Loss (Raw)": 2.2883574962615967, "Pretrain/Step": 100, "Pretrain/Step Time": 11.3000803232193} +{"Pretrain/Learning Rate": 1.7657342657342656e-05, "Pretrain/Loss": 2.791534900665283, "Pretrain/Loss (Raw)": 2.617586374282837, "Pretrain/Step": 101, "Pretrain/Step Time": 11.310942843408867} +{"Pretrain/Learning Rate": 1.7832167832167836e-05, "Pretrain/Loss": 2.788464307785034, "Pretrain/Loss (Raw)": 2.4783127307891846, "Pretrain/Step": 102, "Pretrain/Step Time": 11.287714046590468} +{"Pretrain/Learning Rate": 1.800699300699301e-05, "Pretrain/Loss": 2.783656120300293, "Pretrain/Loss (Raw)": 2.2932558059692383, "Pretrain/Step": 103, "Pretrain/Step Time": 11.315183519159707} +{"Pretrain/Learning Rate": 1.8181818181818182e-05, "Pretrain/Loss": 2.779566764831543, "Pretrain/Loss (Raw)": 2.3583295345306396, "Pretrain/Step": 104, "Pretrain/Step Time": 11.290273742033886} +{"Pretrain/Learning Rate": 1.835664335664336e-05, "Pretrain/Loss": 2.7742929458618164, "Pretrain/Loss (Raw)": 2.225837469100952, "Pretrain/Step": 105, "Pretrain/Step Time": 11.27362554640997} +{"Pretrain/Learning Rate": 1.8531468531468532e-05, "Pretrain/Loss": 2.769951581954956, "Pretrain/Loss (Raw)": 2.3141119480133057, "Pretrain/Step": 106, "Pretrain/Step Time": 11.320447858774438} +{"Pretrain/Learning Rate": 1.8706293706293705e-05, "Pretrain/Loss": 2.7701022624969482, "Pretrain/Loss (Raw)": 2.7860524654388428, "Pretrain/Step": 107, "Pretrain/Step Time": 11.292806132931576} +{"Pretrain/Learning Rate": 1.888111888111888e-05, "Pretrain/Loss": 2.767958164215088, "Pretrain/Loss (Raw)": 2.5385427474975586, "Pretrain/Step": 108, "Pretrain/Step Time": 11.27070611053043} +{"Pretrain/Learning Rate": 1.9055944055944055e-05, "Pretrain/Loss": 2.766308069229126, "Pretrain/Loss (Raw)": 2.5881266593933105, "Pretrain/Step": 109, "Pretrain/Step Time": 11.302459327452773} +{"Pretrain/Learning Rate": 1.923076923076923e-05, "Pretrain/Loss": 2.76354718208313, "Pretrain/Loss (Raw)": 2.462620973587036, "Pretrain/Step": 110, "Pretrain/Step Time": 11.275669999556108} +{"Pretrain/Learning Rate": 1.9405594405594408e-05, "Pretrain/Loss": 2.7599291801452637, "Pretrain/Loss (Raw)": 2.3619253635406494, "Pretrain/Step": 111, "Pretrain/Step Time": 11.283183652001458} +{"Pretrain/Learning Rate": 1.958041958041958e-05, "Pretrain/Loss": 2.757410764694214, "Pretrain/Loss (Raw)": 2.477834463119507, "Pretrain/Step": 112, "Pretrain/Step Time": 11.259291154997689} +{"Pretrain/Learning Rate": 1.9755244755244758e-05, "Pretrain/Loss": 2.753443956375122, "Pretrain/Loss (Raw)": 2.3091633319854736, "Pretrain/Step": 113, "Pretrain/Step Time": 11.261349296147845} +{"Pretrain/Learning Rate": 1.993006993006993e-05, "Pretrain/Loss": 2.7490174770355225, "Pretrain/Loss (Raw)": 2.248831033706665, "Pretrain/Step": 114, "Pretrain/Step Time": 11.23595601006558} +{"Pretrain/Learning Rate": 2.0104895104895104e-05, "Pretrain/Loss": 2.7460622787475586, "Pretrain/Loss (Raw)": 2.4091925621032715, "Pretrain/Step": 115, "Pretrain/Step Time": 11.243792506922846} +{"Pretrain/Learning Rate": 2.027972027972028e-05, "Pretrain/Loss": 2.7427310943603516, "Pretrain/Loss (Raw)": 2.35960054397583, "Pretrain/Step": 116, "Pretrain/Step Time": 11.22361396098959} +{"Pretrain/Learning Rate": 2.0454545454545457e-05, "Pretrain/Loss": 2.742725372314453, "Pretrain/Loss (Raw)": 2.7420921325683594, "Pretrain/Step": 117, "Pretrain/Step Time": 11.204230777218811} +{"Pretrain/Learning Rate": 2.062937062937063e-05, "Pretrain/Loss": 2.7421298027038574, "Pretrain/Loss (Raw)": 2.672428846359253, "Pretrain/Step": 118, "Pretrain/Step Time": 11.1814553394156} +{"Pretrain/Learning Rate": 2.0804195804195807e-05, "Pretrain/Loss": 2.739409923553467, "Pretrain/Loss (Raw)": 2.418457269668579, "Pretrain/Step": 119, "Pretrain/Step Time": 11.163546456008397} +{"Pretrain/Learning Rate": 2.097902097902098e-05, "Pretrain/Loss": 2.7395591735839844, "Pretrain/Loss (Raw)": 2.757303237915039, "Pretrain/Step": 120, "Pretrain/Step Time": 11.156174810727437} +{"Pretrain/Learning Rate": 2.1153846153846154e-05, "Pretrain/Loss": 2.737565517425537, "Pretrain/Loss (Raw)": 2.4983937740325928, "Pretrain/Step": 121, "Pretrain/Step Time": 11.197650075944003} +{"Pretrain/Learning Rate": 2.132867132867133e-05, "Pretrain/Loss": 2.7342467308044434, "Pretrain/Loss (Raw)": 2.332669734954834, "Pretrain/Step": 122, "Pretrain/Step Time": 11.177505416948287} +{"Pretrain/Learning Rate": 2.1503496503496503e-05, "Pretrain/Loss": 2.7319600582122803, "Pretrain/Loss (Raw)": 2.4529592990875244, "Pretrain/Step": 123, "Pretrain/Step Time": 11.159686179665046} +{"Pretrain/Learning Rate": 2.1678321678321677e-05, "Pretrain/Loss": 2.7290477752685547, "Pretrain/Loss (Raw)": 2.370847225189209, "Pretrain/Step": 124, "Pretrain/Step Time": 11.148001922715094} +{"Pretrain/Learning Rate": 2.1853146853146857e-05, "Pretrain/Loss": 2.7302985191345215, "Pretrain/Loss (Raw)": 2.8853375911712646, "Pretrain/Step": 125, "Pretrain/Step Time": 11.128755187988281} +{"Pretrain/Learning Rate": 2.202797202797203e-05, "Pretrain/Loss": 2.726224660873413, "Pretrain/Loss (Raw)": 2.2169833183288574, "Pretrain/Step": 126, "Pretrain/Step Time": 11.18206675090487} +{"Pretrain/Learning Rate": 2.2202797202797203e-05, "Pretrain/Loss": 2.723215103149414, "Pretrain/Loss (Raw)": 2.3440518379211426, "Pretrain/Step": 127, "Pretrain/Step Time": 11.160160111630058} +{"Pretrain/Learning Rate": 2.237762237762238e-05, "Pretrain/Loss": 2.721311092376709, "Pretrain/Loss (Raw)": 2.479517936706543, "Pretrain/Step": 128, "Pretrain/Step Time": 11.156796915456653} +{"Pretrain/Learning Rate": 2.2552447552447553e-05, "Pretrain/Loss": 2.7116165161132812, "Pretrain/Loss (Raw)": 2.648613214492798, "Pretrain/Step": 129, "Pretrain/Step Time": 10.980103582143784} +{"Pretrain/Learning Rate": 2.272727272727273e-05, "Pretrain/Loss": 2.7032618522644043, "Pretrain/Loss (Raw)": 2.554356098175049, "Pretrain/Step": 130, "Pretrain/Step Time": 10.999120820313692} +{"Pretrain/Learning Rate": 2.2902097902097902e-05, "Pretrain/Loss": 2.6897945404052734, "Pretrain/Loss (Raw)": 2.348217725753784, "Pretrain/Step": 131, "Pretrain/Step Time": 11.00416929833591} +{"Pretrain/Learning Rate": 2.307692307692308e-05, "Pretrain/Loss": 2.6762163639068604, "Pretrain/Loss (Raw)": 2.42429518699646, "Pretrain/Step": 132, "Pretrain/Step Time": 11.019621970131993} +{"Pretrain/Learning Rate": 2.3251748251748252e-05, "Pretrain/Loss": 2.663663864135742, "Pretrain/Loss (Raw)": 2.3009486198425293, "Pretrain/Step": 133, "Pretrain/Step Time": 11.022768894210458} +{"Pretrain/Learning Rate": 2.342657342657343e-05, "Pretrain/Loss": 2.6585745811462402, "Pretrain/Loss (Raw)": 2.2628448009490967, "Pretrain/Step": 134, "Pretrain/Step Time": 11.081889186054468} +{"Pretrain/Learning Rate": 2.3601398601398602e-05, "Pretrain/Loss": 2.6371850967407227, "Pretrain/Loss (Raw)": 2.398005247116089, "Pretrain/Step": 135, "Pretrain/Step Time": 11.052885565906763} +{"Pretrain/Learning Rate": 2.377622377622378e-05, "Pretrain/Loss": 2.633523941040039, "Pretrain/Loss (Raw)": 2.7060298919677734, "Pretrain/Step": 136, "Pretrain/Step Time": 11.055948967114091} +{"Pretrain/Learning Rate": 2.3951048951048952e-05, "Pretrain/Loss": 2.627006769180298, "Pretrain/Loss (Raw)": 2.5424375534057617, "Pretrain/Step": 137, "Pretrain/Step Time": 10.989820821210742} +{"Pretrain/Learning Rate": 2.4125874125874125e-05, "Pretrain/Loss": 2.6074252128601074, "Pretrain/Loss (Raw)": 2.331839084625244, "Pretrain/Step": 138, "Pretrain/Step Time": 10.996584512293339} +{"Pretrain/Learning Rate": 2.43006993006993e-05, "Pretrain/Loss": 2.596860408782959, "Pretrain/Loss (Raw)": 2.3145322799682617, "Pretrain/Step": 139, "Pretrain/Step Time": 11.024858290329576} +{"Pretrain/Learning Rate": 2.4475524475524478e-05, "Pretrain/Loss": 2.587672233581543, "Pretrain/Loss (Raw)": 2.350952625274658, "Pretrain/Step": 140, "Pretrain/Step Time": 11.00336273573339} +{"Pretrain/Learning Rate": 2.465034965034965e-05, "Pretrain/Loss": 2.5822505950927734, "Pretrain/Loss (Raw)": 2.8846359252929688, "Pretrain/Step": 141, "Pretrain/Step Time": 11.068630825728178} +{"Pretrain/Learning Rate": 2.4825174825174828e-05, "Pretrain/Loss": 2.5707333087921143, "Pretrain/Loss (Raw)": 2.452362537384033, "Pretrain/Step": 142, "Pretrain/Step Time": 11.03392176516354} +{"Pretrain/Learning Rate": 2.5e-05, "Pretrain/Loss": 2.5638866424560547, "Pretrain/Loss (Raw)": 2.4597649574279785, "Pretrain/Step": 143, "Pretrain/Step Time": 11.06988281197846} +{"Pretrain/Learning Rate": 2.5174825174825178e-05, "Pretrain/Loss": 2.561479091644287, "Pretrain/Loss (Raw)": 2.659074544906616, "Pretrain/Step": 144, "Pretrain/Step Time": 11.041254693642259} +{"Pretrain/Learning Rate": 2.534965034965035e-05, "Pretrain/Loss": 2.558281421661377, "Pretrain/Loss (Raw)": 2.6425600051879883, "Pretrain/Step": 145, "Pretrain/Step Time": 11.017621245235205} +{"Pretrain/Learning Rate": 2.5524475524475528e-05, "Pretrain/Loss": 2.5547471046447754, "Pretrain/Loss (Raw)": 2.3106467723846436, "Pretrain/Step": 146, "Pretrain/Step Time": 10.98473814688623} +{"Pretrain/Learning Rate": 2.5699300699300697e-05, "Pretrain/Loss": 2.5501718521118164, "Pretrain/Loss (Raw)": 2.3271377086639404, "Pretrain/Step": 147, "Pretrain/Step Time": 11.05139765329659} +{"Pretrain/Learning Rate": 2.5874125874125877e-05, "Pretrain/Loss": 2.5468790531158447, "Pretrain/Loss (Raw)": 2.3990049362182617, "Pretrain/Step": 148, "Pretrain/Step Time": 11.050394797697663} +{"Pretrain/Learning Rate": 2.6048951048951047e-05, "Pretrain/Loss": 2.5413966178894043, "Pretrain/Loss (Raw)": 2.5600204467773438, "Pretrain/Step": 149, "Pretrain/Step Time": 11.043749524280429} +{"Pretrain/Learning Rate": 2.6223776223776224e-05, "Pretrain/Loss": 2.5311081409454346, "Pretrain/Loss (Raw)": 2.3507936000823975, "Pretrain/Step": 150, "Pretrain/Step Time": 11.004838110879064} +{"Pretrain/Learning Rate": 2.6398601398601404e-05, "Pretrain/Loss": 2.523383617401123, "Pretrain/Loss (Raw)": 2.4540176391601562, "Pretrain/Step": 151, "Pretrain/Step Time": 11.009416030719876} +{"Pretrain/Learning Rate": 2.6573426573426574e-05, "Pretrain/Loss": 2.520252227783203, "Pretrain/Loss (Raw)": 2.349823474884033, "Pretrain/Step": 152, "Pretrain/Step Time": 10.996139282360673} +{"Pretrain/Learning Rate": 2.674825174825175e-05, "Pretrain/Loss": 2.5217976570129395, "Pretrain/Loss (Raw)": 2.9595024585723877, "Pretrain/Step": 153, "Pretrain/Step Time": 10.942490505054593} +{"Pretrain/Learning Rate": 2.6923076923076923e-05, "Pretrain/Loss": 2.518054962158203, "Pretrain/Loss (Raw)": 2.384690284729004, "Pretrain/Step": 154, "Pretrain/Step Time": 10.915674895048141} +{"Pretrain/Learning Rate": 2.70979020979021e-05, "Pretrain/Loss": 2.515223979949951, "Pretrain/Loss (Raw)": 2.402117967605591, "Pretrain/Step": 155, "Pretrain/Step Time": 10.880591213703156} +{"Pretrain/Learning Rate": 2.7272727272727273e-05, "Pretrain/Loss": 2.5094141960144043, "Pretrain/Loss (Raw)": 2.194549798965454, "Pretrain/Step": 156, "Pretrain/Step Time": 10.82990500330925} +{"Pretrain/Learning Rate": 2.744755244755245e-05, "Pretrain/Loss": 2.5061163902282715, "Pretrain/Loss (Raw)": 2.2541332244873047, "Pretrain/Step": 157, "Pretrain/Step Time": 10.825770754367113} +{"Pretrain/Learning Rate": 2.762237762237762e-05, "Pretrain/Loss": 2.5039398670196533, "Pretrain/Loss (Raw)": 2.4906821250915527, "Pretrain/Step": 158, "Pretrain/Step Time": 10.763823265209794} +{"Pretrain/Learning Rate": 2.77972027972028e-05, "Pretrain/Loss": 2.501469373703003, "Pretrain/Loss (Raw)": 2.4181294441223145, "Pretrain/Step": 159, "Pretrain/Step Time": 10.798270152881742} +{"Pretrain/Learning Rate": 2.7972027972027976e-05, "Pretrain/Loss": 2.498223304748535, "Pretrain/Loss (Raw)": 2.1468467712402344, "Pretrain/Step": 160, "Pretrain/Step Time": 10.777941096574068} +{"Pretrain/Learning Rate": 2.8146853146853146e-05, "Pretrain/Loss": 2.4983174800872803, "Pretrain/Loss (Raw)": 2.3593549728393555, "Pretrain/Step": 161, "Pretrain/Step Time": 10.778861321508884} +{"Pretrain/Learning Rate": 2.8321678321678326e-05, "Pretrain/Loss": 2.4988203048706055, "Pretrain/Loss (Raw)": 2.570063591003418, "Pretrain/Step": 162, "Pretrain/Step Time": 10.76427473127842} +{"Pretrain/Learning Rate": 2.8496503496503496e-05, "Pretrain/Loss": 2.4955689907073975, "Pretrain/Loss (Raw)": 2.1881043910980225, "Pretrain/Step": 163, "Pretrain/Step Time": 10.792688904330134} +{"Pretrain/Learning Rate": 2.8671328671328672e-05, "Pretrain/Loss": 2.491485118865967, "Pretrain/Loss (Raw)": 2.418949842453003, "Pretrain/Step": 164, "Pretrain/Step Time": 10.793781822547317} +{"Pretrain/Learning Rate": 2.8846153846153845e-05, "Pretrain/Loss": 2.4903383255004883, "Pretrain/Loss (Raw)": 2.1596200466156006, "Pretrain/Step": 165, "Pretrain/Step Time": 10.77673066034913} +{"Pretrain/Learning Rate": 2.9020979020979022e-05, "Pretrain/Loss": 2.4895071983337402, "Pretrain/Loss (Raw)": 2.404438018798828, "Pretrain/Step": 166, "Pretrain/Step Time": 10.77952585555613} +{"Pretrain/Learning Rate": 2.91958041958042e-05, "Pretrain/Loss": 2.488068103790283, "Pretrain/Loss (Raw)": 2.3062965869903564, "Pretrain/Step": 167, "Pretrain/Step Time": 10.735434222966433} +{"Pretrain/Learning Rate": 2.9370629370629372e-05, "Pretrain/Loss": 2.487234115600586, "Pretrain/Loss (Raw)": 2.3644511699676514, "Pretrain/Step": 168, "Pretrain/Step Time": 10.731283409520984} +{"Pretrain/Learning Rate": 2.954545454545455e-05, "Pretrain/Loss": 2.4878740310668945, "Pretrain/Loss (Raw)": 2.66208553314209, "Pretrain/Step": 169, "Pretrain/Step Time": 10.694572884589434} +{"Pretrain/Learning Rate": 2.972027972027972e-05, "Pretrain/Loss": 2.4846668243408203, "Pretrain/Loss (Raw)": 2.4483301639556885, "Pretrain/Step": 170, "Pretrain/Step Time": 10.71172053180635} +{"Pretrain/Learning Rate": 2.9895104895104898e-05, "Pretrain/Loss": 2.48824405670166, "Pretrain/Loss (Raw)": 2.7153725624084473, "Pretrain/Step": 171, "Pretrain/Step Time": 10.663212412968278} +{"Pretrain/Learning Rate": 3.0069930069930068e-05, "Pretrain/Loss": 2.490882158279419, "Pretrain/Loss (Raw)": 2.738647937774658, "Pretrain/Step": 172, "Pretrain/Step Time": 10.680735521018505} +{"Pretrain/Learning Rate": 3.0244755244755245e-05, "Pretrain/Loss": 2.4907007217407227, "Pretrain/Loss (Raw)": 2.4319729804992676, "Pretrain/Step": 173, "Pretrain/Step Time": 10.67074342444539} +{"Pretrain/Learning Rate": 3.0419580419580425e-05, "Pretrain/Loss": 2.488356828689575, "Pretrain/Loss (Raw)": 2.1216495037078857, "Pretrain/Step": 174, "Pretrain/Step Time": 10.722579343244433} +{"Pretrain/Learning Rate": 3.0594405594405594e-05, "Pretrain/Loss": 2.4805963039398193, "Pretrain/Loss (Raw)": 2.4724159240722656, "Pretrain/Step": 175, "Pretrain/Step Time": 10.715711129829288} +{"Pretrain/Learning Rate": 3.0769230769230774e-05, "Pretrain/Loss": 2.4811501502990723, "Pretrain/Loss (Raw)": 2.253173828125, "Pretrain/Step": 176, "Pretrain/Step Time": 10.73338745906949} +{"Pretrain/Learning Rate": 3.094405594405594e-05, "Pretrain/Loss": 2.4807159900665283, "Pretrain/Loss (Raw)": 2.4955155849456787, "Pretrain/Step": 177, "Pretrain/Step Time": 10.68053451180458} +{"Pretrain/Learning Rate": 3.111888111888112e-05, "Pretrain/Loss": 2.4800684452056885, "Pretrain/Loss (Raw)": 2.345604181289673, "Pretrain/Step": 178, "Pretrain/Step Time": 10.703449562191963} +{"Pretrain/Learning Rate": 3.1293706293706294e-05, "Pretrain/Loss": 2.4791088104248047, "Pretrain/Loss (Raw)": 2.3387112617492676, "Pretrain/Step": 179, "Pretrain/Step Time": 10.700517281889915} +{"Pretrain/Learning Rate": 3.146853146853147e-05, "Pretrain/Loss": 2.4781360626220703, "Pretrain/Loss (Raw)": 2.4580748081207275, "Pretrain/Step": 180, "Pretrain/Step Time": 10.736877663061023} +{"Pretrain/Learning Rate": 3.164335664335665e-05, "Pretrain/Loss": 2.478336811065674, "Pretrain/Loss (Raw)": 2.4936063289642334, "Pretrain/Step": 181, "Pretrain/Step Time": 10.69641206599772} +{"Pretrain/Learning Rate": 3.181818181818182e-05, "Pretrain/Loss": 2.4800682067871094, "Pretrain/Loss (Raw)": 2.5555951595306396, "Pretrain/Step": 182, "Pretrain/Step Time": 10.698171682655811} +{"Pretrain/Learning Rate": 3.1993006993006994e-05, "Pretrain/Loss": 2.4779458045959473, "Pretrain/Loss (Raw)": 2.4819083213806152, "Pretrain/Step": 183, "Pretrain/Step Time": 10.715469870716333} +{"Pretrain/Learning Rate": 3.216783216783217e-05, "Pretrain/Loss": 2.476212978363037, "Pretrain/Loss (Raw)": 2.087247610092163, "Pretrain/Step": 184, "Pretrain/Step Time": 10.707610365003347} +{"Pretrain/Learning Rate": 3.234265734265735e-05, "Pretrain/Loss": 2.4728102684020996, "Pretrain/Loss (Raw)": 2.0660839080810547, "Pretrain/Step": 185, "Pretrain/Step Time": 10.718307280912995} +{"Pretrain/Learning Rate": 3.251748251748252e-05, "Pretrain/Loss": 2.4695584774017334, "Pretrain/Loss (Raw)": 2.418062686920166, "Pretrain/Step": 186, "Pretrain/Step Time": 10.719945764169097} +{"Pretrain/Learning Rate": 3.269230769230769e-05, "Pretrain/Loss": 2.4681127071380615, "Pretrain/Loss (Raw)": 2.398359775543213, "Pretrain/Step": 187, "Pretrain/Step Time": 10.654306983575225} +{"Pretrain/Learning Rate": 3.2867132867132866e-05, "Pretrain/Loss": 2.470256805419922, "Pretrain/Loss (Raw)": 2.6150193214416504, "Pretrain/Step": 188, "Pretrain/Step Time": 10.692748045548797} +{"Pretrain/Learning Rate": 3.3041958041958046e-05, "Pretrain/Loss": 2.4701340198516846, "Pretrain/Loss (Raw)": 2.301987648010254, "Pretrain/Step": 189, "Pretrain/Step Time": 10.688388833776116} +{"Pretrain/Learning Rate": 3.321678321678322e-05, "Pretrain/Loss": 2.470472812652588, "Pretrain/Loss (Raw)": 2.321183919906616, "Pretrain/Step": 190, "Pretrain/Step Time": 10.744945330545306} +{"Pretrain/Learning Rate": 3.339160839160839e-05, "Pretrain/Loss": 2.4683022499084473, "Pretrain/Loss (Raw)": 2.280608654022217, "Pretrain/Step": 191, "Pretrain/Step Time": 10.734640004113317} +{"Pretrain/Learning Rate": 3.356643356643357e-05, "Pretrain/Loss": 2.464643716812134, "Pretrain/Loss (Raw)": 2.154367685317993, "Pretrain/Step": 192, "Pretrain/Step Time": 10.802281688898802} +{"Pretrain/Learning Rate": 3.374125874125874e-05, "Pretrain/Loss": 2.4642157554626465, "Pretrain/Loss (Raw)": 2.4194302558898926, "Pretrain/Step": 193, "Pretrain/Step Time": 10.731603076681495} +{"Pretrain/Learning Rate": 3.391608391608392e-05, "Pretrain/Loss": 2.4644339084625244, "Pretrain/Loss (Raw)": 2.273695945739746, "Pretrain/Step": 194, "Pretrain/Step Time": 10.76376523077488} +{"Pretrain/Learning Rate": 3.409090909090909e-05, "Pretrain/Loss": 2.4632151126861572, "Pretrain/Loss (Raw)": 2.4606282711029053, "Pretrain/Step": 195, "Pretrain/Step Time": 10.764980329200625} +{"Pretrain/Learning Rate": 3.4265734265734265e-05, "Pretrain/Loss": 2.455355644226074, "Pretrain/Loss (Raw)": 2.3881289958953857, "Pretrain/Step": 196, "Pretrain/Step Time": 10.768046842887998} +{"Pretrain/Learning Rate": 3.4440559440559445e-05, "Pretrain/Loss": 2.4455716609954834, "Pretrain/Loss (Raw)": 2.2333340644836426, "Pretrain/Step": 197, "Pretrain/Step Time": 10.724771972745657} +{"Pretrain/Learning Rate": 3.461538461538462e-05, "Pretrain/Loss": 2.4454433917999268, "Pretrain/Loss (Raw)": 2.7110230922698975, "Pretrain/Step": 198, "Pretrain/Step Time": 10.737432297319174} +{"Pretrain/Learning Rate": 3.479020979020979e-05, "Pretrain/Loss": 2.446108818054199, "Pretrain/Loss (Raw)": 2.624985456466675, "Pretrain/Step": 199, "Pretrain/Step Time": 10.74567300081253} +{"Pretrain/Learning Rate": 3.4965034965034965e-05, "Pretrain/Loss": 2.4441585540771484, "Pretrain/Loss (Raw)": 2.2154664993286133, "Pretrain/Step": 200, "Pretrain/Step Time": 10.7589519508183} +{"Pretrain/Learning Rate": 3.5139860139860145e-05, "Pretrain/Loss": 2.4442098140716553, "Pretrain/Loss (Raw)": 2.3673856258392334, "Pretrain/Step": 201, "Pretrain/Step Time": 10.788501283153892} +{"Pretrain/Learning Rate": 3.531468531468531e-05, "Pretrain/Loss": 2.4406118392944336, "Pretrain/Loss (Raw)": 2.3972907066345215, "Pretrain/Step": 202, "Pretrain/Step Time": 10.773956706747413} +{"Pretrain/Learning Rate": 3.548951048951049e-05, "Pretrain/Loss": 2.4399633407592773, "Pretrain/Loss (Raw)": 2.334089517593384, "Pretrain/Step": 203, "Pretrain/Step Time": 10.77801881916821} +{"Pretrain/Learning Rate": 3.566433566433567e-05, "Pretrain/Loss": 2.4402682781219482, "Pretrain/Loss (Raw)": 2.463992118835449, "Pretrain/Step": 204, "Pretrain/Step Time": 10.783669520169497} +{"Pretrain/Learning Rate": 3.583916083916084e-05, "Pretrain/Loss": 2.437422752380371, "Pretrain/Loss (Raw)": 2.189509630203247, "Pretrain/Step": 205, "Pretrain/Step Time": 10.751660004258156} +{"Pretrain/Learning Rate": 3.601398601398602e-05, "Pretrain/Loss": 2.437290668487549, "Pretrain/Loss (Raw)": 2.414116859436035, "Pretrain/Step": 206, "Pretrain/Step Time": 10.80419510230422} +{"Pretrain/Learning Rate": 3.618881118881119e-05, "Pretrain/Loss": 2.43402099609375, "Pretrain/Loss (Raw)": 2.159611701965332, "Pretrain/Step": 207, "Pretrain/Step Time": 10.789899392053485} +{"Pretrain/Learning Rate": 3.6363636363636364e-05, "Pretrain/Loss": 2.4336726665496826, "Pretrain/Loss (Raw)": 2.650158643722534, "Pretrain/Step": 208, "Pretrain/Step Time": 10.836800774559379} +{"Pretrain/Learning Rate": 3.653846153846154e-05, "Pretrain/Loss": 2.4339966773986816, "Pretrain/Loss (Raw)": 2.2965328693389893, "Pretrain/Step": 209, "Pretrain/Step Time": 10.801496118307114} +{"Pretrain/Learning Rate": 3.671328671328672e-05, "Pretrain/Loss": 2.4364190101623535, "Pretrain/Loss (Raw)": 2.649536371231079, "Pretrain/Step": 210, "Pretrain/Step Time": 10.84221071191132} +{"Pretrain/Learning Rate": 3.688811188811189e-05, "Pretrain/Loss": 2.4277377128601074, "Pretrain/Loss (Raw)": 2.1636645793914795, "Pretrain/Step": 211, "Pretrain/Step Time": 10.79503259062767} +{"Pretrain/Learning Rate": 3.7062937062937064e-05, "Pretrain/Loss": 2.423584461212158, "Pretrain/Loss (Raw)": 2.308710813522339, "Pretrain/Step": 212, "Pretrain/Step Time": 10.844582518562675} +{"Pretrain/Learning Rate": 3.7237762237762244e-05, "Pretrain/Loss": 2.4214534759521484, "Pretrain/Loss (Raw)": 2.3031816482543945, "Pretrain/Step": 213, "Pretrain/Step Time": 10.81870624050498} +{"Pretrain/Learning Rate": 3.741258741258741e-05, "Pretrain/Loss": 2.4209961891174316, "Pretrain/Loss (Raw)": 2.242371082305908, "Pretrain/Step": 214, "Pretrain/Step Time": 10.85252613388002} +{"Pretrain/Learning Rate": 3.758741258741259e-05, "Pretrain/Loss": 2.4211463928222656, "Pretrain/Loss (Raw)": 2.445060968399048, "Pretrain/Step": 215, "Pretrain/Step Time": 10.839878587052226} +{"Pretrain/Learning Rate": 3.776223776223776e-05, "Pretrain/Loss": 2.4239308834075928, "Pretrain/Loss (Raw)": 2.510711908340454, "Pretrain/Step": 216, "Pretrain/Step Time": 10.89342244900763} +{"Pretrain/Learning Rate": 3.7937062937062936e-05, "Pretrain/Loss": 2.4242281913757324, "Pretrain/Loss (Raw)": 2.348339557647705, "Pretrain/Step": 217, "Pretrain/Step Time": 10.870664587244391} +{"Pretrain/Learning Rate": 3.811188811188811e-05, "Pretrain/Loss": 2.4217889308929443, "Pretrain/Loss (Raw)": 2.488942861557007, "Pretrain/Step": 218, "Pretrain/Step Time": 10.908666113391519} +{"Pretrain/Learning Rate": 3.828671328671329e-05, "Pretrain/Loss": 2.421212673187256, "Pretrain/Loss (Raw)": 2.444011688232422, "Pretrain/Step": 219, "Pretrain/Step Time": 10.888089329004288} +{"Pretrain/Learning Rate": 3.846153846153846e-05, "Pretrain/Loss": 2.4189138412475586, "Pretrain/Loss (Raw)": 2.176549196243286, "Pretrain/Step": 220, "Pretrain/Step Time": 10.959101350978017} +{"Pretrain/Learning Rate": 3.8636363636363636e-05, "Pretrain/Loss": 2.4177513122558594, "Pretrain/Loss (Raw)": 2.2911593914031982, "Pretrain/Step": 221, "Pretrain/Step Time": 10.95416583865881} +{"Pretrain/Learning Rate": 3.8811188811188816e-05, "Pretrain/Loss": 2.4182796478271484, "Pretrain/Loss (Raw)": 2.6277523040771484, "Pretrain/Step": 222, "Pretrain/Step Time": 11.007274802774191} +{"Pretrain/Learning Rate": 3.898601398601399e-05, "Pretrain/Loss": 2.4145402908325195, "Pretrain/Loss (Raw)": 2.2448785305023193, "Pretrain/Step": 223, "Pretrain/Step Time": 11.009402673691511} +{"Pretrain/Learning Rate": 3.916083916083916e-05, "Pretrain/Loss": 2.4146780967712402, "Pretrain/Loss (Raw)": 2.1896307468414307, "Pretrain/Step": 224, "Pretrain/Step Time": 11.047975953668356} +{"Pretrain/Learning Rate": 3.9335664335664336e-05, "Pretrain/Loss": 2.4135899543762207, "Pretrain/Loss (Raw)": 2.2364461421966553, "Pretrain/Step": 225, "Pretrain/Step Time": 10.993563989177346} +{"Pretrain/Learning Rate": 3.9510489510489516e-05, "Pretrain/Loss": 2.4130136966705322, "Pretrain/Loss (Raw)": 2.293461799621582, "Pretrain/Step": 226, "Pretrain/Step Time": 11.018499260768294} +{"Pretrain/Learning Rate": 3.968531468531469e-05, "Pretrain/Loss": 2.412639856338501, "Pretrain/Loss (Raw)": 2.25494647026062, "Pretrain/Step": 227, "Pretrain/Step Time": 10.994431782513857} +{"Pretrain/Learning Rate": 3.986013986013986e-05, "Pretrain/Loss": 2.41190242767334, "Pretrain/Loss (Raw)": 2.193964958190918, "Pretrain/Step": 228, "Pretrain/Step Time": 11.05681198835373} +{"Pretrain/Learning Rate": 4.0034965034965035e-05, "Pretrain/Loss": 2.4094600677490234, "Pretrain/Loss (Raw)": 2.3049662113189697, "Pretrain/Step": 229, "Pretrain/Step Time": 11.03147765994072} +{"Pretrain/Learning Rate": 4.020979020979021e-05, "Pretrain/Loss": 2.410174608230591, "Pretrain/Loss (Raw)": 2.5697779655456543, "Pretrain/Step": 230, "Pretrain/Step Time": 11.032752901315689} +{"Pretrain/Learning Rate": 4.038461538461539e-05, "Pretrain/Loss": 2.4101696014404297, "Pretrain/Loss (Raw)": 2.292625904083252, "Pretrain/Step": 231, "Pretrain/Step Time": 10.998680358752608} +{"Pretrain/Learning Rate": 4.055944055944056e-05, "Pretrain/Loss": 2.4101738929748535, "Pretrain/Loss (Raw)": 2.358877182006836, "Pretrain/Step": 232, "Pretrain/Step Time": 11.015523165464401} +{"Pretrain/Learning Rate": 4.0734265734265735e-05, "Pretrain/Loss": 2.4094982147216797, "Pretrain/Loss (Raw)": 2.139331340789795, "Pretrain/Step": 233, "Pretrain/Step Time": 11.007674973458052} +{"Pretrain/Learning Rate": 4.0909090909090915e-05, "Pretrain/Loss": 2.4092583656311035, "Pretrain/Loss (Raw)": 2.283405303955078, "Pretrain/Step": 234, "Pretrain/Step Time": 10.973567556589842} +{"Pretrain/Learning Rate": 4.108391608391609e-05, "Pretrain/Loss": 2.4070558547973633, "Pretrain/Loss (Raw)": 2.5041260719299316, "Pretrain/Step": 235, "Pretrain/Step Time": 10.977519892156124} +{"Pretrain/Learning Rate": 4.125874125874126e-05, "Pretrain/Loss": 2.4041147232055664, "Pretrain/Loss (Raw)": 2.162125587463379, "Pretrain/Step": 236, "Pretrain/Step Time": 11.00805339589715} +{"Pretrain/Learning Rate": 4.1433566433566434e-05, "Pretrain/Loss": 2.4039523601531982, "Pretrain/Loss (Raw)": 2.567323923110962, "Pretrain/Step": 237, "Pretrain/Step Time": 11.00213684886694} +{"Pretrain/Learning Rate": 4.1608391608391614e-05, "Pretrain/Loss": 2.4028239250183105, "Pretrain/Loss (Raw)": 2.3181817531585693, "Pretrain/Step": 238, "Pretrain/Step Time": 11.06036944128573} +{"Pretrain/Learning Rate": 4.178321678321678e-05, "Pretrain/Loss": 2.4044837951660156, "Pretrain/Loss (Raw)": 2.574384927749634, "Pretrain/Step": 239, "Pretrain/Step Time": 11.074048168957233} +{"Pretrain/Learning Rate": 4.195804195804196e-05, "Pretrain/Loss": 2.4030590057373047, "Pretrain/Loss (Raw)": 2.2954607009887695, "Pretrain/Step": 240, "Pretrain/Step Time": 11.089879201725125} +{"Pretrain/Learning Rate": 4.213286713286714e-05, "Pretrain/Loss": 2.4034371376037598, "Pretrain/Loss (Raw)": 2.357545852661133, "Pretrain/Step": 241, "Pretrain/Step Time": 11.095128383487463} +{"Pretrain/Learning Rate": 4.230769230769231e-05, "Pretrain/Loss": 2.4047327041625977, "Pretrain/Loss (Raw)": 2.414670467376709, "Pretrain/Step": 242, "Pretrain/Step Time": 11.110795367509127} +{"Pretrain/Learning Rate": 4.248251748251749e-05, "Pretrain/Loss": 2.4042015075683594, "Pretrain/Loss (Raw)": 2.3412158489227295, "Pretrain/Step": 243, "Pretrain/Step Time": 11.118271322920918} +{"Pretrain/Learning Rate": 4.265734265734266e-05, "Pretrain/Loss": 2.4017887115478516, "Pretrain/Loss (Raw)": 2.0507547855377197, "Pretrain/Step": 244, "Pretrain/Step Time": 11.125485952943563} +{"Pretrain/Learning Rate": 4.2832167832167833e-05, "Pretrain/Loss": 2.3984341621398926, "Pretrain/Loss (Raw)": 2.312704563140869, "Pretrain/Step": 245, "Pretrain/Step Time": 11.132691407576203} +{"Pretrain/Learning Rate": 4.300699300699301e-05, "Pretrain/Loss": 2.3943488597869873, "Pretrain/Loss (Raw)": 2.149527072906494, "Pretrain/Step": 246, "Pretrain/Step Time": 11.136513710021973} +{"Pretrain/Learning Rate": 4.318181818181819e-05, "Pretrain/Loss": 2.3948774337768555, "Pretrain/Loss (Raw)": 2.4860990047454834, "Pretrain/Step": 247, "Pretrain/Step Time": 11.170572016388178} +{"Pretrain/Learning Rate": 4.335664335664335e-05, "Pretrain/Loss": 2.3897016048431396, "Pretrain/Loss (Raw)": 2.0948078632354736, "Pretrain/Step": 248, "Pretrain/Step Time": 11.161952503025532} +{"Pretrain/Learning Rate": 4.353146853146853e-05, "Pretrain/Loss": 2.387913703918457, "Pretrain/Loss (Raw)": 2.2695329189300537, "Pretrain/Step": 249, "Pretrain/Step Time": 11.147333590313792} +{"Pretrain/Learning Rate": 4.370629370629371e-05, "Pretrain/Loss": 2.386606454849243, "Pretrain/Loss (Raw)": 2.165360450744629, "Pretrain/Step": 250, "Pretrain/Step Time": 11.162107339128852} +{"Pretrain/Learning Rate": 4.388111888111888e-05, "Pretrain/Loss": 2.384840488433838, "Pretrain/Loss (Raw)": 2.226909875869751, "Pretrain/Step": 251, "Pretrain/Step Time": 11.204890238121152} +{"Pretrain/Learning Rate": 4.405594405594406e-05, "Pretrain/Loss": 2.383296251296997, "Pretrain/Loss (Raw)": 2.1731979846954346, "Pretrain/Step": 252, "Pretrain/Step Time": 11.25552174821496} +{"Pretrain/Learning Rate": 4.423076923076923e-05, "Pretrain/Loss": 2.379055976867676, "Pretrain/Loss (Raw)": 2.3425540924072266, "Pretrain/Step": 253, "Pretrain/Step Time": 11.257416605949402} +{"Pretrain/Learning Rate": 4.4405594405594406e-05, "Pretrain/Loss": 2.3794472217559814, "Pretrain/Loss (Raw)": 2.2670738697052, "Pretrain/Step": 254, "Pretrain/Step Time": 11.18434327840805} +{"Pretrain/Learning Rate": 4.458041958041958e-05, "Pretrain/Loss": 2.37978458404541, "Pretrain/Loss (Raw)": 2.3872358798980713, "Pretrain/Step": 255, "Pretrain/Step Time": 11.185411574319005} +{"Pretrain/Learning Rate": 4.475524475524476e-05, "Pretrain/Loss": 2.3779332637786865, "Pretrain/Loss (Raw)": 2.242554187774658, "Pretrain/Step": 256, "Pretrain/Step Time": 11.185691552236676} +{"Pretrain/Learning Rate": 4.493006993006993e-05, "Pretrain/Loss": 2.3749442100524902, "Pretrain/Loss (Raw)": 2.2660136222839355, "Pretrain/Step": 257, "Pretrain/Step Time": 11.197624191641808} +{"Pretrain/Learning Rate": 4.5104895104895105e-05, "Pretrain/Loss": 2.3737151622772217, "Pretrain/Loss (Raw)": 2.3970260620117188, "Pretrain/Step": 258, "Pretrain/Step Time": 11.180298384279013} +{"Pretrain/Learning Rate": 4.5279720279720285e-05, "Pretrain/Loss": 2.3751723766326904, "Pretrain/Loss (Raw)": 2.5347437858581543, "Pretrain/Step": 259, "Pretrain/Step Time": 11.232837915420532} +{"Pretrain/Learning Rate": 4.545454545454546e-05, "Pretrain/Loss": 2.3740994930267334, "Pretrain/Loss (Raw)": 2.2869818210601807, "Pretrain/Step": 260, "Pretrain/Step Time": 11.252715788781643} +{"Pretrain/Learning Rate": 4.562937062937063e-05, "Pretrain/Loss": 2.373168468475342, "Pretrain/Loss (Raw)": 2.1817500591278076, "Pretrain/Step": 261, "Pretrain/Step Time": 11.257583685219288} +{"Pretrain/Learning Rate": 4.5804195804195805e-05, "Pretrain/Loss": 2.373019218444824, "Pretrain/Loss (Raw)": 2.243776559829712, "Pretrain/Step": 262, "Pretrain/Step Time": 11.210425676777959} +{"Pretrain/Learning Rate": 4.597902097902098e-05, "Pretrain/Loss": 2.370758295059204, "Pretrain/Loss (Raw)": 2.1085753440856934, "Pretrain/Step": 263, "Pretrain/Step Time": 11.246475547552109} +{"Pretrain/Learning Rate": 4.615384615384616e-05, "Pretrain/Loss": 2.368211030960083, "Pretrain/Loss (Raw)": 2.3799960613250732, "Pretrain/Step": 264, "Pretrain/Step Time": 11.277660990133882} +{"Pretrain/Learning Rate": 4.632867132867133e-05, "Pretrain/Loss": 2.3669025897979736, "Pretrain/Loss (Raw)": 2.3749446868896484, "Pretrain/Step": 265, "Pretrain/Step Time": 11.274895401671529} +{"Pretrain/Learning Rate": 4.6503496503496505e-05, "Pretrain/Loss": 2.369150400161743, "Pretrain/Loss (Raw)": 2.619574546813965, "Pretrain/Step": 266, "Pretrain/Step Time": 11.285995131358504} +{"Pretrain/Learning Rate": 4.667832167832168e-05, "Pretrain/Loss": 2.3700222969055176, "Pretrain/Loss (Raw)": 2.426150321960449, "Pretrain/Step": 267, "Pretrain/Step Time": 11.258145432919264} +{"Pretrain/Learning Rate": 4.685314685314686e-05, "Pretrain/Loss": 2.371507167816162, "Pretrain/Loss (Raw)": 2.5410242080688477, "Pretrain/Step": 268, "Pretrain/Step Time": 11.290635671466589} +{"Pretrain/Learning Rate": 4.702797202797203e-05, "Pretrain/Loss": 2.3671438694000244, "Pretrain/Loss (Raw)": 2.3261067867279053, "Pretrain/Step": 269, "Pretrain/Step Time": 11.248494073748589} +{"Pretrain/Learning Rate": 4.7202797202797204e-05, "Pretrain/Loss": 2.3659684658050537, "Pretrain/Loss (Raw)": 2.3019115924835205, "Pretrain/Step": 270, "Pretrain/Step Time": 11.247118251398206} +{"Pretrain/Learning Rate": 4.7377622377622384e-05, "Pretrain/Loss": 2.3677141666412354, "Pretrain/Loss (Raw)": 2.683199167251587, "Pretrain/Step": 271, "Pretrain/Step Time": 11.255748022347689} +{"Pretrain/Learning Rate": 4.755244755244756e-05, "Pretrain/Loss": 2.365025758743286, "Pretrain/Loss (Raw)": 2.3149847984313965, "Pretrain/Step": 272, "Pretrain/Step Time": 11.297422513365746} +{"Pretrain/Learning Rate": 4.772727272727273e-05, "Pretrain/Loss": 2.362440586090088, "Pretrain/Loss (Raw)": 2.311652898788452, "Pretrain/Step": 273, "Pretrain/Step Time": 11.296071592718363} +{"Pretrain/Learning Rate": 4.7902097902097904e-05, "Pretrain/Loss": 2.3617939949035645, "Pretrain/Loss (Raw)": 2.2278871536254883, "Pretrain/Step": 274, "Pretrain/Step Time": 11.293848553672433} +{"Pretrain/Learning Rate": 4.8076923076923084e-05, "Pretrain/Loss": 2.360621929168701, "Pretrain/Loss (Raw)": 2.177121877670288, "Pretrain/Step": 275, "Pretrain/Step Time": 11.25500663369894} +{"Pretrain/Learning Rate": 4.825174825174825e-05, "Pretrain/Loss": 2.358609199523926, "Pretrain/Loss (Raw)": 2.1413722038269043, "Pretrain/Step": 276, "Pretrain/Step Time": 11.28917733952403} +{"Pretrain/Learning Rate": 4.842657342657343e-05, "Pretrain/Loss": 2.356400966644287, "Pretrain/Loss (Raw)": 2.2773630619049072, "Pretrain/Step": 277, "Pretrain/Step Time": 11.24649634771049} +{"Pretrain/Learning Rate": 4.86013986013986e-05, "Pretrain/Loss": 2.3573193550109863, "Pretrain/Loss (Raw)": 2.468308925628662, "Pretrain/Step": 278, "Pretrain/Step Time": 11.294613359495997} +{"Pretrain/Learning Rate": 4.8776223776223776e-05, "Pretrain/Loss": 2.356204032897949, "Pretrain/Loss (Raw)": 2.311260461807251, "Pretrain/Step": 279, "Pretrain/Step Time": 11.287133142352104} +{"Pretrain/Learning Rate": 4.8951048951048956e-05, "Pretrain/Loss": 2.3554797172546387, "Pretrain/Loss (Raw)": 2.257132053375244, "Pretrain/Step": 280, "Pretrain/Step Time": 11.322633633390069} +{"Pretrain/Learning Rate": 4.912587412587413e-05, "Pretrain/Loss": 2.349809408187866, "Pretrain/Loss (Raw)": 2.2336807250976562, "Pretrain/Step": 281, "Pretrain/Step Time": 11.320302518084645} +{"Pretrain/Learning Rate": 4.93006993006993e-05, "Pretrain/Loss": 2.3487515449523926, "Pretrain/Loss (Raw)": 2.2492804527282715, "Pretrain/Step": 282, "Pretrain/Step Time": 11.365974372252822} +{"Pretrain/Learning Rate": 4.9475524475524476e-05, "Pretrain/Loss": 2.348630905151367, "Pretrain/Loss (Raw)": 2.3867275714874268, "Pretrain/Step": 283, "Pretrain/Step Time": 11.374029261991382} +{"Pretrain/Learning Rate": 4.9650349650349656e-05, "Pretrain/Loss": 2.3505702018737793, "Pretrain/Loss (Raw)": 2.4427835941314697, "Pretrain/Step": 284, "Pretrain/Step Time": 11.383415047079325} +{"Pretrain/Learning Rate": 4.982517482517482e-05, "Pretrain/Loss": 2.352383613586426, "Pretrain/Loss (Raw)": 2.4862215518951416, "Pretrain/Step": 285, "Pretrain/Step Time": 11.417584890499711} +{"Pretrain/Learning Rate": 5e-05, "Pretrain/Loss": 2.3508591651916504, "Pretrain/Loss (Raw)": 2.2955524921417236, "Pretrain/Step": 286, "Pretrain/Step Time": 11.40325465425849} +{"Pretrain/Learning Rate": 4.9999998558441094e-05, "Pretrain/Loss": 2.349522113800049, "Pretrain/Loss (Raw)": 2.2469863891601562, "Pretrain/Step": 287, "Pretrain/Step Time": 11.420004161074758} +{"Pretrain/Learning Rate": 4.999999423376456e-05, "Pretrain/Loss": 2.351378917694092, "Pretrain/Loss (Raw)": 2.384502649307251, "Pretrain/Step": 288, "Pretrain/Step Time": 11.41395664960146} +{"Pretrain/Learning Rate": 4.9999987025970884e-05, "Pretrain/Loss": 2.351292133331299, "Pretrain/Loss (Raw)": 2.348247528076172, "Pretrain/Step": 289, "Pretrain/Step Time": 11.41954500041902} +{"Pretrain/Learning Rate": 4.99999769350609e-05, "Pretrain/Loss": 2.348968505859375, "Pretrain/Loss (Raw)": 2.2726504802703857, "Pretrain/Step": 290, "Pretrain/Step Time": 11.50946923904121} +{"Pretrain/Learning Rate": 4.999996396103577e-05, "Pretrain/Loss": 2.3501834869384766, "Pretrain/Loss (Raw)": 2.343611478805542, "Pretrain/Step": 291, "Pretrain/Step Time": 11.472737332805991} +{"Pretrain/Learning Rate": 4.999994810389699e-05, "Pretrain/Loss": 2.348330020904541, "Pretrain/Loss (Raw)": 2.181739568710327, "Pretrain/Step": 292, "Pretrain/Step Time": 11.471605567261577} +{"Pretrain/Learning Rate": 4.999992936364639e-05, "Pretrain/Loss": 2.3493454456329346, "Pretrain/Loss (Raw)": 2.2895607948303223, "Pretrain/Step": 293, "Pretrain/Step Time": 11.470500463619828} +{"Pretrain/Learning Rate": 4.9999907740286136e-05, "Pretrain/Loss": 2.3485805988311768, "Pretrain/Loss (Raw)": 2.3065342903137207, "Pretrain/Step": 294, "Pretrain/Step Time": 11.55407308228314} +{"Pretrain/Learning Rate": 4.9999883233818724e-05, "Pretrain/Loss": 2.34641432762146, "Pretrain/Loss (Raw)": 2.0290117263793945, "Pretrain/Step": 295, "Pretrain/Step Time": 11.54303901270032} +{"Pretrain/Learning Rate": 4.999985584424696e-05, "Pretrain/Loss": 2.3453006744384766, "Pretrain/Loss (Raw)": 2.221916675567627, "Pretrain/Step": 296, "Pretrain/Step Time": 11.591800907626748} +{"Pretrain/Learning Rate": 4.999982557157403e-05, "Pretrain/Loss": 2.3404862880706787, "Pretrain/Loss (Raw)": 2.0458343029022217, "Pretrain/Step": 297, "Pretrain/Step Time": 11.557370226830244} +{"Pretrain/Learning Rate": 4.9999792415803405e-05, "Pretrain/Loss": 2.3390660285949707, "Pretrain/Loss (Raw)": 2.2665581703186035, "Pretrain/Step": 298, "Pretrain/Step Time": 11.592468274757266} +{"Pretrain/Learning Rate": 4.999975637693892e-05, "Pretrain/Loss": 2.3377609252929688, "Pretrain/Loss (Raw)": 2.5483036041259766, "Pretrain/Step": 299, "Pretrain/Step Time": 11.591245334595442} +{"Pretrain/Learning Rate": 4.999971745498472e-05, "Pretrain/Loss": 2.334757089614868, "Pretrain/Loss (Raw)": 2.3541696071624756, "Pretrain/Step": 300, "Pretrain/Step Time": 11.654743680730462} +{"Pretrain/Learning Rate": 4.999967564994531e-05, "Pretrain/Loss": 2.333979368209839, "Pretrain/Loss (Raw)": 2.3324368000030518, "Pretrain/Step": 301, "Pretrain/Step Time": 11.659596901386976} +{"Pretrain/Learning Rate": 4.999963096182549e-05, "Pretrain/Loss": 2.334537982940674, "Pretrain/Loss (Raw)": 2.1931216716766357, "Pretrain/Step": 302, "Pretrain/Step Time": 11.590359622612596} +{"Pretrain/Learning Rate": 4.9999583390630435e-05, "Pretrain/Loss": 2.333261489868164, "Pretrain/Loss (Raw)": 2.3090426921844482, "Pretrain/Step": 303, "Pretrain/Step Time": 11.593702655285597} +{"Pretrain/Learning Rate": 4.999953293636562e-05, "Pretrain/Loss": 2.3329660892486572, "Pretrain/Loss (Raw)": 2.2153561115264893, "Pretrain/Step": 304, "Pretrain/Step Time": 11.630044670775533} +{"Pretrain/Learning Rate": 4.9999479599036856e-05, "Pretrain/Loss": 2.3312480449676514, "Pretrain/Loss (Raw)": 2.2756223678588867, "Pretrain/Step": 305, "Pretrain/Step Time": 11.626040127128363} +{"Pretrain/Learning Rate": 4.9999423378650315e-05, "Pretrain/Loss": 2.3294596672058105, "Pretrain/Loss (Raw)": 2.1166725158691406, "Pretrain/Step": 306, "Pretrain/Step Time": 11.6446129437536} +{"Pretrain/Learning Rate": 4.9999364275212466e-05, "Pretrain/Loss": 2.330815315246582, "Pretrain/Loss (Raw)": 2.5122218132019043, "Pretrain/Step": 307, "Pretrain/Step Time": 11.639977471902966} +{"Pretrain/Learning Rate": 4.9999302288730126e-05, "Pretrain/Loss": 2.331418037414551, "Pretrain/Loss (Raw)": 2.535245656967163, "Pretrain/Step": 308, "Pretrain/Step Time": 11.734738165512681} +{"Pretrain/Learning Rate": 4.9999237419210445e-05, "Pretrain/Loss": 2.329470634460449, "Pretrain/Loss (Raw)": 2.2443454265594482, "Pretrain/Step": 309, "Pretrain/Step Time": 11.735157134011388} +{"Pretrain/Learning Rate": 4.99991696666609e-05, "Pretrain/Loss": 2.327326536178589, "Pretrain/Loss (Raw)": 2.281137466430664, "Pretrain/Step": 310, "Pretrain/Step Time": 11.725983878597617} +{"Pretrain/Learning Rate": 4.999909903108932e-05, "Pretrain/Loss": 2.327115774154663, "Pretrain/Loss (Raw)": 2.4549295902252197, "Pretrain/Step": 311, "Pretrain/Step Time": 11.705947430804372} +{"Pretrain/Learning Rate": 4.999902551250384e-05, "Pretrain/Loss": 2.328233242034912, "Pretrain/Loss (Raw)": 2.230286121368408, "Pretrain/Step": 312, "Pretrain/Step Time": 11.711197605356574} +{"Pretrain/Learning Rate": 4.999894911091293e-05, "Pretrain/Loss": 2.329500198364258, "Pretrain/Loss (Raw)": 2.2282533645629883, "Pretrain/Step": 313, "Pretrain/Step Time": 11.671973530203104} +{"Pretrain/Learning Rate": 4.999886982632541e-05, "Pretrain/Loss": 2.328338623046875, "Pretrain/Loss (Raw)": 2.2693939208984375, "Pretrain/Step": 314, "Pretrain/Step Time": 11.678261298686266} +{"Pretrain/Learning Rate": 4.999878765875042e-05, "Pretrain/Loss": 2.3272714614868164, "Pretrain/Loss (Raw)": 2.261739492416382, "Pretrain/Step": 315, "Pretrain/Step Time": 11.684775115922093} +{"Pretrain/Learning Rate": 4.999870260819745e-05, "Pretrain/Loss": 2.3239083290100098, "Pretrain/Loss (Raw)": 2.1845552921295166, "Pretrain/Step": 316, "Pretrain/Step Time": 11.709765939041972} +{"Pretrain/Learning Rate": 4.999861467467629e-05, "Pretrain/Loss": 2.3236775398254395, "Pretrain/Loss (Raw)": 2.2724437713623047, "Pretrain/Step": 317, "Pretrain/Step Time": 11.707053704187274} +{"Pretrain/Learning Rate": 4.9998523858197094e-05, "Pretrain/Loss": 2.3234784603118896, "Pretrain/Loss (Raw)": 2.295684576034546, "Pretrain/Step": 318, "Pretrain/Step Time": 11.705737706273794} +{"Pretrain/Learning Rate": 4.999843015877032e-05, "Pretrain/Loss": 2.3234167098999023, "Pretrain/Loss (Raw)": 2.2727088928222656, "Pretrain/Step": 319, "Pretrain/Step Time": 11.70474631153047} +{"Pretrain/Learning Rate": 4.99983335764068e-05, "Pretrain/Loss": 2.324338436126709, "Pretrain/Loss (Raw)": 2.272392511367798, "Pretrain/Step": 320, "Pretrain/Step Time": 11.672632213681936} +{"Pretrain/Learning Rate": 4.999823411111765e-05, "Pretrain/Loss": 2.323190212249756, "Pretrain/Loss (Raw)": 2.2724449634552, "Pretrain/Step": 321, "Pretrain/Step Time": 11.66785648278892} +{"Pretrain/Learning Rate": 4.999813176291433e-05, "Pretrain/Loss": 2.323389768600464, "Pretrain/Loss (Raw)": 2.2992212772369385, "Pretrain/Step": 322, "Pretrain/Step Time": 11.689672576263547} +{"Pretrain/Learning Rate": 4.999802653180868e-05, "Pretrain/Loss": 2.320666790008545, "Pretrain/Loss (Raw)": 2.1120715141296387, "Pretrain/Step": 323, "Pretrain/Step Time": 11.688867768272758} +{"Pretrain/Learning Rate": 4.9997918417812805e-05, "Pretrain/Loss": 2.319624900817871, "Pretrain/Loss (Raw)": 2.2548015117645264, "Pretrain/Step": 324, "Pretrain/Step Time": 11.69402245245874} +{"Pretrain/Learning Rate": 4.999780742093919e-05, "Pretrain/Loss": 2.3203060626983643, "Pretrain/Loss (Raw)": 2.32053279876709, "Pretrain/Step": 325, "Pretrain/Step Time": 11.673743300139904} +{"Pretrain/Learning Rate": 4.999769354120063e-05, "Pretrain/Loss": 2.3160343170166016, "Pretrain/Loss (Raw)": 2.1641972064971924, "Pretrain/Step": 326, "Pretrain/Step Time": 11.685390559956431} +{"Pretrain/Learning Rate": 4.9997576778610254e-05, "Pretrain/Loss": 2.3130321502685547, "Pretrain/Loss (Raw)": 2.2406997680664062, "Pretrain/Step": 327, "Pretrain/Step Time": 11.666449768468738} +{"Pretrain/Learning Rate": 4.999745713318154e-05, "Pretrain/Loss": 2.3142666816711426, "Pretrain/Loss (Raw)": 2.3735053539276123, "Pretrain/Step": 328, "Pretrain/Step Time": 11.678507037460804} +{"Pretrain/Learning Rate": 4.999733460492826e-05, "Pretrain/Loss": 2.3104779720306396, "Pretrain/Loss (Raw)": 1.882433533668518, "Pretrain/Step": 329, "Pretrain/Step Time": 11.62322985008359} +{"Pretrain/Learning Rate": 4.999720919386457e-05, "Pretrain/Loss": 2.3090803623199463, "Pretrain/Loss (Raw)": 2.218400001525879, "Pretrain/Step": 330, "Pretrain/Step Time": 11.636186560615897} +{"Pretrain/Learning Rate": 4.999708090000493e-05, "Pretrain/Loss": 2.308255672454834, "Pretrain/Loss (Raw)": 2.22851824760437, "Pretrain/Step": 331, "Pretrain/Step Time": 11.628649203106761} +{"Pretrain/Learning Rate": 4.999694972336413e-05, "Pretrain/Loss": 2.3067564964294434, "Pretrain/Loss (Raw)": 2.272117853164673, "Pretrain/Step": 332, "Pretrain/Step Time": 11.628554737195373} +{"Pretrain/Learning Rate": 4.9996815663957296e-05, "Pretrain/Loss": 2.306765556335449, "Pretrain/Loss (Raw)": 2.190669536590576, "Pretrain/Step": 333, "Pretrain/Step Time": 11.617485893890262} +{"Pretrain/Learning Rate": 4.9996678721799893e-05, "Pretrain/Loss": 2.308492422103882, "Pretrain/Loss (Raw)": 2.6351265907287598, "Pretrain/Step": 334, "Pretrain/Step Time": 11.616481760516763} +{"Pretrain/Learning Rate": 4.999653889690771e-05, "Pretrain/Loss": 2.310441017150879, "Pretrain/Loss (Raw)": 2.4090301990509033, "Pretrain/Step": 335, "Pretrain/Step Time": 11.591782508417964} +{"Pretrain/Learning Rate": 4.9996396189296865e-05, "Pretrain/Loss": 2.3078718185424805, "Pretrain/Loss (Raw)": 2.3213424682617188, "Pretrain/Step": 336, "Pretrain/Step Time": 11.588356425985694} +{"Pretrain/Learning Rate": 4.999625059898384e-05, "Pretrain/Loss": 2.3084592819213867, "Pretrain/Loss (Raw)": 2.3717119693756104, "Pretrain/Step": 337, "Pretrain/Step Time": 11.577794820070267} +{"Pretrain/Learning Rate": 4.99961021259854e-05, "Pretrain/Loss": 2.3050222396850586, "Pretrain/Loss (Raw)": 2.2095766067504883, "Pretrain/Step": 338, "Pretrain/Step Time": 11.61930333264172} +{"Pretrain/Learning Rate": 4.999595077031868e-05, "Pretrain/Loss": 2.3114144802093506, "Pretrain/Loss (Raw)": 2.981877565383911, "Pretrain/Step": 339, "Pretrain/Step Time": 11.615989692509174} +{"Pretrain/Learning Rate": 4.9995796532001136e-05, "Pretrain/Loss": 2.3108203411102295, "Pretrain/Loss (Raw)": 2.2326536178588867, "Pretrain/Step": 340, "Pretrain/Step Time": 11.612277070060372} +{"Pretrain/Learning Rate": 4.999563941105054e-05, "Pretrain/Loss": 2.310683012008667, "Pretrain/Loss (Raw)": 2.285630226135254, "Pretrain/Step": 341, "Pretrain/Step Time": 11.616835059598088} +{"Pretrain/Learning Rate": 4.9995479407485035e-05, "Pretrain/Loss": 2.310575008392334, "Pretrain/Loss (Raw)": 2.2285189628601074, "Pretrain/Step": 342, "Pretrain/Step Time": 11.615567248314619} +{"Pretrain/Learning Rate": 4.9995316521323066e-05, "Pretrain/Loss": 2.3094186782836914, "Pretrain/Loss (Raw)": 2.2970774173736572, "Pretrain/Step": 343, "Pretrain/Step Time": 11.619820531457663} +{"Pretrain/Learning Rate": 4.99951507525834e-05, "Pretrain/Loss": 2.308474540710449, "Pretrain/Loss (Raw)": 2.389861583709717, "Pretrain/Step": 344, "Pretrain/Step Time": 11.615418139845133} +{"Pretrain/Learning Rate": 4.999498210128518e-05, "Pretrain/Loss": 2.3074796199798584, "Pretrain/Loss (Raw)": 2.220982313156128, "Pretrain/Step": 345, "Pretrain/Step Time": 11.615287559106946} +{"Pretrain/Learning Rate": 4.9994810567447834e-05, "Pretrain/Loss": 2.306027412414551, "Pretrain/Loss (Raw)": 2.3030548095703125, "Pretrain/Step": 346, "Pretrain/Step Time": 11.600152652710676} +{"Pretrain/Learning Rate": 4.9994636151091165e-05, "Pretrain/Loss": 2.304955005645752, "Pretrain/Loss (Raw)": 2.306729793548584, "Pretrain/Step": 347, "Pretrain/Step Time": 11.598277324810624} +{"Pretrain/Learning Rate": 4.999445885223527e-05, "Pretrain/Loss": 2.3043761253356934, "Pretrain/Loss (Raw)": 2.1024599075317383, "Pretrain/Step": 348, "Pretrain/Step Time": 11.55357556976378} +{"Pretrain/Learning Rate": 4.99942786709006e-05, "Pretrain/Loss": 2.3033580780029297, "Pretrain/Loss (Raw)": 2.1608378887176514, "Pretrain/Step": 349, "Pretrain/Step Time": 11.557308431714773} +{"Pretrain/Learning Rate": 4.999409560710794e-05, "Pretrain/Loss": 2.3002500534057617, "Pretrain/Loss (Raw)": 2.229933977127075, "Pretrain/Step": 350, "Pretrain/Step Time": 11.503169486299157} +{"Pretrain/Learning Rate": 4.99939096608784e-05, "Pretrain/Loss": 2.3007302284240723, "Pretrain/Loss (Raw)": 2.3063478469848633, "Pretrain/Step": 351, "Pretrain/Step Time": 11.502798227593303} +{"Pretrain/Learning Rate": 4.999372083223343e-05, "Pretrain/Loss": 2.300628423690796, "Pretrain/Loss (Raw)": 2.176602602005005, "Pretrain/Step": 352, "Pretrain/Step Time": 11.489623924717307} +{"Pretrain/Learning Rate": 4.999352912119478e-05, "Pretrain/Loss": 2.3011221885681152, "Pretrain/Loss (Raw)": 2.299644947052002, "Pretrain/Step": 353, "Pretrain/Step Time": 11.492293402552605} +{"Pretrain/Learning Rate": 4.999333452778459e-05, "Pretrain/Loss": 2.3008804321289062, "Pretrain/Loss (Raw)": 2.2625393867492676, "Pretrain/Step": 354, "Pretrain/Step Time": 11.475800409913063} +{"Pretrain/Learning Rate": 4.999313705202529e-05, "Pretrain/Loss": 2.2999181747436523, "Pretrain/Loss (Raw)": 2.1317429542541504, "Pretrain/Step": 355, "Pretrain/Step Time": 11.471176372841} +{"Pretrain/Learning Rate": 4.999293669393965e-05, "Pretrain/Loss": 2.3006839752197266, "Pretrain/Loss (Raw)": 2.2920045852661133, "Pretrain/Step": 356, "Pretrain/Step Time": 11.448299845680594} +{"Pretrain/Learning Rate": 4.999273345355078e-05, "Pretrain/Loss": 2.3005404472351074, "Pretrain/Loss (Raw)": 2.2865912914276123, "Pretrain/Step": 357, "Pretrain/Step Time": 11.441700143739581} +{"Pretrain/Learning Rate": 4.9992527330882125e-05, "Pretrain/Loss": 2.297079086303711, "Pretrain/Loss (Raw)": 2.1267521381378174, "Pretrain/Step": 358, "Pretrain/Step Time": 11.449364546686411} +{"Pretrain/Learning Rate": 4.999231832595744e-05, "Pretrain/Loss": 2.296976089477539, "Pretrain/Loss (Raw)": 2.2794036865234375, "Pretrain/Step": 359, "Pretrain/Step Time": 11.446619091555476} +{"Pretrain/Learning Rate": 4.9992106438800846e-05, "Pretrain/Loss": 2.2963180541992188, "Pretrain/Loss (Raw)": 2.2746589183807373, "Pretrain/Step": 360, "Pretrain/Step Time": 11.450139032676816} +{"Pretrain/Learning Rate": 4.999189166943677e-05, "Pretrain/Loss": 2.2965173721313477, "Pretrain/Loss (Raw)": 2.164846181869507, "Pretrain/Step": 361, "Pretrain/Step Time": 11.47361901961267} +{"Pretrain/Learning Rate": 4.999167401788998e-05, "Pretrain/Loss": 2.296419620513916, "Pretrain/Loss (Raw)": 2.2709014415740967, "Pretrain/Step": 362, "Pretrain/Step Time": 11.46802812628448} +{"Pretrain/Learning Rate": 4.9991453484185577e-05, "Pretrain/Loss": 2.293527126312256, "Pretrain/Loss (Raw)": 2.1338934898376465, "Pretrain/Step": 363, "Pretrain/Step Time": 11.497961664572358} +{"Pretrain/Learning Rate": 4.999123006834899e-05, "Pretrain/Loss": 2.294205665588379, "Pretrain/Loss (Raw)": 2.248948097229004, "Pretrain/Step": 364, "Pretrain/Step Time": 11.479036377742887} +{"Pretrain/Learning Rate": 4.9991003770405994e-05, "Pretrain/Loss": 2.2930350303649902, "Pretrain/Loss (Raw)": 2.4175119400024414, "Pretrain/Step": 365, "Pretrain/Step Time": 11.477585883811116} +{"Pretrain/Learning Rate": 4.999077459038268e-05, "Pretrain/Loss": 2.2915244102478027, "Pretrain/Loss (Raw)": 2.1248106956481934, "Pretrain/Step": 366, "Pretrain/Step Time": 11.434038002043962} +{"Pretrain/Learning Rate": 4.9990542528305484e-05, "Pretrain/Loss": 2.2877135276794434, "Pretrain/Loss (Raw)": 2.086604595184326, "Pretrain/Step": 367, "Pretrain/Step Time": 11.41517186909914} +{"Pretrain/Learning Rate": 4.999030758420116e-05, "Pretrain/Loss": 2.2867634296417236, "Pretrain/Loss (Raw)": 2.173828125, "Pretrain/Step": 368, "Pretrain/Step Time": 11.427148140966892} +{"Pretrain/Learning Rate": 4.999006975809681e-05, "Pretrain/Loss": 2.285064697265625, "Pretrain/Loss (Raw)": 2.140132427215576, "Pretrain/Step": 369, "Pretrain/Step Time": 11.398505043238401} +{"Pretrain/Learning Rate": 4.998982905001986e-05, "Pretrain/Loss": 2.2852134704589844, "Pretrain/Loss (Raw)": 2.4336771965026855, "Pretrain/Step": 370, "Pretrain/Step Time": 11.409421814605594} +{"Pretrain/Learning Rate": 4.998958545999806e-05, "Pretrain/Loss": 2.2836217880249023, "Pretrain/Loss (Raw)": 2.1374759674072266, "Pretrain/Step": 371, "Pretrain/Step Time": 11.371658198535442} +{"Pretrain/Learning Rate": 4.998933898805951e-05, "Pretrain/Loss": 2.2847437858581543, "Pretrain/Loss (Raw)": 2.1943883895874023, "Pretrain/Step": 372, "Pretrain/Step Time": 11.36826617270708} +{"Pretrain/Learning Rate": 4.9989089634232645e-05, "Pretrain/Loss": 2.2859930992126465, "Pretrain/Loss (Raw)": 2.472606658935547, "Pretrain/Step": 373, "Pretrain/Step Time": 11.358396384865046} +{"Pretrain/Learning Rate": 4.9988837398546206e-05, "Pretrain/Loss": 2.2878530025482178, "Pretrain/Loss (Raw)": 2.387617826461792, "Pretrain/Step": 374, "Pretrain/Step Time": 11.410220945253968} +{"Pretrain/Learning Rate": 4.9988582281029284e-05, "Pretrain/Loss": 2.2865638732910156, "Pretrain/Loss (Raw)": 2.3210577964782715, "Pretrain/Step": 375, "Pretrain/Step Time": 11.370063045993447} +{"Pretrain/Learning Rate": 4.998832428171131e-05, "Pretrain/Loss": 2.2875051498413086, "Pretrain/Loss (Raw)": 2.2153160572052, "Pretrain/Step": 376, "Pretrain/Step Time": 11.376219399273396} +{"Pretrain/Learning Rate": 4.998806340062202e-05, "Pretrain/Loss": 2.287691116333008, "Pretrain/Loss (Raw)": 2.2933461666107178, "Pretrain/Step": 377, "Pretrain/Step Time": 11.33780095539987} +{"Pretrain/Learning Rate": 4.998779963779152e-05, "Pretrain/Loss": 2.2882773876190186, "Pretrain/Loss (Raw)": 2.240398406982422, "Pretrain/Step": 378, "Pretrain/Step Time": 11.340990575030446} +{"Pretrain/Learning Rate": 4.998753299325021e-05, "Pretrain/Loss": 2.2894911766052246, "Pretrain/Loss (Raw)": 2.382267951965332, "Pretrain/Step": 379, "Pretrain/Step Time": 11.296759089455009} +{"Pretrain/Learning Rate": 4.998726346702886e-05, "Pretrain/Loss": 2.290198564529419, "Pretrain/Loss (Raw)": 2.26374888420105, "Pretrain/Step": 380, "Pretrain/Step Time": 11.284816643223166} +{"Pretrain/Learning Rate": 4.998699105915854e-05, "Pretrain/Loss": 2.289616107940674, "Pretrain/Loss (Raw)": 2.268003463745117, "Pretrain/Step": 381, "Pretrain/Step Time": 11.27961110509932} +{"Pretrain/Learning Rate": 4.9986715769670665e-05, "Pretrain/Loss": 2.289473056793213, "Pretrain/Loss (Raw)": 2.2487478256225586, "Pretrain/Step": 382, "Pretrain/Step Time": 11.307612173259258} +{"Pretrain/Learning Rate": 4.998643759859699e-05, "Pretrain/Loss": 2.290067195892334, "Pretrain/Loss (Raw)": 2.4633045196533203, "Pretrain/Step": 383, "Pretrain/Step Time": 11.344206511974335} +{"Pretrain/Learning Rate": 4.998615654596959e-05, "Pretrain/Loss": 2.2888996601104736, "Pretrain/Loss (Raw)": 2.0931015014648438, "Pretrain/Step": 384, "Pretrain/Step Time": 11.325315047055483} +{"Pretrain/Learning Rate": 4.9985872611820885e-05, "Pretrain/Loss": 2.2900819778442383, "Pretrain/Loss (Raw)": 2.4173293113708496, "Pretrain/Step": 385, "Pretrain/Step Time": 11.315934946760535} +{"Pretrain/Learning Rate": 4.9985585796183605e-05, "Pretrain/Loss": 2.287722587585449, "Pretrain/Loss (Raw)": 2.0950403213500977, "Pretrain/Step": 386, "Pretrain/Step Time": 11.321168651804328} +{"Pretrain/Learning Rate": 4.998529609909084e-05, "Pretrain/Loss": 2.285149574279785, "Pretrain/Loss (Raw)": 2.205418109893799, "Pretrain/Step": 387, "Pretrain/Step Time": 11.272975351661444} +{"Pretrain/Learning Rate": 4.998500352057599e-05, "Pretrain/Loss": 2.2855334281921387, "Pretrain/Loss (Raw)": 2.3361055850982666, "Pretrain/Step": 388, "Pretrain/Step Time": 11.279984382912517} +{"Pretrain/Learning Rate": 4.9984708060672805e-05, "Pretrain/Loss": 2.2870988845825195, "Pretrain/Loss (Raw)": 2.382098913192749, "Pretrain/Step": 389, "Pretrain/Step Time": 11.281950194388628} +{"Pretrain/Learning Rate": 4.9984409719415345e-05, "Pretrain/Loss": 2.2867207527160645, "Pretrain/Loss (Raw)": 2.195375680923462, "Pretrain/Step": 390, "Pretrain/Step Time": 11.263463728129864} +{"Pretrain/Learning Rate": 4.9984108496838034e-05, "Pretrain/Loss": 2.2876596450805664, "Pretrain/Loss (Raw)": 2.228771686553955, "Pretrain/Step": 391, "Pretrain/Step Time": 11.244794443249702} +{"Pretrain/Learning Rate": 4.99838043929756e-05, "Pretrain/Loss": 2.2858598232269287, "Pretrain/Loss (Raw)": 2.1496121883392334, "Pretrain/Step": 392, "Pretrain/Step Time": 11.240715701133013} +{"Pretrain/Learning Rate": 4.9983497407863114e-05, "Pretrain/Loss": 2.2869315147399902, "Pretrain/Loss (Raw)": 2.5121381282806396, "Pretrain/Step": 393, "Pretrain/Step Time": 11.244235271587968} +{"Pretrain/Learning Rate": 4.9983187541535984e-05, "Pretrain/Loss": 2.2870988845825195, "Pretrain/Loss (Raw)": 2.6410086154937744, "Pretrain/Step": 394, "Pretrain/Step Time": 11.232418805360794} +{"Pretrain/Learning Rate": 4.998287479402994e-05, "Pretrain/Loss": 2.287297248840332, "Pretrain/Loss (Raw)": 2.451483726501465, "Pretrain/Step": 395, "Pretrain/Step Time": 11.236996337771416} +{"Pretrain/Learning Rate": 4.998255916538106e-05, "Pretrain/Loss": 2.2847726345062256, "Pretrain/Loss (Raw)": 2.217906951904297, "Pretrain/Step": 396, "Pretrain/Step Time": 11.244300374761224} +{"Pretrain/Learning Rate": 4.998224065562572e-05, "Pretrain/Loss": 2.2842254638671875, "Pretrain/Loss (Raw)": 2.256074905395508, "Pretrain/Step": 397, "Pretrain/Step Time": 11.236885277554393} +{"Pretrain/Learning Rate": 4.998191926480068e-05, "Pretrain/Loss": 2.2836427688598633, "Pretrain/Loss (Raw)": 2.227325201034546, "Pretrain/Step": 398, "Pretrain/Step Time": 11.24956583045423} +{"Pretrain/Learning Rate": 4.998159499294299e-05, "Pretrain/Loss": 2.28167724609375, "Pretrain/Loss (Raw)": 2.431619882583618, "Pretrain/Step": 399, "Pretrain/Step Time": 11.243615513667464} +{"Pretrain/Learning Rate": 4.998126784009005e-05, "Pretrain/Loss": 2.2804908752441406, "Pretrain/Loss (Raw)": 2.163105010986328, "Pretrain/Step": 400, "Pretrain/Step Time": 11.20656561665237} +{"Pretrain/Learning Rate": 4.998093780627958e-05, "Pretrain/Loss": 2.280221700668335, "Pretrain/Loss (Raw)": 2.277200222015381, "Pretrain/Step": 401, "Pretrain/Step Time": 11.225892441347241} +{"Pretrain/Learning Rate": 4.9980604891549656e-05, "Pretrain/Loss": 2.2804455757141113, "Pretrain/Loss (Raw)": 2.25656795501709, "Pretrain/Step": 402, "Pretrain/Step Time": 11.230268565937877} +{"Pretrain/Learning Rate": 4.998026909593865e-05, "Pretrain/Loss": 2.280944347381592, "Pretrain/Loss (Raw)": 2.240929126739502, "Pretrain/Step": 403, "Pretrain/Step Time": 11.257972089573741} +{"Pretrain/Learning Rate": 4.997993041948531e-05, "Pretrain/Loss": 2.2832772731781006, "Pretrain/Loss (Raw)": 2.440004587173462, "Pretrain/Step": 404, "Pretrain/Step Time": 11.220373744145036} +{"Pretrain/Learning Rate": 4.997958886222869e-05, "Pretrain/Loss": 2.2837142944335938, "Pretrain/Loss (Raw)": 2.333303451538086, "Pretrain/Step": 405, "Pretrain/Step Time": 11.283750930801034} +{"Pretrain/Learning Rate": 4.9979244424208165e-05, "Pretrain/Loss": 2.2818260192871094, "Pretrain/Loss (Raw)": 2.226576566696167, "Pretrain/Step": 406, "Pretrain/Step Time": 11.234580030664802} +{"Pretrain/Learning Rate": 4.997889710546347e-05, "Pretrain/Loss": 2.2802531719207764, "Pretrain/Loss (Raw)": 2.109971523284912, "Pretrain/Step": 407, "Pretrain/Step Time": 11.248712453991175} +{"Pretrain/Learning Rate": 4.9978546906034655e-05, "Pretrain/Loss": 2.2789926528930664, "Pretrain/Loss (Raw)": 2.0957822799682617, "Pretrain/Step": 408, "Pretrain/Step Time": 11.205668572336435} +{"Pretrain/Learning Rate": 4.997819382596212e-05, "Pretrain/Loss": 2.278717041015625, "Pretrain/Loss (Raw)": 2.198413372039795, "Pretrain/Step": 409, "Pretrain/Step Time": 11.209340197965503} +{"Pretrain/Learning Rate": 4.997783786528656e-05, "Pretrain/Loss": 2.279304265975952, "Pretrain/Loss (Raw)": 2.324432373046875, "Pretrain/Step": 410, "Pretrain/Step Time": 11.17719310335815} +{"Pretrain/Learning Rate": 4.997747902404904e-05, "Pretrain/Loss": 2.2783877849578857, "Pretrain/Loss (Raw)": 2.2694060802459717, "Pretrain/Step": 411, "Pretrain/Step Time": 11.177015325054526} +{"Pretrain/Learning Rate": 4.997711730229094e-05, "Pretrain/Loss": 2.276902675628662, "Pretrain/Loss (Raw)": 2.2526919841766357, "Pretrain/Step": 412, "Pretrain/Step Time": 11.16542011871934} +{"Pretrain/Learning Rate": 4.9976752700053975e-05, "Pretrain/Loss": 2.274735927581787, "Pretrain/Loss (Raw)": 2.2088799476623535, "Pretrain/Step": 413, "Pretrain/Step Time": 11.130686720833182} +{"Pretrain/Learning Rate": 4.9976385217380195e-05, "Pretrain/Loss": 2.2758774757385254, "Pretrain/Loss (Raw)": 2.4416825771331787, "Pretrain/Step": 414, "Pretrain/Step Time": 11.137129127979279} +{"Pretrain/Learning Rate": 4.997601485431198e-05, "Pretrain/Loss": 2.275263786315918, "Pretrain/Loss (Raw)": 2.1684439182281494, "Pretrain/Step": 415, "Pretrain/Step Time": 11.086750576272607} +{"Pretrain/Learning Rate": 4.997564161089204e-05, "Pretrain/Loss": 2.2738547325134277, "Pretrain/Loss (Raw)": 2.2041146755218506, "Pretrain/Step": 416, "Pretrain/Step Time": 11.117199044674635} +{"Pretrain/Learning Rate": 4.9975265487163424e-05, "Pretrain/Loss": 2.273040771484375, "Pretrain/Loss (Raw)": 2.2440598011016846, "Pretrain/Step": 417, "Pretrain/Step Time": 11.125403508543968} +{"Pretrain/Learning Rate": 4.997488648316951e-05, "Pretrain/Loss": 2.2734298706054688, "Pretrain/Loss (Raw)": 2.3224873542785645, "Pretrain/Step": 418, "Pretrain/Step Time": 11.02841455861926} +{"Pretrain/Learning Rate": 4.997450459895399e-05, "Pretrain/Loss": 2.272871494293213, "Pretrain/Loss (Raw)": 2.2721009254455566, "Pretrain/Step": 419, "Pretrain/Step Time": 11.078089501708746} +{"Pretrain/Learning Rate": 4.997411983456092e-05, "Pretrain/Loss": 2.272413969039917, "Pretrain/Loss (Raw)": 2.1232028007507324, "Pretrain/Step": 420, "Pretrain/Step Time": 11.058991372585297} +{"Pretrain/Learning Rate": 4.9973732190034674e-05, "Pretrain/Loss": 2.2716732025146484, "Pretrain/Loss (Raw)": 2.194718599319458, "Pretrain/Step": 421, "Pretrain/Step Time": 11.063134020194411} +{"Pretrain/Learning Rate": 4.9973341665419946e-05, "Pretrain/Loss": 2.2731127738952637, "Pretrain/Loss (Raw)": 2.4908359050750732, "Pretrain/Step": 422, "Pretrain/Step Time": 10.986892277374864} +{"Pretrain/Learning Rate": 4.997294826076178e-05, "Pretrain/Loss": 2.274742841720581, "Pretrain/Loss (Raw)": 2.2376627922058105, "Pretrain/Step": 423, "Pretrain/Step Time": 11.029891934245825} +{"Pretrain/Learning Rate": 4.9972551976105545e-05, "Pretrain/Loss": 2.274094581604004, "Pretrain/Loss (Raw)": 2.1389236450195312, "Pretrain/Step": 424, "Pretrain/Step Time": 10.982654029503465} +{"Pretrain/Learning Rate": 4.9972152811496945e-05, "Pretrain/Loss": 2.2773666381835938, "Pretrain/Loss (Raw)": 2.464665412902832, "Pretrain/Step": 425, "Pretrain/Step Time": 10.99744975566864} +{"Pretrain/Learning Rate": 4.9971750766982e-05, "Pretrain/Loss": 2.2769455909729004, "Pretrain/Loss (Raw)": 2.2126598358154297, "Pretrain/Step": 426, "Pretrain/Step Time": 10.942975252866745} +{"Pretrain/Learning Rate": 4.9971345842607095e-05, "Pretrain/Loss": 2.274648666381836, "Pretrain/Loss (Raw)": 2.2543044090270996, "Pretrain/Step": 427, "Pretrain/Step Time": 10.981511075049639} +{"Pretrain/Learning Rate": 4.997093803841891e-05, "Pretrain/Loss": 2.272783041000366, "Pretrain/Loss (Raw)": 2.115361213684082, "Pretrain/Step": 428, "Pretrain/Step Time": 10.908141497522593} +{"Pretrain/Learning Rate": 4.997052735446449e-05, "Pretrain/Loss": 2.2718112468719482, "Pretrain/Loss (Raw)": 2.208045721054077, "Pretrain/Step": 429, "Pretrain/Step Time": 10.935301903635263} +{"Pretrain/Learning Rate": 4.997011379079119e-05, "Pretrain/Loss": 2.2723469734191895, "Pretrain/Loss (Raw)": 2.261678695678711, "Pretrain/Step": 430, "Pretrain/Step Time": 10.920790068805218} +{"Pretrain/Learning Rate": 4.996969734744671e-05, "Pretrain/Loss": 2.27152681350708, "Pretrain/Loss (Raw)": 2.204092264175415, "Pretrain/Step": 431, "Pretrain/Step Time": 10.960215006023645} +{"Pretrain/Learning Rate": 4.996927802447906e-05, "Pretrain/Loss": 2.2728703022003174, "Pretrain/Loss (Raw)": 2.38729190826416, "Pretrain/Step": 432, "Pretrain/Step Time": 10.914090825244784} +{"Pretrain/Learning Rate": 4.9968855821936613e-05, "Pretrain/Loss": 2.2730603218078613, "Pretrain/Loss (Raw)": 2.2999372482299805, "Pretrain/Step": 433, "Pretrain/Step Time": 10.939506836235523} +{"Pretrain/Learning Rate": 4.9968430739868056e-05, "Pretrain/Loss": 2.2738242149353027, "Pretrain/Loss (Raw)": 2.214447021484375, "Pretrain/Step": 434, "Pretrain/Step Time": 10.9240433704108} +{"Pretrain/Learning Rate": 4.9968002778322406e-05, "Pretrain/Loss": 2.273332118988037, "Pretrain/Loss (Raw)": 2.44923734664917, "Pretrain/Step": 435, "Pretrain/Step Time": 10.924700809642673} +{"Pretrain/Learning Rate": 4.9967571937349034e-05, "Pretrain/Loss": 2.270704507827759, "Pretrain/Loss (Raw)": 2.1989309787750244, "Pretrain/Step": 436, "Pretrain/Step Time": 10.84517770074308} +{"Pretrain/Learning Rate": 4.996713821699761e-05, "Pretrain/Loss": 2.271137237548828, "Pretrain/Loss (Raw)": 2.2997498512268066, "Pretrain/Step": 437, "Pretrain/Step Time": 10.842155097052455} +{"Pretrain/Learning Rate": 4.9966701617318154e-05, "Pretrain/Loss": 2.2715835571289062, "Pretrain/Loss (Raw)": 2.3382792472839355, "Pretrain/Step": 438, "Pretrain/Step Time": 10.88964145258069} +{"Pretrain/Learning Rate": 4.996626213836103e-05, "Pretrain/Loss": 2.270885944366455, "Pretrain/Loss (Raw)": 2.365622043609619, "Pretrain/Step": 439, "Pretrain/Step Time": 10.8855707552284} +{"Pretrain/Learning Rate": 4.99658197801769e-05, "Pretrain/Loss": 2.2721710205078125, "Pretrain/Loss (Raw)": 2.394763946533203, "Pretrain/Step": 440, "Pretrain/Step Time": 10.911544790491462} +{"Pretrain/Learning Rate": 4.99653745428168e-05, "Pretrain/Loss": 2.2719807624816895, "Pretrain/Loss (Raw)": 2.203892707824707, "Pretrain/Step": 441, "Pretrain/Step Time": 10.910119006410241} +{"Pretrain/Learning Rate": 4.9964926426332056e-05, "Pretrain/Loss": 2.2713630199432373, "Pretrain/Loss (Raw)": 2.190314292907715, "Pretrain/Step": 442, "Pretrain/Step Time": 10.926839785650373} +{"Pretrain/Learning Rate": 4.9964475430774364e-05, "Pretrain/Loss": 2.2722935676574707, "Pretrain/Loss (Raw)": 2.3808820247650146, "Pretrain/Step": 443, "Pretrain/Step Time": 10.929180465638638} +{"Pretrain/Learning Rate": 4.996402155619573e-05, "Pretrain/Loss": 2.272555351257324, "Pretrain/Loss (Raw)": 2.218064546585083, "Pretrain/Step": 444, "Pretrain/Step Time": 10.888838935643435} +{"Pretrain/Learning Rate": 4.9963564802648494e-05, "Pretrain/Loss": 2.2713310718536377, "Pretrain/Loss (Raw)": 2.115725517272949, "Pretrain/Step": 445, "Pretrain/Step Time": 10.890232285484672} +{"Pretrain/Learning Rate": 4.9963105170185334e-05, "Pretrain/Loss": 2.2701451778411865, "Pretrain/Loss (Raw)": 2.14387845993042, "Pretrain/Step": 446, "Pretrain/Step Time": 10.84260543808341} +{"Pretrain/Learning Rate": 4.9962642658859255e-05, "Pretrain/Loss": 2.2698817253112793, "Pretrain/Loss (Raw)": 2.2389943599700928, "Pretrain/Step": 447, "Pretrain/Step Time": 10.839986773207784} +{"Pretrain/Learning Rate": 4.99621772687236e-05, "Pretrain/Loss": 2.2694480419158936, "Pretrain/Loss (Raw)": 2.216860771179199, "Pretrain/Step": 448, "Pretrain/Step Time": 10.811666741967201} +{"Pretrain/Learning Rate": 4.996170899983203e-05, "Pretrain/Loss": 2.26955509185791, "Pretrain/Loss (Raw)": 2.28615403175354, "Pretrain/Step": 449, "Pretrain/Step Time": 10.814209481701255} +{"Pretrain/Learning Rate": 4.9961237852238554e-05, "Pretrain/Loss": 2.2682273387908936, "Pretrain/Loss (Raw)": 2.1292548179626465, "Pretrain/Step": 450, "Pretrain/Step Time": 10.77535123564303} +{"Pretrain/Learning Rate": 4.996076382599752e-05, "Pretrain/Loss": 2.2700319290161133, "Pretrain/Loss (Raw)": 2.343104600906372, "Pretrain/Step": 451, "Pretrain/Step Time": 10.784667721018195} +{"Pretrain/Learning Rate": 4.996028692116357e-05, "Pretrain/Loss": 2.2694449424743652, "Pretrain/Loss (Raw)": 2.1796493530273438, "Pretrain/Step": 452, "Pretrain/Step Time": 10.821976510807872} +{"Pretrain/Learning Rate": 4.995980713779172e-05, "Pretrain/Loss": 2.2704288959503174, "Pretrain/Loss (Raw)": 2.44647216796875, "Pretrain/Step": 453, "Pretrain/Step Time": 10.833737039938569} +{"Pretrain/Learning Rate": 4.9959324475937297e-05, "Pretrain/Loss": 2.2712388038635254, "Pretrain/Loss (Raw)": 2.2678539752960205, "Pretrain/Step": 454, "Pretrain/Step Time": 10.848940571770072} +{"Pretrain/Learning Rate": 4.995883893565596e-05, "Pretrain/Loss": 2.269820213317871, "Pretrain/Loss (Raw)": 2.059147834777832, "Pretrain/Step": 455, "Pretrain/Step Time": 10.870787918567657} +{"Pretrain/Learning Rate": 4.995835051700371e-05, "Pretrain/Loss": 2.268174171447754, "Pretrain/Loss (Raw)": 2.1627719402313232, "Pretrain/Step": 456, "Pretrain/Step Time": 10.890056002885103} +{"Pretrain/Learning Rate": 4.995785922003687e-05, "Pretrain/Loss": 2.2704691886901855, "Pretrain/Loss (Raw)": 2.1762142181396484, "Pretrain/Step": 457, "Pretrain/Step Time": 10.891965914517641} +{"Pretrain/Learning Rate": 4.9957365044812097e-05, "Pretrain/Loss": 2.2729153633117676, "Pretrain/Loss (Raw)": 2.5315120220184326, "Pretrain/Step": 458, "Pretrain/Step Time": 10.886440079659224} +{"Pretrain/Learning Rate": 4.995686799138639e-05, "Pretrain/Loss": 2.2731966972351074, "Pretrain/Loss (Raw)": 2.264564275741577, "Pretrain/Step": 459, "Pretrain/Step Time": 10.879441175609827} +{"Pretrain/Learning Rate": 4.995636805981706e-05, "Pretrain/Loss": 2.272658348083496, "Pretrain/Loss (Raw)": 2.2032012939453125, "Pretrain/Step": 460, "Pretrain/Step Time": 10.861042331904173} +{"Pretrain/Learning Rate": 4.9955865250161774e-05, "Pretrain/Loss": 2.2717299461364746, "Pretrain/Loss (Raw)": 2.0718116760253906, "Pretrain/Step": 461, "Pretrain/Step Time": 10.858231775462627} +{"Pretrain/Learning Rate": 4.9955359562478504e-05, "Pretrain/Loss": 2.2681145668029785, "Pretrain/Loss (Raw)": 2.1723721027374268, "Pretrain/Step": 462, "Pretrain/Step Time": 10.815735699608922} +{"Pretrain/Learning Rate": 4.995485099682558e-05, "Pretrain/Loss": 2.266183614730835, "Pretrain/Loss (Raw)": 2.161863088607788, "Pretrain/Step": 463, "Pretrain/Step Time": 10.82750897668302} +{"Pretrain/Learning Rate": 4.995433955326165e-05, "Pretrain/Loss": 2.2667605876922607, "Pretrain/Loss (Raw)": 2.395171880722046, "Pretrain/Step": 464, "Pretrain/Step Time": 10.78794782049954} +{"Pretrain/Learning Rate": 4.995382523184569e-05, "Pretrain/Loss": 2.265878915786743, "Pretrain/Loss (Raw)": 2.258880138397217, "Pretrain/Step": 465, "Pretrain/Step Time": 10.788497567176819} +{"Pretrain/Learning Rate": 4.9953308032637016e-05, "Pretrain/Loss": 2.265176296234131, "Pretrain/Loss (Raw)": 2.1196341514587402, "Pretrain/Step": 466, "Pretrain/Step Time": 10.731625584885478} +{"Pretrain/Learning Rate": 4.995278795569528e-05, "Pretrain/Loss": 2.258807897567749, "Pretrain/Loss (Raw)": 2.1667330265045166, "Pretrain/Step": 467, "Pretrain/Step Time": 10.767208037897944} +{"Pretrain/Learning Rate": 4.995226500108046e-05, "Pretrain/Loss": 2.2580924034118652, "Pretrain/Loss (Raw)": 2.141073703765869, "Pretrain/Step": 468, "Pretrain/Step Time": 10.775906570255756} +{"Pretrain/Learning Rate": 4.995173916885285e-05, "Pretrain/Loss": 2.2575430870056152, "Pretrain/Loss (Raw)": 2.2152810096740723, "Pretrain/Step": 469, "Pretrain/Step Time": 10.771819211542606} +{"Pretrain/Learning Rate": 4.9951210459073105e-05, "Pretrain/Loss": 2.2587859630584717, "Pretrain/Loss (Raw)": 2.387638568878174, "Pretrain/Step": 470, "Pretrain/Step Time": 10.769870856776834} +{"Pretrain/Learning Rate": 4.99506788718022e-05, "Pretrain/Loss": 2.259500503540039, "Pretrain/Loss (Raw)": 2.388519763946533, "Pretrain/Step": 471, "Pretrain/Step Time": 10.773031610995531} +{"Pretrain/Learning Rate": 4.995014440710144e-05, "Pretrain/Loss": 2.259768009185791, "Pretrain/Loss (Raw)": 2.4240856170654297, "Pretrain/Step": 472, "Pretrain/Step Time": 10.767318783327937} +{"Pretrain/Learning Rate": 4.9949607065032445e-05, "Pretrain/Loss": 2.2605690956115723, "Pretrain/Loss (Raw)": 2.3235251903533936, "Pretrain/Step": 473, "Pretrain/Step Time": 10.769899055361748} +{"Pretrain/Learning Rate": 4.99490668456572e-05, "Pretrain/Loss": 2.2600655555725098, "Pretrain/Loss (Raw)": 2.2386162281036377, "Pretrain/Step": 474, "Pretrain/Step Time": 10.743090607225895} +{"Pretrain/Learning Rate": 4.994852374903801e-05, "Pretrain/Loss": 2.2600982189178467, "Pretrain/Loss (Raw)": 2.3109354972839355, "Pretrain/Step": 475, "Pretrain/Step Time": 10.744337134063244} +{"Pretrain/Learning Rate": 4.99479777752375e-05, "Pretrain/Loss": 2.2608895301818848, "Pretrain/Loss (Raw)": 2.203705072402954, "Pretrain/Step": 476, "Pretrain/Step Time": 10.723110994324088} +{"Pretrain/Learning Rate": 4.994742892431863e-05, "Pretrain/Loss": 2.2613868713378906, "Pretrain/Loss (Raw)": 2.2244985103607178, "Pretrain/Step": 477, "Pretrain/Step Time": 10.718815634027123} +{"Pretrain/Learning Rate": 4.99468771963447e-05, "Pretrain/Loss": 2.261300802230835, "Pretrain/Loss (Raw)": 2.2189552783966064, "Pretrain/Step": 478, "Pretrain/Step Time": 10.739104254171252} +{"Pretrain/Learning Rate": 4.994632259137935e-05, "Pretrain/Loss": 2.2606301307678223, "Pretrain/Loss (Raw)": 2.2204837799072266, "Pretrain/Step": 479, "Pretrain/Step Time": 10.748782277107239} +{"Pretrain/Learning Rate": 4.9945765109486506e-05, "Pretrain/Loss": 2.260546922683716, "Pretrain/Loss (Raw)": 2.165944814682007, "Pretrain/Step": 480, "Pretrain/Step Time": 10.730065478011966} +{"Pretrain/Learning Rate": 4.99452047507305e-05, "Pretrain/Loss": 2.2602877616882324, "Pretrain/Loss (Raw)": 2.2664785385131836, "Pretrain/Step": 481, "Pretrain/Step Time": 10.747079737484455} +{"Pretrain/Learning Rate": 4.994464151517593e-05, "Pretrain/Loss": 2.260118007659912, "Pretrain/Loss (Raw)": 2.2408249378204346, "Pretrain/Step": 482, "Pretrain/Step Time": 10.739147244021297} +{"Pretrain/Learning Rate": 4.994407540288775e-05, "Pretrain/Loss": 2.260892152786255, "Pretrain/Loss (Raw)": 2.230815887451172, "Pretrain/Step": 483, "Pretrain/Step Time": 10.749324599280953} +{"Pretrain/Learning Rate": 4.994350641393126e-05, "Pretrain/Loss": 2.26043701171875, "Pretrain/Loss (Raw)": 2.233750581741333, "Pretrain/Step": 484, "Pretrain/Step Time": 10.72306983731687} +{"Pretrain/Learning Rate": 4.9942934548372077e-05, "Pretrain/Loss": 2.258760929107666, "Pretrain/Loss (Raw)": 2.0720317363739014, "Pretrain/Step": 485, "Pretrain/Step Time": 10.725303364917636} +{"Pretrain/Learning Rate": 4.994235980627614e-05, "Pretrain/Loss": 2.2607407569885254, "Pretrain/Loss (Raw)": 2.3801846504211426, "Pretrain/Step": 486, "Pretrain/Step Time": 10.737627865746617} +{"Pretrain/Learning Rate": 4.9941782187709746e-05, "Pretrain/Loss": 2.2595813274383545, "Pretrain/Loss (Raw)": 2.1310207843780518, "Pretrain/Step": 487, "Pretrain/Step Time": 10.729829473420978} +{"Pretrain/Learning Rate": 4.994120169273949e-05, "Pretrain/Loss": 2.259769916534424, "Pretrain/Loss (Raw)": 2.298767566680908, "Pretrain/Step": 488, "Pretrain/Step Time": 10.729067761451006} +{"Pretrain/Learning Rate": 4.9940618321432344e-05, "Pretrain/Loss": 2.2605276107788086, "Pretrain/Loss (Raw)": 2.261833906173706, "Pretrain/Step": 489, "Pretrain/Step Time": 10.714403746649623} +{"Pretrain/Learning Rate": 4.994003207385556e-05, "Pretrain/Loss": 2.2612059116363525, "Pretrain/Loss (Raw)": 2.3577370643615723, "Pretrain/Step": 490, "Pretrain/Step Time": 10.714114215224981} +{"Pretrain/Learning Rate": 4.9939442950076755e-05, "Pretrain/Loss": 2.2621917724609375, "Pretrain/Loss (Raw)": 2.260087728500366, "Pretrain/Step": 491, "Pretrain/Step Time": 10.73540329001844} +{"Pretrain/Learning Rate": 4.9938850950163864e-05, "Pretrain/Loss": 2.263071060180664, "Pretrain/Loss (Raw)": 2.3614871501922607, "Pretrain/Step": 492, "Pretrain/Step Time": 10.726112434640527} +{"Pretrain/Learning Rate": 4.9938256074185174e-05, "Pretrain/Loss": 2.259406328201294, "Pretrain/Loss (Raw)": 1.9484288692474365, "Pretrain/Step": 493, "Pretrain/Step Time": 10.693936914205551} +{"Pretrain/Learning Rate": 4.993765832220928e-05, "Pretrain/Loss": 2.2617411613464355, "Pretrain/Loss (Raw)": 2.423659086227417, "Pretrain/Step": 494, "Pretrain/Step Time": 10.679879620671272} +{"Pretrain/Learning Rate": 4.993705769430511e-05, "Pretrain/Loss": 2.2646350860595703, "Pretrain/Loss (Raw)": 2.4570491313934326, "Pretrain/Step": 495, "Pretrain/Step Time": 10.65679756551981} +{"Pretrain/Learning Rate": 4.9936454190541945e-05, "Pretrain/Loss": 2.2650866508483887, "Pretrain/Loss (Raw)": 2.2316136360168457, "Pretrain/Step": 496, "Pretrain/Step Time": 10.642112094908953} +{"Pretrain/Learning Rate": 4.993584781098939e-05, "Pretrain/Loss": 2.2661213874816895, "Pretrain/Loss (Raw)": 2.272587299346924, "Pretrain/Step": 497, "Pretrain/Step Time": 10.652578387409449} +{"Pretrain/Learning Rate": 4.993523855571735e-05, "Pretrain/Loss": 2.2650158405303955, "Pretrain/Loss (Raw)": 2.2921671867370605, "Pretrain/Step": 498, "Pretrain/Step Time": 10.632972341030836} +{"Pretrain/Learning Rate": 4.99346264247961e-05, "Pretrain/Loss": 2.2648162841796875, "Pretrain/Loss (Raw)": 2.111937999725342, "Pretrain/Step": 499, "Pretrain/Step Time": 10.641362074762583} +{"Pretrain/Learning Rate": 4.993401141829625e-05, "Pretrain/Loss": 2.264981269836426, "Pretrain/Loss (Raw)": 2.2155051231384277, "Pretrain/Step": 500, "Pretrain/Step Time": 10.644404914230108} +{"Pretrain/Learning Rate": 4.99333935362887e-05, "Pretrain/Loss": 2.262969970703125, "Pretrain/Loss (Raw)": 2.2151405811309814, "Pretrain/Step": 501, "Pretrain/Step Time": 10.664286656305194} +{"Pretrain/Learning Rate": 4.993277277884471e-05, "Pretrain/Loss": 2.2628002166748047, "Pretrain/Loss (Raw)": 2.3659002780914307, "Pretrain/Step": 502, "Pretrain/Step Time": 10.624316500499845} +{"Pretrain/Learning Rate": 4.993214914603588e-05, "Pretrain/Loss": 2.263683319091797, "Pretrain/Loss (Raw)": 2.4341087341308594, "Pretrain/Step": 503, "Pretrain/Step Time": 10.626152047887444} +{"Pretrain/Learning Rate": 4.993152263793414e-05, "Pretrain/Loss": 2.2648167610168457, "Pretrain/Loss (Raw)": 2.3604161739349365, "Pretrain/Step": 504, "Pretrain/Step Time": 10.68281596340239} +{"Pretrain/Learning Rate": 4.993089325461171e-05, "Pretrain/Loss": 2.263371467590332, "Pretrain/Loss (Raw)": 2.108323812484741, "Pretrain/Step": 505, "Pretrain/Step Time": 10.685850845649838} +{"Pretrain/Learning Rate": 4.99302609961412e-05, "Pretrain/Loss": 2.263641834259033, "Pretrain/Loss (Raw)": 2.2750084400177, "Pretrain/Step": 506, "Pretrain/Step Time": 10.698597403243184} +{"Pretrain/Learning Rate": 4.9929625862595516e-05, "Pretrain/Loss": 2.2629237174987793, "Pretrain/Loss (Raw)": 2.290350914001465, "Pretrain/Step": 507, "Pretrain/Step Time": 10.697773266583681} +{"Pretrain/Learning Rate": 4.9928987854047905e-05, "Pretrain/Loss": 2.2614076137542725, "Pretrain/Loss (Raw)": 2.0696725845336914, "Pretrain/Step": 508, "Pretrain/Step Time": 10.718528293073177} +{"Pretrain/Learning Rate": 4.992834697057195e-05, "Pretrain/Loss": 2.2604942321777344, "Pretrain/Loss (Raw)": 2.151113271713257, "Pretrain/Step": 509, "Pretrain/Step Time": 10.719148863106966} +{"Pretrain/Learning Rate": 4.992770321224155e-05, "Pretrain/Loss": 2.260852336883545, "Pretrain/Loss (Raw)": 2.2945728302001953, "Pretrain/Step": 510, "Pretrain/Step Time": 10.693468084558845} +{"Pretrain/Learning Rate": 4.992705657913095e-05, "Pretrain/Loss": 2.257972240447998, "Pretrain/Loss (Raw)": 2.094637870788574, "Pretrain/Step": 511, "Pretrain/Step Time": 10.660327963531017} +{"Pretrain/Learning Rate": 4.9926407071314736e-05, "Pretrain/Loss": 2.2593908309936523, "Pretrain/Loss (Raw)": 2.274730682373047, "Pretrain/Step": 512, "Pretrain/Step Time": 10.683747075498104} +{"Pretrain/Learning Rate": 4.9925754688867796e-05, "Pretrain/Loss": 2.2572693824768066, "Pretrain/Loss (Raw)": 2.145768880844116, "Pretrain/Step": 513, "Pretrain/Step Time": 10.679910339415073} +{"Pretrain/Learning Rate": 4.992509943186537e-05, "Pretrain/Loss": 2.25834059715271, "Pretrain/Loss (Raw)": 2.2321407794952393, "Pretrain/Step": 514, "Pretrain/Step Time": 10.673357589170337} +{"Pretrain/Learning Rate": 4.992444130038302e-05, "Pretrain/Loss": 2.2583484649658203, "Pretrain/Loss (Raw)": 2.206395149230957, "Pretrain/Step": 515, "Pretrain/Step Time": 10.678861821070313} +{"Pretrain/Learning Rate": 4.992378029449666e-05, "Pretrain/Loss": 2.2581048011779785, "Pretrain/Loss (Raw)": 2.3049263954162598, "Pretrain/Step": 516, "Pretrain/Step Time": 10.655529372394085} +{"Pretrain/Learning Rate": 4.9923116414282514e-05, "Pretrain/Loss": 2.255962371826172, "Pretrain/Loss (Raw)": 2.1078853607177734, "Pretrain/Step": 517, "Pretrain/Step Time": 10.676147695630789} +{"Pretrain/Learning Rate": 4.992244965981714e-05, "Pretrain/Loss": 2.2560603618621826, "Pretrain/Loss (Raw)": 2.207923650741577, "Pretrain/Step": 518, "Pretrain/Step Time": 10.75916388630867} +{"Pretrain/Learning Rate": 4.9921780031177425e-05, "Pretrain/Loss": 2.255892753601074, "Pretrain/Loss (Raw)": 2.2072925567626953, "Pretrain/Step": 519, "Pretrain/Step Time": 10.733068060129881} +{"Pretrain/Learning Rate": 4.992110752844061e-05, "Pretrain/Loss": 2.254545211791992, "Pretrain/Loss (Raw)": 1.977173089981079, "Pretrain/Step": 520, "Pretrain/Step Time": 10.739432234317064} +{"Pretrain/Learning Rate": 4.992043215168424e-05, "Pretrain/Loss": 2.253033399581909, "Pretrain/Loss (Raw)": 2.318612575531006, "Pretrain/Step": 521, "Pretrain/Step Time": 10.755280829966068} +{"Pretrain/Learning Rate": 4.99197539009862e-05, "Pretrain/Loss": 2.2489495277404785, "Pretrain/Loss (Raw)": 2.1182944774627686, "Pretrain/Step": 522, "Pretrain/Step Time": 10.7882289160043} +{"Pretrain/Learning Rate": 4.9919072776424726e-05, "Pretrain/Loss": 2.246203899383545, "Pretrain/Loss (Raw)": 2.1000115871429443, "Pretrain/Step": 523, "Pretrain/Step Time": 10.782407807186246} +{"Pretrain/Learning Rate": 4.9918388778078347e-05, "Pretrain/Loss": 2.2453036308288574, "Pretrain/Loss (Raw)": 2.102677583694458, "Pretrain/Step": 524, "Pretrain/Step Time": 10.761186845600605} +{"Pretrain/Learning Rate": 4.991770190602596e-05, "Pretrain/Loss": 2.2450594902038574, "Pretrain/Loss (Raw)": 2.2248146533966064, "Pretrain/Step": 525, "Pretrain/Step Time": 10.78558393754065} +{"Pretrain/Learning Rate": 4.991701216034677e-05, "Pretrain/Loss": 2.246302366256714, "Pretrain/Loss (Raw)": 2.3864212036132812, "Pretrain/Step": 526, "Pretrain/Step Time": 10.78154556080699} +{"Pretrain/Learning Rate": 4.9916319541120324e-05, "Pretrain/Loss": 2.245131015777588, "Pretrain/Loss (Raw)": 2.2816669940948486, "Pretrain/Step": 527, "Pretrain/Step Time": 10.772511880844831} +{"Pretrain/Learning Rate": 4.99156240484265e-05, "Pretrain/Loss": 2.245227098464966, "Pretrain/Loss (Raw)": 2.1754310131073, "Pretrain/Step": 528, "Pretrain/Step Time": 10.79172501899302} +{"Pretrain/Learning Rate": 4.9914925682345504e-05, "Pretrain/Loss": 2.2445077896118164, "Pretrain/Loss (Raw)": 2.1851282119750977, "Pretrain/Step": 529, "Pretrain/Step Time": 10.784068809822202} +{"Pretrain/Learning Rate": 4.991422444295788e-05, "Pretrain/Loss": 2.244290351867676, "Pretrain/Loss (Raw)": 2.228729486465454, "Pretrain/Step": 530, "Pretrain/Step Time": 10.779601799324155} +{"Pretrain/Learning Rate": 4.9913520330344486e-05, "Pretrain/Loss": 2.2438080310821533, "Pretrain/Loss (Raw)": 2.1791837215423584, "Pretrain/Step": 531, "Pretrain/Step Time": 10.72955627925694} +{"Pretrain/Learning Rate": 4.991281334458654e-05, "Pretrain/Loss": 2.242645263671875, "Pretrain/Loss (Raw)": 2.291182279586792, "Pretrain/Step": 532, "Pretrain/Step Time": 10.7630714494735} +{"Pretrain/Learning Rate": 4.991210348576556e-05, "Pretrain/Loss": 2.241464853286743, "Pretrain/Loss (Raw)": 2.1822166442871094, "Pretrain/Step": 533, "Pretrain/Step Time": 10.713990224525332} +{"Pretrain/Learning Rate": 4.991139075396342e-05, "Pretrain/Loss": 2.240438222885132, "Pretrain/Loss (Raw)": 2.0951619148254395, "Pretrain/Step": 534, "Pretrain/Step Time": 10.75570254959166} +{"Pretrain/Learning Rate": 4.991067514926231e-05, "Pretrain/Loss": 2.240659713745117, "Pretrain/Loss (Raw)": 2.1383349895477295, "Pretrain/Step": 535, "Pretrain/Step Time": 10.748561706393957} +{"Pretrain/Learning Rate": 4.990995667174476e-05, "Pretrain/Loss": 2.2415714263916016, "Pretrain/Loss (Raw)": 2.212437152862549, "Pretrain/Step": 536, "Pretrain/Step Time": 10.790622115135193} +{"Pretrain/Learning Rate": 4.990923532149362e-05, "Pretrain/Loss": 2.241736650466919, "Pretrain/Loss (Raw)": 2.219604015350342, "Pretrain/Step": 537, "Pretrain/Step Time": 10.794960208237171} +{"Pretrain/Learning Rate": 4.990851109859209e-05, "Pretrain/Loss": 2.24234938621521, "Pretrain/Loss (Raw)": 2.4028639793395996, "Pretrain/Step": 538, "Pretrain/Step Time": 10.791041297838092} +{"Pretrain/Learning Rate": 4.9907784003123695e-05, "Pretrain/Loss": 2.241129159927368, "Pretrain/Loss (Raw)": 2.1131951808929443, "Pretrain/Step": 539, "Pretrain/Step Time": 10.87221178226173} +{"Pretrain/Learning Rate": 4.9907054035172273e-05, "Pretrain/Loss": 2.2395553588867188, "Pretrain/Loss (Raw)": 2.0512235164642334, "Pretrain/Step": 540, "Pretrain/Step Time": 10.884016774594784} +{"Pretrain/Learning Rate": 4.9906321194822014e-05, "Pretrain/Loss": 2.2393388748168945, "Pretrain/Loss (Raw)": 2.1811981201171875, "Pretrain/Step": 541, "Pretrain/Step Time": 10.887168711051345} +{"Pretrain/Learning Rate": 4.9905585482157436e-05, "Pretrain/Loss": 2.238215446472168, "Pretrain/Loss (Raw)": 2.2979016304016113, "Pretrain/Step": 542, "Pretrain/Step Time": 10.916788376867771} +{"Pretrain/Learning Rate": 4.990484689726338e-05, "Pretrain/Loss": 2.239234209060669, "Pretrain/Loss (Raw)": 2.2988104820251465, "Pretrain/Step": 543, "Pretrain/Step Time": 10.979469386860728} +{"Pretrain/Learning Rate": 4.990410544022502e-05, "Pretrain/Loss": 2.2395811080932617, "Pretrain/Loss (Raw)": 2.248525381088257, "Pretrain/Step": 544, "Pretrain/Step Time": 11.001698456704617} +{"Pretrain/Learning Rate": 4.9903361111127864e-05, "Pretrain/Loss": 2.238995313644409, "Pretrain/Loss (Raw)": 2.169083833694458, "Pretrain/Step": 545, "Pretrain/Step Time": 10.991471016779542} +{"Pretrain/Learning Rate": 4.990261391005777e-05, "Pretrain/Loss": 2.238051176071167, "Pretrain/Loss (Raw)": 2.2016401290893555, "Pretrain/Step": 546, "Pretrain/Step Time": 11.036730470135808} +{"Pretrain/Learning Rate": 4.9901863837100886e-05, "Pretrain/Loss": 2.237637519836426, "Pretrain/Loss (Raw)": 2.2191622257232666, "Pretrain/Step": 547, "Pretrain/Step Time": 11.010672055184841} +{"Pretrain/Learning Rate": 4.9901110892343724e-05, "Pretrain/Loss": 2.238393783569336, "Pretrain/Loss (Raw)": 2.2199862003326416, "Pretrain/Step": 548, "Pretrain/Step Time": 11.013538111001253} +{"Pretrain/Learning Rate": 4.9900355075873116e-05, "Pretrain/Loss": 2.2371985912323, "Pretrain/Loss (Raw)": 2.0417544841766357, "Pretrain/Step": 549, "Pretrain/Step Time": 11.063260221853852} +{"Pretrain/Learning Rate": 4.989959638777623e-05, "Pretrain/Loss": 2.2339982986450195, "Pretrain/Loss (Raw)": 2.081163167953491, "Pretrain/Step": 550, "Pretrain/Step Time": 11.065490793436766} +{"Pretrain/Learning Rate": 4.989883482814056e-05, "Pretrain/Loss": 2.2326712608337402, "Pretrain/Loss (Raw)": 2.0678389072418213, "Pretrain/Step": 551, "Pretrain/Step Time": 11.03493077494204} +{"Pretrain/Learning Rate": 4.989807039705392e-05, "Pretrain/Loss": 2.233626365661621, "Pretrain/Loss (Raw)": 2.2611584663391113, "Pretrain/Step": 552, "Pretrain/Step Time": 11.050079829990864} +{"Pretrain/Learning Rate": 4.989730309460449e-05, "Pretrain/Loss": 2.231640338897705, "Pretrain/Loss (Raw)": 2.2104780673980713, "Pretrain/Step": 553, "Pretrain/Step Time": 11.042795551940799} +{"Pretrain/Learning Rate": 4.989653292088074e-05, "Pretrain/Loss": 2.231110095977783, "Pretrain/Loss (Raw)": 2.1447510719299316, "Pretrain/Step": 554, "Pretrain/Step Time": 11.109831023961306} +{"Pretrain/Learning Rate": 4.9895759875971495e-05, "Pretrain/Loss": 2.2313997745513916, "Pretrain/Loss (Raw)": 2.2914106845855713, "Pretrain/Step": 555, "Pretrain/Step Time": 11.072409816086292} +{"Pretrain/Learning Rate": 4.9894983959965915e-05, "Pretrain/Loss": 2.2313780784606934, "Pretrain/Loss (Raw)": 2.112558126449585, "Pretrain/Step": 556, "Pretrain/Step Time": 11.153780858963728} +{"Pretrain/Learning Rate": 4.989420517295347e-05, "Pretrain/Loss": 2.231501817703247, "Pretrain/Loss (Raw)": 2.22390079498291, "Pretrain/Step": 557, "Pretrain/Step Time": 11.12133097089827} +{"Pretrain/Learning Rate": 4.9893423515023986e-05, "Pretrain/Loss": 2.230660915374756, "Pretrain/Loss (Raw)": 2.154050588607788, "Pretrain/Step": 558, "Pretrain/Step Time": 11.15726543776691} +{"Pretrain/Learning Rate": 4.9892638986267594e-05, "Pretrain/Loss": 2.2314467430114746, "Pretrain/Loss (Raw)": 2.3046669960021973, "Pretrain/Step": 559, "Pretrain/Step Time": 11.119478473439813} +{"Pretrain/Learning Rate": 4.989185158677478e-05, "Pretrain/Loss": 2.2292776107788086, "Pretrain/Loss (Raw)": 2.109644889831543, "Pretrain/Step": 560, "Pretrain/Step Time": 11.156371992081404} +{"Pretrain/Learning Rate": 4.9891061316636346e-05, "Pretrain/Loss": 2.2281713485717773, "Pretrain/Loss (Raw)": 2.1583356857299805, "Pretrain/Step": 561, "Pretrain/Step Time": 11.141435727477074} +{"Pretrain/Learning Rate": 4.9890268175943425e-05, "Pretrain/Loss": 2.2283687591552734, "Pretrain/Loss (Raw)": 2.239708185195923, "Pretrain/Step": 562, "Pretrain/Step Time": 11.117203325033188} +{"Pretrain/Learning Rate": 4.9889472164787496e-05, "Pretrain/Loss": 2.226686477661133, "Pretrain/Loss (Raw)": 2.2338974475860596, "Pretrain/Step": 563, "Pretrain/Step Time": 11.164046877995133} +{"Pretrain/Learning Rate": 4.9888673283260355e-05, "Pretrain/Loss": 2.2266597747802734, "Pretrain/Loss (Raw)": 2.1955206394195557, "Pretrain/Step": 564, "Pretrain/Step Time": 11.108966307714581} +{"Pretrain/Learning Rate": 4.9887871531454134e-05, "Pretrain/Loss": 2.226433277130127, "Pretrain/Loss (Raw)": 2.270777463912964, "Pretrain/Step": 565, "Pretrain/Step Time": 11.108725380152464} +{"Pretrain/Learning Rate": 4.988706690946129e-05, "Pretrain/Loss": 2.2231931686401367, "Pretrain/Loss (Raw)": 1.9235334396362305, "Pretrain/Step": 566, "Pretrain/Step Time": 11.081012407317758} +{"Pretrain/Learning Rate": 4.9886259417374616e-05, "Pretrain/Loss": 2.2228493690490723, "Pretrain/Loss (Raw)": 2.321629524230957, "Pretrain/Step": 567, "Pretrain/Step Time": 11.100228602066636} +{"Pretrain/Learning Rate": 4.988544905528724e-05, "Pretrain/Loss": 2.2235212326049805, "Pretrain/Loss (Raw)": 2.480757474899292, "Pretrain/Step": 568, "Pretrain/Step Time": 11.096332648769021} +{"Pretrain/Learning Rate": 4.9884635823292615e-05, "Pretrain/Loss": 2.223773956298828, "Pretrain/Loss (Raw)": 2.2362303733825684, "Pretrain/Step": 569, "Pretrain/Step Time": 11.169462539255619} +{"Pretrain/Learning Rate": 4.988381972148452e-05, "Pretrain/Loss": 2.2237138748168945, "Pretrain/Loss (Raw)": 2.1826298236846924, "Pretrain/Step": 570, "Pretrain/Step Time": 11.143144151195884} +{"Pretrain/Learning Rate": 4.9883000749957086e-05, "Pretrain/Loss": 2.2217092514038086, "Pretrain/Loss (Raw)": 2.124307155609131, "Pretrain/Step": 571, "Pretrain/Step Time": 11.211235979571939} +{"Pretrain/Learning Rate": 4.988217890880475e-05, "Pretrain/Loss": 2.221116304397583, "Pretrain/Loss (Raw)": 2.1421265602111816, "Pretrain/Step": 572, "Pretrain/Step Time": 11.194772858172655} +{"Pretrain/Learning Rate": 4.98813541981223e-05, "Pretrain/Loss": 2.2188053131103516, "Pretrain/Loss (Raw)": 1.8199262619018555, "Pretrain/Step": 573, "Pretrain/Step Time": 11.240548498928547} +{"Pretrain/Learning Rate": 4.988052661800483e-05, "Pretrain/Loss": 2.2184183597564697, "Pretrain/Loss (Raw)": 2.0943777561187744, "Pretrain/Step": 574, "Pretrain/Step Time": 11.230789557099342} +{"Pretrain/Learning Rate": 4.98796961685478e-05, "Pretrain/Loss": 2.2180721759796143, "Pretrain/Loss (Raw)": 2.1946756839752197, "Pretrain/Step": 575, "Pretrain/Step Time": 11.281846340745687} +{"Pretrain/Learning Rate": 4.987886284984695e-05, "Pretrain/Loss": 2.2185773849487305, "Pretrain/Loss (Raw)": 2.2815167903900146, "Pretrain/Step": 576, "Pretrain/Step Time": 11.271918457001448} +{"Pretrain/Learning Rate": 4.987802666199842e-05, "Pretrain/Loss": 2.2175796031951904, "Pretrain/Loss (Raw)": 2.1584558486938477, "Pretrain/Step": 577, "Pretrain/Step Time": 11.344137715175748} +{"Pretrain/Learning Rate": 4.987718760509863e-05, "Pretrain/Loss": 2.218583106994629, "Pretrain/Loss (Raw)": 2.25766921043396, "Pretrain/Step": 578, "Pretrain/Step Time": 11.326530624181032} +{"Pretrain/Learning Rate": 4.987634567924433e-05, "Pretrain/Loss": 2.214766025543213, "Pretrain/Loss (Raw)": 1.8545414209365845, "Pretrain/Step": 579, "Pretrain/Step Time": 11.350202690809965} +{"Pretrain/Learning Rate": 4.9875500884532634e-05, "Pretrain/Loss": 2.2164719104766846, "Pretrain/Loss (Raw)": 2.3980133533477783, "Pretrain/Step": 580, "Pretrain/Step Time": 11.30948299728334} +{"Pretrain/Learning Rate": 4.987465322106095e-05, "Pretrain/Loss": 2.2146236896514893, "Pretrain/Loss (Raw)": 2.2098801136016846, "Pretrain/Step": 581, "Pretrain/Step Time": 11.335335602983832} +{"Pretrain/Learning Rate": 4.987380268892705e-05, "Pretrain/Loss": 2.2145538330078125, "Pretrain/Loss (Raw)": 2.2589304447174072, "Pretrain/Step": 582, "Pretrain/Step Time": 11.29603628627956} +{"Pretrain/Learning Rate": 4.987294928822901e-05, "Pretrain/Loss": 2.213735342025757, "Pretrain/Loss (Raw)": 1.9543737173080444, "Pretrain/Step": 583, "Pretrain/Step Time": 11.31771544367075} +{"Pretrain/Learning Rate": 4.9872093019065255e-05, "Pretrain/Loss": 2.2153611183166504, "Pretrain/Loss (Raw)": 2.3708455562591553, "Pretrain/Step": 584, "Pretrain/Step Time": 11.300424739718437} +{"Pretrain/Learning Rate": 4.987123388153453e-05, "Pretrain/Loss": 2.2148027420043945, "Pretrain/Loss (Raw)": 2.104776620864868, "Pretrain/Step": 585, "Pretrain/Step Time": 11.319791039451957} +{"Pretrain/Learning Rate": 4.9870371875735916e-05, "Pretrain/Loss": 2.2133352756500244, "Pretrain/Loss (Raw)": 2.3436617851257324, "Pretrain/Step": 586, "Pretrain/Step Time": 11.38794507458806} +{"Pretrain/Learning Rate": 4.986950700176882e-05, "Pretrain/Loss": 2.2116196155548096, "Pretrain/Loss (Raw)": 2.0449633598327637, "Pretrain/Step": 587, "Pretrain/Step Time": 11.387745009735227} +{"Pretrain/Learning Rate": 4.9868639259732996e-05, "Pretrain/Loss": 2.212440252304077, "Pretrain/Loss (Raw)": 2.3082332611083984, "Pretrain/Step": 588, "Pretrain/Step Time": 11.410156523808837} +{"Pretrain/Learning Rate": 4.986776864972851e-05, "Pretrain/Loss": 2.213963270187378, "Pretrain/Loss (Raw)": 2.2667462825775146, "Pretrain/Step": 589, "Pretrain/Step Time": 11.424696015194058} +{"Pretrain/Learning Rate": 4.9866895171855756e-05, "Pretrain/Loss": 2.214869499206543, "Pretrain/Loss (Raw)": 2.2883894443511963, "Pretrain/Step": 590, "Pretrain/Step Time": 11.44194764085114} +{"Pretrain/Learning Rate": 4.9866018826215475e-05, "Pretrain/Loss": 2.2147574424743652, "Pretrain/Loss (Raw)": 2.147520065307617, "Pretrain/Step": 591, "Pretrain/Step Time": 11.504431877285242} +{"Pretrain/Learning Rate": 4.9865139612908736e-05, "Pretrain/Loss": 2.2144622802734375, "Pretrain/Loss (Raw)": 2.3573968410491943, "Pretrain/Step": 592, "Pretrain/Step Time": 11.51046708598733} +{"Pretrain/Learning Rate": 4.9864257532036924e-05, "Pretrain/Loss": 2.214665412902832, "Pretrain/Loss (Raw)": 2.284895181655884, "Pretrain/Step": 593, "Pretrain/Step Time": 11.528480473905802} +{"Pretrain/Learning Rate": 4.9863372583701765e-05, "Pretrain/Loss": 2.2150750160217285, "Pretrain/Loss (Raw)": 2.1720356941223145, "Pretrain/Step": 594, "Pretrain/Step Time": 11.540958262979984} +{"Pretrain/Learning Rate": 4.9862484768005324e-05, "Pretrain/Loss": 2.214754104614258, "Pretrain/Loss (Raw)": 2.125659465789795, "Pretrain/Step": 595, "Pretrain/Step Time": 11.511769648641348} +{"Pretrain/Learning Rate": 4.986159408504999e-05, "Pretrain/Loss": 2.2152023315429688, "Pretrain/Loss (Raw)": 2.1984639167785645, "Pretrain/Step": 596, "Pretrain/Step Time": 11.497543826699257} +{"Pretrain/Learning Rate": 4.986070053493846e-05, "Pretrain/Loss": 2.214931011199951, "Pretrain/Loss (Raw)": 2.1805598735809326, "Pretrain/Step": 597, "Pretrain/Step Time": 11.50507765635848} +{"Pretrain/Learning Rate": 4.985980411777381e-05, "Pretrain/Loss": 2.214780807495117, "Pretrain/Loss (Raw)": 2.3683817386627197, "Pretrain/Step": 598, "Pretrain/Step Time": 11.524483012035489} +{"Pretrain/Learning Rate": 4.9858904833659404e-05, "Pretrain/Loss": 2.2132456302642822, "Pretrain/Loss (Raw)": 2.192026376724243, "Pretrain/Step": 599, "Pretrain/Step Time": 11.518872160464525} +{"Pretrain/Learning Rate": 4.985800268269895e-05, "Pretrain/Loss": 2.210618734359741, "Pretrain/Loss (Raw)": 2.087839365005493, "Pretrain/Step": 600, "Pretrain/Step Time": 11.54844106733799} +{"Pretrain/Learning Rate": 4.9857097664996486e-05, "Pretrain/Loss": 2.211538076400757, "Pretrain/Loss (Raw)": 2.4411985874176025, "Pretrain/Step": 601, "Pretrain/Step Time": 11.546156907454133} +{"Pretrain/Learning Rate": 4.98561897806564e-05, "Pretrain/Loss": 2.2100749015808105, "Pretrain/Loss (Raw)": 2.051320791244507, "Pretrain/Step": 602, "Pretrain/Step Time": 11.545507617294788} +{"Pretrain/Learning Rate": 4.985527902978337e-05, "Pretrain/Loss": 2.2094993591308594, "Pretrain/Loss (Raw)": 2.2372887134552, "Pretrain/Step": 603, "Pretrain/Step Time": 11.54488186724484} +{"Pretrain/Learning Rate": 4.985436541248245e-05, "Pretrain/Loss": 2.208291530609131, "Pretrain/Loss (Raw)": 2.049107074737549, "Pretrain/Step": 604, "Pretrain/Step Time": 11.592479519546032} +{"Pretrain/Learning Rate": 4.985344892885899e-05, "Pretrain/Loss": 2.208465576171875, "Pretrain/Loss (Raw)": 2.2467339038848877, "Pretrain/Step": 605, "Pretrain/Step Time": 11.600142560899258} +{"Pretrain/Learning Rate": 4.985252957901869e-05, "Pretrain/Loss": 2.208308696746826, "Pretrain/Loss (Raw)": 2.1989142894744873, "Pretrain/Step": 606, "Pretrain/Step Time": 11.591137252748013} +{"Pretrain/Learning Rate": 4.985160736306756e-05, "Pretrain/Loss": 2.2079873085021973, "Pretrain/Loss (Raw)": 2.1793413162231445, "Pretrain/Step": 607, "Pretrain/Step Time": 11.591185877099633} +{"Pretrain/Learning Rate": 4.985068228111198e-05, "Pretrain/Loss": 2.2091808319091797, "Pretrain/Loss (Raw)": 2.3187220096588135, "Pretrain/Step": 608, "Pretrain/Step Time": 11.63519754447043} +{"Pretrain/Learning Rate": 4.984975433325861e-05, "Pretrain/Loss": 2.20880389213562, "Pretrain/Loss (Raw)": 2.2182211875915527, "Pretrain/Step": 609, "Pretrain/Step Time": 11.6302643828094} +{"Pretrain/Learning Rate": 4.9848823519614475e-05, "Pretrain/Loss": 2.206561803817749, "Pretrain/Loss (Raw)": 1.9538397789001465, "Pretrain/Step": 610, "Pretrain/Step Time": 11.697744809091091} +{"Pretrain/Learning Rate": 4.9847889840286924e-05, "Pretrain/Loss": 2.2073514461517334, "Pretrain/Loss (Raw)": 2.3318796157836914, "Pretrain/Step": 611, "Pretrain/Step Time": 11.694415805861354} +{"Pretrain/Learning Rate": 4.984695329538362e-05, "Pretrain/Loss": 2.206127643585205, "Pretrain/Loss (Raw)": 2.0770978927612305, "Pretrain/Step": 612, "Pretrain/Step Time": 11.67711040750146} +{"Pretrain/Learning Rate": 4.984601388501258e-05, "Pretrain/Loss": 2.206979751586914, "Pretrain/Loss (Raw)": 2.18110990524292, "Pretrain/Step": 613, "Pretrain/Step Time": 11.683846842497587} +{"Pretrain/Learning Rate": 4.9845071609282145e-05, "Pretrain/Loss": 2.2060136795043945, "Pretrain/Loss (Raw)": 2.25653076171875, "Pretrain/Step": 614, "Pretrain/Step Time": 11.701062843203545} +{"Pretrain/Learning Rate": 4.984412646830098e-05, "Pretrain/Loss": 2.206712245941162, "Pretrain/Loss (Raw)": 2.220421075820923, "Pretrain/Step": 615, "Pretrain/Step Time": 11.720397744327784} +{"Pretrain/Learning Rate": 4.9843178462178084e-05, "Pretrain/Loss": 2.2043724060058594, "Pretrain/Loss (Raw)": 1.999260663986206, "Pretrain/Step": 616, "Pretrain/Step Time": 11.759899076074362} +{"Pretrain/Learning Rate": 4.984222759102277e-05, "Pretrain/Loss": 2.202744960784912, "Pretrain/Loss (Raw)": 2.0535407066345215, "Pretrain/Step": 617, "Pretrain/Step Time": 11.760936439037323} +{"Pretrain/Learning Rate": 4.984127385494472e-05, "Pretrain/Loss": 2.201630115509033, "Pretrain/Loss (Raw)": 2.215045928955078, "Pretrain/Step": 618, "Pretrain/Step Time": 11.792172310873866} +{"Pretrain/Learning Rate": 4.984031725405392e-05, "Pretrain/Loss": 2.2009997367858887, "Pretrain/Loss (Raw)": 2.179360866546631, "Pretrain/Step": 619, "Pretrain/Step Time": 11.743181146681309} +{"Pretrain/Learning Rate": 4.983935778846067e-05, "Pretrain/Loss": 2.200248956680298, "Pretrain/Loss (Raw)": 2.2654166221618652, "Pretrain/Step": 620, "Pretrain/Step Time": 11.826764211058617} +{"Pretrain/Learning Rate": 4.9838395458275636e-05, "Pretrain/Loss": 2.1998863220214844, "Pretrain/Loss (Raw)": 1.9019941091537476, "Pretrain/Step": 621, "Pretrain/Step Time": 11.815494805574417} +{"Pretrain/Learning Rate": 4.98374302636098e-05, "Pretrain/Loss": 2.197105884552002, "Pretrain/Loss (Raw)": 2.0677616596221924, "Pretrain/Step": 622, "Pretrain/Step Time": 11.864228148013353} +{"Pretrain/Learning Rate": 4.983646220457446e-05, "Pretrain/Loss": 2.1943559646606445, "Pretrain/Loss (Raw)": 2.105090618133545, "Pretrain/Step": 623, "Pretrain/Step Time": 11.864032754674554} +{"Pretrain/Learning Rate": 4.9835491281281274e-05, "Pretrain/Loss": 2.193565607070923, "Pretrain/Loss (Raw)": 2.1304333209991455, "Pretrain/Step": 624, "Pretrain/Step Time": 11.900633918121457} +{"Pretrain/Learning Rate": 4.9834517493842196e-05, "Pretrain/Loss": 2.192091703414917, "Pretrain/Loss (Raw)": 2.083925485610962, "Pretrain/Step": 625, "Pretrain/Step Time": 11.944791374728084} +{"Pretrain/Learning Rate": 4.983354084236954e-05, "Pretrain/Loss": 2.1916654109954834, "Pretrain/Loss (Raw)": 2.2376017570495605, "Pretrain/Step": 626, "Pretrain/Step Time": 11.940552163869143} +{"Pretrain/Learning Rate": 4.983256132697594e-05, "Pretrain/Loss": 2.1921191215515137, "Pretrain/Loss (Raw)": 2.170001745223999, "Pretrain/Step": 627, "Pretrain/Step Time": 11.963570496067405} +{"Pretrain/Learning Rate": 4.983157894777435e-05, "Pretrain/Loss": 2.192265033721924, "Pretrain/Loss (Raw)": 2.2341747283935547, "Pretrain/Step": 628, "Pretrain/Step Time": 11.958698313683271} +{"Pretrain/Learning Rate": 4.983059370487806e-05, "Pretrain/Loss": 2.1911239624023438, "Pretrain/Loss (Raw)": 2.0690879821777344, "Pretrain/Step": 629, "Pretrain/Step Time": 12.001466270536184} +{"Pretrain/Learning Rate": 4.9829605598400705e-05, "Pretrain/Loss": 2.1896228790283203, "Pretrain/Loss (Raw)": 2.173752546310425, "Pretrain/Step": 630, "Pretrain/Step Time": 11.986629569903016} +{"Pretrain/Learning Rate": 4.982861462845623e-05, "Pretrain/Loss": 2.188079357147217, "Pretrain/Loss (Raw)": 2.2365429401397705, "Pretrain/Step": 631, "Pretrain/Step Time": 11.99965982325375} +{"Pretrain/Learning Rate": 4.982762079515892e-05, "Pretrain/Loss": 2.1868581771850586, "Pretrain/Loss (Raw)": 2.2041168212890625, "Pretrain/Step": 632, "Pretrain/Step Time": 11.961144572123885} +{"Pretrain/Learning Rate": 4.982662409862339e-05, "Pretrain/Loss": 2.187199115753174, "Pretrain/Loss (Raw)": 2.1519899368286133, "Pretrain/Step": 633, "Pretrain/Step Time": 11.958549499511719} +{"Pretrain/Learning Rate": 4.9825624538964576e-05, "Pretrain/Loss": 2.186527729034424, "Pretrain/Loss (Raw)": 2.189025402069092, "Pretrain/Step": 634, "Pretrain/Step Time": 12.01099581643939} +{"Pretrain/Learning Rate": 4.982462211629776e-05, "Pretrain/Loss": 2.1871633529663086, "Pretrain/Loss (Raw)": 2.3717637062072754, "Pretrain/Step": 635, "Pretrain/Step Time": 12.009200531989336} +{"Pretrain/Learning Rate": 4.9823616830738546e-05, "Pretrain/Loss": 2.188701868057251, "Pretrain/Loss (Raw)": 2.266575574874878, "Pretrain/Step": 636, "Pretrain/Step Time": 11.941923538222909} +{"Pretrain/Learning Rate": 4.9822608682402866e-05, "Pretrain/Loss": 2.1888067722320557, "Pretrain/Loss (Raw)": 2.1645424365997314, "Pretrain/Step": 637, "Pretrain/Step Time": 11.968737598508596} +{"Pretrain/Learning Rate": 4.9821597671406984e-05, "Pretrain/Loss": 2.1887922286987305, "Pretrain/Loss (Raw)": 2.29272723197937, "Pretrain/Step": 638, "Pretrain/Step Time": 11.986077386885881} +{"Pretrain/Learning Rate": 4.982058379786749e-05, "Pretrain/Loss": 2.189634084701538, "Pretrain/Loss (Raw)": 2.2023794651031494, "Pretrain/Step": 639, "Pretrain/Step Time": 11.984697354957461} +{"Pretrain/Learning Rate": 4.9819567061901327e-05, "Pretrain/Loss": 2.1885123252868652, "Pretrain/Loss (Raw)": 2.1311378479003906, "Pretrain/Step": 640, "Pretrain/Step Time": 11.963015981018543} +{"Pretrain/Learning Rate": 4.981854746362573e-05, "Pretrain/Loss": 2.1858510971069336, "Pretrain/Loss (Raw)": 1.8051393032073975, "Pretrain/Step": 641, "Pretrain/Step Time": 11.945955771952868} +{"Pretrain/Learning Rate": 4.981752500315829e-05, "Pretrain/Loss": 2.1858673095703125, "Pretrain/Loss (Raw)": 2.2341935634613037, "Pretrain/Step": 642, "Pretrain/Step Time": 11.997958416119218} +{"Pretrain/Learning Rate": 4.981649968061692e-05, "Pretrain/Loss": 2.1848559379577637, "Pretrain/Loss (Raw)": 2.0769736766815186, "Pretrain/Step": 643, "Pretrain/Step Time": 12.036693824455142} +{"Pretrain/Learning Rate": 4.981547149611987e-05, "Pretrain/Loss": 2.1836936473846436, "Pretrain/Loss (Raw)": 2.156142234802246, "Pretrain/Step": 644, "Pretrain/Step Time": 12.01921391300857} +{"Pretrain/Learning Rate": 4.9814440449785715e-05, "Pretrain/Loss": 2.185227394104004, "Pretrain/Loss (Raw)": 2.304218053817749, "Pretrain/Step": 645, "Pretrain/Step Time": 11.993271432816982} +{"Pretrain/Learning Rate": 4.9813406541733355e-05, "Pretrain/Loss": 2.185572624206543, "Pretrain/Loss (Raw)": 2.2521138191223145, "Pretrain/Step": 646, "Pretrain/Step Time": 11.925680300220847} +{"Pretrain/Learning Rate": 4.981236977208203e-05, "Pretrain/Loss": 2.1863436698913574, "Pretrain/Loss (Raw)": 2.3059840202331543, "Pretrain/Step": 647, "Pretrain/Step Time": 11.976426001638174} +{"Pretrain/Learning Rate": 4.98113301409513e-05, "Pretrain/Loss": 2.1861352920532227, "Pretrain/Loss (Raw)": 1.9504932165145874, "Pretrain/Step": 648, "Pretrain/Step Time": 11.95994584262371} +{"Pretrain/Learning Rate": 4.981028764846106e-05, "Pretrain/Loss": 2.185610294342041, "Pretrain/Loss (Raw)": 2.2514193058013916, "Pretrain/Step": 649, "Pretrain/Step Time": 11.981546025723219} +{"Pretrain/Learning Rate": 4.980924229473155e-05, "Pretrain/Loss": 2.1869523525238037, "Pretrain/Loss (Raw)": 2.2900588512420654, "Pretrain/Step": 650, "Pretrain/Step Time": 11.93823591247201} +{"Pretrain/Learning Rate": 4.980819407988331e-05, "Pretrain/Loss": 2.1883115768432617, "Pretrain/Loss (Raw)": 2.2740180492401123, "Pretrain/Step": 651, "Pretrain/Step Time": 11.980698674917221} +{"Pretrain/Learning Rate": 4.980714300403723e-05, "Pretrain/Loss": 2.1890978813171387, "Pretrain/Loss (Raw)": 2.203312873840332, "Pretrain/Step": 652, "Pretrain/Step Time": 11.974025383591652} +{"Pretrain/Learning Rate": 4.9806089067314515e-05, "Pretrain/Loss": 2.1884121894836426, "Pretrain/Loss (Raw)": 2.137038469314575, "Pretrain/Step": 653, "Pretrain/Step Time": 12.001495974138379} +{"Pretrain/Learning Rate": 4.980503226983673e-05, "Pretrain/Loss": 2.1862475872039795, "Pretrain/Loss (Raw)": 2.109360456466675, "Pretrain/Step": 654, "Pretrain/Step Time": 11.994690174236894} +{"Pretrain/Learning Rate": 4.980397261172573e-05, "Pretrain/Loss": 2.1862430572509766, "Pretrain/Loss (Raw)": 2.281099796295166, "Pretrain/Step": 655, "Pretrain/Step Time": 11.955178059637547} +{"Pretrain/Learning Rate": 4.9802910093103725e-05, "Pretrain/Loss": 2.1863210201263428, "Pretrain/Loss (Raw)": 2.185392379760742, "Pretrain/Step": 656, "Pretrain/Step Time": 11.934474751353264} +{"Pretrain/Learning Rate": 4.980184471409326e-05, "Pretrain/Loss": 2.1883537769317627, "Pretrain/Loss (Raw)": 2.4453237056732178, "Pretrain/Step": 657, "Pretrain/Step Time": 11.997547378763556} +{"Pretrain/Learning Rate": 4.980077647481719e-05, "Pretrain/Loss": 2.1879470348358154, "Pretrain/Loss (Raw)": 2.1766645908355713, "Pretrain/Step": 658, "Pretrain/Step Time": 12.011768460273743} +{"Pretrain/Learning Rate": 4.979970537539871e-05, "Pretrain/Loss": 2.188304901123047, "Pretrain/Loss (Raw)": 2.2250208854675293, "Pretrain/Step": 659, "Pretrain/Step Time": 12.01755090802908} +{"Pretrain/Learning Rate": 4.979863141596135e-05, "Pretrain/Loss": 2.187908411026001, "Pretrain/Loss (Raw)": 2.2404048442840576, "Pretrain/Step": 660, "Pretrain/Step Time": 11.987680520862341} +{"Pretrain/Learning Rate": 4.979755459662896e-05, "Pretrain/Loss": 2.187681198120117, "Pretrain/Loss (Raw)": 2.1531147956848145, "Pretrain/Step": 661, "Pretrain/Step Time": 12.029431868344545} +{"Pretrain/Learning Rate": 4.979647491752572e-05, "Pretrain/Loss": 2.1871747970581055, "Pretrain/Loss (Raw)": 2.0303735733032227, "Pretrain/Step": 662, "Pretrain/Step Time": 12.025043275207281} +{"Pretrain/Learning Rate": 4.979539237877615e-05, "Pretrain/Loss": 2.1871347427368164, "Pretrain/Loss (Raw)": 2.1331729888916016, "Pretrain/Step": 663, "Pretrain/Step Time": 12.021158820018172} +{"Pretrain/Learning Rate": 4.979430698050509e-05, "Pretrain/Loss": 2.1875360012054443, "Pretrain/Loss (Raw)": 2.263831853866577, "Pretrain/Step": 664, "Pretrain/Step Time": 12.027503959834576} +{"Pretrain/Learning Rate": 4.979321872283772e-05, "Pretrain/Loss": 2.185866355895996, "Pretrain/Loss (Raw)": 2.005871534347534, "Pretrain/Step": 665, "Pretrain/Step Time": 12.017480686306953} +{"Pretrain/Learning Rate": 4.979212760589953e-05, "Pretrain/Loss": 2.1809229850769043, "Pretrain/Loss (Raw)": 1.7700977325439453, "Pretrain/Step": 666, "Pretrain/Step Time": 12.034366136416793} +{"Pretrain/Learning Rate": 4.9791033629816364e-05, "Pretrain/Loss": 2.1817426681518555, "Pretrain/Loss (Raw)": 2.2181363105773926, "Pretrain/Step": 667, "Pretrain/Step Time": 11.97352970391512} +{"Pretrain/Learning Rate": 4.978993679471438e-05, "Pretrain/Loss": 2.181105136871338, "Pretrain/Loss (Raw)": 1.9696253538131714, "Pretrain/Step": 668, "Pretrain/Step Time": 11.980524117127061} +{"Pretrain/Learning Rate": 4.978883710072008e-05, "Pretrain/Loss": 2.181504487991333, "Pretrain/Loss (Raw)": 2.2323083877563477, "Pretrain/Step": 669, "Pretrain/Step Time": 12.00064130499959} +{"Pretrain/Learning Rate": 4.978773454796026e-05, "Pretrain/Loss": 2.1813716888427734, "Pretrain/Loss (Raw)": 2.280910015106201, "Pretrain/Step": 670, "Pretrain/Step Time": 11.99651861935854} +{"Pretrain/Learning Rate": 4.9786629136562095e-05, "Pretrain/Loss": 2.181272506713867, "Pretrain/Loss (Raw)": 2.2861380577087402, "Pretrain/Step": 671, "Pretrain/Step Time": 11.941019371151924} +{"Pretrain/Learning Rate": 4.978552086665306e-05, "Pretrain/Loss": 2.1796581745147705, "Pretrain/Loss (Raw)": 2.0418739318847656, "Pretrain/Step": 672, "Pretrain/Step Time": 11.924976222217083} +{"Pretrain/Learning Rate": 4.9784409738360973e-05, "Pretrain/Loss": 2.1777169704437256, "Pretrain/Loss (Raw)": 1.920601725578308, "Pretrain/Step": 673, "Pretrain/Step Time": 11.926599107682705} +{"Pretrain/Learning Rate": 4.978329575181395e-05, "Pretrain/Loss": 2.176102638244629, "Pretrain/Loss (Raw)": 1.9949747323989868, "Pretrain/Step": 674, "Pretrain/Step Time": 11.92407988011837} +{"Pretrain/Learning Rate": 4.978217890714049e-05, "Pretrain/Loss": 2.1753547191619873, "Pretrain/Loss (Raw)": 2.123453378677368, "Pretrain/Step": 675, "Pretrain/Step Time": 11.899503584951162} +{"Pretrain/Learning Rate": 4.978105920446938e-05, "Pretrain/Loss": 2.175096273422241, "Pretrain/Loss (Raw)": 2.1869122982025146, "Pretrain/Step": 676, "Pretrain/Step Time": 11.92054270580411} +{"Pretrain/Learning Rate": 4.977993664392975e-05, "Pretrain/Loss": 2.1759490966796875, "Pretrain/Loss (Raw)": 2.1508944034576416, "Pretrain/Step": 677, "Pretrain/Step Time": 11.871845895424485} +{"Pretrain/Learning Rate": 4.9778811225651056e-05, "Pretrain/Loss": 2.176581859588623, "Pretrain/Loss (Raw)": 2.1621508598327637, "Pretrain/Step": 678, "Pretrain/Step Time": 11.905232669785619} +{"Pretrain/Learning Rate": 4.9777682949763096e-05, "Pretrain/Loss": 2.1775031089782715, "Pretrain/Loss (Raw)": 2.1857967376708984, "Pretrain/Step": 679, "Pretrain/Step Time": 11.895851291716099} +{"Pretrain/Learning Rate": 4.9776551816395975e-05, "Pretrain/Loss": 2.177121639251709, "Pretrain/Loss (Raw)": 2.2123122215270996, "Pretrain/Step": 680, "Pretrain/Step Time": 11.948157548904419} +{"Pretrain/Learning Rate": 4.977541782568015e-05, "Pretrain/Loss": 2.1756398677825928, "Pretrain/Loss (Raw)": 2.0207977294921875, "Pretrain/Step": 681, "Pretrain/Step Time": 11.938789455220103} +{"Pretrain/Learning Rate": 4.97742809777464e-05, "Pretrain/Loss": 2.1770551204681396, "Pretrain/Loss (Raw)": 2.325928211212158, "Pretrain/Step": 682, "Pretrain/Step Time": 11.916376527398825} +{"Pretrain/Learning Rate": 4.9773141272725824e-05, "Pretrain/Loss": 2.175581455230713, "Pretrain/Loss (Raw)": 2.1027772426605225, "Pretrain/Step": 683, "Pretrain/Step Time": 11.915624151006341} +{"Pretrain/Learning Rate": 4.9771998710749864e-05, "Pretrain/Loss": 2.1749043464660645, "Pretrain/Loss (Raw)": 2.0258915424346924, "Pretrain/Step": 684, "Pretrain/Step Time": 11.840362034738064} +{"Pretrain/Learning Rate": 4.977085329195028e-05, "Pretrain/Loss": 2.1750292778015137, "Pretrain/Loss (Raw)": 2.239873170852661, "Pretrain/Step": 685, "Pretrain/Step Time": 11.849265910685062} +{"Pretrain/Learning Rate": 4.9769705016459164e-05, "Pretrain/Loss": 2.1753945350646973, "Pretrain/Loss (Raw)": 2.2008185386657715, "Pretrain/Step": 686, "Pretrain/Step Time": 11.834446487948298} +{"Pretrain/Learning Rate": 4.976855388440896e-05, "Pretrain/Loss": 2.1737060546875, "Pretrain/Loss (Raw)": 2.0885684490203857, "Pretrain/Step": 687, "Pretrain/Step Time": 11.83239652402699} +{"Pretrain/Learning Rate": 4.97673998959324e-05, "Pretrain/Loss": 2.1723952293395996, "Pretrain/Loss (Raw)": 1.9418344497680664, "Pretrain/Step": 688, "Pretrain/Step Time": 11.832518514245749} +{"Pretrain/Learning Rate": 4.976624305116259e-05, "Pretrain/Loss": 2.173442840576172, "Pretrain/Loss (Raw)": 2.2924187183380127, "Pretrain/Step": 689, "Pretrain/Step Time": 11.831923514604568} +{"Pretrain/Learning Rate": 4.9765083350232913e-05, "Pretrain/Loss": 2.1722660064697266, "Pretrain/Loss (Raw)": 2.089068651199341, "Pretrain/Step": 690, "Pretrain/Step Time": 11.851820604875684} +{"Pretrain/Learning Rate": 4.976392079327713e-05, "Pretrain/Loss": 2.1718788146972656, "Pretrain/Loss (Raw)": 2.184343099594116, "Pretrain/Step": 691, "Pretrain/Step Time": 11.828730950132012} +{"Pretrain/Learning Rate": 4.976275538042932e-05, "Pretrain/Loss": 2.1723146438598633, "Pretrain/Loss (Raw)": 2.251333713531494, "Pretrain/Step": 692, "Pretrain/Step Time": 11.840782061219215} +{"Pretrain/Learning Rate": 4.976158711182386e-05, "Pretrain/Loss": 2.170156478881836, "Pretrain/Loss (Raw)": 1.9945119619369507, "Pretrain/Step": 693, "Pretrain/Step Time": 11.851603899151087} +{"Pretrain/Learning Rate": 4.9760415987595496e-05, "Pretrain/Loss": 2.173461437225342, "Pretrain/Loss (Raw)": 2.3465492725372314, "Pretrain/Step": 694, "Pretrain/Step Time": 11.86990376189351} +{"Pretrain/Learning Rate": 4.9759242007879295e-05, "Pretrain/Loss": 2.172614574432373, "Pretrain/Loss (Raw)": 2.213278293609619, "Pretrain/Step": 695, "Pretrain/Step Time": 11.858945157378912} +{"Pretrain/Learning Rate": 4.975806517281062e-05, "Pretrain/Loss": 2.1693530082702637, "Pretrain/Loss (Raw)": 2.063262939453125, "Pretrain/Step": 696, "Pretrain/Step Time": 11.834341136738658} +{"Pretrain/Learning Rate": 4.975688548252522e-05, "Pretrain/Loss": 2.168137311935425, "Pretrain/Loss (Raw)": 2.080580711364746, "Pretrain/Step": 697, "Pretrain/Step Time": 11.762499380856752} +{"Pretrain/Learning Rate": 4.9755702937159124e-05, "Pretrain/Loss": 2.168405532836914, "Pretrain/Loss (Raw)": 2.21700382232666, "Pretrain/Step": 698, "Pretrain/Step Time": 11.814122730866075} +{"Pretrain/Learning Rate": 4.975451753684871e-05, "Pretrain/Loss": 2.1685824394226074, "Pretrain/Loss (Raw)": 2.1469194889068604, "Pretrain/Step": 699, "Pretrain/Step Time": 11.777871742844582} +{"Pretrain/Learning Rate": 4.975332928173069e-05, "Pretrain/Loss": 2.1693296432495117, "Pretrain/Loss (Raw)": 2.237778663635254, "Pretrain/Step": 700, "Pretrain/Step Time": 11.780150486156344} +{"Pretrain/Learning Rate": 4.975213817194209e-05, "Pretrain/Loss": 2.171008825302124, "Pretrain/Loss (Raw)": 2.034858226776123, "Pretrain/Step": 701, "Pretrain/Step Time": 11.796223308891058} +{"Pretrain/Learning Rate": 4.975094420762029e-05, "Pretrain/Loss": 2.169398546218872, "Pretrain/Loss (Raw)": 1.8882771730422974, "Pretrain/Step": 702, "Pretrain/Step Time": 11.854441687464714} +{"Pretrain/Learning Rate": 4.9749747388902964e-05, "Pretrain/Loss": 2.1698107719421387, "Pretrain/Loss (Raw)": 2.247434616088867, "Pretrain/Step": 703, "Pretrain/Step Time": 11.805224986746907} +{"Pretrain/Learning Rate": 4.974854771592815e-05, "Pretrain/Loss": 2.1705987453460693, "Pretrain/Loss (Raw)": 2.382359266281128, "Pretrain/Step": 704, "Pretrain/Step Time": 11.80576728656888} +{"Pretrain/Learning Rate": 4.974734518883419e-05, "Pretrain/Loss": 2.1698665618896484, "Pretrain/Loss (Raw)": 2.064732074737549, "Pretrain/Step": 705, "Pretrain/Step Time": 11.757497204467654} +{"Pretrain/Learning Rate": 4.974613980775977e-05, "Pretrain/Loss": 2.170186758041382, "Pretrain/Loss (Raw)": 2.2986674308776855, "Pretrain/Step": 706, "Pretrain/Step Time": 11.75910715945065} +{"Pretrain/Learning Rate": 4.974493157284391e-05, "Pretrain/Loss": 2.17588472366333, "Pretrain/Loss (Raw)": 2.5838913917541504, "Pretrain/Step": 707, "Pretrain/Step Time": 11.73742744885385} +{"Pretrain/Learning Rate": 4.974372048422593e-05, "Pretrain/Loss": 2.174452304840088, "Pretrain/Loss (Raw)": 2.2146668434143066, "Pretrain/Step": 708, "Pretrain/Step Time": 11.739592155441642} +{"Pretrain/Learning Rate": 4.974250654204551e-05, "Pretrain/Loss": 2.172142505645752, "Pretrain/Loss (Raw)": 1.9142191410064697, "Pretrain/Step": 709, "Pretrain/Step Time": 11.699308052659035} +{"Pretrain/Learning Rate": 4.974128974644264e-05, "Pretrain/Loss": 2.172222137451172, "Pretrain/Loss (Raw)": 2.2690999507904053, "Pretrain/Step": 710, "Pretrain/Step Time": 11.762782720848918} +{"Pretrain/Learning Rate": 4.9740070097557656e-05, "Pretrain/Loss": 2.1736738681793213, "Pretrain/Loss (Raw)": 2.1402158737182617, "Pretrain/Step": 711, "Pretrain/Step Time": 11.74178852327168} +{"Pretrain/Learning Rate": 4.973884759553121e-05, "Pretrain/Loss": 2.171802520751953, "Pretrain/Loss (Raw)": 2.131303310394287, "Pretrain/Step": 712, "Pretrain/Step Time": 11.760281266644597} +{"Pretrain/Learning Rate": 4.973762224050428e-05, "Pretrain/Loss": 2.1716341972351074, "Pretrain/Loss (Raw)": 2.0832135677337646, "Pretrain/Step": 713, "Pretrain/Step Time": 11.803249757736921} +{"Pretrain/Learning Rate": 4.973639403261819e-05, "Pretrain/Loss": 2.172236680984497, "Pretrain/Loss (Raw)": 2.420813798904419, "Pretrain/Step": 714, "Pretrain/Step Time": 11.728761466220021} +{"Pretrain/Learning Rate": 4.9735162972014584e-05, "Pretrain/Loss": 2.1731619834899902, "Pretrain/Loss (Raw)": 2.163381814956665, "Pretrain/Step": 715, "Pretrain/Step Time": 11.819557355716825} +{"Pretrain/Learning Rate": 4.9733929058835425e-05, "Pretrain/Loss": 2.17130708694458, "Pretrain/Loss (Raw)": 2.0708398818969727, "Pretrain/Step": 716, "Pretrain/Step Time": 11.771570416167378} +{"Pretrain/Learning Rate": 4.973269229322301e-05, "Pretrain/Loss": 2.1698532104492188, "Pretrain/Loss (Raw)": 2.080641269683838, "Pretrain/Step": 717, "Pretrain/Step Time": 11.757153576239944} +{"Pretrain/Learning Rate": 4.973145267531998e-05, "Pretrain/Loss": 2.169766664505005, "Pretrain/Loss (Raw)": 2.2773118019104004, "Pretrain/Step": 718, "Pretrain/Step Time": 11.792174531146884} +{"Pretrain/Learning Rate": 4.973021020526929e-05, "Pretrain/Loss": 2.1708054542541504, "Pretrain/Loss (Raw)": 2.2804603576660156, "Pretrain/Step": 719, "Pretrain/Step Time": 11.718012480065227} +{"Pretrain/Learning Rate": 4.972896488321422e-05, "Pretrain/Loss": 2.1695609092712402, "Pretrain/Loss (Raw)": 2.1981067657470703, "Pretrain/Step": 720, "Pretrain/Step Time": 11.715828470885754} +{"Pretrain/Learning Rate": 4.97277167092984e-05, "Pretrain/Loss": 2.1691298484802246, "Pretrain/Loss (Raw)": 2.2296955585479736, "Pretrain/Step": 721, "Pretrain/Step Time": 11.710974365472794} +{"Pretrain/Learning Rate": 4.972646568366577e-05, "Pretrain/Loss": 2.1691489219665527, "Pretrain/Loss (Raw)": 2.174511432647705, "Pretrain/Step": 722, "Pretrain/Step Time": 11.676318511366844} +{"Pretrain/Learning Rate": 4.9725211806460604e-05, "Pretrain/Loss": 2.16972279548645, "Pretrain/Loss (Raw)": 2.199096918106079, "Pretrain/Step": 723, "Pretrain/Step Time": 11.690939238294959} +{"Pretrain/Learning Rate": 4.97239550778275e-05, "Pretrain/Loss": 2.1691489219665527, "Pretrain/Loss (Raw)": 2.125025749206543, "Pretrain/Step": 724, "Pretrain/Step Time": 11.656761437654495} +{"Pretrain/Learning Rate": 4.972269549791139e-05, "Pretrain/Loss": 2.1693496704101562, "Pretrain/Loss (Raw)": 2.206249952316284, "Pretrain/Step": 725, "Pretrain/Step Time": 11.662287188693881} +{"Pretrain/Learning Rate": 4.9721433066857535e-05, "Pretrain/Loss": 2.166942596435547, "Pretrain/Loss (Raw)": 2.060267925262451, "Pretrain/Step": 726, "Pretrain/Step Time": 11.66795651614666} +{"Pretrain/Learning Rate": 4.9720167784811535e-05, "Pretrain/Loss": 2.1656863689422607, "Pretrain/Loss (Raw)": 2.0312297344207764, "Pretrain/Step": 727, "Pretrain/Step Time": 11.676770439371467} +{"Pretrain/Learning Rate": 4.97188996519193e-05, "Pretrain/Loss": 2.1648025512695312, "Pretrain/Loss (Raw)": 1.9747140407562256, "Pretrain/Step": 728, "Pretrain/Step Time": 11.596577689051628} +{"Pretrain/Learning Rate": 4.971762866832708e-05, "Pretrain/Loss": 2.162675380706787, "Pretrain/Loss (Raw)": 2.1689391136169434, "Pretrain/Step": 729, "Pretrain/Step Time": 11.60270657017827} +{"Pretrain/Learning Rate": 4.971635483418144e-05, "Pretrain/Loss": 2.163072347640991, "Pretrain/Loss (Raw)": 2.1021130084991455, "Pretrain/Step": 730, "Pretrain/Step Time": 11.63974104449153} +{"Pretrain/Learning Rate": 4.97150781496293e-05, "Pretrain/Loss": 2.1625285148620605, "Pretrain/Loss (Raw)": 2.167677640914917, "Pretrain/Step": 731, "Pretrain/Step Time": 11.63874844275415} +{"Pretrain/Learning Rate": 4.971379861481789e-05, "Pretrain/Loss": 2.1640329360961914, "Pretrain/Loss (Raw)": 2.2417025566101074, "Pretrain/Step": 732, "Pretrain/Step Time": 11.594164036214352} +{"Pretrain/Learning Rate": 4.9712516229894756e-05, "Pretrain/Loss": 2.1637966632843018, "Pretrain/Loss (Raw)": 2.2164697647094727, "Pretrain/Step": 733, "Pretrain/Step Time": 11.641120191663504} +{"Pretrain/Learning Rate": 4.971123099500781e-05, "Pretrain/Loss": 2.1636195182800293, "Pretrain/Loss (Raw)": 2.176240921020508, "Pretrain/Step": 734, "Pretrain/Step Time": 11.617698833346367} +{"Pretrain/Learning Rate": 4.970994291030526e-05, "Pretrain/Loss": 2.16310977935791, "Pretrain/Loss (Raw)": 2.1140947341918945, "Pretrain/Step": 735, "Pretrain/Step Time": 11.673327947035432} +{"Pretrain/Learning Rate": 4.970865197593566e-05, "Pretrain/Loss": 2.161923885345459, "Pretrain/Loss (Raw)": 2.1669113636016846, "Pretrain/Step": 736, "Pretrain/Step Time": 11.619366338476539} +{"Pretrain/Learning Rate": 4.9707358192047885e-05, "Pretrain/Loss": 2.1609809398651123, "Pretrain/Loss (Raw)": 2.0975401401519775, "Pretrain/Step": 737, "Pretrain/Step Time": 11.613354494795203} +{"Pretrain/Learning Rate": 4.970606155879113e-05, "Pretrain/Loss": 2.1632986068725586, "Pretrain/Loss (Raw)": 2.2504940032958984, "Pretrain/Step": 738, "Pretrain/Step Time": 11.551699349656701} +{"Pretrain/Learning Rate": 4.970476207631494e-05, "Pretrain/Loss": 2.1616580486297607, "Pretrain/Loss (Raw)": 2.121877670288086, "Pretrain/Step": 739, "Pretrain/Step Time": 11.577043104916811} +{"Pretrain/Learning Rate": 4.970345974476918e-05, "Pretrain/Loss": 2.1615328788757324, "Pretrain/Loss (Raw)": 2.06107497215271, "Pretrain/Step": 740, "Pretrain/Step Time": 11.565624553710222} +{"Pretrain/Learning Rate": 4.970215456430403e-05, "Pretrain/Loss": 2.160332202911377, "Pretrain/Loss (Raw)": 2.027453660964966, "Pretrain/Step": 741, "Pretrain/Step Time": 11.639449952170253} +{"Pretrain/Learning Rate": 4.970084653507001e-05, "Pretrain/Loss": 2.1622159481048584, "Pretrain/Loss (Raw)": 2.4976308345794678, "Pretrain/Step": 742, "Pretrain/Step Time": 11.596416870132089} +{"Pretrain/Learning Rate": 4.969953565721799e-05, "Pretrain/Loss": 2.161644458770752, "Pretrain/Loss (Raw)": 2.147263288497925, "Pretrain/Step": 743, "Pretrain/Step Time": 11.604091262444854} +{"Pretrain/Learning Rate": 4.969822193089911e-05, "Pretrain/Loss": 2.163421630859375, "Pretrain/Loss (Raw)": 2.2267565727233887, "Pretrain/Step": 744, "Pretrain/Step Time": 11.543148260563612} +{"Pretrain/Learning Rate": 4.969690535626491e-05, "Pretrain/Loss": 2.1652026176452637, "Pretrain/Loss (Raw)": 2.281522750854492, "Pretrain/Step": 745, "Pretrain/Step Time": 11.613259520381689} +{"Pretrain/Learning Rate": 4.96955859334672e-05, "Pretrain/Loss": 2.1657345294952393, "Pretrain/Loss (Raw)": 2.2830936908721924, "Pretrain/Step": 746, "Pretrain/Step Time": 11.560865867882967} +{"Pretrain/Learning Rate": 4.9694263662658156e-05, "Pretrain/Loss": 2.166822910308838, "Pretrain/Loss (Raw)": 2.318683624267578, "Pretrain/Step": 747, "Pretrain/Step Time": 11.559917880222201} +{"Pretrain/Learning Rate": 4.9692938543990265e-05, "Pretrain/Loss": 2.1651201248168945, "Pretrain/Loss (Raw)": 2.0474534034729004, "Pretrain/Step": 748, "Pretrain/Step Time": 11.473018379881978} +{"Pretrain/Learning Rate": 4.969161057761634e-05, "Pretrain/Loss": 2.167994976043701, "Pretrain/Loss (Raw)": 2.26997447013855, "Pretrain/Step": 749, "Pretrain/Step Time": 11.482351215556264} +{"Pretrain/Learning Rate": 4.969027976368954e-05, "Pretrain/Loss": 2.16656231880188, "Pretrain/Loss (Raw)": 1.8843779563903809, "Pretrain/Step": 750, "Pretrain/Step Time": 11.435032026842237} +{"Pretrain/Learning Rate": 4.968894610236332e-05, "Pretrain/Loss": 2.1673879623413086, "Pretrain/Loss (Raw)": 2.2108070850372314, "Pretrain/Step": 751, "Pretrain/Step Time": 11.531598323956132} +{"Pretrain/Learning Rate": 4.968760959379151e-05, "Pretrain/Loss": 2.1673707962036133, "Pretrain/Loss (Raw)": 2.12821364402771, "Pretrain/Step": 752, "Pretrain/Step Time": 11.481515534222126} +{"Pretrain/Learning Rate": 4.968627023812822e-05, "Pretrain/Loss": 2.1678037643432617, "Pretrain/Loss (Raw)": 2.139338731765747, "Pretrain/Step": 753, "Pretrain/Step Time": 11.494337432086468} +{"Pretrain/Learning Rate": 4.968492803552793e-05, "Pretrain/Loss": 2.1671948432922363, "Pretrain/Loss (Raw)": 2.1596739292144775, "Pretrain/Step": 754, "Pretrain/Step Time": 11.496281489729881} +{"Pretrain/Learning Rate": 4.968358298614541e-05, "Pretrain/Loss": 2.1673593521118164, "Pretrain/Loss (Raw)": 2.191042184829712, "Pretrain/Step": 755, "Pretrain/Step Time": 11.499179668724537} +{"Pretrain/Learning Rate": 4.968223509013579e-05, "Pretrain/Loss": 2.1666016578674316, "Pretrain/Loss (Raw)": 2.1371822357177734, "Pretrain/Step": 756, "Pretrain/Step Time": 11.495427001267672} +{"Pretrain/Learning Rate": 4.968088434765452e-05, "Pretrain/Loss": 2.170903205871582, "Pretrain/Loss (Raw)": 2.619699716567993, "Pretrain/Step": 757, "Pretrain/Step Time": 11.449643351137638} +{"Pretrain/Learning Rate": 4.967953075885736e-05, "Pretrain/Loss": 2.1691057682037354, "Pretrain/Loss (Raw)": 1.9436652660369873, "Pretrain/Step": 758, "Pretrain/Step Time": 11.449546551331878} +{"Pretrain/Learning Rate": 4.9678174323900415e-05, "Pretrain/Loss": 2.1688809394836426, "Pretrain/Loss (Raw)": 2.2077815532684326, "Pretrain/Step": 759, "Pretrain/Step Time": 11.457062086090446} +{"Pretrain/Learning Rate": 4.9676815042940125e-05, "Pretrain/Loss": 2.1661601066589355, "Pretrain/Loss (Raw)": 1.855843186378479, "Pretrain/Step": 760, "Pretrain/Step Time": 11.427340146154165} +{"Pretrain/Learning Rate": 4.967545291613325e-05, "Pretrain/Loss": 2.164956569671631, "Pretrain/Loss (Raw)": 1.997938632965088, "Pretrain/Step": 761, "Pretrain/Step Time": 11.426533877849579} +{"Pretrain/Learning Rate": 4.967408794363686e-05, "Pretrain/Loss": 2.165452241897583, "Pretrain/Loss (Raw)": 2.252470016479492, "Pretrain/Step": 762, "Pretrain/Step Time": 11.350116992369294} +{"Pretrain/Learning Rate": 4.9672720125608384e-05, "Pretrain/Loss": 2.163137435913086, "Pretrain/Loss (Raw)": 2.0754778385162354, "Pretrain/Step": 763, "Pretrain/Step Time": 11.368597129359841} +{"Pretrain/Learning Rate": 4.9671349462205565e-05, "Pretrain/Loss": 2.162169933319092, "Pretrain/Loss (Raw)": 2.1427149772644043, "Pretrain/Step": 764, "Pretrain/Step Time": 11.368202723562717} +{"Pretrain/Learning Rate": 4.966997595358647e-05, "Pretrain/Loss": 2.161815643310547, "Pretrain/Loss (Raw)": 2.1192281246185303, "Pretrain/Step": 765, "Pretrain/Step Time": 11.393907764926553} +{"Pretrain/Learning Rate": 4.966859959990949e-05, "Pretrain/Loss": 2.1600253582000732, "Pretrain/Loss (Raw)": 2.063540458679199, "Pretrain/Step": 766, "Pretrain/Step Time": 11.378140218555927} +{"Pretrain/Learning Rate": 4.966722040133337e-05, "Pretrain/Loss": 2.1589269638061523, "Pretrain/Loss (Raw)": 2.06178879737854, "Pretrain/Step": 767, "Pretrain/Step Time": 11.427525669336319} +{"Pretrain/Learning Rate": 4.9665838358017156e-05, "Pretrain/Loss": 2.1603078842163086, "Pretrain/Loss (Raw)": 2.307908058166504, "Pretrain/Step": 768, "Pretrain/Step Time": 11.42650156095624} +{"Pretrain/Learning Rate": 4.966445347012023e-05, "Pretrain/Loss": 2.163583278656006, "Pretrain/Loss (Raw)": 2.2243919372558594, "Pretrain/Step": 769, "Pretrain/Step Time": 11.492504691705108} +{"Pretrain/Learning Rate": 4.9663065737802316e-05, "Pretrain/Loss": 2.1628167629241943, "Pretrain/Loss (Raw)": 2.1360700130462646, "Pretrain/Step": 770, "Pretrain/Step Time": 11.437601981684566} +{"Pretrain/Learning Rate": 4.9661675161223435e-05, "Pretrain/Loss": 2.165694236755371, "Pretrain/Loss (Raw)": 2.4453020095825195, "Pretrain/Step": 771, "Pretrain/Step Time": 11.449448715895414} +{"Pretrain/Learning Rate": 4.966028174054397e-05, "Pretrain/Loss": 2.1654183864593506, "Pretrain/Loss (Raw)": 2.120821475982666, "Pretrain/Step": 772, "Pretrain/Step Time": 11.446960527449846} +{"Pretrain/Learning Rate": 4.965888547592461e-05, "Pretrain/Loss": 2.1639256477355957, "Pretrain/Loss (Raw)": 2.113128185272217, "Pretrain/Step": 773, "Pretrain/Step Time": 11.446227269247174} +{"Pretrain/Learning Rate": 4.965748636752638e-05, "Pretrain/Loss": 2.1631619930267334, "Pretrain/Loss (Raw)": 2.1543755531311035, "Pretrain/Step": 774, "Pretrain/Step Time": 11.454042632132769} +{"Pretrain/Learning Rate": 4.965608441551063e-05, "Pretrain/Loss": 2.1619129180908203, "Pretrain/Loss (Raw)": 2.146129846572876, "Pretrain/Step": 775, "Pretrain/Step Time": 11.445565355941653} +{"Pretrain/Learning Rate": 4.965467962003905e-05, "Pretrain/Loss": 2.1632089614868164, "Pretrain/Loss (Raw)": 2.1163554191589355, "Pretrain/Step": 776, "Pretrain/Step Time": 11.428788866847754} +{"Pretrain/Learning Rate": 4.965327198127363e-05, "Pretrain/Loss": 2.1628475189208984, "Pretrain/Loss (Raw)": 2.2051892280578613, "Pretrain/Step": 777, "Pretrain/Step Time": 11.427232833579183} +{"Pretrain/Learning Rate": 4.965186149937672e-05, "Pretrain/Loss": 2.1605801582336426, "Pretrain/Loss (Raw)": 1.999831199645996, "Pretrain/Step": 778, "Pretrain/Step Time": 11.443093912675977} +{"Pretrain/Learning Rate": 4.9650448174510986e-05, "Pretrain/Loss": 2.159919023513794, "Pretrain/Loss (Raw)": 2.1893765926361084, "Pretrain/Step": 779, "Pretrain/Step Time": 11.404654802754521} +{"Pretrain/Learning Rate": 4.9649032006839404e-05, "Pretrain/Loss": 2.1592259407043457, "Pretrain/Loss (Raw)": 2.114581823348999, "Pretrain/Step": 780, "Pretrain/Step Time": 11.42642961256206} +{"Pretrain/Learning Rate": 4.964761299652529e-05, "Pretrain/Loss": 2.1591978073120117, "Pretrain/Loss (Raw)": 2.133465051651001, "Pretrain/Step": 781, "Pretrain/Step Time": 11.367863826453686} +{"Pretrain/Learning Rate": 4.9646191143732324e-05, "Pretrain/Loss": 2.16092586517334, "Pretrain/Loss (Raw)": 2.3305344581604004, "Pretrain/Step": 782, "Pretrain/Step Time": 11.406610051169991} +{"Pretrain/Learning Rate": 4.9644766448624444e-05, "Pretrain/Loss": 2.1595001220703125, "Pretrain/Loss (Raw)": 2.098634719848633, "Pretrain/Step": 783, "Pretrain/Step Time": 11.406099133193493} +{"Pretrain/Learning Rate": 4.9643338911365964e-05, "Pretrain/Loss": 2.1591639518737793, "Pretrain/Loss (Raw)": 2.142354965209961, "Pretrain/Step": 784, "Pretrain/Step Time": 11.466350339353085} +{"Pretrain/Learning Rate": 4.9641908532121525e-05, "Pretrain/Loss": 2.1564457416534424, "Pretrain/Loss (Raw)": 2.0973868370056152, "Pretrain/Step": 785, "Pretrain/Step Time": 11.369417570531368} +{"Pretrain/Learning Rate": 4.964047531105608e-05, "Pretrain/Loss": 2.1578140258789062, "Pretrain/Loss (Raw)": 2.351795196533203, "Pretrain/Step": 786, "Pretrain/Step Time": 11.43391034938395} +{"Pretrain/Learning Rate": 4.963903924833491e-05, "Pretrain/Loss": 2.157623052597046, "Pretrain/Loss (Raw)": 2.2006046772003174, "Pretrain/Step": 787, "Pretrain/Step Time": 11.428723128512502} +{"Pretrain/Learning Rate": 4.963760034412363e-05, "Pretrain/Loss": 2.156919240951538, "Pretrain/Loss (Raw)": 2.150294065475464, "Pretrain/Step": 788, "Pretrain/Step Time": 11.442618120461702} +{"Pretrain/Learning Rate": 4.9636158598588185e-05, "Pretrain/Loss": 2.1577484607696533, "Pretrain/Loss (Raw)": 2.259248733520508, "Pretrain/Step": 789, "Pretrain/Step Time": 11.389846621081233} +{"Pretrain/Learning Rate": 4.9634714011894836e-05, "Pretrain/Loss": 2.158006191253662, "Pretrain/Loss (Raw)": 2.0633604526519775, "Pretrain/Step": 790, "Pretrain/Step Time": 11.364190066233277} +{"Pretrain/Learning Rate": 4.963326658421019e-05, "Pretrain/Loss": 2.158829689025879, "Pretrain/Loss (Raw)": 2.238600254058838, "Pretrain/Step": 791, "Pretrain/Step Time": 11.372476372867823} +{"Pretrain/Learning Rate": 4.9631816315701165e-05, "Pretrain/Loss": 2.1585140228271484, "Pretrain/Loss (Raw)": 2.2234041690826416, "Pretrain/Step": 792, "Pretrain/Step Time": 11.38875081203878} +{"Pretrain/Learning Rate": 4.9630363206535e-05, "Pretrain/Loss": 2.160701036453247, "Pretrain/Loss (Raw)": 2.2858245372772217, "Pretrain/Step": 793, "Pretrain/Step Time": 11.39181068353355} +{"Pretrain/Learning Rate": 4.962890725687931e-05, "Pretrain/Loss": 2.165898323059082, "Pretrain/Loss (Raw)": 2.4353456497192383, "Pretrain/Step": 794, "Pretrain/Step Time": 11.428224720060825} +{"Pretrain/Learning Rate": 4.962744846690196e-05, "Pretrain/Loss": 2.1659250259399414, "Pretrain/Loss (Raw)": 2.2215840816497803, "Pretrain/Step": 795, "Pretrain/Step Time": 11.400578951463103} +{"Pretrain/Learning Rate": 4.962598683677122e-05, "Pretrain/Loss": 2.166590690612793, "Pretrain/Loss (Raw)": 2.054816961288452, "Pretrain/Step": 796, "Pretrain/Step Time": 11.411499941721559} +{"Pretrain/Learning Rate": 4.9624522366655625e-05, "Pretrain/Loss": 2.1664633750915527, "Pretrain/Loss (Raw)": 2.2159900665283203, "Pretrain/Step": 797, "Pretrain/Step Time": 11.381976084783673} +{"Pretrain/Learning Rate": 4.962305505672408e-05, "Pretrain/Loss": 2.165536403656006, "Pretrain/Loss (Raw)": 2.1622836589813232, "Pretrain/Step": 798, "Pretrain/Step Time": 11.361747240647674} +{"Pretrain/Learning Rate": 4.96215849071458e-05, "Pretrain/Loss": 2.1616649627685547, "Pretrain/Loss (Raw)": 1.7906031608581543, "Pretrain/Step": 799, "Pretrain/Step Time": 11.355915131047368} +{"Pretrain/Learning Rate": 4.962011191809033e-05, "Pretrain/Loss": 2.1628665924072266, "Pretrain/Loss (Raw)": 2.1956467628479004, "Pretrain/Step": 800, "Pretrain/Step Time": 11.32064975053072} +{"Pretrain/Learning Rate": 4.961863608972753e-05, "Pretrain/Loss": 2.1646924018859863, "Pretrain/Loss (Raw)": 2.1543326377868652, "Pretrain/Step": 801, "Pretrain/Step Time": 11.32750490307808} +{"Pretrain/Learning Rate": 4.961715742222762e-05, "Pretrain/Loss": 2.165905714035034, "Pretrain/Loss (Raw)": 2.1502556800842285, "Pretrain/Step": 802, "Pretrain/Step Time": 11.284304052591324} +{"Pretrain/Learning Rate": 4.961567591576112e-05, "Pretrain/Loss": 2.1656014919281006, "Pretrain/Loss (Raw)": 2.0845460891723633, "Pretrain/Step": 803, "Pretrain/Step Time": 11.285459958016872} +{"Pretrain/Learning Rate": 4.961419157049887e-05, "Pretrain/Loss": 2.1639599800109863, "Pretrain/Loss (Raw)": 1.976760745048523, "Pretrain/Step": 804, "Pretrain/Step Time": 11.253913784399629} +{"Pretrain/Learning Rate": 4.9612704386612066e-05, "Pretrain/Loss": 2.162583351135254, "Pretrain/Loss (Raw)": 1.974678635597229, "Pretrain/Step": 805, "Pretrain/Step Time": 11.258528769016266} +{"Pretrain/Learning Rate": 4.9611214364272206e-05, "Pretrain/Loss": 2.162911891937256, "Pretrain/Loss (Raw)": 2.204204559326172, "Pretrain/Step": 806, "Pretrain/Step Time": 11.210842909291387} +{"Pretrain/Learning Rate": 4.960972150365114e-05, "Pretrain/Loss": 2.1626946926116943, "Pretrain/Loss (Raw)": 2.1580328941345215, "Pretrain/Step": 807, "Pretrain/Step Time": 11.228452436625957} +{"Pretrain/Learning Rate": 4.960822580492103e-05, "Pretrain/Loss": 2.1634552478790283, "Pretrain/Loss (Raw)": 2.3096516132354736, "Pretrain/Step": 808, "Pretrain/Step Time": 11.171111391857266} +{"Pretrain/Learning Rate": 4.960672726825436e-05, "Pretrain/Loss": 2.1655631065368652, "Pretrain/Loss (Raw)": 2.290595293045044, "Pretrain/Step": 809, "Pretrain/Step Time": 11.181059926748276} +{"Pretrain/Learning Rate": 4.960522589382395e-05, "Pretrain/Loss": 2.1639788150787354, "Pretrain/Loss (Raw)": 2.123117208480835, "Pretrain/Step": 810, "Pretrain/Step Time": 11.171118658035994} +{"Pretrain/Learning Rate": 4.960372168180294e-05, "Pretrain/Loss": 2.16378116607666, "Pretrain/Loss (Raw)": 2.077514886856079, "Pretrain/Step": 811, "Pretrain/Step Time": 11.176332438364625} +{"Pretrain/Learning Rate": 4.9602214632364816e-05, "Pretrain/Loss": 2.164623260498047, "Pretrain/Loss (Raw)": 2.133653402328491, "Pretrain/Step": 812, "Pretrain/Step Time": 11.195362323895097} +{"Pretrain/Learning Rate": 4.9600704745683367e-05, "Pretrain/Loss": 2.1639046669006348, "Pretrain/Loss (Raw)": 2.1479034423828125, "Pretrain/Step": 813, "Pretrain/Step Time": 11.195640759542584} +{"Pretrain/Learning Rate": 4.959919202193273e-05, "Pretrain/Loss": 2.1631979942321777, "Pretrain/Loss (Raw)": 2.1103591918945312, "Pretrain/Step": 814, "Pretrain/Step Time": 11.209135776385665} +{"Pretrain/Learning Rate": 4.959767646128735e-05, "Pretrain/Loss": 2.165384292602539, "Pretrain/Loss (Raw)": 2.3684144020080566, "Pretrain/Step": 815, "Pretrain/Step Time": 11.209527732804418} +{"Pretrain/Learning Rate": 4.959615806392201e-05, "Pretrain/Loss": 2.16709041595459, "Pretrain/Loss (Raw)": 2.1602227687835693, "Pretrain/Step": 816, "Pretrain/Step Time": 11.205349370837212} +{"Pretrain/Learning Rate": 4.959463683001182e-05, "Pretrain/Loss": 2.1666007041931152, "Pretrain/Loss (Raw)": 2.229738473892212, "Pretrain/Step": 817, "Pretrain/Step Time": 11.197460286319256} +{"Pretrain/Learning Rate": 4.959311275973223e-05, "Pretrain/Loss": 2.167400360107422, "Pretrain/Loss (Raw)": 2.191423177719116, "Pretrain/Step": 818, "Pretrain/Step Time": 11.225968265905976} +{"Pretrain/Learning Rate": 4.959158585325898e-05, "Pretrain/Loss": 2.166699171066284, "Pretrain/Loss (Raw)": 2.0946104526519775, "Pretrain/Step": 819, "Pretrain/Step Time": 11.20285820774734} +{"Pretrain/Learning Rate": 4.959005611076817e-05, "Pretrain/Loss": 2.1664376258850098, "Pretrain/Loss (Raw)": 2.217824935913086, "Pretrain/Step": 820, "Pretrain/Step Time": 11.300293654203415} +{"Pretrain/Learning Rate": 4.9588523532436214e-05, "Pretrain/Loss": 2.167536497116089, "Pretrain/Loss (Raw)": 2.13517689704895, "Pretrain/Step": 821, "Pretrain/Step Time": 11.29339049383998} +{"Pretrain/Learning Rate": 4.9586988118439863e-05, "Pretrain/Loss": 2.166564464569092, "Pretrain/Loss (Raw)": 2.22214937210083, "Pretrain/Step": 822, "Pretrain/Step Time": 11.25457145087421} +{"Pretrain/Learning Rate": 4.958544986895619e-05, "Pretrain/Loss": 2.1658458709716797, "Pretrain/Loss (Raw)": 2.1212692260742188, "Pretrain/Step": 823, "Pretrain/Step Time": 11.242752177640796} +{"Pretrain/Learning Rate": 4.958390878416258e-05, "Pretrain/Loss": 2.166494846343994, "Pretrain/Loss (Raw)": 2.1463334560394287, "Pretrain/Step": 824, "Pretrain/Step Time": 11.231345791369677} +{"Pretrain/Learning Rate": 4.9582364864236765e-05, "Pretrain/Loss": 2.167268753051758, "Pretrain/Loss (Raw)": 2.1796653270721436, "Pretrain/Step": 825, "Pretrain/Step Time": 11.230462234467268} +{"Pretrain/Learning Rate": 4.95808181093568e-05, "Pretrain/Loss": 2.166717767715454, "Pretrain/Loss (Raw)": 2.146458148956299, "Pretrain/Step": 826, "Pretrain/Step Time": 11.176658755168319} +{"Pretrain/Learning Rate": 4.9579268519701063e-05, "Pretrain/Loss": 2.1664137840270996, "Pretrain/Loss (Raw)": 2.1080074310302734, "Pretrain/Step": 827, "Pretrain/Step Time": 11.13945852406323} +{"Pretrain/Learning Rate": 4.957771609544826e-05, "Pretrain/Loss": 2.165879726409912, "Pretrain/Loss (Raw)": 2.1694366931915283, "Pretrain/Step": 828, "Pretrain/Step Time": 11.156136807054281} +{"Pretrain/Learning Rate": 4.957616083677742e-05, "Pretrain/Loss": 2.1672863960266113, "Pretrain/Loss (Raw)": 2.2149126529693604, "Pretrain/Step": 829, "Pretrain/Step Time": 11.151289325207472} +{"Pretrain/Learning Rate": 4.9574602743867916e-05, "Pretrain/Loss": 2.1701149940490723, "Pretrain/Loss (Raw)": 2.250312566757202, "Pretrain/Step": 830, "Pretrain/Step Time": 11.104145988821983} +{"Pretrain/Learning Rate": 4.957304181689941e-05, "Pretrain/Loss": 2.1688649654388428, "Pretrain/Loss (Raw)": 2.087435245513916, "Pretrain/Step": 831, "Pretrain/Step Time": 11.171077670529485} +{"Pretrain/Learning Rate": 4.957147805605194e-05, "Pretrain/Loss": 2.1674129962921143, "Pretrain/Loss (Raw)": 2.196502208709717, "Pretrain/Step": 832, "Pretrain/Step Time": 11.18888758867979} +{"Pretrain/Learning Rate": 4.956991146150583e-05, "Pretrain/Loss": 2.1687512397766113, "Pretrain/Loss (Raw)": 2.2360620498657227, "Pretrain/Step": 833, "Pretrain/Step Time": 11.219372717663646} +{"Pretrain/Learning Rate": 4.9568342033441755e-05, "Pretrain/Loss": 2.171764850616455, "Pretrain/Loss (Raw)": 2.6843936443328857, "Pretrain/Step": 834, "Pretrain/Step Time": 11.219399048015475} +{"Pretrain/Learning Rate": 4.956676977204071e-05, "Pretrain/Loss": 2.16772198677063, "Pretrain/Loss (Raw)": 2.066396951675415, "Pretrain/Step": 835, "Pretrain/Step Time": 11.25436720252037} +{"Pretrain/Learning Rate": 4.9565194677484e-05, "Pretrain/Loss": 2.167015314102173, "Pretrain/Loss (Raw)": 2.1242048740386963, "Pretrain/Step": 836, "Pretrain/Step Time": 11.251374227926135} +{"Pretrain/Learning Rate": 4.95636167499533e-05, "Pretrain/Loss": 2.168872117996216, "Pretrain/Loss (Raw)": 2.1518914699554443, "Pretrain/Step": 837, "Pretrain/Step Time": 11.351448249071836} +{"Pretrain/Learning Rate": 4.9562035989630564e-05, "Pretrain/Loss": 2.168044090270996, "Pretrain/Loss (Raw)": 2.1631078720092773, "Pretrain/Step": 838, "Pretrain/Step Time": 11.288419047370553} +{"Pretrain/Learning Rate": 4.95604523966981e-05, "Pretrain/Loss": 2.168026924133301, "Pretrain/Loss (Raw)": 2.138023614883423, "Pretrain/Step": 839, "Pretrain/Step Time": 11.318622471764684} +{"Pretrain/Learning Rate": 4.9558865971338524e-05, "Pretrain/Loss": 2.1689414978027344, "Pretrain/Loss (Raw)": 2.2483839988708496, "Pretrain/Step": 840, "Pretrain/Step Time": 11.276816930621862} +{"Pretrain/Learning Rate": 4.9557276713734805e-05, "Pretrain/Loss": 2.1686787605285645, "Pretrain/Loss (Raw)": 2.0495684146881104, "Pretrain/Step": 841, "Pretrain/Step Time": 11.209544867277145} +{"Pretrain/Learning Rate": 4.955568462407022e-05, "Pretrain/Loss": 2.1661014556884766, "Pretrain/Loss (Raw)": 2.0909206867218018, "Pretrain/Step": 842, "Pretrain/Step Time": 11.26674597710371} +{"Pretrain/Learning Rate": 4.955408970252837e-05, "Pretrain/Loss": 2.165036916732788, "Pretrain/Loss (Raw)": 2.0271315574645996, "Pretrain/Step": 843, "Pretrain/Step Time": 11.179239206016064} +{"Pretrain/Learning Rate": 4.955249194929319e-05, "Pretrain/Loss": 2.1631901264190674, "Pretrain/Loss (Raw)": 1.8344523906707764, "Pretrain/Step": 844, "Pretrain/Step Time": 11.195924494415522} +{"Pretrain/Learning Rate": 4.955089136454895e-05, "Pretrain/Loss": 2.1660070419311523, "Pretrain/Loss (Raw)": 2.4412124156951904, "Pretrain/Step": 845, "Pretrain/Step Time": 11.202280638739467} +{"Pretrain/Learning Rate": 4.954928794848023e-05, "Pretrain/Loss": 2.1653313636779785, "Pretrain/Loss (Raw)": 2.1907958984375, "Pretrain/Step": 846, "Pretrain/Step Time": 11.167880292981863} +{"Pretrain/Learning Rate": 4.954768170127194e-05, "Pretrain/Loss": 2.1628241539001465, "Pretrain/Loss (Raw)": 1.9595493078231812, "Pretrain/Step": 847, "Pretrain/Step Time": 11.236185954883695} +{"Pretrain/Learning Rate": 4.9546072623109325e-05, "Pretrain/Loss": 2.1628897190093994, "Pretrain/Loss (Raw)": 2.20650315284729, "Pretrain/Step": 848, "Pretrain/Step Time": 11.23000530898571} +{"Pretrain/Learning Rate": 4.954446071417795e-05, "Pretrain/Loss": 2.162105083465576, "Pretrain/Loss (Raw)": 2.129279851913452, "Pretrain/Step": 849, "Pretrain/Step Time": 11.308665366843343} +{"Pretrain/Learning Rate": 4.954284597466371e-05, "Pretrain/Loss": 2.163975477218628, "Pretrain/Loss (Raw)": 2.413908004760742, "Pretrain/Step": 850, "Pretrain/Step Time": 11.300122369080782} +{"Pretrain/Learning Rate": 4.954122840475281e-05, "Pretrain/Loss": 2.1631834506988525, "Pretrain/Loss (Raw)": 2.097722291946411, "Pretrain/Step": 851, "Pretrain/Step Time": 11.303667090833187} +{"Pretrain/Learning Rate": 4.9539608004631825e-05, "Pretrain/Loss": 2.1627821922302246, "Pretrain/Loss (Raw)": 2.0736560821533203, "Pretrain/Step": 852, "Pretrain/Step Time": 11.294736359268427} +{"Pretrain/Learning Rate": 4.9537984774487606e-05, "Pretrain/Loss": 2.1616272926330566, "Pretrain/Loss (Raw)": 2.058441162109375, "Pretrain/Step": 853, "Pretrain/Step Time": 11.343571092933416} +{"Pretrain/Learning Rate": 4.953635871450736e-05, "Pretrain/Loss": 2.161807060241699, "Pretrain/Loss (Raw)": 2.083275079727173, "Pretrain/Step": 854, "Pretrain/Step Time": 11.283226411789656} +{"Pretrain/Learning Rate": 4.95347298248786e-05, "Pretrain/Loss": 2.1627516746520996, "Pretrain/Loss (Raw)": 2.1521263122558594, "Pretrain/Step": 855, "Pretrain/Step Time": 11.324562847614288} +{"Pretrain/Learning Rate": 4.953309810578918e-05, "Pretrain/Loss": 2.1635351181030273, "Pretrain/Loss (Raw)": 2.074979305267334, "Pretrain/Step": 856, "Pretrain/Step Time": 11.326409589499235} +{"Pretrain/Learning Rate": 4.953146355742729e-05, "Pretrain/Loss": 2.1631035804748535, "Pretrain/Loss (Raw)": 2.113701105117798, "Pretrain/Step": 857, "Pretrain/Step Time": 11.39010338485241} +{"Pretrain/Learning Rate": 4.952982617998143e-05, "Pretrain/Loss": 2.1622133255004883, "Pretrain/Loss (Raw)": 1.9881865978240967, "Pretrain/Step": 858, "Pretrain/Step Time": 11.349949402734637} +{"Pretrain/Learning Rate": 4.952818597364043e-05, "Pretrain/Loss": 2.16143798828125, "Pretrain/Loss (Raw)": 2.0684115886688232, "Pretrain/Step": 859, "Pretrain/Step Time": 11.354239758104086} +{"Pretrain/Learning Rate": 4.952654293859344e-05, "Pretrain/Loss": 2.159754753112793, "Pretrain/Loss (Raw)": 2.0262410640716553, "Pretrain/Step": 860, "Pretrain/Step Time": 11.377077849581838} +{"Pretrain/Learning Rate": 4.952489707502993e-05, "Pretrain/Loss": 2.1581168174743652, "Pretrain/Loss (Raw)": 2.006819009780884, "Pretrain/Step": 861, "Pretrain/Step Time": 11.351609153673053} +{"Pretrain/Learning Rate": 4.952324838313974e-05, "Pretrain/Loss": 2.158437490463257, "Pretrain/Loss (Raw)": 2.2173025608062744, "Pretrain/Step": 862, "Pretrain/Step Time": 11.361161902546883} +{"Pretrain/Learning Rate": 4.9521596863112986e-05, "Pretrain/Loss": 2.1590189933776855, "Pretrain/Loss (Raw)": 2.1885416507720947, "Pretrain/Step": 863, "Pretrain/Step Time": 11.36947700381279} +{"Pretrain/Learning Rate": 4.951994251514013e-05, "Pretrain/Loss": 2.159207344055176, "Pretrain/Loss (Raw)": 2.191011667251587, "Pretrain/Step": 864, "Pretrain/Step Time": 11.379411628469825} +{"Pretrain/Learning Rate": 4.9518285339411966e-05, "Pretrain/Loss": 2.159003734588623, "Pretrain/Loss (Raw)": 2.071469783782959, "Pretrain/Step": 865, "Pretrain/Step Time": 11.366460299119353} +{"Pretrain/Learning Rate": 4.9516625336119595e-05, "Pretrain/Loss": 2.1591663360595703, "Pretrain/Loss (Raw)": 2.271293878555298, "Pretrain/Step": 866, "Pretrain/Step Time": 11.36821899190545} +{"Pretrain/Learning Rate": 4.951496250545446e-05, "Pretrain/Loss": 2.1602048873901367, "Pretrain/Loss (Raw)": 2.2548513412475586, "Pretrain/Step": 867, "Pretrain/Step Time": 11.35119622759521} +{"Pretrain/Learning Rate": 4.951329684760835e-05, "Pretrain/Loss": 2.160203218460083, "Pretrain/Loss (Raw)": 2.060838222503662, "Pretrain/Step": 868, "Pretrain/Step Time": 11.359961649402976} +{"Pretrain/Learning Rate": 4.951162836277332e-05, "Pretrain/Loss": 2.1616969108581543, "Pretrain/Loss (Raw)": 2.2186455726623535, "Pretrain/Step": 869, "Pretrain/Step Time": 11.296163780614734} +{"Pretrain/Learning Rate": 4.950995705114182e-05, "Pretrain/Loss": 2.160243511199951, "Pretrain/Loss (Raw)": 2.3115923404693604, "Pretrain/Step": 870, "Pretrain/Step Time": 11.343080163002014} +{"Pretrain/Learning Rate": 4.950828291290656e-05, "Pretrain/Loss": 2.16115665435791, "Pretrain/Loss (Raw)": 2.2641711235046387, "Pretrain/Step": 871, "Pretrain/Step Time": 11.321405598893762} +{"Pretrain/Learning Rate": 4.950660594826064e-05, "Pretrain/Loss": 2.158555030822754, "Pretrain/Loss (Raw)": 1.8937519788742065, "Pretrain/Step": 872, "Pretrain/Step Time": 11.330992003902793} +{"Pretrain/Learning Rate": 4.9504926157397436e-05, "Pretrain/Loss": 2.1573972702026367, "Pretrain/Loss (Raw)": 2.133284568786621, "Pretrain/Step": 873, "Pretrain/Step Time": 11.2823739759624} +{"Pretrain/Learning Rate": 4.950324354051068e-05, "Pretrain/Loss": 2.156250476837158, "Pretrain/Loss (Raw)": 2.136294364929199, "Pretrain/Step": 874, "Pretrain/Step Time": 11.331146655604243} +{"Pretrain/Learning Rate": 4.950155809779442e-05, "Pretrain/Loss": 2.1570534706115723, "Pretrain/Loss (Raw)": 2.4215188026428223, "Pretrain/Step": 875, "Pretrain/Step Time": 11.335905687883496} +{"Pretrain/Learning Rate": 4.9499869829443026e-05, "Pretrain/Loss": 2.156315565109253, "Pretrain/Loss (Raw)": 1.9529813528060913, "Pretrain/Step": 876, "Pretrain/Step Time": 11.405613427981734} +{"Pretrain/Learning Rate": 4.9498178735651184e-05, "Pretrain/Loss": 2.155695915222168, "Pretrain/Loss (Raw)": 2.1906473636627197, "Pretrain/Step": 877, "Pretrain/Step Time": 11.405025318264961} +{"Pretrain/Learning Rate": 4.949648481661394e-05, "Pretrain/Loss": 2.15877628326416, "Pretrain/Loss (Raw)": 2.278681516647339, "Pretrain/Step": 878, "Pretrain/Step Time": 11.472520330920815} +{"Pretrain/Learning Rate": 4.949478807252663e-05, "Pretrain/Loss": 2.160033702850342, "Pretrain/Loss (Raw)": 2.3717586994171143, "Pretrain/Step": 879, "Pretrain/Step Time": 11.37676803022623} +{"Pretrain/Learning Rate": 4.949308850358494e-05, "Pretrain/Loss": 2.158320903778076, "Pretrain/Loss (Raw)": 1.9089409112930298, "Pretrain/Step": 880, "Pretrain/Step Time": 11.395233234390616} +{"Pretrain/Learning Rate": 4.949138610998487e-05, "Pretrain/Loss": 2.1597561836242676, "Pretrain/Loss (Raw)": 2.3230698108673096, "Pretrain/Step": 881, "Pretrain/Step Time": 11.328648019582033} +{"Pretrain/Learning Rate": 4.9489680891922746e-05, "Pretrain/Loss": 2.159914016723633, "Pretrain/Loss (Raw)": 2.179896831512451, "Pretrain/Step": 882, "Pretrain/Step Time": 11.402980756014585} +{"Pretrain/Learning Rate": 4.948797284959522e-05, "Pretrain/Loss": 2.1610162258148193, "Pretrain/Loss (Raw)": 2.332131862640381, "Pretrain/Step": 883, "Pretrain/Step Time": 11.387728342786431} +{"Pretrain/Learning Rate": 4.948626198319928e-05, "Pretrain/Loss": 2.161658763885498, "Pretrain/Loss (Raw)": 2.2194268703460693, "Pretrain/Step": 884, "Pretrain/Step Time": 11.401524698361754} +{"Pretrain/Learning Rate": 4.948454829293222e-05, "Pretrain/Loss": 2.1581664085388184, "Pretrain/Loss (Raw)": 2.172680139541626, "Pretrain/Step": 885, "Pretrain/Step Time": 11.468704462051392} +{"Pretrain/Learning Rate": 4.9482831778991676e-05, "Pretrain/Loss": 2.1590631008148193, "Pretrain/Loss (Raw)": 2.058424949645996, "Pretrain/Step": 886, "Pretrain/Step Time": 11.468140561133623} +{"Pretrain/Learning Rate": 4.9481112441575605e-05, "Pretrain/Loss": 2.157693862915039, "Pretrain/Loss (Raw)": 2.032521963119507, "Pretrain/Step": 887, "Pretrain/Step Time": 11.447063805535436} +{"Pretrain/Learning Rate": 4.947939028088229e-05, "Pretrain/Loss": 2.160569667816162, "Pretrain/Loss (Raw)": 2.223949432373047, "Pretrain/Step": 888, "Pretrain/Step Time": 11.4478893391788} +{"Pretrain/Learning Rate": 4.947766529711033e-05, "Pretrain/Loss": 2.1627297401428223, "Pretrain/Loss (Raw)": 2.2744319438934326, "Pretrain/Step": 889, "Pretrain/Step Time": 11.520480027422309} +{"Pretrain/Learning Rate": 4.947593749045867e-05, "Pretrain/Loss": 2.164653778076172, "Pretrain/Loss (Raw)": 2.498713731765747, "Pretrain/Step": 890, "Pretrain/Step Time": 11.51132544502616} +{"Pretrain/Learning Rate": 4.947420686112657e-05, "Pretrain/Loss": 2.1648142337799072, "Pretrain/Loss (Raw)": 2.096057891845703, "Pretrain/Step": 891, "Pretrain/Step Time": 11.547523302957416} +{"Pretrain/Learning Rate": 4.9472473409313605e-05, "Pretrain/Loss": 2.1634716987609863, "Pretrain/Loss (Raw)": 1.9708540439605713, "Pretrain/Step": 892, "Pretrain/Step Time": 11.557564361020923} +{"Pretrain/Learning Rate": 4.947073713521968e-05, "Pretrain/Loss": 2.1640419960021973, "Pretrain/Loss (Raw)": 2.192200183868408, "Pretrain/Step": 893, "Pretrain/Step Time": 11.526238340884447} +{"Pretrain/Learning Rate": 4.9468998039045046e-05, "Pretrain/Loss": 2.1648011207580566, "Pretrain/Loss (Raw)": 2.1607232093811035, "Pretrain/Step": 894, "Pretrain/Step Time": 11.522794181481004} +{"Pretrain/Learning Rate": 4.946725612099026e-05, "Pretrain/Loss": 2.1688499450683594, "Pretrain/Loss (Raw)": 2.580045700073242, "Pretrain/Step": 895, "Pretrain/Step Time": 11.54447496496141} +{"Pretrain/Learning Rate": 4.9465511381256204e-05, "Pretrain/Loss": 2.1675069332122803, "Pretrain/Loss (Raw)": 2.1360056400299072, "Pretrain/Step": 896, "Pretrain/Step Time": 11.551685040816665} +{"Pretrain/Learning Rate": 4.946376382004408e-05, "Pretrain/Loss": 2.168062686920166, "Pretrain/Loss (Raw)": 2.295525550842285, "Pretrain/Step": 897, "Pretrain/Step Time": 11.515438847243786} +{"Pretrain/Learning Rate": 4.9462013437555446e-05, "Pretrain/Loss": 2.168776512145996, "Pretrain/Loss (Raw)": 2.2274329662323, "Pretrain/Step": 898, "Pretrain/Step Time": 11.527112634852529} +{"Pretrain/Learning Rate": 4.946026023399215e-05, "Pretrain/Loss": 2.1671690940856934, "Pretrain/Loss (Raw)": 2.2395811080932617, "Pretrain/Step": 899, "Pretrain/Step Time": 11.49787400662899} +{"Pretrain/Learning Rate": 4.9458504209556377e-05, "Pretrain/Loss": 2.1667635440826416, "Pretrain/Loss (Raw)": 2.06890869140625, "Pretrain/Step": 900, "Pretrain/Step Time": 11.493399837985635} +{"Pretrain/Learning Rate": 4.945674536445065e-05, "Pretrain/Loss": 2.167078971862793, "Pretrain/Loss (Raw)": 2.1535017490386963, "Pretrain/Step": 901, "Pretrain/Step Time": 11.50719072110951} +{"Pretrain/Learning Rate": 4.945498369887781e-05, "Pretrain/Loss": 2.166635751724243, "Pretrain/Loss (Raw)": 2.0976195335388184, "Pretrain/Step": 902, "Pretrain/Step Time": 11.4926494397223} +{"Pretrain/Learning Rate": 4.945321921304101e-05, "Pretrain/Loss": 2.16654109954834, "Pretrain/Loss (Raw)": 2.1340088844299316, "Pretrain/Step": 903, "Pretrain/Step Time": 11.449323089793324} +{"Pretrain/Learning Rate": 4.945145190714374e-05, "Pretrain/Loss": 2.1660799980163574, "Pretrain/Loss (Raw)": 2.0573275089263916, "Pretrain/Step": 904, "Pretrain/Step Time": 11.502996776252985} +{"Pretrain/Learning Rate": 4.944968178138982e-05, "Pretrain/Loss": 2.1655921936035156, "Pretrain/Loss (Raw)": 2.142787456512451, "Pretrain/Step": 905, "Pretrain/Step Time": 11.471732193604112} +{"Pretrain/Learning Rate": 4.944790883598339e-05, "Pretrain/Loss": 2.1664228439331055, "Pretrain/Loss (Raw)": 2.1061248779296875, "Pretrain/Step": 906, "Pretrain/Step Time": 11.503304803743958} +{"Pretrain/Learning Rate": 4.9446133071128905e-05, "Pretrain/Loss": 2.1661462783813477, "Pretrain/Loss (Raw)": 2.154008150100708, "Pretrain/Step": 907, "Pretrain/Step Time": 11.49698456004262} +{"Pretrain/Learning Rate": 4.944435448703116e-05, "Pretrain/Loss": 2.166581630706787, "Pretrain/Loss (Raw)": 2.1703109741210938, "Pretrain/Step": 908, "Pretrain/Step Time": 11.514261035248637} +{"Pretrain/Learning Rate": 4.944257308389528e-05, "Pretrain/Loss": 2.1670942306518555, "Pretrain/Loss (Raw)": 2.199073314666748, "Pretrain/Step": 909, "Pretrain/Step Time": 11.501403409987688} +{"Pretrain/Learning Rate": 4.944078886192668e-05, "Pretrain/Loss": 2.166095733642578, "Pretrain/Loss (Raw)": 2.202731132507324, "Pretrain/Step": 910, "Pretrain/Step Time": 11.521635245531797} +{"Pretrain/Learning Rate": 4.943900182133116e-05, "Pretrain/Loss": 2.1658682823181152, "Pretrain/Loss (Raw)": 2.0695183277130127, "Pretrain/Step": 911, "Pretrain/Step Time": 11.533115863800049} +{"Pretrain/Learning Rate": 4.943721196231477e-05, "Pretrain/Loss": 2.1662473678588867, "Pretrain/Loss (Raw)": 2.190859794616699, "Pretrain/Step": 912, "Pretrain/Step Time": 11.500009281560779} +{"Pretrain/Learning Rate": 4.943541928508395e-05, "Pretrain/Loss": 2.16646146774292, "Pretrain/Loss (Raw)": 2.1247920989990234, "Pretrain/Step": 913, "Pretrain/Step Time": 11.502805575728416} +{"Pretrain/Learning Rate": 4.9433623789845426e-05, "Pretrain/Loss": 2.16050386428833, "Pretrain/Loss (Raw)": 1.5892032384872437, "Pretrain/Step": 914, "Pretrain/Step Time": 11.440893108025193} +{"Pretrain/Learning Rate": 4.943182547680629e-05, "Pretrain/Loss": 2.1592211723327637, "Pretrain/Loss (Raw)": 2.036428451538086, "Pretrain/Step": 915, "Pretrain/Step Time": 11.465832613408566} +{"Pretrain/Learning Rate": 4.94300243461739e-05, "Pretrain/Loss": 2.159606695175171, "Pretrain/Loss (Raw)": 2.199652671813965, "Pretrain/Step": 916, "Pretrain/Step Time": 11.450279844924808} +{"Pretrain/Learning Rate": 4.9428220398155986e-05, "Pretrain/Loss": 2.1586434841156006, "Pretrain/Loss (Raw)": 2.1359593868255615, "Pretrain/Step": 917, "Pretrain/Step Time": 11.50797601789236} +{"Pretrain/Learning Rate": 4.94264136329606e-05, "Pretrain/Loss": 2.1595072746276855, "Pretrain/Loss (Raw)": 2.1739180088043213, "Pretrain/Step": 918, "Pretrain/Step Time": 11.507057312875986} +{"Pretrain/Learning Rate": 4.942460405079608e-05, "Pretrain/Loss": 2.1580593585968018, "Pretrain/Loss (Raw)": 2.0532658100128174, "Pretrain/Step": 919, "Pretrain/Step Time": 11.517215229570866} +{"Pretrain/Learning Rate": 4.942279165187113e-05, "Pretrain/Loss": 2.156151294708252, "Pretrain/Loss (Raw)": 1.9791488647460938, "Pretrain/Step": 920, "Pretrain/Step Time": 11.456083921715617} +{"Pretrain/Learning Rate": 4.9420976436394764e-05, "Pretrain/Loss": 2.1545462608337402, "Pretrain/Loss (Raw)": 2.0804176330566406, "Pretrain/Step": 921, "Pretrain/Step Time": 11.516041740775108} +{"Pretrain/Learning Rate": 4.941915840457632e-05, "Pretrain/Loss": 2.152021884918213, "Pretrain/Loss (Raw)": 2.1122052669525146, "Pretrain/Step": 922, "Pretrain/Step Time": 11.458130937069654} +{"Pretrain/Learning Rate": 4.941733755662545e-05, "Pretrain/Loss": 2.151962995529175, "Pretrain/Loss (Raw)": 2.214062213897705, "Pretrain/Step": 923, "Pretrain/Step Time": 11.482722859829664} +{"Pretrain/Learning Rate": 4.941551389275217e-05, "Pretrain/Loss": 2.1534488201141357, "Pretrain/Loss (Raw)": 2.244983673095703, "Pretrain/Step": 924, "Pretrain/Step Time": 11.454488411545753} +{"Pretrain/Learning Rate": 4.9413687413166777e-05, "Pretrain/Loss": 2.1533806324005127, "Pretrain/Loss (Raw)": 2.207275152206421, "Pretrain/Step": 925, "Pretrain/Step Time": 11.485851556062698} +{"Pretrain/Learning Rate": 4.94118581180799e-05, "Pretrain/Loss": 2.1537423133850098, "Pretrain/Loss (Raw)": 2.208563804626465, "Pretrain/Step": 926, "Pretrain/Step Time": 11.477589946240187} +{"Pretrain/Learning Rate": 4.9410026007702525e-05, "Pretrain/Loss": 2.155930757522583, "Pretrain/Loss (Raw)": 2.070749282836914, "Pretrain/Step": 927, "Pretrain/Step Time": 11.50396808795631} +{"Pretrain/Learning Rate": 4.940819108224592e-05, "Pretrain/Loss": 2.155768394470215, "Pretrain/Loss (Raw)": 2.174877166748047, "Pretrain/Step": 928, "Pretrain/Step Time": 11.514109620824456} +{"Pretrain/Learning Rate": 4.940635334192171e-05, "Pretrain/Loss": 2.1547842025756836, "Pretrain/Loss (Raw)": 2.0283498764038086, "Pretrain/Step": 929, "Pretrain/Step Time": 11.514211351051927} +{"Pretrain/Learning Rate": 4.940451278694181e-05, "Pretrain/Loss": 2.154949903488159, "Pretrain/Loss (Raw)": 2.1714444160461426, "Pretrain/Step": 930, "Pretrain/Step Time": 11.52487663924694} +{"Pretrain/Learning Rate": 4.9402669417518514e-05, "Pretrain/Loss": 2.1534934043884277, "Pretrain/Loss (Raw)": 1.8981269598007202, "Pretrain/Step": 931, "Pretrain/Step Time": 11.553369944915175} +{"Pretrain/Learning Rate": 4.940082323386439e-05, "Pretrain/Loss": 2.1539711952209473, "Pretrain/Loss (Raw)": 2.037893533706665, "Pretrain/Step": 932, "Pretrain/Step Time": 11.582969458773732} +{"Pretrain/Learning Rate": 4.939897423619234e-05, "Pretrain/Loss": 2.155709743499756, "Pretrain/Loss (Raw)": 2.197211265563965, "Pretrain/Step": 933, "Pretrain/Step Time": 11.621521012857556} +{"Pretrain/Learning Rate": 4.9397122424715624e-05, "Pretrain/Loss": 2.156749725341797, "Pretrain/Loss (Raw)": 2.337341070175171, "Pretrain/Step": 934, "Pretrain/Step Time": 11.640806470066309} +{"Pretrain/Learning Rate": 4.939526779964778e-05, "Pretrain/Loss": 2.154507637023926, "Pretrain/Loss (Raw)": 1.8710646629333496, "Pretrain/Step": 935, "Pretrain/Step Time": 11.639976765960455} +{"Pretrain/Learning Rate": 4.9393410361202694e-05, "Pretrain/Loss": 2.152920961380005, "Pretrain/Loss (Raw)": 2.1065287590026855, "Pretrain/Step": 936, "Pretrain/Step Time": 11.65726251155138} +{"Pretrain/Learning Rate": 4.9391550109594584e-05, "Pretrain/Loss": 2.1508069038391113, "Pretrain/Loss (Raw)": 2.020007610321045, "Pretrain/Step": 937, "Pretrain/Step Time": 11.666045671328902} +{"Pretrain/Learning Rate": 4.938968704503798e-05, "Pretrain/Loss": 2.150662660598755, "Pretrain/Loss (Raw)": 2.1046531200408936, "Pretrain/Step": 938, "Pretrain/Step Time": 11.629994245246053} +{"Pretrain/Learning Rate": 4.938782116774774e-05, "Pretrain/Loss": 2.1504392623901367, "Pretrain/Loss (Raw)": 2.0489096641540527, "Pretrain/Step": 939, "Pretrain/Step Time": 11.652648130431771} +{"Pretrain/Learning Rate": 4.938595247793903e-05, "Pretrain/Loss": 2.1502256393432617, "Pretrain/Loss (Raw)": 2.1063191890716553, "Pretrain/Step": 940, "Pretrain/Step Time": 11.61892037652433} +{"Pretrain/Learning Rate": 4.938408097582738e-05, "Pretrain/Loss": 2.1499862670898438, "Pretrain/Loss (Raw)": 2.117253541946411, "Pretrain/Step": 941, "Pretrain/Step Time": 11.701767379418015} +{"Pretrain/Learning Rate": 4.9382206661628615e-05, "Pretrain/Loss": 2.150712013244629, "Pretrain/Loss (Raw)": 2.203265905380249, "Pretrain/Step": 942, "Pretrain/Step Time": 11.673040384426713} +{"Pretrain/Learning Rate": 4.9380329535558887e-05, "Pretrain/Loss": 2.1493337154388428, "Pretrain/Loss (Raw)": 2.192004680633545, "Pretrain/Step": 943, "Pretrain/Step Time": 11.737786076962948} +{"Pretrain/Learning Rate": 4.9378449597834664e-05, "Pretrain/Loss": 2.1502816677093506, "Pretrain/Loss (Raw)": 2.2815423011779785, "Pretrain/Step": 944, "Pretrain/Step Time": 11.689962588250637} +{"Pretrain/Learning Rate": 4.937656684867276e-05, "Pretrain/Loss": 2.150994062423706, "Pretrain/Loss (Raw)": 2.320929527282715, "Pretrain/Step": 945, "Pretrain/Step Time": 11.722267096862197} +{"Pretrain/Learning Rate": 4.93746812882903e-05, "Pretrain/Loss": 2.1510353088378906, "Pretrain/Loss (Raw)": 2.1967194080352783, "Pretrain/Step": 946, "Pretrain/Step Time": 11.67697255127132} +{"Pretrain/Learning Rate": 4.937279291690474e-05, "Pretrain/Loss": 2.1515583992004395, "Pretrain/Loss (Raw)": 2.1615278720855713, "Pretrain/Step": 947, "Pretrain/Step Time": 11.727751227095723} +{"Pretrain/Learning Rate": 4.9370901734733856e-05, "Pretrain/Loss": 2.149914264678955, "Pretrain/Loss (Raw)": 2.0073626041412354, "Pretrain/Step": 948, "Pretrain/Step Time": 11.619897957891226} +{"Pretrain/Learning Rate": 4.936900774199573e-05, "Pretrain/Loss": 2.1491527557373047, "Pretrain/Loss (Raw)": 2.0377111434936523, "Pretrain/Step": 949, "Pretrain/Step Time": 11.61652634292841} +{"Pretrain/Learning Rate": 4.936711093890881e-05, "Pretrain/Loss": 2.1488428115844727, "Pretrain/Loss (Raw)": 2.182504653930664, "Pretrain/Step": 950, "Pretrain/Step Time": 11.625925937667489} +{"Pretrain/Learning Rate": 4.936521132569184e-05, "Pretrain/Loss": 2.1485767364501953, "Pretrain/Loss (Raw)": 2.0872185230255127, "Pretrain/Step": 951, "Pretrain/Step Time": 11.624826801940799} +{"Pretrain/Learning Rate": 4.936330890256388e-05, "Pretrain/Loss": 2.148900270462036, "Pretrain/Loss (Raw)": 2.187730312347412, "Pretrain/Step": 952, "Pretrain/Step Time": 11.664054546505213} +{"Pretrain/Learning Rate": 4.9361403669744336e-05, "Pretrain/Loss": 2.1484649181365967, "Pretrain/Loss (Raw)": 2.1239585876464844, "Pretrain/Step": 953, "Pretrain/Step Time": 11.670500317588449} +{"Pretrain/Learning Rate": 4.935949562745293e-05, "Pretrain/Loss": 2.1486377716064453, "Pretrain/Loss (Raw)": 2.168586492538452, "Pretrain/Step": 954, "Pretrain/Step Time": 11.730663368478417} +{"Pretrain/Learning Rate": 4.93575847759097e-05, "Pretrain/Loss": 2.147125244140625, "Pretrain/Loss (Raw)": 1.9143836498260498, "Pretrain/Step": 955, "Pretrain/Step Time": 11.730253759771585} +{"Pretrain/Learning Rate": 4.9355671115335015e-05, "Pretrain/Loss": 2.146153450012207, "Pretrain/Loss (Raw)": 2.045050621032715, "Pretrain/Step": 956, "Pretrain/Step Time": 11.740043284371495} +{"Pretrain/Learning Rate": 4.935375464594957e-05, "Pretrain/Loss": 2.1466410160064697, "Pretrain/Loss (Raw)": 2.2773053646087646, "Pretrain/Step": 957, "Pretrain/Step Time": 11.685894886031747} +{"Pretrain/Learning Rate": 4.9351835367974375e-05, "Pretrain/Loss": 2.1464130878448486, "Pretrain/Loss (Raw)": 2.221158027648926, "Pretrain/Step": 958, "Pretrain/Step Time": 11.67956592515111} +{"Pretrain/Learning Rate": 4.9349913281630786e-05, "Pretrain/Loss": 2.146852970123291, "Pretrain/Loss (Raw)": 2.143723964691162, "Pretrain/Step": 959, "Pretrain/Step Time": 11.65796815045178} +{"Pretrain/Learning Rate": 4.934798838714045e-05, "Pretrain/Loss": 2.147517204284668, "Pretrain/Loss (Raw)": 2.281533718109131, "Pretrain/Step": 960, "Pretrain/Step Time": 11.644973697140813} +{"Pretrain/Learning Rate": 4.9346060684725364e-05, "Pretrain/Loss": 2.146946430206299, "Pretrain/Loss (Raw)": 2.162999391555786, "Pretrain/Step": 961, "Pretrain/Step Time": 11.634060122072697} +{"Pretrain/Learning Rate": 4.934413017460784e-05, "Pretrain/Loss": 2.1415605545043945, "Pretrain/Loss (Raw)": 1.9950250387191772, "Pretrain/Step": 962, "Pretrain/Step Time": 11.646084817126393} +{"Pretrain/Learning Rate": 4.93421968570105e-05, "Pretrain/Loss": 2.142571449279785, "Pretrain/Loss (Raw)": 2.195787191390991, "Pretrain/Step": 963, "Pretrain/Step Time": 11.614881480112672} +{"Pretrain/Learning Rate": 4.934026073215633e-05, "Pretrain/Loss": 2.1424903869628906, "Pretrain/Loss (Raw)": 2.113807439804077, "Pretrain/Step": 964, "Pretrain/Step Time": 11.691224124282598} +{"Pretrain/Learning Rate": 4.933832180026858e-05, "Pretrain/Loss": 2.1425797939300537, "Pretrain/Loss (Raw)": 2.1633241176605225, "Pretrain/Step": 965, "Pretrain/Step Time": 11.599533380940557} +{"Pretrain/Learning Rate": 4.933638006157089e-05, "Pretrain/Loss": 2.1431028842926025, "Pretrain/Loss (Raw)": 2.2300827503204346, "Pretrain/Step": 966, "Pretrain/Step Time": 11.596722796559334} +{"Pretrain/Learning Rate": 4.933443551628717e-05, "Pretrain/Loss": 2.1433470249176025, "Pretrain/Loss (Raw)": 2.169267177581787, "Pretrain/Step": 967, "Pretrain/Step Time": 11.55373035557568} +{"Pretrain/Learning Rate": 4.933248816464168e-05, "Pretrain/Loss": 2.1424179077148438, "Pretrain/Loss (Raw)": 2.1294658184051514, "Pretrain/Step": 968, "Pretrain/Step Time": 11.574041847139597} +{"Pretrain/Learning Rate": 4.933053800685899e-05, "Pretrain/Loss": 2.143674373626709, "Pretrain/Loss (Raw)": 2.210380792617798, "Pretrain/Step": 969, "Pretrain/Step Time": 11.584981996566057} +{"Pretrain/Learning Rate": 4.932858504316401e-05, "Pretrain/Loss": 2.143294334411621, "Pretrain/Loss (Raw)": 2.042266368865967, "Pretrain/Step": 970, "Pretrain/Step Time": 11.649132054299116} +{"Pretrain/Learning Rate": 4.932662927378196e-05, "Pretrain/Loss": 2.1443333625793457, "Pretrain/Loss (Raw)": 2.1601319313049316, "Pretrain/Step": 971, "Pretrain/Step Time": 11.650272214785218} +{"Pretrain/Learning Rate": 4.93246706989384e-05, "Pretrain/Loss": 2.1469995975494385, "Pretrain/Loss (Raw)": 2.175734043121338, "Pretrain/Step": 972, "Pretrain/Step Time": 11.692134333774447} +{"Pretrain/Learning Rate": 4.932270931885918e-05, "Pretrain/Loss": 2.1421093940734863, "Pretrain/Loss (Raw)": 1.8152803182601929, "Pretrain/Step": 973, "Pretrain/Step Time": 11.688167048618197} +{"Pretrain/Learning Rate": 4.9320745133770524e-05, "Pretrain/Loss": 2.140983819961548, "Pretrain/Loss (Raw)": 2.046718120574951, "Pretrain/Step": 974, "Pretrain/Step Time": 11.738445008173585} +{"Pretrain/Learning Rate": 4.931877814389893e-05, "Pretrain/Loss": 2.141274929046631, "Pretrain/Loss (Raw)": 1.9967947006225586, "Pretrain/Step": 975, "Pretrain/Step Time": 11.679100964218378} +{"Pretrain/Learning Rate": 4.931680834947124e-05, "Pretrain/Loss": 2.141968250274658, "Pretrain/Loss (Raw)": 2.2952659130096436, "Pretrain/Step": 976, "Pretrain/Step Time": 11.678907161578536} +{"Pretrain/Learning Rate": 4.9314835750714635e-05, "Pretrain/Loss": 2.1414318084716797, "Pretrain/Loss (Raw)": 2.0606296062469482, "Pretrain/Step": 977, "Pretrain/Step Time": 11.596335565671325} +{"Pretrain/Learning Rate": 4.9312860347856595e-05, "Pretrain/Loss": 2.1384994983673096, "Pretrain/Loss (Raw)": 2.038564682006836, "Pretrain/Step": 978, "Pretrain/Step Time": 11.652116183191538} +{"Pretrain/Learning Rate": 4.931088214112494e-05, "Pretrain/Loss": 2.1385388374328613, "Pretrain/Loss (Raw)": 2.1027581691741943, "Pretrain/Step": 979, "Pretrain/Step Time": 11.62788218446076} +{"Pretrain/Learning Rate": 4.930890113074779e-05, "Pretrain/Loss": 2.1390466690063477, "Pretrain/Loss (Raw)": 2.138653516769409, "Pretrain/Step": 980, "Pretrain/Step Time": 11.679357135668397} +{"Pretrain/Learning Rate": 4.930691731695362e-05, "Pretrain/Loss": 2.1401424407958984, "Pretrain/Loss (Raw)": 2.198669910430908, "Pretrain/Step": 981, "Pretrain/Step Time": 11.626090977340937} +{"Pretrain/Learning Rate": 4.9304930699971194e-05, "Pretrain/Loss": 2.139573574066162, "Pretrain/Loss (Raw)": 2.010457754135132, "Pretrain/Step": 982, "Pretrain/Step Time": 11.627031920477748} +{"Pretrain/Learning Rate": 4.9302941280029645e-05, "Pretrain/Loss": 2.1395015716552734, "Pretrain/Loss (Raw)": 2.1429288387298584, "Pretrain/Step": 983, "Pretrain/Step Time": 11.580041542649269} +{"Pretrain/Learning Rate": 4.930094905735838e-05, "Pretrain/Loss": 2.140035629272461, "Pretrain/Loss (Raw)": 2.1433680057525635, "Pretrain/Step": 984, "Pretrain/Step Time": 11.672177286818624} +{"Pretrain/Learning Rate": 4.929895403218717e-05, "Pretrain/Loss": 2.137917995452881, "Pretrain/Loss (Raw)": 1.8426276445388794, "Pretrain/Step": 985, "Pretrain/Step Time": 11.603371679782867} +{"Pretrain/Learning Rate": 4.929695620474607e-05, "Pretrain/Loss": 2.1381804943084717, "Pretrain/Loss (Raw)": 2.0217697620391846, "Pretrain/Step": 986, "Pretrain/Step Time": 11.638408767059445} +{"Pretrain/Learning Rate": 4.9294955575265494e-05, "Pretrain/Loss": 2.1385042667388916, "Pretrain/Loss (Raw)": 2.1098756790161133, "Pretrain/Step": 987, "Pretrain/Step Time": 11.636183630675077} +{"Pretrain/Learning Rate": 4.929295214397616e-05, "Pretrain/Loss": 2.138762950897217, "Pretrain/Loss (Raw)": 2.0593526363372803, "Pretrain/Step": 988, "Pretrain/Step Time": 11.613118063658476} +{"Pretrain/Learning Rate": 4.929094591110911e-05, "Pretrain/Loss": 2.1398215293884277, "Pretrain/Loss (Raw)": 2.1423163414001465, "Pretrain/Step": 989, "Pretrain/Step Time": 11.588036132976413} +{"Pretrain/Learning Rate": 4.928893687689572e-05, "Pretrain/Loss": 2.1387100219726562, "Pretrain/Loss (Raw)": 2.0750293731689453, "Pretrain/Step": 990, "Pretrain/Step Time": 11.58285547979176} +{"Pretrain/Learning Rate": 4.928692504156767e-05, "Pretrain/Loss": 2.137911319732666, "Pretrain/Loss (Raw)": 2.0863003730773926, "Pretrain/Step": 991, "Pretrain/Step Time": 11.505365880206227} +{"Pretrain/Learning Rate": 4.928491040535699e-05, "Pretrain/Loss": 2.1374831199645996, "Pretrain/Loss (Raw)": 2.1361799240112305, "Pretrain/Step": 992, "Pretrain/Step Time": 11.512920057401061} +{"Pretrain/Learning Rate": 4.9282892968495995e-05, "Pretrain/Loss": 2.138500452041626, "Pretrain/Loss (Raw)": 2.201704502105713, "Pretrain/Step": 993, "Pretrain/Step Time": 11.531793048605323} +{"Pretrain/Learning Rate": 4.928087273121737e-05, "Pretrain/Loss": 2.136718511581421, "Pretrain/Loss (Raw)": 2.0431995391845703, "Pretrain/Step": 994, "Pretrain/Step Time": 11.610900774598122} +{"Pretrain/Learning Rate": 4.9278849693754076e-05, "Pretrain/Loss": 2.1359004974365234, "Pretrain/Loss (Raw)": 2.150165319442749, "Pretrain/Step": 995, "Pretrain/Step Time": 11.595967905595899} +{"Pretrain/Learning Rate": 4.927682385633944e-05, "Pretrain/Loss": 2.1368348598480225, "Pretrain/Loss (Raw)": 2.1804115772247314, "Pretrain/Step": 996, "Pretrain/Step Time": 11.609564181417227} +{"Pretrain/Learning Rate": 4.927479521920707e-05, "Pretrain/Loss": 2.1357665061950684, "Pretrain/Loss (Raw)": 2.0819242000579834, "Pretrain/Step": 997, "Pretrain/Step Time": 11.600578648969531} +{"Pretrain/Learning Rate": 4.927276378259094e-05, "Pretrain/Loss": 2.134481430053711, "Pretrain/Loss (Raw)": 2.1470859050750732, "Pretrain/Step": 998, "Pretrain/Step Time": 11.567618530243635} +{"Pretrain/Learning Rate": 4.9270729546725305e-05, "Pretrain/Loss": 2.1317903995513916, "Pretrain/Loss (Raw)": 1.9197207689285278, "Pretrain/Step": 999, "Pretrain/Step Time": 11.594323126599193} +{"Pretrain/Learning Rate": 4.9268692511844774e-05, "Pretrain/Loss": 2.133864402770996, "Pretrain/Loss (Raw)": 2.159238338470459, "Pretrain/Step": 1000, "Pretrain/Step Time": 11.623583754524589} +{"Pretrain/Learning Rate": 4.926665267818426e-05, "Pretrain/Loss": 2.133821964263916, "Pretrain/Loss (Raw)": 2.127819299697876, "Pretrain/Step": 1001, "Pretrain/Step Time": 11.607205433771014} +{"Pretrain/Learning Rate": 4.926461004597901e-05, "Pretrain/Loss": 2.134202480316162, "Pretrain/Loss (Raw)": 2.1850175857543945, "Pretrain/Step": 1002, "Pretrain/Step Time": 11.577265430241823} +{"Pretrain/Learning Rate": 4.92625646154646e-05, "Pretrain/Loss": 2.1306886672973633, "Pretrain/Loss (Raw)": 1.9717682600021362, "Pretrain/Step": 1003, "Pretrain/Step Time": 11.606362722814083} +{"Pretrain/Learning Rate": 4.926051638687691e-05, "Pretrain/Loss": 2.1317687034606934, "Pretrain/Loss (Raw)": 2.091238498687744, "Pretrain/Step": 1004, "Pretrain/Step Time": 11.54020837880671} +{"Pretrain/Learning Rate": 4.925846536045215e-05, "Pretrain/Loss": 2.1310291290283203, "Pretrain/Loss (Raw)": 2.095954656600952, "Pretrain/Step": 1005, "Pretrain/Step Time": 11.56207257695496} +{"Pretrain/Learning Rate": 4.925641153642684e-05, "Pretrain/Loss": 2.130467414855957, "Pretrain/Loss (Raw)": 2.2067816257476807, "Pretrain/Step": 1006, "Pretrain/Step Time": 11.496063129976392} +{"Pretrain/Learning Rate": 4.925435491503787e-05, "Pretrain/Loss": 2.1288645267486572, "Pretrain/Loss (Raw)": 2.1666033267974854, "Pretrain/Step": 1007, "Pretrain/Step Time": 11.51949936710298} +{"Pretrain/Learning Rate": 4.9252295496522395e-05, "Pretrain/Loss": 2.1310367584228516, "Pretrain/Loss (Raw)": 2.186974287033081, "Pretrain/Step": 1008, "Pretrain/Step Time": 11.50384820252657} +{"Pretrain/Learning Rate": 4.925023328111792e-05, "Pretrain/Loss": 2.1281027793884277, "Pretrain/Loss (Raw)": 1.9475115537643433, "Pretrain/Step": 1009, "Pretrain/Step Time": 11.556176573038101} +{"Pretrain/Learning Rate": 4.924816826906227e-05, "Pretrain/Loss": 2.1279802322387695, "Pretrain/Loss (Raw)": 2.1641945838928223, "Pretrain/Step": 1010, "Pretrain/Step Time": 11.481457037851214} +{"Pretrain/Learning Rate": 4.92461004605936e-05, "Pretrain/Loss": 2.1255083084106445, "Pretrain/Loss (Raw)": 2.015748977661133, "Pretrain/Step": 1011, "Pretrain/Step Time": 11.506527479737997} +{"Pretrain/Learning Rate": 4.924402985595037e-05, "Pretrain/Loss": 2.124682903289795, "Pretrain/Loss (Raw)": 2.1137948036193848, "Pretrain/Step": 1012, "Pretrain/Step Time": 11.491366252303123} +{"Pretrain/Learning Rate": 4.924195645537138e-05, "Pretrain/Loss": 2.1242291927337646, "Pretrain/Loss (Raw)": 2.114586353302002, "Pretrain/Step": 1013, "Pretrain/Step Time": 11.415467374026775} +{"Pretrain/Learning Rate": 4.923988025909574e-05, "Pretrain/Loss": 2.1246819496154785, "Pretrain/Loss (Raw)": 2.1164052486419678, "Pretrain/Step": 1014, "Pretrain/Step Time": 11.416191726922989} +{"Pretrain/Learning Rate": 4.923780126736288e-05, "Pretrain/Loss": 2.1263389587402344, "Pretrain/Loss (Raw)": 2.2445907592773438, "Pretrain/Step": 1015, "Pretrain/Step Time": 11.435694992542267} +{"Pretrain/Learning Rate": 4.923571948041257e-05, "Pretrain/Loss": 2.1249256134033203, "Pretrain/Loss (Raw)": 2.0430593490600586, "Pretrain/Step": 1016, "Pretrain/Step Time": 11.43596020154655} +{"Pretrain/Learning Rate": 4.923363489848489e-05, "Pretrain/Loss": 2.120917797088623, "Pretrain/Loss (Raw)": 1.7614072561264038, "Pretrain/Step": 1017, "Pretrain/Step Time": 11.402707746252418} +{"Pretrain/Learning Rate": 4.923154752182023e-05, "Pretrain/Loss": 2.1192147731781006, "Pretrain/Loss (Raw)": 2.280751943588257, "Pretrain/Step": 1018, "Pretrain/Step Time": 11.40113709680736} +{"Pretrain/Learning Rate": 4.922945735065934e-05, "Pretrain/Loss": 2.118075370788574, "Pretrain/Loss (Raw)": 1.9502042531967163, "Pretrain/Step": 1019, "Pretrain/Step Time": 11.378128807991743} +{"Pretrain/Learning Rate": 4.9227364385243246e-05, "Pretrain/Loss": 2.118701934814453, "Pretrain/Loss (Raw)": 2.0510504245758057, "Pretrain/Step": 1020, "Pretrain/Step Time": 11.372748106718063} +{"Pretrain/Learning Rate": 4.922526862581333e-05, "Pretrain/Loss": 2.1180219650268555, "Pretrain/Loss (Raw)": 2.1051533222198486, "Pretrain/Step": 1021, "Pretrain/Step Time": 11.36268037557602} +{"Pretrain/Learning Rate": 4.922317007261129e-05, "Pretrain/Loss": 2.117158889770508, "Pretrain/Loss (Raw)": 2.0502450466156006, "Pretrain/Step": 1022, "Pretrain/Step Time": 11.414151882752776} +{"Pretrain/Learning Rate": 4.922106872587913e-05, "Pretrain/Loss": 2.115201950073242, "Pretrain/Loss (Raw)": 2.329582929611206, "Pretrain/Step": 1023, "Pretrain/Step Time": 11.352603059262037} +{"Pretrain/Learning Rate": 4.921896458585919e-05, "Pretrain/Loss": 2.1142146587371826, "Pretrain/Loss (Raw)": 2.0096230506896973, "Pretrain/Step": 1024, "Pretrain/Step Time": 11.365791896358132} +{"Pretrain/Learning Rate": 4.9216857652794125e-05, "Pretrain/Loss": 2.113314151763916, "Pretrain/Loss (Raw)": 2.1802468299865723, "Pretrain/Step": 1025, "Pretrain/Step Time": 11.34399571083486} +{"Pretrain/Learning Rate": 4.921474792692692e-05, "Pretrain/Loss": 2.113499641418457, "Pretrain/Loss (Raw)": 2.251176595687866, "Pretrain/Step": 1026, "Pretrain/Step Time": 11.340424589812756} +{"Pretrain/Learning Rate": 4.921263540850089e-05, "Pretrain/Loss": 2.1120572090148926, "Pretrain/Loss (Raw)": 2.0549676418304443, "Pretrain/Step": 1027, "Pretrain/Step Time": 11.334998805075884} +{"Pretrain/Learning Rate": 4.921052009775965e-05, "Pretrain/Loss": 2.1126744747161865, "Pretrain/Loss (Raw)": 2.1479175090789795, "Pretrain/Step": 1028, "Pretrain/Step Time": 11.337897684425116} +{"Pretrain/Learning Rate": 4.9208401994947144e-05, "Pretrain/Loss": 2.1128063201904297, "Pretrain/Loss (Raw)": 2.1703600883483887, "Pretrain/Step": 1029, "Pretrain/Step Time": 11.331020193174481} +{"Pretrain/Learning Rate": 4.920628110030765e-05, "Pretrain/Loss": 2.113450527191162, "Pretrain/Loss (Raw)": 2.180098295211792, "Pretrain/Step": 1030, "Pretrain/Step Time": 11.322127824649215} +{"Pretrain/Learning Rate": 4.920415741408575e-05, "Pretrain/Loss": 2.113617420196533, "Pretrain/Loss (Raw)": 2.155397415161133, "Pretrain/Step": 1031, "Pretrain/Step Time": 11.319097850471735} +{"Pretrain/Learning Rate": 4.920203093652637e-05, "Pretrain/Loss": 2.113152503967285, "Pretrain/Loss (Raw)": 1.9978073835372925, "Pretrain/Step": 1032, "Pretrain/Step Time": 11.291629068553448} +{"Pretrain/Learning Rate": 4.919990166787474e-05, "Pretrain/Loss": 2.111931562423706, "Pretrain/Loss (Raw)": 1.986470341682434, "Pretrain/Step": 1033, "Pretrain/Step Time": 11.318697830662131} +{"Pretrain/Learning Rate": 4.919776960837641e-05, "Pretrain/Loss": 2.1117920875549316, "Pretrain/Loss (Raw)": 2.0882856845855713, "Pretrain/Step": 1034, "Pretrain/Step Time": 11.305781004950404} +{"Pretrain/Learning Rate": 4.9195634758277264e-05, "Pretrain/Loss": 2.1114397048950195, "Pretrain/Loss (Raw)": 2.108907461166382, "Pretrain/Step": 1035, "Pretrain/Step Time": 11.312973974272609} +{"Pretrain/Learning Rate": 4.919349711782351e-05, "Pretrain/Loss": 2.110260009765625, "Pretrain/Loss (Raw)": 2.019331932067871, "Pretrain/Step": 1036, "Pretrain/Step Time": 11.27375808916986} +{"Pretrain/Learning Rate": 4.919135668726167e-05, "Pretrain/Loss": 2.1091389656066895, "Pretrain/Loss (Raw)": 2.055565357208252, "Pretrain/Step": 1037, "Pretrain/Step Time": 11.317387543618679} +{"Pretrain/Learning Rate": 4.9189213466838565e-05, "Pretrain/Loss": 2.1086411476135254, "Pretrain/Loss (Raw)": 2.1390230655670166, "Pretrain/Step": 1038, "Pretrain/Step Time": 11.256885800510645} +{"Pretrain/Learning Rate": 4.91870674568014e-05, "Pretrain/Loss": 2.1093578338623047, "Pretrain/Loss (Raw)": 2.1612420082092285, "Pretrain/Step": 1039, "Pretrain/Step Time": 11.271521508693695} +{"Pretrain/Learning Rate": 4.9184918657397625e-05, "Pretrain/Loss": 2.109170436859131, "Pretrain/Loss (Raw)": 2.166844367980957, "Pretrain/Step": 1040, "Pretrain/Step Time": 11.253434823825955} +{"Pretrain/Learning Rate": 4.918276706887508e-05, "Pretrain/Loss": 2.10935115814209, "Pretrain/Loss (Raw)": 2.1479249000549316, "Pretrain/Step": 1041, "Pretrain/Step Time": 11.279940923675895} +{"Pretrain/Learning Rate": 4.918061269148187e-05, "Pretrain/Loss": 2.112461805343628, "Pretrain/Loss (Raw)": 1.987375259399414, "Pretrain/Step": 1042, "Pretrain/Step Time": 11.302431950345635} +{"Pretrain/Learning Rate": 4.9178455525466484e-05, "Pretrain/Loss": 2.113770008087158, "Pretrain/Loss (Raw)": 2.2038674354553223, "Pretrain/Step": 1043, "Pretrain/Step Time": 11.274469438940287} +{"Pretrain/Learning Rate": 4.9176295571077655e-05, "Pretrain/Loss": 2.1143808364868164, "Pretrain/Loss (Raw)": 2.277852773666382, "Pretrain/Step": 1044, "Pretrain/Step Time": 11.29887449555099} +{"Pretrain/Learning Rate": 4.917413282856451e-05, "Pretrain/Loss": 2.114189863204956, "Pretrain/Loss (Raw)": 2.111527442932129, "Pretrain/Step": 1045, "Pretrain/Step Time": 11.241520997136831} +{"Pretrain/Learning Rate": 4.917196729817645e-05, "Pretrain/Loss": 2.1154112815856934, "Pretrain/Loss (Raw)": 2.3302454948425293, "Pretrain/Step": 1046, "Pretrain/Step Time": 11.2506751883775} +{"Pretrain/Learning Rate": 4.9169798980163215e-05, "Pretrain/Loss": 2.1159818172454834, "Pretrain/Loss (Raw)": 2.12629771232605, "Pretrain/Step": 1047, "Pretrain/Step Time": 11.247807277366519} +{"Pretrain/Learning Rate": 4.916762787477487e-05, "Pretrain/Loss": 2.1175975799560547, "Pretrain/Loss (Raw)": 2.1859772205352783, "Pretrain/Step": 1048, "Pretrain/Step Time": 11.250251557677984} +{"Pretrain/Learning Rate": 4.91654539822618e-05, "Pretrain/Loss": 2.1188457012176514, "Pretrain/Loss (Raw)": 2.2401540279388428, "Pretrain/Step": 1049, "Pretrain/Step Time": 11.19559445232153} +{"Pretrain/Learning Rate": 4.916327730287471e-05, "Pretrain/Loss": 2.118455410003662, "Pretrain/Loss (Raw)": 2.0622408390045166, "Pretrain/Step": 1050, "Pretrain/Step Time": 11.192523561418056} +{"Pretrain/Learning Rate": 4.916109783686461e-05, "Pretrain/Loss": 2.117492198944092, "Pretrain/Loss (Raw)": 2.090785503387451, "Pretrain/Step": 1051, "Pretrain/Step Time": 11.173112411051989} +{"Pretrain/Learning Rate": 4.915891558448287e-05, "Pretrain/Loss": 2.1157853603363037, "Pretrain/Loss (Raw)": 2.0265374183654785, "Pretrain/Step": 1052, "Pretrain/Step Time": 11.185065474361181} +{"Pretrain/Learning Rate": 4.915673054598113e-05, "Pretrain/Loss": 2.114421844482422, "Pretrain/Loss (Raw)": 2.032711982727051, "Pretrain/Step": 1053, "Pretrain/Step Time": 11.15862081758678} +{"Pretrain/Learning Rate": 4.91545427216114e-05, "Pretrain/Loss": 2.113480567932129, "Pretrain/Loss (Raw)": 2.0880746841430664, "Pretrain/Step": 1054, "Pretrain/Step Time": 11.168885190039873} +{"Pretrain/Learning Rate": 4.915235211162599e-05, "Pretrain/Loss": 2.1113553047180176, "Pretrain/Loss (Raw)": 1.7987158298492432, "Pretrain/Step": 1055, "Pretrain/Step Time": 11.141389785334468} +{"Pretrain/Learning Rate": 4.9150158716277516e-05, "Pretrain/Loss": 2.1113216876983643, "Pretrain/Loss (Raw)": 2.1705949306488037, "Pretrain/Step": 1056, "Pretrain/Step Time": 11.161825649440289} +{"Pretrain/Learning Rate": 4.9147962535818935e-05, "Pretrain/Loss": 2.112180233001709, "Pretrain/Loss (Raw)": 2.1382453441619873, "Pretrain/Step": 1057, "Pretrain/Step Time": 11.153590232133865} +{"Pretrain/Learning Rate": 4.9145763570503536e-05, "Pretrain/Loss": 2.1119489669799805, "Pretrain/Loss (Raw)": 2.141843318939209, "Pretrain/Step": 1058, "Pretrain/Step Time": 11.209477994590998} +{"Pretrain/Learning Rate": 4.914356182058491e-05, "Pretrain/Loss": 2.1122541427612305, "Pretrain/Loss (Raw)": 1.9371682405471802, "Pretrain/Step": 1059, "Pretrain/Step Time": 11.179500309750438} +{"Pretrain/Learning Rate": 4.914135728631695e-05, "Pretrain/Loss": 2.1117870807647705, "Pretrain/Loss (Raw)": 1.978149652481079, "Pretrain/Step": 1060, "Pretrain/Step Time": 11.182866469025612} +{"Pretrain/Learning Rate": 4.913914996795391e-05, "Pretrain/Loss": 2.110914707183838, "Pretrain/Loss (Raw)": 2.0855298042297363, "Pretrain/Step": 1061, "Pretrain/Step Time": 11.136852903291583} +{"Pretrain/Learning Rate": 4.9136939865750357e-05, "Pretrain/Loss": 2.1095240116119385, "Pretrain/Loss (Raw)": 2.1593265533447266, "Pretrain/Step": 1062, "Pretrain/Step Time": 11.121948003768921} +{"Pretrain/Learning Rate": 4.913472697996116e-05, "Pretrain/Loss": 2.1109607219696045, "Pretrain/Loss (Raw)": 2.054943561553955, "Pretrain/Step": 1063, "Pretrain/Step Time": 11.106670809909701} +{"Pretrain/Learning Rate": 4.913251131084152e-05, "Pretrain/Loss": 2.1107513904571533, "Pretrain/Loss (Raw)": 2.079747438430786, "Pretrain/Step": 1064, "Pretrain/Step Time": 11.075368598103523} +{"Pretrain/Learning Rate": 4.9130292858646966e-05, "Pretrain/Loss": 2.111253261566162, "Pretrain/Loss (Raw)": 2.0842318534851074, "Pretrain/Step": 1065, "Pretrain/Step Time": 11.061858145520091} +{"Pretrain/Learning Rate": 4.912807162363332e-05, "Pretrain/Loss": 2.1114931106567383, "Pretrain/Loss (Raw)": 2.1353609561920166, "Pretrain/Step": 1066, "Pretrain/Step Time": 11.097512364387512} +{"Pretrain/Learning Rate": 4.912584760605677e-05, "Pretrain/Loss": 2.1105704307556152, "Pretrain/Loss (Raw)": 1.9308305978775024, "Pretrain/Step": 1067, "Pretrain/Step Time": 11.06908238120377} +{"Pretrain/Learning Rate": 4.9123620806173785e-05, "Pretrain/Loss": 2.111419916152954, "Pretrain/Loss (Raw)": 2.2150468826293945, "Pretrain/Step": 1068, "Pretrain/Step Time": 11.138861957937479} +{"Pretrain/Learning Rate": 4.9121391224241174e-05, "Pretrain/Loss": 2.1117501258850098, "Pretrain/Loss (Raw)": 2.159498929977417, "Pretrain/Step": 1069, "Pretrain/Step Time": 11.047054262831807} +{"Pretrain/Learning Rate": 4.9119158860516066e-05, "Pretrain/Loss": 2.1112008094787598, "Pretrain/Loss (Raw)": 2.1329524517059326, "Pretrain/Step": 1070, "Pretrain/Step Time": 11.053558636456728} +{"Pretrain/Learning Rate": 4.9116923715255905e-05, "Pretrain/Loss": 2.1106996536254883, "Pretrain/Loss (Raw)": 2.1278531551361084, "Pretrain/Step": 1071, "Pretrain/Step Time": 10.985976714640856} +{"Pretrain/Learning Rate": 4.9114685788718454e-05, "Pretrain/Loss": 2.1107943058013916, "Pretrain/Loss (Raw)": 2.2936947345733643, "Pretrain/Step": 1072, "Pretrain/Step Time": 11.057613641023636} +{"Pretrain/Learning Rate": 4.9112445081161813e-05, "Pretrain/Loss": 2.108015537261963, "Pretrain/Loss (Raw)": 1.9652318954467773, "Pretrain/Step": 1073, "Pretrain/Step Time": 11.033252701163292} +{"Pretrain/Learning Rate": 4.9110201592844376e-05, "Pretrain/Loss": 2.1069846153259277, "Pretrain/Loss (Raw)": 2.064777374267578, "Pretrain/Step": 1074, "Pretrain/Step Time": 11.037509387359023} +{"Pretrain/Learning Rate": 4.910795532402489e-05, "Pretrain/Loss": 2.1076302528381348, "Pretrain/Loss (Raw)": 2.244150161743164, "Pretrain/Step": 1075, "Pretrain/Step Time": 10.983465053141117} +{"Pretrain/Learning Rate": 4.910570627496239e-05, "Pretrain/Loss": 2.1088814735412598, "Pretrain/Loss (Raw)": 2.1675431728363037, "Pretrain/Step": 1076, "Pretrain/Step Time": 11.064707966521382} +{"Pretrain/Learning Rate": 4.9103454445916256e-05, "Pretrain/Loss": 2.110034942626953, "Pretrain/Loss (Raw)": 2.185311794281006, "Pretrain/Step": 1077, "Pretrain/Step Time": 11.065571507439017} +{"Pretrain/Learning Rate": 4.910119983714616e-05, "Pretrain/Loss": 2.1083219051361084, "Pretrain/Loss (Raw)": 1.9632625579833984, "Pretrain/Step": 1078, "Pretrain/Step Time": 11.082255283370614} +{"Pretrain/Learning Rate": 4.909894244891214e-05, "Pretrain/Loss": 2.109602928161621, "Pretrain/Loss (Raw)": 2.2511837482452393, "Pretrain/Step": 1079, "Pretrain/Step Time": 11.08267685957253} +{"Pretrain/Learning Rate": 4.909668228147453e-05, "Pretrain/Loss": 2.110752582550049, "Pretrain/Loss (Raw)": 2.3348634243011475, "Pretrain/Step": 1080, "Pretrain/Step Time": 11.044128350913525} +{"Pretrain/Learning Rate": 4.9094419335093966e-05, "Pretrain/Loss": 2.1108462810516357, "Pretrain/Loss (Raw)": 2.1359763145446777, "Pretrain/Step": 1081, "Pretrain/Step Time": 11.03980072401464} +{"Pretrain/Learning Rate": 4.909215361003142e-05, "Pretrain/Loss": 2.1105990409851074, "Pretrain/Loss (Raw)": 2.1369237899780273, "Pretrain/Step": 1082, "Pretrain/Step Time": 10.987087966874242} +{"Pretrain/Learning Rate": 4.90898851065482e-05, "Pretrain/Loss": 2.111888885498047, "Pretrain/Loss (Raw)": 2.0795016288757324, "Pretrain/Step": 1083, "Pretrain/Step Time": 10.984939835965633} +{"Pretrain/Learning Rate": 4.908761382490591e-05, "Pretrain/Loss": 2.111851930618286, "Pretrain/Loss (Raw)": 2.0403029918670654, "Pretrain/Step": 1084, "Pretrain/Step Time": 10.948439471423626} +{"Pretrain/Learning Rate": 4.908533976536649e-05, "Pretrain/Loss": 2.1091065406799316, "Pretrain/Loss (Raw)": 1.9259099960327148, "Pretrain/Step": 1085, "Pretrain/Step Time": 10.944800965487957} +{"Pretrain/Learning Rate": 4.90830629281922e-05, "Pretrain/Loss": 2.1073904037475586, "Pretrain/Loss (Raw)": 2.001513957977295, "Pretrain/Step": 1086, "Pretrain/Step Time": 10.943223556503654} +{"Pretrain/Learning Rate": 4.908078331364561e-05, "Pretrain/Loss": 2.108180046081543, "Pretrain/Loss (Raw)": 2.2447714805603027, "Pretrain/Step": 1087, "Pretrain/Step Time": 10.911908844485879} +{"Pretrain/Learning Rate": 4.907850092198961e-05, "Pretrain/Loss": 2.1053853034973145, "Pretrain/Loss (Raw)": 1.923813819885254, "Pretrain/Step": 1088, "Pretrain/Step Time": 10.911371406167746} +{"Pretrain/Learning Rate": 4.9076215753487425e-05, "Pretrain/Loss": 2.104586362838745, "Pretrain/Loss (Raw)": 2.0607285499572754, "Pretrain/Step": 1089, "Pretrain/Step Time": 10.878551995381713} +{"Pretrain/Learning Rate": 4.9073927808402585e-05, "Pretrain/Loss": 2.105830192565918, "Pretrain/Loss (Raw)": 2.154230833053589, "Pretrain/Step": 1090, "Pretrain/Step Time": 10.871211340650916} +{"Pretrain/Learning Rate": 4.907163708699896e-05, "Pretrain/Loss": 2.1050007343292236, "Pretrain/Loss (Raw)": 2.0896284580230713, "Pretrain/Step": 1091, "Pretrain/Step Time": 10.887846494093537} +{"Pretrain/Learning Rate": 4.9069343589540704e-05, "Pretrain/Loss": 2.1061975955963135, "Pretrain/Loss (Raw)": 2.267014503479004, "Pretrain/Step": 1092, "Pretrain/Step Time": 10.836772317066789} +{"Pretrain/Learning Rate": 4.906704731629233e-05, "Pretrain/Loss": 2.106266975402832, "Pretrain/Loss (Raw)": 2.1721832752227783, "Pretrain/Step": 1093, "Pretrain/Step Time": 10.835770834237337} +{"Pretrain/Learning Rate": 4.9064748267518656e-05, "Pretrain/Loss": 2.106001138687134, "Pretrain/Loss (Raw)": 2.196070432662964, "Pretrain/Step": 1094, "Pretrain/Step Time": 10.858475705608726} +{"Pretrain/Learning Rate": 4.9062446443484813e-05, "Pretrain/Loss": 2.10417103767395, "Pretrain/Loss (Raw)": 1.9350104331970215, "Pretrain/Step": 1095, "Pretrain/Step Time": 10.858948120847344} +{"Pretrain/Learning Rate": 4.9060141844456267e-05, "Pretrain/Loss": 2.1060338020324707, "Pretrain/Loss (Raw)": 2.3678739070892334, "Pretrain/Step": 1096, "Pretrain/Step Time": 10.842205699533224} +{"Pretrain/Learning Rate": 4.905783447069878e-05, "Pretrain/Loss": 2.1041712760925293, "Pretrain/Loss (Raw)": 1.9719874858856201, "Pretrain/Step": 1097, "Pretrain/Step Time": 10.838238758966327} +{"Pretrain/Learning Rate": 4.905552432247846e-05, "Pretrain/Loss": 2.1047544479370117, "Pretrain/Loss (Raw)": 2.1169204711914062, "Pretrain/Step": 1098, "Pretrain/Step Time": 10.71939466521144} +{"Pretrain/Learning Rate": 4.905321140006172e-05, "Pretrain/Loss": 2.104330062866211, "Pretrain/Loss (Raw)": 2.105820894241333, "Pretrain/Step": 1099, "Pretrain/Step Time": 10.769434509798884} +{"Pretrain/Learning Rate": 4.90508957037153e-05, "Pretrain/Loss": 2.1059298515319824, "Pretrain/Loss (Raw)": 2.3805103302001953, "Pretrain/Step": 1100, "Pretrain/Step Time": 10.707114577293396} +{"Pretrain/Learning Rate": 4.9048577233706264e-05, "Pretrain/Loss": 2.1090433597564697, "Pretrain/Loss (Raw)": 2.2138094902038574, "Pretrain/Step": 1101, "Pretrain/Step Time": 10.709116101264954} +{"Pretrain/Learning Rate": 4.9046255990301965e-05, "Pretrain/Loss": 2.109476089477539, "Pretrain/Loss (Raw)": 2.1020939350128174, "Pretrain/Step": 1102, "Pretrain/Step Time": 10.677069049328566} +{"Pretrain/Learning Rate": 4.904393197377012e-05, "Pretrain/Loss": 2.107837438583374, "Pretrain/Loss (Raw)": 1.7870713472366333, "Pretrain/Step": 1103, "Pretrain/Step Time": 10.670235129073262} +{"Pretrain/Learning Rate": 4.9041605184378746e-05, "Pretrain/Loss": 2.1086275577545166, "Pretrain/Loss (Raw)": 2.3963844776153564, "Pretrain/Step": 1104, "Pretrain/Step Time": 10.670323736965656} +{"Pretrain/Learning Rate": 4.903927562239617e-05, "Pretrain/Loss": 2.1085057258605957, "Pretrain/Loss (Raw)": 2.0450315475463867, "Pretrain/Step": 1105, "Pretrain/Step Time": 10.662119209766388} +{"Pretrain/Learning Rate": 4.9036943288091066e-05, "Pretrain/Loss": 2.109384059906006, "Pretrain/Loss (Raw)": 2.1510140895843506, "Pretrain/Step": 1106, "Pretrain/Step Time": 10.611399231478572} +{"Pretrain/Learning Rate": 4.903460818173238e-05, "Pretrain/Loss": 2.1100950241088867, "Pretrain/Loss (Raw)": 2.193763017654419, "Pretrain/Step": 1107, "Pretrain/Step Time": 10.61383394524455} +{"Pretrain/Learning Rate": 4.9032270303589435e-05, "Pretrain/Loss": 2.110046148300171, "Pretrain/Loss (Raw)": 2.1323788166046143, "Pretrain/Step": 1108, "Pretrain/Step Time": 10.576386969536543} +{"Pretrain/Learning Rate": 4.9029929653931826e-05, "Pretrain/Loss": 2.108168601989746, "Pretrain/Loss (Raw)": 1.958362102508545, "Pretrain/Step": 1109, "Pretrain/Step Time": 10.569527227431536} +{"Pretrain/Learning Rate": 4.90275862330295e-05, "Pretrain/Loss": 2.110403060913086, "Pretrain/Loss (Raw)": 2.2964625358581543, "Pretrain/Step": 1110, "Pretrain/Step Time": 10.5715700853616} +{"Pretrain/Learning Rate": 4.902524004115271e-05, "Pretrain/Loss": 2.1103062629699707, "Pretrain/Loss (Raw)": 2.1305196285247803, "Pretrain/Step": 1111, "Pretrain/Step Time": 10.568536737933755} +{"Pretrain/Learning Rate": 4.902289107857202e-05, "Pretrain/Loss": 2.110074043273926, "Pretrain/Loss (Raw)": 2.113630533218384, "Pretrain/Step": 1112, "Pretrain/Step Time": 10.517652345821261} +{"Pretrain/Learning Rate": 4.9020539345558335e-05, "Pretrain/Loss": 2.111356735229492, "Pretrain/Loss (Raw)": 2.006852626800537, "Pretrain/Step": 1113, "Pretrain/Step Time": 10.524751776829362} +{"Pretrain/Learning Rate": 4.9018184842382866e-05, "Pretrain/Loss": 2.1118831634521484, "Pretrain/Loss (Raw)": 2.0891273021698, "Pretrain/Step": 1114, "Pretrain/Step Time": 10.507572259753942} +{"Pretrain/Learning Rate": 4.901582756931715e-05, "Pretrain/Loss": 2.1109399795532227, "Pretrain/Loss (Raw)": 1.9891554117202759, "Pretrain/Step": 1115, "Pretrain/Step Time": 10.519092014059424} +{"Pretrain/Learning Rate": 4.901346752663302e-05, "Pretrain/Loss": 2.112060070037842, "Pretrain/Loss (Raw)": 2.202712297439575, "Pretrain/Step": 1116, "Pretrain/Step Time": 10.51159162633121} +{"Pretrain/Learning Rate": 4.9011104714602666e-05, "Pretrain/Loss": 2.1089794635772705, "Pretrain/Loss (Raw)": 1.7480014562606812, "Pretrain/Step": 1117, "Pretrain/Step Time": 10.509903386235237} +{"Pretrain/Learning Rate": 4.900873913349857e-05, "Pretrain/Loss": 2.1109566688537598, "Pretrain/Loss (Raw)": 2.3281211853027344, "Pretrain/Step": 1118, "Pretrain/Step Time": 10.510959092527628} +{"Pretrain/Learning Rate": 4.9006370783593544e-05, "Pretrain/Loss": 2.112272024154663, "Pretrain/Loss (Raw)": 2.2546637058258057, "Pretrain/Step": 1119, "Pretrain/Step Time": 10.508483892306685} +{"Pretrain/Learning Rate": 4.900399966516073e-05, "Pretrain/Loss": 2.1129379272460938, "Pretrain/Loss (Raw)": 2.221439838409424, "Pretrain/Step": 1120, "Pretrain/Step Time": 10.51403677277267} +{"Pretrain/Learning Rate": 4.900162577847355e-05, "Pretrain/Loss": 2.1138925552368164, "Pretrain/Loss (Raw)": 2.323848247528076, "Pretrain/Step": 1121, "Pretrain/Step Time": 10.501881519332528} +{"Pretrain/Learning Rate": 4.899924912380579e-05, "Pretrain/Loss": 2.1119823455810547, "Pretrain/Loss (Raw)": 1.7987377643585205, "Pretrain/Step": 1122, "Pretrain/Step Time": 10.41603784263134} +{"Pretrain/Learning Rate": 4.899686970143153e-05, "Pretrain/Loss": 2.111894130706787, "Pretrain/Loss (Raw)": 2.1388449668884277, "Pretrain/Step": 1123, "Pretrain/Step Time": 10.424009719863534} +{"Pretrain/Learning Rate": 4.8994487511625184e-05, "Pretrain/Loss": 2.1111831665039062, "Pretrain/Loss (Raw)": 2.089416265487671, "Pretrain/Step": 1124, "Pretrain/Step Time": 10.404135616496205} +{"Pretrain/Learning Rate": 4.899210255466147e-05, "Pretrain/Loss": 2.1117959022521973, "Pretrain/Loss (Raw)": 2.1603543758392334, "Pretrain/Step": 1125, "Pretrain/Step Time": 10.401398682966828} +{"Pretrain/Learning Rate": 4.898971483081543e-05, "Pretrain/Loss": 2.1111631393432617, "Pretrain/Loss (Raw)": 2.066087245941162, "Pretrain/Step": 1126, "Pretrain/Step Time": 10.394357094541192} +{"Pretrain/Learning Rate": 4.898732434036244e-05, "Pretrain/Loss": 2.1137895584106445, "Pretrain/Loss (Raw)": 2.2559006214141846, "Pretrain/Step": 1127, "Pretrain/Step Time": 10.36507135629654} +{"Pretrain/Learning Rate": 4.898493108357817e-05, "Pretrain/Loss": 2.1140127182006836, "Pretrain/Loss (Raw)": 2.1878116130828857, "Pretrain/Step": 1128, "Pretrain/Step Time": 10.33313175663352} +{"Pretrain/Learning Rate": 4.898253506073863e-05, "Pretrain/Loss": 2.1133058071136475, "Pretrain/Loss (Raw)": 2.037337064743042, "Pretrain/Step": 1129, "Pretrain/Step Time": 10.329202678054571} +{"Pretrain/Learning Rate": 4.8980136272120136e-05, "Pretrain/Loss": 2.1139726638793945, "Pretrain/Loss (Raw)": 2.2703797817230225, "Pretrain/Step": 1130, "Pretrain/Step Time": 10.314487669616938} +{"Pretrain/Learning Rate": 4.8977734717999326e-05, "Pretrain/Loss": 2.1155433654785156, "Pretrain/Loss (Raw)": 2.1728315353393555, "Pretrain/Step": 1131, "Pretrain/Step Time": 10.280096443369985} +{"Pretrain/Learning Rate": 4.8975330398653164e-05, "Pretrain/Loss": 2.115065813064575, "Pretrain/Loss (Raw)": 2.030095100402832, "Pretrain/Step": 1132, "Pretrain/Step Time": 10.280661733821034} +{"Pretrain/Learning Rate": 4.8972923314358934e-05, "Pretrain/Loss": 2.1172854900360107, "Pretrain/Loss (Raw)": 2.3800599575042725, "Pretrain/Step": 1133, "Pretrain/Step Time": 10.29769828170538} +{"Pretrain/Learning Rate": 4.8970513465394206e-05, "Pretrain/Loss": 2.11613130569458, "Pretrain/Loss (Raw)": 2.059074640274048, "Pretrain/Step": 1134, "Pretrain/Step Time": 10.29552105627954} +{"Pretrain/Learning Rate": 4.896810085203692e-05, "Pretrain/Loss": 2.1160120964050293, "Pretrain/Loss (Raw)": 2.151313304901123, "Pretrain/Step": 1135, "Pretrain/Step Time": 10.287990354001522} +{"Pretrain/Learning Rate": 4.896568547456531e-05, "Pretrain/Loss": 2.115446090698242, "Pretrain/Loss (Raw)": 2.114515781402588, "Pretrain/Step": 1136, "Pretrain/Step Time": 10.286426305770874} +{"Pretrain/Learning Rate": 4.896326733325791e-05, "Pretrain/Loss": 2.11633563041687, "Pretrain/Loss (Raw)": 2.0613858699798584, "Pretrain/Step": 1137, "Pretrain/Step Time": 10.24029085598886} +{"Pretrain/Learning Rate": 4.8960846428393615e-05, "Pretrain/Loss": 2.116239309310913, "Pretrain/Loss (Raw)": 2.1518642902374268, "Pretrain/Step": 1138, "Pretrain/Step Time": 10.234936632215977} +{"Pretrain/Learning Rate": 4.8958422760251585e-05, "Pretrain/Loss": 2.1184113025665283, "Pretrain/Loss (Raw)": 2.293766975402832, "Pretrain/Step": 1139, "Pretrain/Step Time": 10.19428269378841} +{"Pretrain/Learning Rate": 4.8955996329111364e-05, "Pretrain/Loss": 2.118875503540039, "Pretrain/Loss (Raw)": 2.173227310180664, "Pretrain/Step": 1140, "Pretrain/Step Time": 10.201059276238084} +{"Pretrain/Learning Rate": 4.895356713525275e-05, "Pretrain/Loss": 2.1169419288635254, "Pretrain/Loss (Raw)": 1.8670616149902344, "Pretrain/Step": 1141, "Pretrain/Step Time": 10.23687463440001} +{"Pretrain/Learning Rate": 4.895113517895591e-05, "Pretrain/Loss": 2.115354061126709, "Pretrain/Loss (Raw)": 1.9131662845611572, "Pretrain/Step": 1142, "Pretrain/Step Time": 10.238464150577784} +{"Pretrain/Learning Rate": 4.8948700460501294e-05, "Pretrain/Loss": 2.114534854888916, "Pretrain/Loss (Raw)": 2.1397340297698975, "Pretrain/Step": 1143, "Pretrain/Step Time": 10.261435203254223} +{"Pretrain/Learning Rate": 4.8946262980169686e-05, "Pretrain/Loss": 2.1155288219451904, "Pretrain/Loss (Raw)": 2.170295238494873, "Pretrain/Step": 1144, "Pretrain/Step Time": 10.268809294328094} +{"Pretrain/Learning Rate": 4.894382273824221e-05, "Pretrain/Loss": 2.1189029216766357, "Pretrain/Loss (Raw)": 2.1932976245880127, "Pretrain/Step": 1145, "Pretrain/Step Time": 10.241718230769038} +{"Pretrain/Learning Rate": 4.894137973500025e-05, "Pretrain/Loss": 2.118828773498535, "Pretrain/Loss (Raw)": 2.271228790283203, "Pretrain/Step": 1146, "Pretrain/Step Time": 10.248711548745632} +{"Pretrain/Learning Rate": 4.893893397072558e-05, "Pretrain/Loss": 2.12099552154541, "Pretrain/Loss (Raw)": 2.2275617122650146, "Pretrain/Step": 1147, "Pretrain/Step Time": 10.246917583048344} +{"Pretrain/Learning Rate": 4.893648544570022e-05, "Pretrain/Loss": 2.121081829071045, "Pretrain/Loss (Raw)": 2.0620994567871094, "Pretrain/Step": 1148, "Pretrain/Step Time": 10.252852816134691} +{"Pretrain/Learning Rate": 4.893403416020658e-05, "Pretrain/Loss": 2.1201331615448, "Pretrain/Loss (Raw)": 1.9837288856506348, "Pretrain/Step": 1149, "Pretrain/Step Time": 10.284799873828888} +{"Pretrain/Learning Rate": 4.893158011452734e-05, "Pretrain/Loss": 2.1214230060577393, "Pretrain/Loss (Raw)": 2.215362310409546, "Pretrain/Step": 1150, "Pretrain/Step Time": 10.231936091557145} +{"Pretrain/Learning Rate": 4.8929123308945505e-05, "Pretrain/Loss": 2.123213052749634, "Pretrain/Loss (Raw)": 2.558706521987915, "Pretrain/Step": 1151, "Pretrain/Step Time": 10.248498832806945} +{"Pretrain/Learning Rate": 4.8926663743744414e-05, "Pretrain/Loss": 2.1231088638305664, "Pretrain/Loss (Raw)": 1.9962722063064575, "Pretrain/Step": 1152, "Pretrain/Step Time": 10.232454758137465} +{"Pretrain/Learning Rate": 4.892420141920772e-05, "Pretrain/Loss": 2.122030019760132, "Pretrain/Loss (Raw)": 2.0421719551086426, "Pretrain/Step": 1153, "Pretrain/Step Time": 10.286442888900638} +{"Pretrain/Learning Rate": 4.8921736335619385e-05, "Pretrain/Loss": 2.12105131149292, "Pretrain/Loss (Raw)": 2.1258668899536133, "Pretrain/Step": 1154, "Pretrain/Step Time": 10.286514779552817} +{"Pretrain/Learning Rate": 4.8919268493263684e-05, "Pretrain/Loss": 2.1222620010375977, "Pretrain/Loss (Raw)": 2.2099449634552, "Pretrain/Step": 1155, "Pretrain/Step Time": 10.311845580115914} +{"Pretrain/Learning Rate": 4.891679789242524e-05, "Pretrain/Loss": 2.1219472885131836, "Pretrain/Loss (Raw)": 2.107675552368164, "Pretrain/Step": 1156, "Pretrain/Step Time": 10.310398038476706} +{"Pretrain/Learning Rate": 4.891432453338895e-05, "Pretrain/Loss": 2.1216564178466797, "Pretrain/Loss (Raw)": 2.133091688156128, "Pretrain/Step": 1157, "Pretrain/Step Time": 10.302947083488107} +{"Pretrain/Learning Rate": 4.8911848416440075e-05, "Pretrain/Loss": 2.1207473278045654, "Pretrain/Loss (Raw)": 2.0637383460998535, "Pretrain/Step": 1158, "Pretrain/Step Time": 10.30521154217422} +{"Pretrain/Learning Rate": 4.890936954186416e-05, "Pretrain/Loss": 2.12076473236084, "Pretrain/Loss (Raw)": 2.1576321125030518, "Pretrain/Step": 1159, "Pretrain/Step Time": 10.307482352480292} +{"Pretrain/Learning Rate": 4.890688790994709e-05, "Pretrain/Loss": 2.1219851970672607, "Pretrain/Loss (Raw)": 2.154026746749878, "Pretrain/Step": 1160, "Pretrain/Step Time": 10.280722739174962} +{"Pretrain/Learning Rate": 4.890440352097505e-05, "Pretrain/Loss": 2.1226134300231934, "Pretrain/Loss (Raw)": 2.0668742656707764, "Pretrain/Step": 1161, "Pretrain/Step Time": 10.288531385362148} +{"Pretrain/Learning Rate": 4.8901916375234556e-05, "Pretrain/Loss": 2.123312473297119, "Pretrain/Loss (Raw)": 2.177776575088501, "Pretrain/Step": 1162, "Pretrain/Step Time": 10.26596837490797} +{"Pretrain/Learning Rate": 4.889942647301243e-05, "Pretrain/Loss": 2.1235384941101074, "Pretrain/Loss (Raw)": 2.137822389602661, "Pretrain/Step": 1163, "Pretrain/Step Time": 10.328744413331151} +{"Pretrain/Learning Rate": 4.8896933814595834e-05, "Pretrain/Loss": 2.1246371269226074, "Pretrain/Loss (Raw)": 2.159970283508301, "Pretrain/Step": 1164, "Pretrain/Step Time": 10.316658921539783} +{"Pretrain/Learning Rate": 4.8894438400272224e-05, "Pretrain/Loss": 2.1235694885253906, "Pretrain/Loss (Raw)": 1.9188926219940186, "Pretrain/Step": 1165, "Pretrain/Step Time": 10.373374769464135} +{"Pretrain/Learning Rate": 4.889194023032938e-05, "Pretrain/Loss": 2.12390398979187, "Pretrain/Loss (Raw)": 2.1818556785583496, "Pretrain/Step": 1166, "Pretrain/Step Time": 10.380461970344186} +{"Pretrain/Learning Rate": 4.8889439305055406e-05, "Pretrain/Loss": 2.1247200965881348, "Pretrain/Loss (Raw)": 2.2657032012939453, "Pretrain/Step": 1167, "Pretrain/Step Time": 10.35248488932848} +{"Pretrain/Learning Rate": 4.8886935624738715e-05, "Pretrain/Loss": 2.1250691413879395, "Pretrain/Loss (Raw)": 2.2115321159362793, "Pretrain/Step": 1168, "Pretrain/Step Time": 10.342718968167901} +{"Pretrain/Learning Rate": 4.888442918966806e-05, "Pretrain/Loss": 2.1251792907714844, "Pretrain/Loss (Raw)": 2.1620023250579834, "Pretrain/Step": 1169, "Pretrain/Step Time": 10.316072655841708} +{"Pretrain/Learning Rate": 4.888192000013248e-05, "Pretrain/Loss": 2.1264162063598633, "Pretrain/Loss (Raw)": 2.1456997394561768, "Pretrain/Step": 1170, "Pretrain/Step Time": 10.29103009402752} +{"Pretrain/Learning Rate": 4.887940805642135e-05, "Pretrain/Loss": 2.125563621520996, "Pretrain/Loss (Raw)": 2.094766616821289, "Pretrain/Step": 1171, "Pretrain/Step Time": 10.28828071989119} +{"Pretrain/Learning Rate": 4.887689335882436e-05, "Pretrain/Loss": 2.1254520416259766, "Pretrain/Loss (Raw)": 2.2635369300842285, "Pretrain/Step": 1172, "Pretrain/Step Time": 10.269677067175508} +{"Pretrain/Learning Rate": 4.8874375907631506e-05, "Pretrain/Loss": 2.126894235610962, "Pretrain/Loss (Raw)": 2.2961487770080566, "Pretrain/Step": 1173, "Pretrain/Step Time": 10.258777199313045} +{"Pretrain/Learning Rate": 4.887185570313314e-05, "Pretrain/Loss": 2.1250433921813965, "Pretrain/Loss (Raw)": 2.0933241844177246, "Pretrain/Step": 1174, "Pretrain/Step Time": 10.32596462778747} +{"Pretrain/Learning Rate": 4.886933274561988e-05, "Pretrain/Loss": 2.126589775085449, "Pretrain/Loss (Raw)": 2.3242578506469727, "Pretrain/Step": 1175, "Pretrain/Step Time": 10.309680912643671} +{"Pretrain/Learning Rate": 4.886680703538269e-05, "Pretrain/Loss": 2.124831199645996, "Pretrain/Loss (Raw)": 1.9608367681503296, "Pretrain/Step": 1176, "Pretrain/Step Time": 10.341762078925967} +{"Pretrain/Learning Rate": 4.886427857271284e-05, "Pretrain/Loss": 2.12345552444458, "Pretrain/Loss (Raw)": 2.0641047954559326, "Pretrain/Step": 1177, "Pretrain/Step Time": 10.343567026779056} +{"Pretrain/Learning Rate": 4.886174735790194e-05, "Pretrain/Loss": 2.12376070022583, "Pretrain/Loss (Raw)": 2.101278781890869, "Pretrain/Step": 1178, "Pretrain/Step Time": 10.432478103786707} +{"Pretrain/Learning Rate": 4.88592133912419e-05, "Pretrain/Loss": 2.124454975128174, "Pretrain/Loss (Raw)": 2.1796655654907227, "Pretrain/Step": 1179, "Pretrain/Step Time": 10.42904756963253} +{"Pretrain/Learning Rate": 4.885667667302494e-05, "Pretrain/Loss": 2.1248292922973633, "Pretrain/Loss (Raw)": 2.0744504928588867, "Pretrain/Step": 1180, "Pretrain/Step Time": 10.441381819546223} +{"Pretrain/Learning Rate": 4.88541372035436e-05, "Pretrain/Loss": 2.1253864765167236, "Pretrain/Loss (Raw)": 2.1040360927581787, "Pretrain/Step": 1181, "Pretrain/Step Time": 10.439141176640987} +{"Pretrain/Learning Rate": 4.885159498309077e-05, "Pretrain/Loss": 2.1252052783966064, "Pretrain/Loss (Raw)": 2.064864158630371, "Pretrain/Step": 1182, "Pretrain/Step Time": 10.451507899910212} +{"Pretrain/Learning Rate": 4.884905001195961e-05, "Pretrain/Loss": 2.126744270324707, "Pretrain/Loss (Raw)": 1.995736837387085, "Pretrain/Step": 1183, "Pretrain/Step Time": 10.449640637263656} +{"Pretrain/Learning Rate": 4.884650229044361e-05, "Pretrain/Loss": 2.126221179962158, "Pretrain/Loss (Raw)": 2.1036415100097656, "Pretrain/Step": 1184, "Pretrain/Step Time": 10.417638760060072} +{"Pretrain/Learning Rate": 4.884395181883661e-05, "Pretrain/Loss": 2.1266937255859375, "Pretrain/Loss (Raw)": 2.198711633682251, "Pretrain/Step": 1185, "Pretrain/Step Time": 10.422626445069909} +{"Pretrain/Learning Rate": 4.8841398597432725e-05, "Pretrain/Loss": 2.1259827613830566, "Pretrain/Loss (Raw)": 2.0508410930633545, "Pretrain/Step": 1186, "Pretrain/Step Time": 10.371340764686465} +{"Pretrain/Learning Rate": 4.883884262652641e-05, "Pretrain/Loss": 2.1278021335601807, "Pretrain/Loss (Raw)": 2.1700611114501953, "Pretrain/Step": 1187, "Pretrain/Step Time": 10.374648466706276} +{"Pretrain/Learning Rate": 4.883628390641243e-05, "Pretrain/Loss": 2.13000750541687, "Pretrain/Loss (Raw)": 2.2604095935821533, "Pretrain/Step": 1188, "Pretrain/Step Time": 10.341175640001893} +{"Pretrain/Learning Rate": 4.883372243738588e-05, "Pretrain/Loss": 2.129988670349121, "Pretrain/Loss (Raw)": 2.0831384658813477, "Pretrain/Step": 1189, "Pretrain/Step Time": 10.331488529220223} +{"Pretrain/Learning Rate": 4.883115821974213e-05, "Pretrain/Loss": 2.128427028656006, "Pretrain/Loss (Raw)": 1.959430456161499, "Pretrain/Step": 1190, "Pretrain/Step Time": 10.375997146591544} +{"Pretrain/Learning Rate": 4.8828591253776937e-05, "Pretrain/Loss": 2.129279613494873, "Pretrain/Loss (Raw)": 2.1640470027923584, "Pretrain/Step": 1191, "Pretrain/Step Time": 10.375323627144098} +{"Pretrain/Learning Rate": 4.88260215397863e-05, "Pretrain/Loss": 2.128178119659424, "Pretrain/Loss (Raw)": 1.9387754201889038, "Pretrain/Step": 1192, "Pretrain/Step Time": 10.403241872787476} +{"Pretrain/Learning Rate": 4.882344907806659e-05, "Pretrain/Loss": 2.1279125213623047, "Pretrain/Loss (Raw)": 2.0502500534057617, "Pretrain/Step": 1193, "Pretrain/Step Time": 10.476536627858877} +{"Pretrain/Learning Rate": 4.882087386891448e-05, "Pretrain/Loss": 2.1276021003723145, "Pretrain/Loss (Raw)": 2.095627546310425, "Pretrain/Step": 1194, "Pretrain/Step Time": 10.447490688413382} +{"Pretrain/Learning Rate": 4.8818295912626955e-05, "Pretrain/Loss": 2.129211902618408, "Pretrain/Loss (Raw)": 2.1368746757507324, "Pretrain/Step": 1195, "Pretrain/Step Time": 10.450831975787878} +{"Pretrain/Learning Rate": 4.88157152095013e-05, "Pretrain/Loss": 2.128938674926758, "Pretrain/Loss (Raw)": 2.180079698562622, "Pretrain/Step": 1196, "Pretrain/Step Time": 10.383511671796441} +{"Pretrain/Learning Rate": 4.881313175983515e-05, "Pretrain/Loss": 2.128101348876953, "Pretrain/Loss (Raw)": 2.052323818206787, "Pretrain/Step": 1197, "Pretrain/Step Time": 10.393726041540504} +{"Pretrain/Learning Rate": 4.881054556392642e-05, "Pretrain/Loss": 2.1289443969726562, "Pretrain/Loss (Raw)": 2.2408337593078613, "Pretrain/Step": 1198, "Pretrain/Step Time": 10.382951797917485} +{"Pretrain/Learning Rate": 4.8807956622073394e-05, "Pretrain/Loss": 2.1292788982391357, "Pretrain/Loss (Raw)": 2.1707024574279785, "Pretrain/Step": 1199, "Pretrain/Step Time": 10.42785015143454} +{"Pretrain/Learning Rate": 4.880536493457461e-05, "Pretrain/Loss": 2.126760959625244, "Pretrain/Loss (Raw)": 1.9713605642318726, "Pretrain/Step": 1200, "Pretrain/Step Time": 10.356710569933057} +{"Pretrain/Learning Rate": 4.880277050172897e-05, "Pretrain/Loss": 2.1288015842437744, "Pretrain/Loss (Raw)": 2.2264726161956787, "Pretrain/Step": 1201, "Pretrain/Step Time": 10.510790707543492} +{"Pretrain/Learning Rate": 4.880017332383567e-05, "Pretrain/Loss": 2.1289281845092773, "Pretrain/Loss (Raw)": 2.0809576511383057, "Pretrain/Step": 1202, "Pretrain/Step Time": 10.507707310840487} +{"Pretrain/Learning Rate": 4.879757340119425e-05, "Pretrain/Loss": 2.127912998199463, "Pretrain/Loss (Raw)": 2.114240884780884, "Pretrain/Step": 1203, "Pretrain/Step Time": 10.506968230009079} +{"Pretrain/Learning Rate": 4.879497073410451e-05, "Pretrain/Loss": 2.1274197101593018, "Pretrain/Loss (Raw)": 2.10436749458313, "Pretrain/Step": 1204, "Pretrain/Step Time": 10.424337284639478} +{"Pretrain/Learning Rate": 4.8792365322866626e-05, "Pretrain/Loss": 2.125441074371338, "Pretrain/Loss (Raw)": 1.9320541620254517, "Pretrain/Step": 1205, "Pretrain/Step Time": 10.4245669785887} +{"Pretrain/Learning Rate": 4.878975716778106e-05, "Pretrain/Loss": 2.127011299133301, "Pretrain/Loss (Raw)": 2.1642367839813232, "Pretrain/Step": 1206, "Pretrain/Step Time": 10.397418268024921} +{"Pretrain/Learning Rate": 4.878714626914859e-05, "Pretrain/Loss": 2.1252150535583496, "Pretrain/Loss (Raw)": 2.02128529548645, "Pretrain/Step": 1207, "Pretrain/Step Time": 10.401865938678384} +{"Pretrain/Learning Rate": 4.878453262727033e-05, "Pretrain/Loss": 2.124157667160034, "Pretrain/Loss (Raw)": 2.1995246410369873, "Pretrain/Step": 1208, "Pretrain/Step Time": 10.401936223730445} +{"Pretrain/Learning Rate": 4.878191624244769e-05, "Pretrain/Loss": 2.1246349811553955, "Pretrain/Loss (Raw)": 2.1970629692077637, "Pretrain/Step": 1209, "Pretrain/Step Time": 10.399050014093518} +{"Pretrain/Learning Rate": 4.8779297114982406e-05, "Pretrain/Loss": 2.124680280685425, "Pretrain/Loss (Raw)": 2.142718553543091, "Pretrain/Step": 1210, "Pretrain/Step Time": 10.396081695333123} +{"Pretrain/Learning Rate": 4.877667524517652e-05, "Pretrain/Loss": 2.1234607696533203, "Pretrain/Loss (Raw)": 1.9233864545822144, "Pretrain/Step": 1211, "Pretrain/Step Time": 10.456236278638244} +{"Pretrain/Learning Rate": 4.877405063333241e-05, "Pretrain/Loss": 2.1273655891418457, "Pretrain/Loss (Raw)": 2.5401501655578613, "Pretrain/Step": 1212, "Pretrain/Step Time": 10.45740614272654} +{"Pretrain/Learning Rate": 4.877142327975276e-05, "Pretrain/Loss": 2.1290364265441895, "Pretrain/Loss (Raw)": 2.139758586883545, "Pretrain/Step": 1213, "Pretrain/Step Time": 10.494790179654956} +{"Pretrain/Learning Rate": 4.8768793184740556e-05, "Pretrain/Loss": 2.1300175189971924, "Pretrain/Loss (Raw)": 2.1270954608917236, "Pretrain/Step": 1214, "Pretrain/Step Time": 10.491845453158021} +{"Pretrain/Learning Rate": 4.8766160348599125e-05, "Pretrain/Loss": 2.128300666809082, "Pretrain/Loss (Raw)": 2.0250158309936523, "Pretrain/Step": 1215, "Pretrain/Step Time": 10.489380346611142} +{"Pretrain/Learning Rate": 4.876352477163209e-05, "Pretrain/Loss": 2.1301581859588623, "Pretrain/Loss (Raw)": 2.161567449569702, "Pretrain/Step": 1216, "Pretrain/Step Time": 10.511887976899743} +{"Pretrain/Learning Rate": 4.8760886454143394e-05, "Pretrain/Loss": 2.1321473121643066, "Pretrain/Loss (Raw)": 2.315351724624634, "Pretrain/Step": 1217, "Pretrain/Step Time": 10.502615675330162} +{"Pretrain/Learning Rate": 4.875824539643731e-05, "Pretrain/Loss": 2.1320080757141113, "Pretrain/Loss (Raw)": 2.136420488357544, "Pretrain/Step": 1218, "Pretrain/Step Time": 10.520077634602785} +{"Pretrain/Learning Rate": 4.8755601598818427e-05, "Pretrain/Loss": 2.132136821746826, "Pretrain/Loss (Raw)": 2.1060750484466553, "Pretrain/Step": 1219, "Pretrain/Step Time": 10.493449438363314} +{"Pretrain/Learning Rate": 4.875295506159161e-05, "Pretrain/Loss": 2.1324901580810547, "Pretrain/Loss (Raw)": 2.312255620956421, "Pretrain/Step": 1220, "Pretrain/Step Time": 10.477932525798678} +{"Pretrain/Learning Rate": 4.87503057850621e-05, "Pretrain/Loss": 2.131723403930664, "Pretrain/Loss (Raw)": 2.0740339756011963, "Pretrain/Step": 1221, "Pretrain/Step Time": 10.476304857060313} +{"Pretrain/Learning Rate": 4.874765376953541e-05, "Pretrain/Loss": 2.1313138008117676, "Pretrain/Loss (Raw)": 2.143669605255127, "Pretrain/Step": 1222, "Pretrain/Step Time": 10.473771395161748} +{"Pretrain/Learning Rate": 4.874499901531737e-05, "Pretrain/Loss": 2.133110523223877, "Pretrain/Loss (Raw)": 2.164952278137207, "Pretrain/Step": 1223, "Pretrain/Step Time": 10.469193909317255} +{"Pretrain/Learning Rate": 4.874234152271418e-05, "Pretrain/Loss": 2.1347098350524902, "Pretrain/Loss (Raw)": 2.5726187229156494, "Pretrain/Step": 1224, "Pretrain/Step Time": 10.470505906268954} +{"Pretrain/Learning Rate": 4.8739681292032266e-05, "Pretrain/Loss": 2.135787010192871, "Pretrain/Loss (Raw)": 2.109851598739624, "Pretrain/Step": 1225, "Pretrain/Step Time": 10.471138818189502} +{"Pretrain/Learning Rate": 4.8737018323578445e-05, "Pretrain/Loss": 2.1354541778564453, "Pretrain/Loss (Raw)": 2.074322462081909, "Pretrain/Step": 1226, "Pretrain/Step Time": 10.51244292408228} +{"Pretrain/Learning Rate": 4.873435261765982e-05, "Pretrain/Loss": 2.1349880695343018, "Pretrain/Loss (Raw)": 2.046149969100952, "Pretrain/Step": 1227, "Pretrain/Step Time": 10.47666304372251} +{"Pretrain/Learning Rate": 4.873168417458381e-05, "Pretrain/Loss": 2.1334621906280518, "Pretrain/Loss (Raw)": 2.1852071285247803, "Pretrain/Step": 1228, "Pretrain/Step Time": 10.477492105215788} +{"Pretrain/Learning Rate": 4.8729012994658166e-05, "Pretrain/Loss": 2.133617877960205, "Pretrain/Loss (Raw)": 2.233739137649536, "Pretrain/Step": 1229, "Pretrain/Step Time": 10.500264711678028} +{"Pretrain/Learning Rate": 4.8726339078190914e-05, "Pretrain/Loss": 2.132241725921631, "Pretrain/Loss (Raw)": 1.925960898399353, "Pretrain/Step": 1230, "Pretrain/Step Time": 10.468722876161337} +{"Pretrain/Learning Rate": 4.872366242549044e-05, "Pretrain/Loss": 2.134942054748535, "Pretrain/Loss (Raw)": 2.132683038711548, "Pretrain/Step": 1231, "Pretrain/Step Time": 10.467165566980839} +{"Pretrain/Learning Rate": 4.872098303686543e-05, "Pretrain/Loss": 2.132814884185791, "Pretrain/Loss (Raw)": 2.124096393585205, "Pretrain/Step": 1232, "Pretrain/Step Time": 10.486818941310048} +{"Pretrain/Learning Rate": 4.871830091262488e-05, "Pretrain/Loss": 2.133233070373535, "Pretrain/Loss (Raw)": 2.0985615253448486, "Pretrain/Step": 1233, "Pretrain/Step Time": 10.492233775556087} +{"Pretrain/Learning Rate": 4.8715616053078095e-05, "Pretrain/Loss": 2.131842613220215, "Pretrain/Loss (Raw)": 1.9730641841888428, "Pretrain/Step": 1234, "Pretrain/Step Time": 10.515846192836761} +{"Pretrain/Learning Rate": 4.871292845853472e-05, "Pretrain/Loss": 2.131432056427002, "Pretrain/Loss (Raw)": 2.1412041187286377, "Pretrain/Step": 1235, "Pretrain/Step Time": 10.5114741679281} +{"Pretrain/Learning Rate": 4.87102381293047e-05, "Pretrain/Loss": 2.130554676055908, "Pretrain/Loss (Raw)": 2.020075798034668, "Pretrain/Step": 1236, "Pretrain/Step Time": 10.567681431770325} +{"Pretrain/Learning Rate": 4.870754506569829e-05, "Pretrain/Loss": 2.1322288513183594, "Pretrain/Loss (Raw)": 2.172652244567871, "Pretrain/Step": 1237, "Pretrain/Step Time": 10.563707314431667} +{"Pretrain/Learning Rate": 4.870484926802606e-05, "Pretrain/Loss": 2.130284309387207, "Pretrain/Loss (Raw)": 2.0475776195526123, "Pretrain/Step": 1238, "Pretrain/Step Time": 10.556160660460591} +{"Pretrain/Learning Rate": 4.8702150736598925e-05, "Pretrain/Loss": 2.1296141147613525, "Pretrain/Loss (Raw)": 2.0447189807891846, "Pretrain/Step": 1239, "Pretrain/Step Time": 10.559827748686075} +{"Pretrain/Learning Rate": 4.8699449471728075e-05, "Pretrain/Loss": 2.129744291305542, "Pretrain/Loss (Raw)": 2.1302967071533203, "Pretrain/Step": 1240, "Pretrain/Step Time": 10.524579361081123} +{"Pretrain/Learning Rate": 4.869674547372504e-05, "Pretrain/Loss": 2.1308393478393555, "Pretrain/Loss (Raw)": 2.1470258235931396, "Pretrain/Step": 1241, "Pretrain/Step Time": 10.562324790284038} +{"Pretrain/Learning Rate": 4.8694038742901646e-05, "Pretrain/Loss": 2.132122039794922, "Pretrain/Loss (Raw)": 2.2533183097839355, "Pretrain/Step": 1242, "Pretrain/Step Time": 10.587052557617426} +{"Pretrain/Learning Rate": 4.869132927957007e-05, "Pretrain/Loss": 2.1327292919158936, "Pretrain/Loss (Raw)": 2.066880702972412, "Pretrain/Step": 1243, "Pretrain/Step Time": 10.604321520775557} +{"Pretrain/Learning Rate": 4.868861708404275e-05, "Pretrain/Loss": 2.132220506668091, "Pretrain/Loss (Raw)": 2.1375808715820312, "Pretrain/Step": 1244, "Pretrain/Step Time": 10.669535428285599} +{"Pretrain/Learning Rate": 4.868590215663248e-05, "Pretrain/Loss": 2.134556293487549, "Pretrain/Loss (Raw)": 2.0469915866851807, "Pretrain/Step": 1245, "Pretrain/Step Time": 10.666121950373054} +{"Pretrain/Learning Rate": 4.8683184497652366e-05, "Pretrain/Loss": 2.133976459503174, "Pretrain/Loss (Raw)": 2.253889560699463, "Pretrain/Step": 1246, "Pretrain/Step Time": 10.711771098896861} +{"Pretrain/Learning Rate": 4.868046410741582e-05, "Pretrain/Loss": 2.1332271099090576, "Pretrain/Loss (Raw)": 2.158745765686035, "Pretrain/Step": 1247, "Pretrain/Step Time": 10.71194376796484} +{"Pretrain/Learning Rate": 4.867774098623657e-05, "Pretrain/Loss": 2.1322031021118164, "Pretrain/Loss (Raw)": 2.090379476547241, "Pretrain/Step": 1248, "Pretrain/Step Time": 10.695511868223548} +{"Pretrain/Learning Rate": 4.8675015134428654e-05, "Pretrain/Loss": 2.1304550170898438, "Pretrain/Loss (Raw)": 2.100071907043457, "Pretrain/Step": 1249, "Pretrain/Step Time": 10.70220516435802} +{"Pretrain/Learning Rate": 4.867228655230643e-05, "Pretrain/Loss": 2.130129098892212, "Pretrain/Loss (Raw)": 1.7570133209228516, "Pretrain/Step": 1250, "Pretrain/Step Time": 10.732786629348993} +{"Pretrain/Learning Rate": 4.866955524018457e-05, "Pretrain/Loss": 2.129201889038086, "Pretrain/Loss (Raw)": 2.0202012062072754, "Pretrain/Step": 1251, "Pretrain/Step Time": 10.723545821383595} +{"Pretrain/Learning Rate": 4.866682119837807e-05, "Pretrain/Loss": 2.131146192550659, "Pretrain/Loss (Raw)": 2.338285446166992, "Pretrain/Step": 1252, "Pretrain/Step Time": 10.723768059164286} +{"Pretrain/Learning Rate": 4.866408442720223e-05, "Pretrain/Loss": 2.131760835647583, "Pretrain/Loss (Raw)": 2.239011526107788, "Pretrain/Step": 1253, "Pretrain/Step Time": 10.717874141409993} +{"Pretrain/Learning Rate": 4.8661344926972666e-05, "Pretrain/Loss": 2.132424831390381, "Pretrain/Loss (Raw)": 2.1510796546936035, "Pretrain/Step": 1254, "Pretrain/Step Time": 10.722165433689952} +{"Pretrain/Learning Rate": 4.8658602698005294e-05, "Pretrain/Loss": 2.129815101623535, "Pretrain/Loss (Raw)": 1.9218562841415405, "Pretrain/Step": 1255, "Pretrain/Step Time": 10.729567581787705} +{"Pretrain/Learning Rate": 4.8655857740616395e-05, "Pretrain/Loss": 2.1290743350982666, "Pretrain/Loss (Raw)": 2.0929765701293945, "Pretrain/Step": 1256, "Pretrain/Step Time": 10.732888834550977} +{"Pretrain/Learning Rate": 4.8653110055122496e-05, "Pretrain/Loss": 2.129154682159424, "Pretrain/Loss (Raw)": 2.047656297683716, "Pretrain/Step": 1257, "Pretrain/Step Time": 10.723241370171309} +{"Pretrain/Learning Rate": 4.8650359641840495e-05, "Pretrain/Loss": 2.1280157566070557, "Pretrain/Loss (Raw)": 2.1245737075805664, "Pretrain/Step": 1258, "Pretrain/Step Time": 10.725454289466143} +{"Pretrain/Learning Rate": 4.864760650108758e-05, "Pretrain/Loss": 2.1281962394714355, "Pretrain/Loss (Raw)": 2.195962905883789, "Pretrain/Step": 1259, "Pretrain/Step Time": 10.722163580358028} +{"Pretrain/Learning Rate": 4.864485063318125e-05, "Pretrain/Loss": 2.128382921218872, "Pretrain/Loss (Raw)": 2.053967237472534, "Pretrain/Step": 1260, "Pretrain/Step Time": 10.736651297658682} +{"Pretrain/Learning Rate": 4.864209203843932e-05, "Pretrain/Loss": 2.126302719116211, "Pretrain/Loss (Raw)": 2.1137800216674805, "Pretrain/Step": 1261, "Pretrain/Step Time": 10.783651558682323} +{"Pretrain/Learning Rate": 4.8639330717179946e-05, "Pretrain/Loss": 2.128612995147705, "Pretrain/Loss (Raw)": 2.354783058166504, "Pretrain/Step": 1262, "Pretrain/Step Time": 10.781176947057247} +{"Pretrain/Learning Rate": 4.863656666972154e-05, "Pretrain/Loss": 2.129765033721924, "Pretrain/Loss (Raw)": 2.298783779144287, "Pretrain/Step": 1263, "Pretrain/Step Time": 10.76712316647172} +{"Pretrain/Learning Rate": 4.86337998963829e-05, "Pretrain/Loss": 2.1299726963043213, "Pretrain/Loss (Raw)": 2.1410961151123047, "Pretrain/Step": 1264, "Pretrain/Step Time": 10.767349977046251} +{"Pretrain/Learning Rate": 4.863103039748309e-05, "Pretrain/Loss": 2.129737377166748, "Pretrain/Loss (Raw)": 2.031261444091797, "Pretrain/Step": 1265, "Pretrain/Step Time": 10.791739525273442} +{"Pretrain/Learning Rate": 4.86282581733415e-05, "Pretrain/Loss": 2.1294689178466797, "Pretrain/Loss (Raw)": 2.1175057888031006, "Pretrain/Step": 1266, "Pretrain/Step Time": 10.795364916324615} +{"Pretrain/Learning Rate": 4.8625483224277835e-05, "Pretrain/Loss": 2.1255431175231934, "Pretrain/Loss (Raw)": 1.7912538051605225, "Pretrain/Step": 1267, "Pretrain/Step Time": 10.874874897301197} +{"Pretrain/Learning Rate": 4.8622705550612126e-05, "Pretrain/Loss": 2.1257524490356445, "Pretrain/Loss (Raw)": 2.200061321258545, "Pretrain/Step": 1268, "Pretrain/Step Time": 10.867185162380338} +{"Pretrain/Learning Rate": 4.861992515266469e-05, "Pretrain/Loss": 2.1277103424072266, "Pretrain/Loss (Raw)": 2.1176469326019287, "Pretrain/Step": 1269, "Pretrain/Step Time": 10.82817761413753} +{"Pretrain/Learning Rate": 4.8617142030756194e-05, "Pretrain/Loss": 2.128537178039551, "Pretrain/Loss (Raw)": 2.0190048217773438, "Pretrain/Step": 1270, "Pretrain/Step Time": 10.83498135022819} +{"Pretrain/Learning Rate": 4.8614356185207575e-05, "Pretrain/Loss": 2.1281158924102783, "Pretrain/Loss (Raw)": 2.085803270339966, "Pretrain/Step": 1271, "Pretrain/Step Time": 10.82166002318263} +{"Pretrain/Learning Rate": 4.861156761634014e-05, "Pretrain/Loss": 2.127711057662964, "Pretrain/Loss (Raw)": 2.118468999862671, "Pretrain/Step": 1272, "Pretrain/Step Time": 10.815064186230302} +{"Pretrain/Learning Rate": 4.860877632447546e-05, "Pretrain/Loss": 2.127420663833618, "Pretrain/Loss (Raw)": 2.1561481952667236, "Pretrain/Step": 1273, "Pretrain/Step Time": 10.805620700120926} +{"Pretrain/Learning Rate": 4.8605982309935446e-05, "Pretrain/Loss": 2.126965045928955, "Pretrain/Loss (Raw)": 2.2128822803497314, "Pretrain/Step": 1274, "Pretrain/Step Time": 10.80217969417572} +{"Pretrain/Learning Rate": 4.860318557304232e-05, "Pretrain/Loss": 2.127695083618164, "Pretrain/Loss (Raw)": 2.3210229873657227, "Pretrain/Step": 1275, "Pretrain/Step Time": 10.812433397397399} +{"Pretrain/Learning Rate": 4.860038611411861e-05, "Pretrain/Loss": 2.129143476486206, "Pretrain/Loss (Raw)": 2.247497797012329, "Pretrain/Step": 1276, "Pretrain/Step Time": 10.810212882235646} +{"Pretrain/Learning Rate": 4.8597583933487165e-05, "Pretrain/Loss": 2.13085675239563, "Pretrain/Loss (Raw)": 2.2030398845672607, "Pretrain/Step": 1277, "Pretrain/Step Time": 10.815823182463646} +{"Pretrain/Learning Rate": 4.859477903147115e-05, "Pretrain/Loss": 2.13051700592041, "Pretrain/Loss (Raw)": 2.171858549118042, "Pretrain/Step": 1278, "Pretrain/Step Time": 10.814004205167294} +{"Pretrain/Learning Rate": 4.8591971408394034e-05, "Pretrain/Loss": 2.1295502185821533, "Pretrain/Loss (Raw)": 2.4349477291107178, "Pretrain/Step": 1279, "Pretrain/Step Time": 10.803606681525707} +{"Pretrain/Learning Rate": 4.85891610645796e-05, "Pretrain/Loss": 2.13266658782959, "Pretrain/Loss (Raw)": 2.3951609134674072, "Pretrain/Step": 1280, "Pretrain/Step Time": 10.805926175788045} +{"Pretrain/Learning Rate": 4.8586348000351956e-05, "Pretrain/Loss": 2.1293225288391113, "Pretrain/Loss (Raw)": 1.6141356229782104, "Pretrain/Step": 1281, "Pretrain/Step Time": 10.754524551331997} +{"Pretrain/Learning Rate": 4.8583532216035524e-05, "Pretrain/Loss": 2.127450466156006, "Pretrain/Loss (Raw)": 1.886244773864746, "Pretrain/Step": 1282, "Pretrain/Step Time": 10.779733579605818} +{"Pretrain/Learning Rate": 4.858071371195502e-05, "Pretrain/Loss": 2.128188133239746, "Pretrain/Loss (Raw)": 2.304353713989258, "Pretrain/Step": 1283, "Pretrain/Step Time": 10.726487211883068} +{"Pretrain/Learning Rate": 4.8577892488435504e-05, "Pretrain/Loss": 2.127734661102295, "Pretrain/Loss (Raw)": 2.0496623516082764, "Pretrain/Step": 1284, "Pretrain/Step Time": 10.732933716848493} +{"Pretrain/Learning Rate": 4.8575068545802316e-05, "Pretrain/Loss": 2.128146171569824, "Pretrain/Loss (Raw)": 2.185755729675293, "Pretrain/Step": 1285, "Pretrain/Step Time": 10.734081104397774} +{"Pretrain/Learning Rate": 4.8572241884381145e-05, "Pretrain/Loss": 2.1294593811035156, "Pretrain/Loss (Raw)": 2.2318532466888428, "Pretrain/Step": 1286, "Pretrain/Step Time": 10.73313101939857} +{"Pretrain/Learning Rate": 4.856941250449795e-05, "Pretrain/Loss": 2.1305880546569824, "Pretrain/Loss (Raw)": 2.3020870685577393, "Pretrain/Step": 1287, "Pretrain/Step Time": 10.739505659788847} +{"Pretrain/Learning Rate": 4.8566580406479045e-05, "Pretrain/Loss": 2.131237506866455, "Pretrain/Loss (Raw)": 2.2371625900268555, "Pretrain/Step": 1288, "Pretrain/Step Time": 10.749178668484092} +{"Pretrain/Learning Rate": 4.856374559065104e-05, "Pretrain/Loss": 2.1322131156921387, "Pretrain/Loss (Raw)": 2.1917479038238525, "Pretrain/Step": 1289, "Pretrain/Step Time": 10.7538628783077} +{"Pretrain/Learning Rate": 4.856090805734086e-05, "Pretrain/Loss": 2.1310617923736572, "Pretrain/Loss (Raw)": 2.0304017066955566, "Pretrain/Step": 1290, "Pretrain/Step Time": 10.746990542858839} +{"Pretrain/Learning Rate": 4.855806780687574e-05, "Pretrain/Loss": 2.131580352783203, "Pretrain/Loss (Raw)": 2.204183340072632, "Pretrain/Step": 1291, "Pretrain/Step Time": 10.681791380047798} +{"Pretrain/Learning Rate": 4.8555224839583236e-05, "Pretrain/Loss": 2.1314632892608643, "Pretrain/Loss (Raw)": 2.1449930667877197, "Pretrain/Step": 1292, "Pretrain/Step Time": 10.704617312178016} +{"Pretrain/Learning Rate": 4.8552379155791194e-05, "Pretrain/Loss": 2.1331417560577393, "Pretrain/Loss (Raw)": 2.133742094039917, "Pretrain/Step": 1293, "Pretrain/Step Time": 10.606156520545483} +{"Pretrain/Learning Rate": 4.854953075582782e-05, "Pretrain/Loss": 2.131521224975586, "Pretrain/Loss (Raw)": 1.9744322299957275, "Pretrain/Step": 1294, "Pretrain/Step Time": 10.639119846746325} +{"Pretrain/Learning Rate": 4.854667964002158e-05, "Pretrain/Loss": 2.1281142234802246, "Pretrain/Loss (Raw)": 1.8295973539352417, "Pretrain/Step": 1295, "Pretrain/Step Time": 10.643235169351101} +{"Pretrain/Learning Rate": 4.8543825808701294e-05, "Pretrain/Loss": 2.126596450805664, "Pretrain/Loss (Raw)": 2.017239570617676, "Pretrain/Step": 1296, "Pretrain/Step Time": 10.650702415034175} +{"Pretrain/Learning Rate": 4.854096926219607e-05, "Pretrain/Loss": 2.1260905265808105, "Pretrain/Loss (Raw)": 2.097262144088745, "Pretrain/Step": 1297, "Pretrain/Step Time": 10.645083932206035} +{"Pretrain/Learning Rate": 4.853811000083535e-05, "Pretrain/Loss": 2.126756191253662, "Pretrain/Loss (Raw)": 2.230929136276245, "Pretrain/Step": 1298, "Pretrain/Step Time": 10.648995101451874} +{"Pretrain/Learning Rate": 4.8535248024948854e-05, "Pretrain/Loss": 2.126791000366211, "Pretrain/Loss (Raw)": 2.0992090702056885, "Pretrain/Step": 1299, "Pretrain/Step Time": 10.662004442885518} +{"Pretrain/Learning Rate": 4.853238333486666e-05, "Pretrain/Loss": 2.1264841556549072, "Pretrain/Loss (Raw)": 2.2242562770843506, "Pretrain/Step": 1300, "Pretrain/Step Time": 10.679449040442705} +{"Pretrain/Learning Rate": 4.852951593091914e-05, "Pretrain/Loss": 2.12553071975708, "Pretrain/Loss (Raw)": 2.1741111278533936, "Pretrain/Step": 1301, "Pretrain/Step Time": 10.68388189561665} +{"Pretrain/Learning Rate": 4.852664581343696e-05, "Pretrain/Loss": 2.1266403198242188, "Pretrain/Loss (Raw)": 2.235344409942627, "Pretrain/Step": 1302, "Pretrain/Step Time": 10.66636847704649} +{"Pretrain/Learning Rate": 4.852377298275113e-05, "Pretrain/Loss": 2.1262035369873047, "Pretrain/Loss (Raw)": 2.2683496475219727, "Pretrain/Step": 1303, "Pretrain/Step Time": 10.669054552912712} +{"Pretrain/Learning Rate": 4.852089743919295e-05, "Pretrain/Loss": 2.127542495727539, "Pretrain/Loss (Raw)": 2.1322453022003174, "Pretrain/Step": 1304, "Pretrain/Step Time": 10.634431766346097} +{"Pretrain/Learning Rate": 4.851801918309403e-05, "Pretrain/Loss": 2.1268727779388428, "Pretrain/Loss (Raw)": 1.978369116783142, "Pretrain/Step": 1305, "Pretrain/Step Time": 10.626126825809479} +{"Pretrain/Learning Rate": 4.8515138214786335e-05, "Pretrain/Loss": 2.127664089202881, "Pretrain/Loss (Raw)": 2.202563524246216, "Pretrain/Step": 1306, "Pretrain/Step Time": 10.538051532581449} +{"Pretrain/Learning Rate": 4.851225453460209e-05, "Pretrain/Loss": 2.127042293548584, "Pretrain/Loss (Raw)": 2.100062847137451, "Pretrain/Step": 1307, "Pretrain/Step Time": 10.534153498709202} +{"Pretrain/Learning Rate": 4.850936814287386e-05, "Pretrain/Loss": 2.1268179416656494, "Pretrain/Loss (Raw)": 2.0457537174224854, "Pretrain/Step": 1308, "Pretrain/Step Time": 10.565101245418191} +{"Pretrain/Learning Rate": 4.85064790399345e-05, "Pretrain/Loss": 2.1266233921051025, "Pretrain/Loss (Raw)": 2.079110622406006, "Pretrain/Step": 1309, "Pretrain/Step Time": 10.568290334194899} +{"Pretrain/Learning Rate": 4.850358722611723e-05, "Pretrain/Loss": 2.127943754196167, "Pretrain/Loss (Raw)": 2.2338814735412598, "Pretrain/Step": 1310, "Pretrain/Step Time": 10.56280162371695} +{"Pretrain/Learning Rate": 4.850069270175552e-05, "Pretrain/Loss": 2.1290862560272217, "Pretrain/Loss (Raw)": 2.141974925994873, "Pretrain/Step": 1311, "Pretrain/Step Time": 10.567032061517239} +{"Pretrain/Learning Rate": 4.849779546718319e-05, "Pretrain/Loss": 2.128427505493164, "Pretrain/Loss (Raw)": 2.01930832862854, "Pretrain/Step": 1312, "Pretrain/Step Time": 10.614778310060501} +{"Pretrain/Learning Rate": 4.8494895522734364e-05, "Pretrain/Loss": 2.1289730072021484, "Pretrain/Loss (Raw)": 2.26853609085083, "Pretrain/Step": 1313, "Pretrain/Step Time": 10.611950371414423} +{"Pretrain/Learning Rate": 4.849199286874347e-05, "Pretrain/Loss": 2.129971504211426, "Pretrain/Loss (Raw)": 2.1786856651306152, "Pretrain/Step": 1314, "Pretrain/Step Time": 10.604094427078962} +{"Pretrain/Learning Rate": 4.8489087505545266e-05, "Pretrain/Loss": 2.129197120666504, "Pretrain/Loss (Raw)": 2.0708978176116943, "Pretrain/Step": 1315, "Pretrain/Step Time": 10.601561052724719} +{"Pretrain/Learning Rate": 4.84861794334748e-05, "Pretrain/Loss": 2.126715898513794, "Pretrain/Loss (Raw)": 1.9428472518920898, "Pretrain/Step": 1316, "Pretrain/Step Time": 10.649968748912215} +{"Pretrain/Learning Rate": 4.848326865286746e-05, "Pretrain/Loss": 2.1269302368164062, "Pretrain/Loss (Raw)": 2.1105425357818604, "Pretrain/Step": 1317, "Pretrain/Step Time": 10.652048107236624} +{"Pretrain/Learning Rate": 4.848035516405892e-05, "Pretrain/Loss": 2.128833770751953, "Pretrain/Loss (Raw)": 2.2031197547912598, "Pretrain/Step": 1318, "Pretrain/Step Time": 10.616616703569889} +{"Pretrain/Learning Rate": 4.847743896738517e-05, "Pretrain/Loss": 2.1290202140808105, "Pretrain/Loss (Raw)": 2.187880277633667, "Pretrain/Step": 1319, "Pretrain/Step Time": 10.613658292219043} +{"Pretrain/Learning Rate": 4.847452006318254e-05, "Pretrain/Loss": 2.132964611053467, "Pretrain/Loss (Raw)": 2.4436933994293213, "Pretrain/Step": 1320, "Pretrain/Step Time": 10.639726173132658} +{"Pretrain/Learning Rate": 4.8471598451787635e-05, "Pretrain/Loss": 2.1348226070404053, "Pretrain/Loss (Raw)": 2.288050413131714, "Pretrain/Step": 1321, "Pretrain/Step Time": 10.564959656447172} +{"Pretrain/Learning Rate": 4.8468674133537395e-05, "Pretrain/Loss": 2.1346426010131836, "Pretrain/Loss (Raw)": 2.072618246078491, "Pretrain/Step": 1322, "Pretrain/Step Time": 10.592528970912099} +{"Pretrain/Learning Rate": 4.846574710876907e-05, "Pretrain/Loss": 2.135491371154785, "Pretrain/Loss (Raw)": 2.2454922199249268, "Pretrain/Step": 1323, "Pretrain/Step Time": 10.592854937538505} +{"Pretrain/Learning Rate": 4.846281737782021e-05, "Pretrain/Loss": 2.135340690612793, "Pretrain/Loss (Raw)": 2.160781145095825, "Pretrain/Step": 1324, "Pretrain/Step Time": 10.61757287941873} +{"Pretrain/Learning Rate": 4.845988494102869e-05, "Pretrain/Loss": 2.135788679122925, "Pretrain/Loss (Raw)": 2.1096556186676025, "Pretrain/Step": 1325, "Pretrain/Step Time": 10.608988244086504} +{"Pretrain/Learning Rate": 4.845694979873269e-05, "Pretrain/Loss": 2.1350507736206055, "Pretrain/Loss (Raw)": 2.146392345428467, "Pretrain/Step": 1326, "Pretrain/Step Time": 10.66349902562797} +{"Pretrain/Learning Rate": 4.845401195127071e-05, "Pretrain/Loss": 2.133793830871582, "Pretrain/Loss (Raw)": 2.0098347663879395, "Pretrain/Step": 1327, "Pretrain/Step Time": 10.625933995470405} +{"Pretrain/Learning Rate": 4.845107139898155e-05, "Pretrain/Loss": 2.134944438934326, "Pretrain/Loss (Raw)": 2.118647575378418, "Pretrain/Step": 1328, "Pretrain/Step Time": 10.637275844812393} +{"Pretrain/Learning Rate": 4.8448128142204334e-05, "Pretrain/Loss": 2.133875846862793, "Pretrain/Loss (Raw)": 2.089674472808838, "Pretrain/Step": 1329, "Pretrain/Step Time": 10.47872424684465} +{"Pretrain/Learning Rate": 4.8445182181278494e-05, "Pretrain/Loss": 2.1341419219970703, "Pretrain/Loss (Raw)": 2.115043878555298, "Pretrain/Step": 1330, "Pretrain/Step Time": 10.507256688550115} +{"Pretrain/Learning Rate": 4.8442233516543756e-05, "Pretrain/Loss": 2.133828639984131, "Pretrain/Loss (Raw)": 2.0741281509399414, "Pretrain/Step": 1331, "Pretrain/Step Time": 10.50703363865614} +{"Pretrain/Learning Rate": 4.8439282148340195e-05, "Pretrain/Loss": 2.1330368518829346, "Pretrain/Loss (Raw)": 2.0030040740966797, "Pretrain/Step": 1332, "Pretrain/Step Time": 10.522243153303862} +{"Pretrain/Learning Rate": 4.843632807700816e-05, "Pretrain/Loss": 2.13517689704895, "Pretrain/Loss (Raw)": 2.2059671878814697, "Pretrain/Step": 1333, "Pretrain/Step Time": 10.525073168799281} +{"Pretrain/Learning Rate": 4.843337130288834e-05, "Pretrain/Loss": 2.1346240043640137, "Pretrain/Loss (Raw)": 2.093473196029663, "Pretrain/Step": 1334, "Pretrain/Step Time": 10.612967671826482} +{"Pretrain/Learning Rate": 4.843041182632172e-05, "Pretrain/Loss": 2.1356260776519775, "Pretrain/Loss (Raw)": 2.149545431137085, "Pretrain/Step": 1335, "Pretrain/Step Time": 10.608058411628008} +{"Pretrain/Learning Rate": 4.84274496476496e-05, "Pretrain/Loss": 2.1346545219421387, "Pretrain/Loss (Raw)": 2.0751705169677734, "Pretrain/Step": 1336, "Pretrain/Step Time": 10.617246486246586} +{"Pretrain/Learning Rate": 4.84244847672136e-05, "Pretrain/Loss": 2.131314992904663, "Pretrain/Loss (Raw)": 1.7696155309677124, "Pretrain/Step": 1337, "Pretrain/Step Time": 10.617326360195875} +{"Pretrain/Learning Rate": 4.842151718535563e-05, "Pretrain/Loss": 2.1315948963165283, "Pretrain/Loss (Raw)": 2.1785359382629395, "Pretrain/Step": 1338, "Pretrain/Step Time": 10.666007321327925} +{"Pretrain/Learning Rate": 4.841854690241793e-05, "Pretrain/Loss": 2.133244037628174, "Pretrain/Loss (Raw)": 2.1344640254974365, "Pretrain/Step": 1339, "Pretrain/Step Time": 10.606368463486433} +{"Pretrain/Learning Rate": 4.841557391874304e-05, "Pretrain/Loss": 2.1290931701660156, "Pretrain/Loss (Raw)": 2.008854866027832, "Pretrain/Step": 1340, "Pretrain/Step Time": 10.62069328688085} +{"Pretrain/Learning Rate": 4.8412598234673845e-05, "Pretrain/Loss": 2.1286697387695312, "Pretrain/Loss (Raw)": 2.0855472087860107, "Pretrain/Step": 1341, "Pretrain/Step Time": 10.587504960596561} +{"Pretrain/Learning Rate": 4.840961985055349e-05, "Pretrain/Loss": 2.1280245780944824, "Pretrain/Loss (Raw)": 2.0445332527160645, "Pretrain/Step": 1342, "Pretrain/Step Time": 10.60116896405816} +{"Pretrain/Learning Rate": 4.8406638766725464e-05, "Pretrain/Loss": 2.1284289360046387, "Pretrain/Loss (Raw)": 2.0767548084259033, "Pretrain/Step": 1343, "Pretrain/Step Time": 10.591668920591474} +{"Pretrain/Learning Rate": 4.840365498353357e-05, "Pretrain/Loss": 2.129128932952881, "Pretrain/Loss (Raw)": 2.2511751651763916, "Pretrain/Step": 1344, "Pretrain/Step Time": 10.569624781608582} +{"Pretrain/Learning Rate": 4.840066850132189e-05, "Pretrain/Loss": 2.1271488666534424, "Pretrain/Loss (Raw)": 2.0619068145751953, "Pretrain/Step": 1345, "Pretrain/Step Time": 10.571552835404873} +{"Pretrain/Learning Rate": 4.839767932043485e-05, "Pretrain/Loss": 2.1277122497558594, "Pretrain/Loss (Raw)": 2.2085561752319336, "Pretrain/Step": 1346, "Pretrain/Step Time": 10.552391475066543} +{"Pretrain/Learning Rate": 4.839468744121718e-05, "Pretrain/Loss": 2.128864049911499, "Pretrain/Loss (Raw)": 2.2534797191619873, "Pretrain/Step": 1347, "Pretrain/Step Time": 10.543702172115445} +{"Pretrain/Learning Rate": 4.8391692864013916e-05, "Pretrain/Loss": 2.127857208251953, "Pretrain/Loss (Raw)": 2.1833789348602295, "Pretrain/Step": 1348, "Pretrain/Step Time": 10.578883718699217} +{"Pretrain/Learning Rate": 4.838869558917041e-05, "Pretrain/Loss": 2.127683639526367, "Pretrain/Loss (Raw)": 2.0518126487731934, "Pretrain/Step": 1349, "Pretrain/Step Time": 10.58879311196506} +{"Pretrain/Learning Rate": 4.838569561703231e-05, "Pretrain/Loss": 2.127537250518799, "Pretrain/Loss (Raw)": 2.1249241828918457, "Pretrain/Step": 1350, "Pretrain/Step Time": 10.573996322229505} +{"Pretrain/Learning Rate": 4.83826929479456e-05, "Pretrain/Loss": 2.1262593269348145, "Pretrain/Loss (Raw)": 2.0013749599456787, "Pretrain/Step": 1351, "Pretrain/Step Time": 10.579024216160178} +{"Pretrain/Learning Rate": 4.837968758225655e-05, "Pretrain/Loss": 2.122553825378418, "Pretrain/Loss (Raw)": 2.0983450412750244, "Pretrain/Step": 1352, "Pretrain/Step Time": 10.578563777729869} +{"Pretrain/Learning Rate": 4.837667952031176e-05, "Pretrain/Loss": 2.123551607131958, "Pretrain/Loss (Raw)": 2.237565517425537, "Pretrain/Step": 1353, "Pretrain/Step Time": 10.584015354514122} +{"Pretrain/Learning Rate": 4.8373668762458144e-05, "Pretrain/Loss": 2.123013973236084, "Pretrain/Loss (Raw)": 2.0055181980133057, "Pretrain/Step": 1354, "Pretrain/Step Time": 10.541470177471638} +{"Pretrain/Learning Rate": 4.8370655309042896e-05, "Pretrain/Loss": 2.124119997024536, "Pretrain/Loss (Raw)": 2.1876816749572754, "Pretrain/Step": 1355, "Pretrain/Step Time": 10.535302734002471} +{"Pretrain/Learning Rate": 4.8367639160413553e-05, "Pretrain/Loss": 2.1246531009674072, "Pretrain/Loss (Raw)": 2.253450870513916, "Pretrain/Step": 1356, "Pretrain/Step Time": 10.530720112845302} +{"Pretrain/Learning Rate": 4.8364620316917956e-05, "Pretrain/Loss": 2.124795436859131, "Pretrain/Loss (Raw)": 2.251950979232788, "Pretrain/Step": 1357, "Pretrain/Step Time": 10.542212933301926} +{"Pretrain/Learning Rate": 4.836159877890424e-05, "Pretrain/Loss": 2.1276469230651855, "Pretrain/Loss (Raw)": 2.2909798622131348, "Pretrain/Step": 1358, "Pretrain/Step Time": 10.53266822360456} +{"Pretrain/Learning Rate": 4.835857454672087e-05, "Pretrain/Loss": 2.1276938915252686, "Pretrain/Loss (Raw)": 2.1386756896972656, "Pretrain/Step": 1359, "Pretrain/Step Time": 10.537014776840806} +{"Pretrain/Learning Rate": 4.835554762071661e-05, "Pretrain/Loss": 2.122267961502075, "Pretrain/Loss (Raw)": 1.4295732975006104, "Pretrain/Step": 1360, "Pretrain/Step Time": 10.52032002992928} +{"Pretrain/Learning Rate": 4.8352518001240555e-05, "Pretrain/Loss": 2.123784065246582, "Pretrain/Loss (Raw)": 2.292644500732422, "Pretrain/Step": 1361, "Pretrain/Step Time": 10.559486635029316} +{"Pretrain/Learning Rate": 4.834948568864207e-05, "Pretrain/Loss": 2.1236696243286133, "Pretrain/Loss (Raw)": 1.9584180116653442, "Pretrain/Step": 1362, "Pretrain/Step Time": 10.53359255939722} +{"Pretrain/Learning Rate": 4.8346450683270875e-05, "Pretrain/Loss": 2.122363567352295, "Pretrain/Loss (Raw)": 1.9739961624145508, "Pretrain/Step": 1363, "Pretrain/Step Time": 10.547314817085862} +{"Pretrain/Learning Rate": 4.8343412985476974e-05, "Pretrain/Loss": 2.1237292289733887, "Pretrain/Loss (Raw)": 2.1948983669281006, "Pretrain/Step": 1364, "Pretrain/Step Time": 10.483929695561528} +{"Pretrain/Learning Rate": 4.83403725956107e-05, "Pretrain/Loss": 2.1223974227905273, "Pretrain/Loss (Raw)": 2.0021817684173584, "Pretrain/Step": 1365, "Pretrain/Step Time": 10.488546939566731} +{"Pretrain/Learning Rate": 4.8337329514022664e-05, "Pretrain/Loss": 2.121875047683716, "Pretrain/Loss (Raw)": 1.9806946516036987, "Pretrain/Step": 1366, "Pretrain/Step Time": 10.492925239726901} +{"Pretrain/Learning Rate": 4.833428374106382e-05, "Pretrain/Loss": 2.121890068054199, "Pretrain/Loss (Raw)": 2.0466599464416504, "Pretrain/Step": 1367, "Pretrain/Step Time": 10.518737295642495} +{"Pretrain/Learning Rate": 4.833123527708542e-05, "Pretrain/Loss": 2.1221530437469482, "Pretrain/Loss (Raw)": 2.163968324661255, "Pretrain/Step": 1368, "Pretrain/Step Time": 10.552567472681403} +{"Pretrain/Learning Rate": 4.832818412243904e-05, "Pretrain/Loss": 2.121880531311035, "Pretrain/Loss (Raw)": 2.112144708633423, "Pretrain/Step": 1369, "Pretrain/Step Time": 10.512272344902158} +{"Pretrain/Learning Rate": 4.8325130277476526e-05, "Pretrain/Loss": 2.1217598915100098, "Pretrain/Loss (Raw)": 2.237863302230835, "Pretrain/Step": 1370, "Pretrain/Step Time": 10.469577489420772} +{"Pretrain/Learning Rate": 4.832207374255008e-05, "Pretrain/Loss": 2.122753381729126, "Pretrain/Loss (Raw)": 2.1940419673919678, "Pretrain/Step": 1371, "Pretrain/Step Time": 10.442438691854477} +{"Pretrain/Learning Rate": 4.8319014518012195e-05, "Pretrain/Loss": 2.122000217437744, "Pretrain/Loss (Raw)": 2.041187286376953, "Pretrain/Step": 1372, "Pretrain/Step Time": 10.373260838910937} +{"Pretrain/Learning Rate": 4.831595260421567e-05, "Pretrain/Loss": 2.1231093406677246, "Pretrain/Loss (Raw)": 2.188929319381714, "Pretrain/Step": 1373, "Pretrain/Step Time": 10.378312991932034} +{"Pretrain/Learning Rate": 4.8312888001513624e-05, "Pretrain/Loss": 2.1228294372558594, "Pretrain/Loss (Raw)": 2.2180819511413574, "Pretrain/Step": 1374, "Pretrain/Step Time": 10.346015512943268} +{"Pretrain/Learning Rate": 4.830982071025948e-05, "Pretrain/Loss": 2.121455192565918, "Pretrain/Loss (Raw)": 1.9828436374664307, "Pretrain/Step": 1375, "Pretrain/Step Time": 10.348350759595633} +{"Pretrain/Learning Rate": 4.830675073080697e-05, "Pretrain/Loss": 2.118518352508545, "Pretrain/Loss (Raw)": 1.7144566774368286, "Pretrain/Step": 1376, "Pretrain/Step Time": 10.370335379615426} +{"Pretrain/Learning Rate": 4.830367806351015e-05, "Pretrain/Loss": 2.117777109146118, "Pretrain/Loss (Raw)": 2.0052101612091064, "Pretrain/Step": 1377, "Pretrain/Step Time": 10.363660883158445} +{"Pretrain/Learning Rate": 4.830060270872335e-05, "Pretrain/Loss": 2.119962692260742, "Pretrain/Loss (Raw)": 2.0367720127105713, "Pretrain/Step": 1378, "Pretrain/Step Time": 10.33200266957283} +{"Pretrain/Learning Rate": 4.8297524666801265e-05, "Pretrain/Loss": 2.1188058853149414, "Pretrain/Loss (Raw)": 1.8720992803573608, "Pretrain/Step": 1379, "Pretrain/Step Time": 10.33414783142507} +{"Pretrain/Learning Rate": 4.829444393809884e-05, "Pretrain/Loss": 2.117441415786743, "Pretrain/Loss (Raw)": 2.1636526584625244, "Pretrain/Step": 1380, "Pretrain/Step Time": 10.368441676720977} +{"Pretrain/Learning Rate": 4.829136052297138e-05, "Pretrain/Loss": 2.1170334815979004, "Pretrain/Loss (Raw)": 2.1867940425872803, "Pretrain/Step": 1381, "Pretrain/Step Time": 10.370901264250278} +{"Pretrain/Learning Rate": 4.828827442177447e-05, "Pretrain/Loss": 2.118454933166504, "Pretrain/Loss (Raw)": 2.333014965057373, "Pretrain/Step": 1382, "Pretrain/Step Time": 10.376899493858218} +{"Pretrain/Learning Rate": 4.8285185634864024e-05, "Pretrain/Loss": 2.117647409439087, "Pretrain/Loss (Raw)": 1.8185230493545532, "Pretrain/Step": 1383, "Pretrain/Step Time": 10.366846598684788} +{"Pretrain/Learning Rate": 4.8282094162596235e-05, "Pretrain/Loss": 2.1172425746917725, "Pretrain/Loss (Raw)": 2.04114031791687, "Pretrain/Step": 1384, "Pretrain/Step Time": 10.360137522220612} +{"Pretrain/Learning Rate": 4.8279000005327644e-05, "Pretrain/Loss": 2.1175498962402344, "Pretrain/Loss (Raw)": 2.0869884490966797, "Pretrain/Step": 1385, "Pretrain/Step Time": 10.375893732532859} +{"Pretrain/Learning Rate": 4.827590316341508e-05, "Pretrain/Loss": 2.117117166519165, "Pretrain/Loss (Raw)": 2.0691921710968018, "Pretrain/Step": 1386, "Pretrain/Step Time": 10.375127485021949} +{"Pretrain/Learning Rate": 4.827280363721568e-05, "Pretrain/Loss": 2.1162607669830322, "Pretrain/Loss (Raw)": 2.086343765258789, "Pretrain/Step": 1387, "Pretrain/Step Time": 10.394932996481657} +{"Pretrain/Learning Rate": 4.82697014270869e-05, "Pretrain/Loss": 2.1164865493774414, "Pretrain/Loss (Raw)": 2.0828728675842285, "Pretrain/Step": 1388, "Pretrain/Step Time": 10.380698166787624} +{"Pretrain/Learning Rate": 4.8266596533386505e-05, "Pretrain/Loss": 2.116072177886963, "Pretrain/Loss (Raw)": 2.0607385635375977, "Pretrain/Step": 1389, "Pretrain/Step Time": 10.326519103720784} +{"Pretrain/Learning Rate": 4.8263488956472555e-05, "Pretrain/Loss": 2.112490653991699, "Pretrain/Loss (Raw)": 1.8963453769683838, "Pretrain/Step": 1390, "Pretrain/Step Time": 10.3317657597363} +{"Pretrain/Learning Rate": 4.826037869670345e-05, "Pretrain/Loss": 2.1115617752075195, "Pretrain/Loss (Raw)": 2.1798946857452393, "Pretrain/Step": 1391, "Pretrain/Step Time": 10.353123713284731} +{"Pretrain/Learning Rate": 4.8257265754437854e-05, "Pretrain/Loss": 2.111135721206665, "Pretrain/Loss (Raw)": 2.086559772491455, "Pretrain/Step": 1392, "Pretrain/Step Time": 10.354659920558333} +{"Pretrain/Learning Rate": 4.825415013003478e-05, "Pretrain/Loss": 2.111382007598877, "Pretrain/Loss (Raw)": 2.0628042221069336, "Pretrain/Step": 1393, "Pretrain/Step Time": 10.327834179624915} +{"Pretrain/Learning Rate": 4.8251031823853546e-05, "Pretrain/Loss": 2.11099910736084, "Pretrain/Loss (Raw)": 2.06847882270813, "Pretrain/Step": 1394, "Pretrain/Step Time": 10.334607454016805} +{"Pretrain/Learning Rate": 4.824791083625375e-05, "Pretrain/Loss": 2.1135036945343018, "Pretrain/Loss (Raw)": 2.1118288040161133, "Pretrain/Step": 1395, "Pretrain/Step Time": 10.25351920351386} +{"Pretrain/Learning Rate": 4.8244787167595335e-05, "Pretrain/Loss": 2.1135692596435547, "Pretrain/Loss (Raw)": 2.2084434032440186, "Pretrain/Step": 1396, "Pretrain/Step Time": 10.255825011059642} +{"Pretrain/Learning Rate": 4.824166081823853e-05, "Pretrain/Loss": 2.1122958660125732, "Pretrain/Loss (Raw)": 1.9546648263931274, "Pretrain/Step": 1397, "Pretrain/Step Time": 10.252791678532958} +{"Pretrain/Learning Rate": 4.823853178854387e-05, "Pretrain/Loss": 2.1141042709350586, "Pretrain/Loss (Raw)": 2.2504613399505615, "Pretrain/Step": 1398, "Pretrain/Step Time": 10.249459441751242} +{"Pretrain/Learning Rate": 4.8235400078872234e-05, "Pretrain/Loss": 2.113654136657715, "Pretrain/Loss (Raw)": 2.028233051300049, "Pretrain/Step": 1399, "Pretrain/Step Time": 10.218354128301144} +{"Pretrain/Learning Rate": 4.823226568958477e-05, "Pretrain/Loss": 2.1149253845214844, "Pretrain/Loss (Raw)": 2.281153440475464, "Pretrain/Step": 1400, "Pretrain/Step Time": 10.224640354514122} +{"Pretrain/Learning Rate": 4.822912862104295e-05, "Pretrain/Loss": 2.113032341003418, "Pretrain/Loss (Raw)": 1.913846731185913, "Pretrain/Step": 1401, "Pretrain/Step Time": 10.21426410600543} +{"Pretrain/Learning Rate": 4.8225988873608554e-05, "Pretrain/Loss": 2.111855983734131, "Pretrain/Loss (Raw)": 2.0622754096984863, "Pretrain/Step": 1402, "Pretrain/Step Time": 10.247064288705587} +{"Pretrain/Learning Rate": 4.8222846447643686e-05, "Pretrain/Loss": 2.1107020378112793, "Pretrain/Loss (Raw)": 2.1733524799346924, "Pretrain/Step": 1403, "Pretrain/Step Time": 10.21627608127892} +{"Pretrain/Learning Rate": 4.8219701343510727e-05, "Pretrain/Loss": 2.108955144882202, "Pretrain/Loss (Raw)": 2.0238893032073975, "Pretrain/Step": 1404, "Pretrain/Step Time": 10.221076481044292} +{"Pretrain/Learning Rate": 4.8216553561572395e-05, "Pretrain/Loss": 2.108466148376465, "Pretrain/Loss (Raw)": 2.140474796295166, "Pretrain/Step": 1405, "Pretrain/Step Time": 10.173552358523011} +{"Pretrain/Learning Rate": 4.821340310219171e-05, "Pretrain/Loss": 2.1061482429504395, "Pretrain/Loss (Raw)": 1.8751463890075684, "Pretrain/Step": 1406, "Pretrain/Step Time": 10.18262036703527} +{"Pretrain/Learning Rate": 4.8210249965732e-05, "Pretrain/Loss": 2.1053099632263184, "Pretrain/Loss (Raw)": 2.3276360034942627, "Pretrain/Step": 1407, "Pretrain/Step Time": 10.166725801303983} +{"Pretrain/Learning Rate": 4.8207094152556886e-05, "Pretrain/Loss": 2.1030828952789307, "Pretrain/Loss (Raw)": 2.1101293563842773, "Pretrain/Step": 1408, "Pretrain/Step Time": 10.166604405269027} +{"Pretrain/Learning Rate": 4.820393566303032e-05, "Pretrain/Loss": 2.106718063354492, "Pretrain/Loss (Raw)": 2.079432964324951, "Pretrain/Step": 1409, "Pretrain/Step Time": 10.184065910056233} +{"Pretrain/Learning Rate": 4.8200774497516555e-05, "Pretrain/Loss": 2.1084423065185547, "Pretrain/Loss (Raw)": 2.1069376468658447, "Pretrain/Step": 1410, "Pretrain/Step Time": 10.151251297444105} +{"Pretrain/Learning Rate": 4.8197610656380144e-05, "Pretrain/Loss": 2.1057515144348145, "Pretrain/Loss (Raw)": 1.9599361419677734, "Pretrain/Step": 1411, "Pretrain/Step Time": 10.175139877945185} +{"Pretrain/Learning Rate": 4.8194444139985965e-05, "Pretrain/Loss": 2.106694221496582, "Pretrain/Loss (Raw)": 2.1703431606292725, "Pretrain/Step": 1412, "Pretrain/Step Time": 10.171726891770959} +{"Pretrain/Learning Rate": 4.81912749486992e-05, "Pretrain/Loss": 2.1095285415649414, "Pretrain/Loss (Raw)": 2.548496723175049, "Pretrain/Step": 1413, "Pretrain/Step Time": 10.175829140469432} +{"Pretrain/Learning Rate": 4.818810308288531e-05, "Pretrain/Loss": 2.1095619201660156, "Pretrain/Loss (Raw)": 2.236126661300659, "Pretrain/Step": 1414, "Pretrain/Step Time": 10.195777863264084} +{"Pretrain/Learning Rate": 4.818492854291012e-05, "Pretrain/Loss": 2.108616828918457, "Pretrain/Loss (Raw)": 2.181117057800293, "Pretrain/Step": 1415, "Pretrain/Step Time": 10.22825494222343} +{"Pretrain/Learning Rate": 4.818175132913971e-05, "Pretrain/Loss": 2.106779098510742, "Pretrain/Loss (Raw)": 2.001967668533325, "Pretrain/Step": 1416, "Pretrain/Step Time": 10.214059680700302} +{"Pretrain/Learning Rate": 4.817857144194051e-05, "Pretrain/Loss": 2.1046149730682373, "Pretrain/Loss (Raw)": 1.9147294759750366, "Pretrain/Step": 1417, "Pretrain/Step Time": 10.17937825806439} +{"Pretrain/Learning Rate": 4.817538888167923e-05, "Pretrain/Loss": 2.1059587001800537, "Pretrain/Loss (Raw)": 2.202397108078003, "Pretrain/Step": 1418, "Pretrain/Step Time": 10.180879471823573} +{"Pretrain/Learning Rate": 4.817220364872289e-05, "Pretrain/Loss": 2.105480194091797, "Pretrain/Loss (Raw)": 2.142932415008545, "Pretrain/Step": 1419, "Pretrain/Step Time": 10.181709442287683} +{"Pretrain/Learning Rate": 4.816901574343884e-05, "Pretrain/Loss": 2.1054067611694336, "Pretrain/Loss (Raw)": 2.1356053352355957, "Pretrain/Step": 1420, "Pretrain/Step Time": 10.189251182600856} +{"Pretrain/Learning Rate": 4.816582516619471e-05, "Pretrain/Loss": 2.104567050933838, "Pretrain/Loss (Raw)": 2.0262482166290283, "Pretrain/Step": 1421, "Pretrain/Step Time": 10.193407341837883} +{"Pretrain/Learning Rate": 4.816263191735847e-05, "Pretrain/Loss": 2.105231523513794, "Pretrain/Loss (Raw)": 2.0594937801361084, "Pretrain/Step": 1422, "Pretrain/Step Time": 10.201370129361749} +{"Pretrain/Learning Rate": 4.8159435997298375e-05, "Pretrain/Loss": 2.105564594268799, "Pretrain/Loss (Raw)": 1.8722286224365234, "Pretrain/Step": 1423, "Pretrain/Step Time": 10.194420509040356} +{"Pretrain/Learning Rate": 4.8156237406382975e-05, "Pretrain/Loss": 2.1061549186706543, "Pretrain/Loss (Raw)": 2.092808961868286, "Pretrain/Step": 1424, "Pretrain/Step Time": 10.19520597718656} +{"Pretrain/Learning Rate": 4.815303614498118e-05, "Pretrain/Loss": 2.1063427925109863, "Pretrain/Loss (Raw)": 2.1212892532348633, "Pretrain/Step": 1425, "Pretrain/Step Time": 10.195243317633867} +{"Pretrain/Learning Rate": 4.814983221346214e-05, "Pretrain/Loss": 2.1060428619384766, "Pretrain/Loss (Raw)": 2.1925570964813232, "Pretrain/Step": 1426, "Pretrain/Step Time": 10.181880509480834} +{"Pretrain/Learning Rate": 4.814662561219537e-05, "Pretrain/Loss": 2.10652494430542, "Pretrain/Loss (Raw)": 2.160909414291382, "Pretrain/Step": 1427, "Pretrain/Step Time": 10.170625351369381} +{"Pretrain/Learning Rate": 4.814341634155066e-05, "Pretrain/Loss": 2.1059651374816895, "Pretrain/Loss (Raw)": 2.1525986194610596, "Pretrain/Step": 1428, "Pretrain/Step Time": 10.144310371950269} +{"Pretrain/Learning Rate": 4.8140204401898134e-05, "Pretrain/Loss": 2.1038875579833984, "Pretrain/Loss (Raw)": 1.908189058303833, "Pretrain/Step": 1429, "Pretrain/Step Time": 10.162603411823511} +{"Pretrain/Learning Rate": 4.813698979360819e-05, "Pretrain/Loss": 2.102898120880127, "Pretrain/Loss (Raw)": 2.108717918395996, "Pretrain/Step": 1430, "Pretrain/Step Time": 10.117511978372931} +{"Pretrain/Learning Rate": 4.813377251705156e-05, "Pretrain/Loss": 2.1024043560028076, "Pretrain/Loss (Raw)": 2.2050940990448, "Pretrain/Step": 1431, "Pretrain/Step Time": 10.130597529932857} +{"Pretrain/Learning Rate": 4.8130552572599265e-05, "Pretrain/Loss": 2.1022047996520996, "Pretrain/Loss (Raw)": 2.1067216396331787, "Pretrain/Step": 1432, "Pretrain/Step Time": 10.141609391197562} +{"Pretrain/Learning Rate": 4.8127329960622656e-05, "Pretrain/Loss": 2.102351665496826, "Pretrain/Loss (Raw)": 1.9971486330032349, "Pretrain/Step": 1433, "Pretrain/Step Time": 10.13963207602501} +{"Pretrain/Learning Rate": 4.8124104681493375e-05, "Pretrain/Loss": 2.101017951965332, "Pretrain/Loss (Raw)": 2.0318899154663086, "Pretrain/Step": 1434, "Pretrain/Step Time": 10.139053413644433} +{"Pretrain/Learning Rate": 4.8120876735583384e-05, "Pretrain/Loss": 2.1003825664520264, "Pretrain/Loss (Raw)": 2.0186994075775146, "Pretrain/Step": 1435, "Pretrain/Step Time": 10.152508109807968} +{"Pretrain/Learning Rate": 4.811764612326493e-05, "Pretrain/Loss": 2.1020712852478027, "Pretrain/Loss (Raw)": 2.2619004249572754, "Pretrain/Step": 1436, "Pretrain/Step Time": 10.140834648162127} +{"Pretrain/Learning Rate": 4.8114412844910595e-05, "Pretrain/Loss": 2.1027560234069824, "Pretrain/Loss (Raw)": 2.166750431060791, "Pretrain/Step": 1437, "Pretrain/Step Time": 10.138051584362984} +{"Pretrain/Learning Rate": 4.8111176900893254e-05, "Pretrain/Loss": 2.1023473739624023, "Pretrain/Loss (Raw)": 2.1816177368164062, "Pretrain/Step": 1438, "Pretrain/Step Time": 10.121468482539058} +{"Pretrain/Learning Rate": 4.810793829158609e-05, "Pretrain/Loss": 2.100813388824463, "Pretrain/Loss (Raw)": 1.9455878734588623, "Pretrain/Step": 1439, "Pretrain/Step Time": 10.128617132082582} +{"Pretrain/Learning Rate": 4.8104697017362595e-05, "Pretrain/Loss": 2.1025257110595703, "Pretrain/Loss (Raw)": 2.2385165691375732, "Pretrain/Step": 1440, "Pretrain/Step Time": 10.08496716991067} +{"Pretrain/Learning Rate": 4.8101453078596565e-05, "Pretrain/Loss": 2.1020514965057373, "Pretrain/Loss (Raw)": 2.2078146934509277, "Pretrain/Step": 1441, "Pretrain/Step Time": 10.082663597539067} +{"Pretrain/Learning Rate": 4.809820647566211e-05, "Pretrain/Loss": 2.1017978191375732, "Pretrain/Loss (Raw)": 2.1462514400482178, "Pretrain/Step": 1442, "Pretrain/Step Time": 10.071994522586465} +{"Pretrain/Learning Rate": 4.8094957208933635e-05, "Pretrain/Loss": 2.1034059524536133, "Pretrain/Loss (Raw)": 2.276721954345703, "Pretrain/Step": 1443, "Pretrain/Step Time": 10.078432008624077} +{"Pretrain/Learning Rate": 4.809170527878587e-05, "Pretrain/Loss": 2.1043834686279297, "Pretrain/Loss (Raw)": 2.0679547786712646, "Pretrain/Step": 1444, "Pretrain/Step Time": 10.030164118856192} +{"Pretrain/Learning Rate": 4.808845068559384e-05, "Pretrain/Loss": 2.106139659881592, "Pretrain/Loss (Raw)": 2.335315465927124, "Pretrain/Step": 1445, "Pretrain/Step Time": 10.031966080889106} +{"Pretrain/Learning Rate": 4.808519342973289e-05, "Pretrain/Loss": 2.105794906616211, "Pretrain/Loss (Raw)": 2.1590192317962646, "Pretrain/Step": 1446, "Pretrain/Step Time": 10.06926904246211} +{"Pretrain/Learning Rate": 4.808193351157865e-05, "Pretrain/Loss": 2.1084823608398438, "Pretrain/Loss (Raw)": 2.5318522453308105, "Pretrain/Step": 1447, "Pretrain/Step Time": 10.068108705803752} +{"Pretrain/Learning Rate": 4.8078670931507064e-05, "Pretrain/Loss": 2.105494499206543, "Pretrain/Loss (Raw)": 2.0612549781799316, "Pretrain/Step": 1448, "Pretrain/Step Time": 10.019351800903678} +{"Pretrain/Learning Rate": 4.80754056898944e-05, "Pretrain/Loss": 2.105672597885132, "Pretrain/Loss (Raw)": 2.3108599185943604, "Pretrain/Step": 1449, "Pretrain/Step Time": 10.019237224012613} +{"Pretrain/Learning Rate": 4.807213778711722e-05, "Pretrain/Loss": 2.1072044372558594, "Pretrain/Loss (Raw)": 2.268693447113037, "Pretrain/Step": 1450, "Pretrain/Step Time": 9.99059029109776} +{"Pretrain/Learning Rate": 4.8068867223552384e-05, "Pretrain/Loss": 2.106309652328491, "Pretrain/Loss (Raw)": 2.1309611797332764, "Pretrain/Step": 1451, "Pretrain/Step Time": 10.004512470215559} +{"Pretrain/Learning Rate": 4.8065593999577086e-05, "Pretrain/Loss": 2.105006217956543, "Pretrain/Loss (Raw)": 1.9939355850219727, "Pretrain/Step": 1452, "Pretrain/Step Time": 9.978130461648107} +{"Pretrain/Learning Rate": 4.806231811556879e-05, "Pretrain/Loss": 2.1047496795654297, "Pretrain/Loss (Raw)": 2.0767993927001953, "Pretrain/Step": 1453, "Pretrain/Step Time": 9.979289768263698} +{"Pretrain/Learning Rate": 4.80590395719053e-05, "Pretrain/Loss": 2.1048388481140137, "Pretrain/Loss (Raw)": 2.157839775085449, "Pretrain/Step": 1454, "Pretrain/Step Time": 9.959805835038424} +{"Pretrain/Learning Rate": 4.805575836896471e-05, "Pretrain/Loss": 2.1060311794281006, "Pretrain/Loss (Raw)": 2.162444591522217, "Pretrain/Step": 1455, "Pretrain/Step Time": 9.96140960790217} +{"Pretrain/Learning Rate": 4.805247450712542e-05, "Pretrain/Loss": 2.1063737869262695, "Pretrain/Loss (Raw)": 2.1625118255615234, "Pretrain/Step": 1456, "Pretrain/Step Time": 9.948766775429249} +{"Pretrain/Learning Rate": 4.804918798676614e-05, "Pretrain/Loss": 2.105257987976074, "Pretrain/Loss (Raw)": 1.9468365907669067, "Pretrain/Step": 1457, "Pretrain/Step Time": 9.957041658461094} +{"Pretrain/Learning Rate": 4.804589880826589e-05, "Pretrain/Loss": 2.1053872108459473, "Pretrain/Loss (Raw)": 2.131582260131836, "Pretrain/Step": 1458, "Pretrain/Step Time": 9.924986889585853} +{"Pretrain/Learning Rate": 4.8042606972004e-05, "Pretrain/Loss": 2.103773593902588, "Pretrain/Loss (Raw)": 1.8676095008850098, "Pretrain/Step": 1459, "Pretrain/Step Time": 9.930986428633332} +{"Pretrain/Learning Rate": 4.803931247836009e-05, "Pretrain/Loss": 2.1042184829711914, "Pretrain/Loss (Raw)": 2.059932231903076, "Pretrain/Step": 1460, "Pretrain/Step Time": 9.92242949269712} +{"Pretrain/Learning Rate": 4.80360153277141e-05, "Pretrain/Loss": 2.1026244163513184, "Pretrain/Loss (Raw)": 2.001924753189087, "Pretrain/Step": 1461, "Pretrain/Step Time": 9.918246250599623} +{"Pretrain/Learning Rate": 4.8032715520446275e-05, "Pretrain/Loss": 2.103544235229492, "Pretrain/Loss (Raw)": 2.211223840713501, "Pretrain/Step": 1462, "Pretrain/Step Time": 9.859185652807355} +{"Pretrain/Learning Rate": 4.802941305693716e-05, "Pretrain/Loss": 2.1044366359710693, "Pretrain/Loss (Raw)": 2.2637715339660645, "Pretrain/Step": 1463, "Pretrain/Step Time": 9.8624711856246} +{"Pretrain/Learning Rate": 4.802610793756761e-05, "Pretrain/Loss": 2.1016268730163574, "Pretrain/Loss (Raw)": 1.7155121564865112, "Pretrain/Step": 1464, "Pretrain/Step Time": 9.89228005707264} +{"Pretrain/Learning Rate": 4.8022800162718794e-05, "Pretrain/Loss": 2.1041574478149414, "Pretrain/Loss (Raw)": 2.0935146808624268, "Pretrain/Step": 1465, "Pretrain/Step Time": 9.894215665757656} +{"Pretrain/Learning Rate": 4.801948973277218e-05, "Pretrain/Loss": 2.098522424697876, "Pretrain/Loss (Raw)": 1.4572560787200928, "Pretrain/Step": 1466, "Pretrain/Step Time": 9.846243964508176} +{"Pretrain/Learning Rate": 4.8016176648109534e-05, "Pretrain/Loss": 2.098318099975586, "Pretrain/Loss (Raw)": 2.108318567276001, "Pretrain/Step": 1467, "Pretrain/Step Time": 9.84595056809485} +{"Pretrain/Learning Rate": 4.801286090911295e-05, "Pretrain/Loss": 2.098942756652832, "Pretrain/Loss (Raw)": 2.0887956619262695, "Pretrain/Step": 1468, "Pretrain/Step Time": 9.837931610643864} +{"Pretrain/Learning Rate": 4.80095425161648e-05, "Pretrain/Loss": 2.0983200073242188, "Pretrain/Loss (Raw)": 2.0058326721191406, "Pretrain/Step": 1469, "Pretrain/Step Time": 9.832370691001415} +{"Pretrain/Learning Rate": 4.800622146964777e-05, "Pretrain/Loss": 2.0986275672912598, "Pretrain/Loss (Raw)": 2.083916425704956, "Pretrain/Step": 1470, "Pretrain/Step Time": 9.829064210876822} +{"Pretrain/Learning Rate": 4.8002897769944885e-05, "Pretrain/Loss": 2.099616050720215, "Pretrain/Loss (Raw)": 2.203284740447998, "Pretrain/Step": 1471, "Pretrain/Step Time": 9.826830038800836} +{"Pretrain/Learning Rate": 4.799957141743944e-05, "Pretrain/Loss": 2.097208023071289, "Pretrain/Loss (Raw)": 1.942932367324829, "Pretrain/Step": 1472, "Pretrain/Step Time": 9.822115257382393} +{"Pretrain/Learning Rate": 4.799624241251502e-05, "Pretrain/Loss": 2.098098039627075, "Pretrain/Loss (Raw)": 2.175849199295044, "Pretrain/Step": 1473, "Pretrain/Step Time": 9.819551829248667} +{"Pretrain/Learning Rate": 4.7992910755555584e-05, "Pretrain/Loss": 2.0989174842834473, "Pretrain/Loss (Raw)": 2.313462734222412, "Pretrain/Step": 1474, "Pretrain/Step Time": 9.820564713329077} +{"Pretrain/Learning Rate": 4.798957644694533e-05, "Pretrain/Loss": 2.098278284072876, "Pretrain/Loss (Raw)": 2.1716487407684326, "Pretrain/Step": 1475, "Pretrain/Step Time": 9.827917590737343} +{"Pretrain/Learning Rate": 4.7986239487068785e-05, "Pretrain/Loss": 2.097381591796875, "Pretrain/Loss (Raw)": 2.068596124649048, "Pretrain/Step": 1476, "Pretrain/Step Time": 9.79046586714685} +{"Pretrain/Learning Rate": 4.798289987631079e-05, "Pretrain/Loss": 2.0990796089172363, "Pretrain/Loss (Raw)": 2.269148111343384, "Pretrain/Step": 1477, "Pretrain/Step Time": 9.773121885955334} +{"Pretrain/Learning Rate": 4.797955761505648e-05, "Pretrain/Loss": 2.0983238220214844, "Pretrain/Loss (Raw)": 2.0281710624694824, "Pretrain/Step": 1478, "Pretrain/Step Time": 9.763896856456995} +{"Pretrain/Learning Rate": 4.7976212703691306e-05, "Pretrain/Loss": 2.09794282913208, "Pretrain/Loss (Raw)": 1.9526212215423584, "Pretrain/Step": 1479, "Pretrain/Step Time": 9.75141055881977} +{"Pretrain/Learning Rate": 4.797286514260101e-05, "Pretrain/Loss": 2.0968177318573, "Pretrain/Loss (Raw)": 1.9543464183807373, "Pretrain/Step": 1480, "Pretrain/Step Time": 9.75082828477025} +{"Pretrain/Learning Rate": 4.7969514932171665e-05, "Pretrain/Loss": 2.095421314239502, "Pretrain/Loss (Raw)": 2.058824300765991, "Pretrain/Step": 1481, "Pretrain/Step Time": 9.738101780414581} +{"Pretrain/Learning Rate": 4.796616207278961e-05, "Pretrain/Loss": 2.0974979400634766, "Pretrain/Loss (Raw)": 2.2713308334350586, "Pretrain/Step": 1482, "Pretrain/Step Time": 9.739534178748727} +{"Pretrain/Learning Rate": 4.796280656484153e-05, "Pretrain/Loss": 2.09649395942688, "Pretrain/Loss (Raw)": 2.0591506958007812, "Pretrain/Step": 1483, "Pretrain/Step Time": 9.730285722762346} +{"Pretrain/Learning Rate": 4.795944840871439e-05, "Pretrain/Loss": 2.094353199005127, "Pretrain/Loss (Raw)": 1.979425072669983, "Pretrain/Step": 1484, "Pretrain/Step Time": 9.744268158450723} +{"Pretrain/Learning Rate": 4.7956087604795474e-05, "Pretrain/Loss": 2.093228816986084, "Pretrain/Loss (Raw)": 2.1080334186553955, "Pretrain/Step": 1485, "Pretrain/Step Time": 9.713866846635938} +{"Pretrain/Learning Rate": 4.7952724153472366e-05, "Pretrain/Loss": 2.091907262802124, "Pretrain/Loss (Raw)": 2.121821165084839, "Pretrain/Step": 1486, "Pretrain/Step Time": 9.730011420324445} +{"Pretrain/Learning Rate": 4.7949358055132945e-05, "Pretrain/Loss": 2.090884208679199, "Pretrain/Loss (Raw)": 2.0077362060546875, "Pretrain/Step": 1487, "Pretrain/Step Time": 9.728553973138332} +{"Pretrain/Learning Rate": 4.7945989310165415e-05, "Pretrain/Loss": 2.0992891788482666, "Pretrain/Loss (Raw)": 2.5054070949554443, "Pretrain/Step": 1488, "Pretrain/Step Time": 9.813475236296654} +{"Pretrain/Learning Rate": 4.794261791895828e-05, "Pretrain/Loss": 2.098445177078247, "Pretrain/Loss (Raw)": 2.1846230030059814, "Pretrain/Step": 1489, "Pretrain/Step Time": 9.767966855317354} +{"Pretrain/Learning Rate": 4.793924388190033e-05, "Pretrain/Loss": 2.099581241607666, "Pretrain/Loss (Raw)": 2.103825569152832, "Pretrain/Step": 1490, "Pretrain/Step Time": 9.7679672986269} +{"Pretrain/Learning Rate": 4.793586719938068e-05, "Pretrain/Loss": 2.100968837738037, "Pretrain/Loss (Raw)": 2.1516151428222656, "Pretrain/Step": 1491, "Pretrain/Step Time": 9.762323366478086} +{"Pretrain/Learning Rate": 4.7932487871788746e-05, "Pretrain/Loss": 2.1007585525512695, "Pretrain/Loss (Raw)": 2.167968273162842, "Pretrain/Step": 1492, "Pretrain/Step Time": 9.753505777567625} +{"Pretrain/Learning Rate": 4.792910589951426e-05, "Pretrain/Loss": 2.09995174407959, "Pretrain/Loss (Raw)": 1.8989272117614746, "Pretrain/Step": 1493, "Pretrain/Step Time": 9.775256333872676} +{"Pretrain/Learning Rate": 4.792572128294722e-05, "Pretrain/Loss": 2.098867893218994, "Pretrain/Loss (Raw)": 1.8419525623321533, "Pretrain/Step": 1494, "Pretrain/Step Time": 9.773952197283506} +{"Pretrain/Learning Rate": 4.792233402247799e-05, "Pretrain/Loss": 2.1002020835876465, "Pretrain/Loss (Raw)": 2.217451333999634, "Pretrain/Step": 1495, "Pretrain/Step Time": 9.78434069827199} +{"Pretrain/Learning Rate": 4.791894411849718e-05, "Pretrain/Loss": 2.0995235443115234, "Pretrain/Loss (Raw)": 2.0771169662475586, "Pretrain/Step": 1496, "Pretrain/Step Time": 9.744067199528217} +{"Pretrain/Learning Rate": 4.7915551571395726e-05, "Pretrain/Loss": 2.099529266357422, "Pretrain/Loss (Raw)": 2.1128592491149902, "Pretrain/Step": 1497, "Pretrain/Step Time": 9.75232084095478} +{"Pretrain/Learning Rate": 4.79121563815649e-05, "Pretrain/Loss": 2.0986952781677246, "Pretrain/Loss (Raw)": 2.1311442852020264, "Pretrain/Step": 1498, "Pretrain/Step Time": 9.828068876639009} +{"Pretrain/Learning Rate": 4.790875854939622e-05, "Pretrain/Loss": 2.098546028137207, "Pretrain/Loss (Raw)": 2.1749207973480225, "Pretrain/Step": 1499, "Pretrain/Step Time": 9.827722124755383} +{"Pretrain/Learning Rate": 4.790535807528156e-05, "Pretrain/Loss": 2.0977513790130615, "Pretrain/Loss (Raw)": 1.939477801322937, "Pretrain/Step": 1500, "Pretrain/Step Time": 9.83329014852643} +{"Pretrain/Learning Rate": 4.7901954959613076e-05, "Pretrain/Loss": 2.0967025756835938, "Pretrain/Loss (Raw)": 2.054669141769409, "Pretrain/Step": 1501, "Pretrain/Step Time": 9.831218376755714} +{"Pretrain/Learning Rate": 4.789854920278323e-05, "Pretrain/Loss": 2.0955419540405273, "Pretrain/Loss (Raw)": 2.0695102214813232, "Pretrain/Step": 1502, "Pretrain/Step Time": 9.81579820252955} +{"Pretrain/Learning Rate": 4.789514080518478e-05, "Pretrain/Loss": 2.096686840057373, "Pretrain/Loss (Raw)": 2.129404306411743, "Pretrain/Step": 1503, "Pretrain/Step Time": 9.81725930608809} +{"Pretrain/Learning Rate": 4.789172976721081e-05, "Pretrain/Loss": 2.0978426933288574, "Pretrain/Loss (Raw)": 1.862402081489563, "Pretrain/Step": 1504, "Pretrain/Step Time": 9.837410103529692} +{"Pretrain/Learning Rate": 4.7888316089254705e-05, "Pretrain/Loss": 2.0989999771118164, "Pretrain/Loss (Raw)": 2.153327465057373, "Pretrain/Step": 1505, "Pretrain/Step Time": 9.834827024489641} +{"Pretrain/Learning Rate": 4.7884899771710126e-05, "Pretrain/Loss": 2.0990099906921387, "Pretrain/Loss (Raw)": 2.0380520820617676, "Pretrain/Step": 1506, "Pretrain/Step Time": 9.84011721983552} +{"Pretrain/Learning Rate": 4.788148081497106e-05, "Pretrain/Loss": 2.102830410003662, "Pretrain/Loss (Raw)": 2.361152410507202, "Pretrain/Step": 1507, "Pretrain/Step Time": 9.842060692608356} +{"Pretrain/Learning Rate": 4.787805921943181e-05, "Pretrain/Loss": 2.1011910438537598, "Pretrain/Loss (Raw)": 1.953774333000183, "Pretrain/Step": 1508, "Pretrain/Step Time": 9.809433724731207} +{"Pretrain/Learning Rate": 4.787463498548698e-05, "Pretrain/Loss": 2.1013784408569336, "Pretrain/Loss (Raw)": 2.210803270339966, "Pretrain/Step": 1509, "Pretrain/Step Time": 9.811032641679049} +{"Pretrain/Learning Rate": 4.787120811353144e-05, "Pretrain/Loss": 2.1006810665130615, "Pretrain/Loss (Raw)": 2.243753433227539, "Pretrain/Step": 1510, "Pretrain/Step Time": 9.810286849737167} +{"Pretrain/Learning Rate": 4.786777860396041e-05, "Pretrain/Loss": 2.1013245582580566, "Pretrain/Loss (Raw)": 1.9008721113204956, "Pretrain/Step": 1511, "Pretrain/Step Time": 9.856216045096517} +{"Pretrain/Learning Rate": 4.78643464571694e-05, "Pretrain/Loss": 2.102627992630005, "Pretrain/Loss (Raw)": 2.207984209060669, "Pretrain/Step": 1512, "Pretrain/Step Time": 9.854078372940421} +{"Pretrain/Learning Rate": 4.786091167355421e-05, "Pretrain/Loss": 2.10258150100708, "Pretrain/Loss (Raw)": 2.081045627593994, "Pretrain/Step": 1513, "Pretrain/Step Time": 9.899436388164759} +{"Pretrain/Learning Rate": 4.785747425351097e-05, "Pretrain/Loss": 2.1037039756774902, "Pretrain/Loss (Raw)": 2.212883472442627, "Pretrain/Step": 1514, "Pretrain/Step Time": 9.891123179346323} +{"Pretrain/Learning Rate": 4.785403419743608e-05, "Pretrain/Loss": 2.1012237071990967, "Pretrain/Loss (Raw)": 1.7688536643981934, "Pretrain/Step": 1515, "Pretrain/Step Time": 9.90723924152553} +{"Pretrain/Learning Rate": 4.785059150572628e-05, "Pretrain/Loss": 2.1020100116729736, "Pretrain/Loss (Raw)": 2.1835267543792725, "Pretrain/Step": 1516, "Pretrain/Step Time": 9.90021831728518} +{"Pretrain/Learning Rate": 4.784714617877859e-05, "Pretrain/Loss": 2.102132558822632, "Pretrain/Loss (Raw)": 2.0764222145080566, "Pretrain/Step": 1517, "Pretrain/Step Time": 9.88345355540514} +{"Pretrain/Learning Rate": 4.784369821699035e-05, "Pretrain/Loss": 2.1038432121276855, "Pretrain/Loss (Raw)": 2.1153032779693604, "Pretrain/Step": 1518, "Pretrain/Step Time": 9.916603634133935} +{"Pretrain/Learning Rate": 4.784024762075918e-05, "Pretrain/Loss": 2.1018238067626953, "Pretrain/Loss (Raw)": 1.9213861227035522, "Pretrain/Step": 1519, "Pretrain/Step Time": 9.897158544510603} +{"Pretrain/Learning Rate": 4.7836794390483035e-05, "Pretrain/Loss": 2.102396249771118, "Pretrain/Loss (Raw)": 2.159834146499634, "Pretrain/Step": 1520, "Pretrain/Step Time": 9.93037585169077} +{"Pretrain/Learning Rate": 4.7833338526560145e-05, "Pretrain/Loss": 2.10208797454834, "Pretrain/Loss (Raw)": 2.0233850479125977, "Pretrain/Step": 1521, "Pretrain/Step Time": 9.926062263548374} +{"Pretrain/Learning Rate": 4.782988002938907e-05, "Pretrain/Loss": 2.1038990020751953, "Pretrain/Loss (Raw)": 2.3002724647521973, "Pretrain/Step": 1522, "Pretrain/Step Time": 9.933281352743506} +{"Pretrain/Learning Rate": 4.782641889936864e-05, "Pretrain/Loss": 2.103248357772827, "Pretrain/Loss (Raw)": 2.028550624847412, "Pretrain/Step": 1523, "Pretrain/Step Time": 9.9357694927603} +{"Pretrain/Learning Rate": 4.782295513689803e-05, "Pretrain/Loss": 2.103177547454834, "Pretrain/Loss (Raw)": 2.199350595474243, "Pretrain/Step": 1524, "Pretrain/Step Time": 9.95668458379805} +{"Pretrain/Learning Rate": 4.7819488742376686e-05, "Pretrain/Loss": 2.1020805835723877, "Pretrain/Loss (Raw)": 1.8142945766448975, "Pretrain/Step": 1525, "Pretrain/Step Time": 9.951805055141449} +{"Pretrain/Learning Rate": 4.7816019716204375e-05, "Pretrain/Loss": 2.101069450378418, "Pretrain/Loss (Raw)": 2.1210293769836426, "Pretrain/Step": 1526, "Pretrain/Step Time": 9.984064428135753} +{"Pretrain/Learning Rate": 4.781254805878115e-05, "Pretrain/Loss": 2.101111888885498, "Pretrain/Loss (Raw)": 2.033660411834717, "Pretrain/Step": 1527, "Pretrain/Step Time": 9.98917431384325} +{"Pretrain/Learning Rate": 4.780907377050739e-05, "Pretrain/Loss": 2.099766731262207, "Pretrain/Loss (Raw)": 2.1089320182800293, "Pretrain/Step": 1528, "Pretrain/Step Time": 10.001127680763602} +{"Pretrain/Learning Rate": 4.780559685178376e-05, "Pretrain/Loss": 2.1008570194244385, "Pretrain/Loss (Raw)": 2.0534374713897705, "Pretrain/Step": 1529, "Pretrain/Step Time": 10.014686284586787} +{"Pretrain/Learning Rate": 4.780211730301124e-05, "Pretrain/Loss": 2.100797176361084, "Pretrain/Loss (Raw)": 2.054609537124634, "Pretrain/Step": 1530, "Pretrain/Step Time": 10.013202017173171} +{"Pretrain/Learning Rate": 4.779863512459111e-05, "Pretrain/Loss": 2.100235939025879, "Pretrain/Loss (Raw)": 2.1015288829803467, "Pretrain/Step": 1531, "Pretrain/Step Time": 10.005939420312643} +{"Pretrain/Learning Rate": 4.779515031692494e-05, "Pretrain/Loss": 2.101071357727051, "Pretrain/Loss (Raw)": 2.1308043003082275, "Pretrain/Step": 1532, "Pretrain/Step Time": 9.99187414161861} +{"Pretrain/Learning Rate": 4.7791662880414625e-05, "Pretrain/Loss": 2.1011412143707275, "Pretrain/Loss (Raw)": 2.149433135986328, "Pretrain/Step": 1533, "Pretrain/Step Time": 10.009631900116801} +{"Pretrain/Learning Rate": 4.778817281546235e-05, "Pretrain/Loss": 2.105400800704956, "Pretrain/Loss (Raw)": 2.420379400253296, "Pretrain/Step": 1534, "Pretrain/Step Time": 10.059512117877603} +{"Pretrain/Learning Rate": 4.7784680122470605e-05, "Pretrain/Loss": 2.1030185222625732, "Pretrain/Loss (Raw)": 2.022681713104248, "Pretrain/Step": 1535, "Pretrain/Step Time": 10.085763527080417} +{"Pretrain/Learning Rate": 4.778118480184218e-05, "Pretrain/Loss": 2.1049985885620117, "Pretrain/Loss (Raw)": 2.3635966777801514, "Pretrain/Step": 1536, "Pretrain/Step Time": 10.07787693850696} +{"Pretrain/Learning Rate": 4.777768685398017e-05, "Pretrain/Loss": 2.1048460006713867, "Pretrain/Loss (Raw)": 2.05989933013916, "Pretrain/Step": 1537, "Pretrain/Step Time": 10.069436712190509} +{"Pretrain/Learning Rate": 4.777418627928799e-05, "Pretrain/Loss": 2.1052563190460205, "Pretrain/Loss (Raw)": 2.159452438354492, "Pretrain/Step": 1538, "Pretrain/Step Time": 10.078860955312848} +{"Pretrain/Learning Rate": 4.777068307816932e-05, "Pretrain/Loss": 2.1049556732177734, "Pretrain/Loss (Raw)": 1.9214779138565063, "Pretrain/Step": 1539, "Pretrain/Step Time": 10.079377623274922} +{"Pretrain/Learning Rate": 4.776717725102819e-05, "Pretrain/Loss": 2.104152202606201, "Pretrain/Loss (Raw)": 2.0674734115600586, "Pretrain/Step": 1540, "Pretrain/Step Time": 10.077249251306057} +{"Pretrain/Learning Rate": 4.77636687982689e-05, "Pretrain/Loss": 2.0999021530151367, "Pretrain/Loss (Raw)": 2.0044896602630615, "Pretrain/Step": 1541, "Pretrain/Step Time": 10.071940956637263} +{"Pretrain/Learning Rate": 4.776015772029605e-05, "Pretrain/Loss": 2.099358558654785, "Pretrain/Loss (Raw)": 2.1665198802948, "Pretrain/Step": 1542, "Pretrain/Step Time": 10.05207352526486} +{"Pretrain/Learning Rate": 4.7756644017514564e-05, "Pretrain/Loss": 2.0984647274017334, "Pretrain/Loss (Raw)": 2.0667214393615723, "Pretrain/Step": 1543, "Pretrain/Step Time": 10.013510663062334} +{"Pretrain/Learning Rate": 4.775312769032966e-05, "Pretrain/Loss": 2.100475788116455, "Pretrain/Loss (Raw)": 2.2593817710876465, "Pretrain/Step": 1544, "Pretrain/Step Time": 10.01573914475739} +{"Pretrain/Learning Rate": 4.774960873914685e-05, "Pretrain/Loss": 2.1017208099365234, "Pretrain/Loss (Raw)": 2.074108362197876, "Pretrain/Step": 1545, "Pretrain/Step Time": 10.029225977137685} +{"Pretrain/Learning Rate": 4.774608716437196e-05, "Pretrain/Loss": 2.1000847816467285, "Pretrain/Loss (Raw)": 1.9929512739181519, "Pretrain/Step": 1546, "Pretrain/Step Time": 10.028649801388383} +{"Pretrain/Learning Rate": 4.7742562966411117e-05, "Pretrain/Loss": 2.099128246307373, "Pretrain/Loss (Raw)": 2.0205347537994385, "Pretrain/Step": 1547, "Pretrain/Step Time": 10.04458331130445} +{"Pretrain/Learning Rate": 4.7739036145670744e-05, "Pretrain/Loss": 2.0983541011810303, "Pretrain/Loss (Raw)": 2.036501407623291, "Pretrain/Step": 1548, "Pretrain/Step Time": 10.017466992139816} +{"Pretrain/Learning Rate": 4.773550670255758e-05, "Pretrain/Loss": 2.096676826477051, "Pretrain/Loss (Raw)": 1.8115661144256592, "Pretrain/Step": 1549, "Pretrain/Step Time": 10.044971158728004} +{"Pretrain/Learning Rate": 4.773197463747865e-05, "Pretrain/Loss": 2.0974650382995605, "Pretrain/Loss (Raw)": 2.160390615463257, "Pretrain/Step": 1550, "Pretrain/Step Time": 10.002170545980334} +{"Pretrain/Learning Rate": 4.772843995084128e-05, "Pretrain/Loss": 2.0997934341430664, "Pretrain/Loss (Raw)": 2.170238971710205, "Pretrain/Step": 1551, "Pretrain/Step Time": 10.000595692545176} +{"Pretrain/Learning Rate": 4.7724902643053116e-05, "Pretrain/Loss": 2.09946870803833, "Pretrain/Loss (Raw)": 2.051281690597534, "Pretrain/Step": 1552, "Pretrain/Step Time": 10.03544040210545} +{"Pretrain/Learning Rate": 4.77213627145221e-05, "Pretrain/Loss": 2.0989999771118164, "Pretrain/Loss (Raw)": 2.0612690448760986, "Pretrain/Step": 1553, "Pretrain/Step Time": 10.037871709093451} +{"Pretrain/Learning Rate": 4.771782016565647e-05, "Pretrain/Loss": 2.0997185707092285, "Pretrain/Loss (Raw)": 2.2845311164855957, "Pretrain/Step": 1554, "Pretrain/Step Time": 10.041260855272412} +{"Pretrain/Learning Rate": 4.771427499686477e-05, "Pretrain/Loss": 2.0984699726104736, "Pretrain/Loss (Raw)": 2.0011062622070312, "Pretrain/Step": 1555, "Pretrain/Step Time": 10.037662649527192} +{"Pretrain/Learning Rate": 4.771072720855584e-05, "Pretrain/Loss": 2.0982158184051514, "Pretrain/Loss (Raw)": 2.1200716495513916, "Pretrain/Step": 1556, "Pretrain/Step Time": 10.0476680919528} +{"Pretrain/Learning Rate": 4.770717680113883e-05, "Pretrain/Loss": 2.098644256591797, "Pretrain/Loss (Raw)": 1.9630132913589478, "Pretrain/Step": 1557, "Pretrain/Step Time": 10.062798572704196} +{"Pretrain/Learning Rate": 4.770362377502319e-05, "Pretrain/Loss": 2.099010467529297, "Pretrain/Loss (Raw)": 2.155576467514038, "Pretrain/Step": 1558, "Pretrain/Step Time": 10.038509171456099} +{"Pretrain/Learning Rate": 4.770006813061868e-05, "Pretrain/Loss": 2.0991806983947754, "Pretrain/Loss (Raw)": 2.2268974781036377, "Pretrain/Step": 1559, "Pretrain/Step Time": 10.02143026329577} +{"Pretrain/Learning Rate": 4.769650986833535e-05, "Pretrain/Loss": 2.0995066165924072, "Pretrain/Loss (Raw)": 2.1484434604644775, "Pretrain/Step": 1560, "Pretrain/Step Time": 10.009751690551639} +{"Pretrain/Learning Rate": 4.769294898858354e-05, "Pretrain/Loss": 2.100999116897583, "Pretrain/Loss (Raw)": 2.188196897506714, "Pretrain/Step": 1561, "Pretrain/Step Time": 10.014526132494211} +{"Pretrain/Learning Rate": 4.768938549177393e-05, "Pretrain/Loss": 2.102536916732788, "Pretrain/Loss (Raw)": 2.22871994972229, "Pretrain/Step": 1562, "Pretrain/Step Time": 10.019927762448788} +{"Pretrain/Learning Rate": 4.768581937831746e-05, "Pretrain/Loss": 2.1032466888427734, "Pretrain/Loss (Raw)": 2.10954213142395, "Pretrain/Step": 1563, "Pretrain/Step Time": 10.019545605406165} +{"Pretrain/Learning Rate": 4.768225064862541e-05, "Pretrain/Loss": 2.102962017059326, "Pretrain/Loss (Raw)": 2.2254862785339355, "Pretrain/Step": 1564, "Pretrain/Step Time": 10.00358777306974} +{"Pretrain/Learning Rate": 4.767867930310933e-05, "Pretrain/Loss": 2.1029202938079834, "Pretrain/Loss (Raw)": 2.1613929271698, "Pretrain/Step": 1565, "Pretrain/Step Time": 10.00654891692102} +{"Pretrain/Learning Rate": 4.7675105342181084e-05, "Pretrain/Loss": 2.101144313812256, "Pretrain/Loss (Raw)": 1.9543055295944214, "Pretrain/Step": 1566, "Pretrain/Step Time": 10.003907985985279} +{"Pretrain/Learning Rate": 4.767152876625285e-05, "Pretrain/Loss": 2.1023473739624023, "Pretrain/Loss (Raw)": 2.0995800495147705, "Pretrain/Step": 1567, "Pretrain/Step Time": 9.996654523536563} +{"Pretrain/Learning Rate": 4.766794957573708e-05, "Pretrain/Loss": 2.100659132003784, "Pretrain/Loss (Raw)": 2.0224225521087646, "Pretrain/Step": 1568, "Pretrain/Step Time": 9.99386783130467} +{"Pretrain/Learning Rate": 4.766436777104655e-05, "Pretrain/Loss": 2.099997043609619, "Pretrain/Loss (Raw)": 2.123027801513672, "Pretrain/Step": 1569, "Pretrain/Step Time": 9.991346856579185} +{"Pretrain/Learning Rate": 4.766078335259433e-05, "Pretrain/Loss": 2.0989840030670166, "Pretrain/Loss (Raw)": 2.0166094303131104, "Pretrain/Step": 1570, "Pretrain/Step Time": 9.994091022759676} +{"Pretrain/Learning Rate": 4.76571963207938e-05, "Pretrain/Loss": 2.096250057220459, "Pretrain/Loss (Raw)": 1.9267791509628296, "Pretrain/Step": 1571, "Pretrain/Step Time": 10.025496697053313} +{"Pretrain/Learning Rate": 4.765360667605861e-05, "Pretrain/Loss": 2.0949928760528564, "Pretrain/Loss (Raw)": 1.9070326089859009, "Pretrain/Step": 1572, "Pretrain/Step Time": 10.028545405715704} +{"Pretrain/Learning Rate": 4.765001441880276e-05, "Pretrain/Loss": 2.092222213745117, "Pretrain/Loss (Raw)": 1.9806712865829468, "Pretrain/Step": 1573, "Pretrain/Step Time": 10.034010734409094} +{"Pretrain/Learning Rate": 4.764641954944052e-05, "Pretrain/Loss": 2.0917677879333496, "Pretrain/Loss (Raw)": 2.10085129737854, "Pretrain/Step": 1574, "Pretrain/Step Time": 9.984115567058325} +{"Pretrain/Learning Rate": 4.764282206838646e-05, "Pretrain/Loss": 2.089202880859375, "Pretrain/Loss (Raw)": 2.2035601139068604, "Pretrain/Step": 1575, "Pretrain/Step Time": 10.017006624490023} +{"Pretrain/Learning Rate": 4.763922197605547e-05, "Pretrain/Loss": 2.0901384353637695, "Pretrain/Loss (Raw)": 2.180992364883423, "Pretrain/Step": 1576, "Pretrain/Step Time": 10.005318539217114} +{"Pretrain/Learning Rate": 4.763561927286271e-05, "Pretrain/Loss": 2.0851426124572754, "Pretrain/Loss (Raw)": 1.6714106798171997, "Pretrain/Step": 1577, "Pretrain/Step Time": 10.024436580017209} +{"Pretrain/Learning Rate": 4.7632013959223684e-05, "Pretrain/Loss": 2.083799362182617, "Pretrain/Loss (Raw)": 2.0967659950256348, "Pretrain/Step": 1578, "Pretrain/Step Time": 10.025532454252243} +{"Pretrain/Learning Rate": 4.7628406035554156e-05, "Pretrain/Loss": 2.0825259685516357, "Pretrain/Loss (Raw)": 1.9679372310638428, "Pretrain/Step": 1579, "Pretrain/Step Time": 10.010983940213919} +{"Pretrain/Learning Rate": 4.762479550227022e-05, "Pretrain/Loss": 2.082101821899414, "Pretrain/Loss (Raw)": 1.9396576881408691, "Pretrain/Step": 1580, "Pretrain/Step Time": 10.02560767158866} +{"Pretrain/Learning Rate": 4.762118235978825e-05, "Pretrain/Loss": 2.0815422534942627, "Pretrain/Loss (Raw)": 2.005164384841919, "Pretrain/Step": 1581, "Pretrain/Step Time": 10.031046312302351} +{"Pretrain/Learning Rate": 4.7617566608524946e-05, "Pretrain/Loss": 2.0817437171936035, "Pretrain/Loss (Raw)": 2.1836304664611816, "Pretrain/Step": 1582, "Pretrain/Step Time": 10.000699140131474} +{"Pretrain/Learning Rate": 4.761394824889727e-05, "Pretrain/Loss": 2.0812039375305176, "Pretrain/Loss (Raw)": 2.0933375358581543, "Pretrain/Step": 1583, "Pretrain/Step Time": 10.004567379131913} +{"Pretrain/Learning Rate": 4.761032728132253e-05, "Pretrain/Loss": 2.079308271408081, "Pretrain/Loss (Raw)": 1.919892430305481, "Pretrain/Step": 1584, "Pretrain/Step Time": 10.027411190792918} +{"Pretrain/Learning Rate": 4.76067037062183e-05, "Pretrain/Loss": 2.0804715156555176, "Pretrain/Loss (Raw)": 2.0957107543945312, "Pretrain/Step": 1585, "Pretrain/Step Time": 10.017022639513016} +{"Pretrain/Learning Rate": 4.7603077524002474e-05, "Pretrain/Loss": 2.0804829597473145, "Pretrain/Loss (Raw)": 2.133082389831543, "Pretrain/Step": 1586, "Pretrain/Step Time": 10.100327413529158} +{"Pretrain/Learning Rate": 4.759944873509324e-05, "Pretrain/Loss": 2.0824215412139893, "Pretrain/Loss (Raw)": 2.115705966949463, "Pretrain/Step": 1587, "Pretrain/Step Time": 10.093234641477466} +{"Pretrain/Learning Rate": 4.7595817339909086e-05, "Pretrain/Loss": 2.081758737564087, "Pretrain/Loss (Raw)": 1.9751039743423462, "Pretrain/Step": 1588, "Pretrain/Step Time": 10.092038683593273} +{"Pretrain/Learning Rate": 4.75921833388688e-05, "Pretrain/Loss": 2.081827402114868, "Pretrain/Loss (Raw)": 2.010709762573242, "Pretrain/Step": 1589, "Pretrain/Step Time": 10.092877751216292} +{"Pretrain/Learning Rate": 4.758854673239147e-05, "Pretrain/Loss": 2.08205246925354, "Pretrain/Loss (Raw)": 2.24004864692688, "Pretrain/Step": 1590, "Pretrain/Step Time": 10.071104584261775} +{"Pretrain/Learning Rate": 4.7584907520896495e-05, "Pretrain/Loss": 2.079829216003418, "Pretrain/Loss (Raw)": 1.9792108535766602, "Pretrain/Step": 1591, "Pretrain/Step Time": 10.074760438874364} +{"Pretrain/Learning Rate": 4.7581265704803554e-05, "Pretrain/Loss": 2.082942485809326, "Pretrain/Loss (Raw)": 2.1140034198760986, "Pretrain/Step": 1592, "Pretrain/Step Time": 10.03142385929823} +{"Pretrain/Learning Rate": 4.757762128453266e-05, "Pretrain/Loss": 2.0828604698181152, "Pretrain/Loss (Raw)": 2.082993745803833, "Pretrain/Step": 1593, "Pretrain/Step Time": 10.036035235971212} +{"Pretrain/Learning Rate": 4.757397426050408e-05, "Pretrain/Loss": 2.089282751083374, "Pretrain/Loss (Raw)": 2.2793076038360596, "Pretrain/Step": 1594, "Pretrain/Step Time": 10.036912586539984} +{"Pretrain/Learning Rate": 4.757032463313842e-05, "Pretrain/Loss": 2.089632511138916, "Pretrain/Loss (Raw)": 2.1530818939208984, "Pretrain/Step": 1595, "Pretrain/Step Time": 10.055182540789247} +{"Pretrain/Learning Rate": 4.756667240285656e-05, "Pretrain/Loss": 2.0917389392852783, "Pretrain/Loss (Raw)": 2.3584258556365967, "Pretrain/Step": 1596, "Pretrain/Step Time": 10.050562703981996} +{"Pretrain/Learning Rate": 4.756301757007971e-05, "Pretrain/Loss": 2.094526767730713, "Pretrain/Loss (Raw)": 2.3626575469970703, "Pretrain/Step": 1597, "Pretrain/Step Time": 10.06630620919168} +{"Pretrain/Learning Rate": 4.755936013522935e-05, "Pretrain/Loss": 2.094902992248535, "Pretrain/Loss (Raw)": 2.132082462310791, "Pretrain/Step": 1598, "Pretrain/Step Time": 10.05941423214972} +{"Pretrain/Learning Rate": 4.7555700098727276e-05, "Pretrain/Loss": 2.0941402912139893, "Pretrain/Loss (Raw)": 2.1056737899780273, "Pretrain/Step": 1599, "Pretrain/Step Time": 10.099739393219352} +{"Pretrain/Learning Rate": 4.755203746099558e-05, "Pretrain/Loss": 2.0949015617370605, "Pretrain/Loss (Raw)": 2.040391206741333, "Pretrain/Step": 1600, "Pretrain/Step Time": 10.104599023237824} +{"Pretrain/Learning Rate": 4.754837222245666e-05, "Pretrain/Loss": 2.0938291549682617, "Pretrain/Loss (Raw)": 2.038567066192627, "Pretrain/Step": 1601, "Pretrain/Step Time": 10.101339302957058} +{"Pretrain/Learning Rate": 4.75447043835332e-05, "Pretrain/Loss": 2.092778205871582, "Pretrain/Loss (Raw)": 2.178946018218994, "Pretrain/Step": 1602, "Pretrain/Step Time": 10.094296637922525} +{"Pretrain/Learning Rate": 4.75410339446482e-05, "Pretrain/Loss": 2.094069480895996, "Pretrain/Loss (Raw)": 2.3369245529174805, "Pretrain/Step": 1603, "Pretrain/Step Time": 10.0888930875808} +{"Pretrain/Learning Rate": 4.753736090622494e-05, "Pretrain/Loss": 2.0931217670440674, "Pretrain/Loss (Raw)": 1.9472943544387817, "Pretrain/Step": 1604, "Pretrain/Step Time": 10.089045083150268} +{"Pretrain/Learning Rate": 4.753368526868703e-05, "Pretrain/Loss": 2.090928316116333, "Pretrain/Loss (Raw)": 1.9883784055709839, "Pretrain/Step": 1605, "Pretrain/Step Time": 10.094529563561082} +{"Pretrain/Learning Rate": 4.753000703245834e-05, "Pretrain/Loss": 2.0913877487182617, "Pretrain/Loss (Raw)": 2.0869998931884766, "Pretrain/Step": 1606, "Pretrain/Step Time": 10.097317807376385} +{"Pretrain/Learning Rate": 4.752632619796309e-05, "Pretrain/Loss": 2.0931625366210938, "Pretrain/Loss (Raw)": 2.179797649383545, "Pretrain/Step": 1607, "Pretrain/Step Time": 10.105865575373173} +{"Pretrain/Learning Rate": 4.752264276562575e-05, "Pretrain/Loss": 2.0945253372192383, "Pretrain/Loss (Raw)": 2.128779172897339, "Pretrain/Step": 1608, "Pretrain/Step Time": 10.099664514884353} +{"Pretrain/Learning Rate": 4.751895673587111e-05, "Pretrain/Loss": 2.0955824851989746, "Pretrain/Loss (Raw)": 2.194132089614868, "Pretrain/Step": 1609, "Pretrain/Step Time": 10.104668317362666} +{"Pretrain/Learning Rate": 4.751526810912427e-05, "Pretrain/Loss": 2.0931684970855713, "Pretrain/Loss (Raw)": 1.9623260498046875, "Pretrain/Step": 1610, "Pretrain/Step Time": 10.10050299949944} +{"Pretrain/Learning Rate": 4.751157688581062e-05, "Pretrain/Loss": 2.0934700965881348, "Pretrain/Loss (Raw)": 2.097752571105957, "Pretrain/Step": 1611, "Pretrain/Step Time": 10.130150180310011} +{"Pretrain/Learning Rate": 4.750788306635584e-05, "Pretrain/Loss": 2.095179557800293, "Pretrain/Loss (Raw)": 2.1982481479644775, "Pretrain/Step": 1612, "Pretrain/Step Time": 10.145009342581034} +{"Pretrain/Learning Rate": 4.7504186651185926e-05, "Pretrain/Loss": 2.0956149101257324, "Pretrain/Loss (Raw)": 2.163736581802368, "Pretrain/Step": 1613, "Pretrain/Step Time": 10.158948885276914} +{"Pretrain/Learning Rate": 4.7500487640727165e-05, "Pretrain/Loss": 2.0955376625061035, "Pretrain/Loss (Raw)": 2.1119420528411865, "Pretrain/Step": 1614, "Pretrain/Step Time": 10.152104329317808} +{"Pretrain/Learning Rate": 4.7496786035406144e-05, "Pretrain/Loss": 2.096538543701172, "Pretrain/Loss (Raw)": 2.135868549346924, "Pretrain/Step": 1615, "Pretrain/Step Time": 10.159693049266934} +{"Pretrain/Learning Rate": 4.749308183564974e-05, "Pretrain/Loss": 2.0936975479125977, "Pretrain/Loss (Raw)": 2.1417887210845947, "Pretrain/Step": 1616, "Pretrain/Step Time": 10.115440601482987} +{"Pretrain/Learning Rate": 4.748937504188517e-05, "Pretrain/Loss": 2.093303680419922, "Pretrain/Loss (Raw)": 2.134167432785034, "Pretrain/Step": 1617, "Pretrain/Step Time": 10.124759742990136} +{"Pretrain/Learning Rate": 4.748566565453988e-05, "Pretrain/Loss": 2.0928244590759277, "Pretrain/Loss (Raw)": 2.0425007343292236, "Pretrain/Step": 1618, "Pretrain/Step Time": 10.129572045058012} +{"Pretrain/Learning Rate": 4.748195367404167e-05, "Pretrain/Loss": 2.0932674407958984, "Pretrain/Loss (Raw)": 2.2083215713500977, "Pretrain/Step": 1619, "Pretrain/Step Time": 10.126555582508445} +{"Pretrain/Learning Rate": 4.747823910081863e-05, "Pretrain/Loss": 2.0925066471099854, "Pretrain/Loss (Raw)": 2.070570468902588, "Pretrain/Step": 1620, "Pretrain/Step Time": 10.137317968532443} +{"Pretrain/Learning Rate": 4.747452193529913e-05, "Pretrain/Loss": 2.093106269836426, "Pretrain/Loss (Raw)": 1.9756853580474854, "Pretrain/Step": 1621, "Pretrain/Step Time": 10.117126842960715} +{"Pretrain/Learning Rate": 4.747080217791187e-05, "Pretrain/Loss": 2.0951149463653564, "Pretrain/Loss (Raw)": 2.099050998687744, "Pretrain/Step": 1622, "Pretrain/Step Time": 10.160065507516265} +{"Pretrain/Learning Rate": 4.7467079829085804e-05, "Pretrain/Loss": 2.0938167572021484, "Pretrain/Loss (Raw)": 2.0513126850128174, "Pretrain/Step": 1623, "Pretrain/Step Time": 10.123363710939884} +{"Pretrain/Learning Rate": 4.746335488925022e-05, "Pretrain/Loss": 2.0961084365844727, "Pretrain/Loss (Raw)": 2.3704259395599365, "Pretrain/Step": 1624, "Pretrain/Step Time": 10.123132567852736} +{"Pretrain/Learning Rate": 4.7459627358834716e-05, "Pretrain/Loss": 2.0964980125427246, "Pretrain/Loss (Raw)": 2.162703514099121, "Pretrain/Step": 1625, "Pretrain/Step Time": 10.116499641910195} +{"Pretrain/Learning Rate": 4.7455897238269134e-05, "Pretrain/Loss": 2.096353769302368, "Pretrain/Loss (Raw)": 2.112701416015625, "Pretrain/Step": 1626, "Pretrain/Step Time": 10.042382821440697} +{"Pretrain/Learning Rate": 4.745216452798368e-05, "Pretrain/Loss": 2.095871686935425, "Pretrain/Loss (Raw)": 2.1132051944732666, "Pretrain/Step": 1627, "Pretrain/Step Time": 10.040826369076967} +{"Pretrain/Learning Rate": 4.744842922840881e-05, "Pretrain/Loss": 2.0972702503204346, "Pretrain/Loss (Raw)": 2.118509292602539, "Pretrain/Step": 1628, "Pretrain/Step Time": 10.051411215215921} +{"Pretrain/Learning Rate": 4.74446913399753e-05, "Pretrain/Loss": 2.09709095954895, "Pretrain/Loss (Raw)": 2.0317132472991943, "Pretrain/Step": 1629, "Pretrain/Step Time": 10.05831854045391} +{"Pretrain/Learning Rate": 4.744095086311422e-05, "Pretrain/Loss": 2.0977978706359863, "Pretrain/Loss (Raw)": 2.160003423690796, "Pretrain/Step": 1630, "Pretrain/Step Time": 10.064835404977202} +{"Pretrain/Learning Rate": 4.743720779825694e-05, "Pretrain/Loss": 2.095092296600342, "Pretrain/Loss (Raw)": 1.7830647230148315, "Pretrain/Step": 1631, "Pretrain/Step Time": 10.065369015559554} +{"Pretrain/Learning Rate": 4.743346214583514e-05, "Pretrain/Loss": 2.096686363220215, "Pretrain/Loss (Raw)": 2.0664761066436768, "Pretrain/Step": 1632, "Pretrain/Step Time": 10.018472000956535} +{"Pretrain/Learning Rate": 4.742971390628076e-05, "Pretrain/Loss": 2.094666004180908, "Pretrain/Loss (Raw)": 1.8947168588638306, "Pretrain/Step": 1633, "Pretrain/Step Time": 10.092133106663823} +{"Pretrain/Learning Rate": 4.742596308002609e-05, "Pretrain/Loss": 2.0965566635131836, "Pretrain/Loss (Raw)": 2.2800447940826416, "Pretrain/Step": 1634, "Pretrain/Step Time": 10.088771039620042} +{"Pretrain/Learning Rate": 4.742220966750368e-05, "Pretrain/Loss": 2.0920424461364746, "Pretrain/Loss (Raw)": 1.7833410501480103, "Pretrain/Step": 1635, "Pretrain/Step Time": 10.110681096091866} +{"Pretrain/Learning Rate": 4.7418453669146404e-05, "Pretrain/Loss": 2.093153953552246, "Pretrain/Loss (Raw)": 2.0960545539855957, "Pretrain/Step": 1636, "Pretrain/Step Time": 10.107022324576974} +{"Pretrain/Learning Rate": 4.74146950853874e-05, "Pretrain/Loss": 2.091675281524658, "Pretrain/Loss (Raw)": 2.021545648574829, "Pretrain/Step": 1637, "Pretrain/Step Time": 10.113739540800452} +{"Pretrain/Learning Rate": 4.741093391666014e-05, "Pretrain/Loss": 2.089761972427368, "Pretrain/Loss (Raw)": 1.9988206624984741, "Pretrain/Step": 1638, "Pretrain/Step Time": 10.098779866471887} +{"Pretrain/Learning Rate": 4.7407170163398375e-05, "Pretrain/Loss": 2.0891823768615723, "Pretrain/Loss (Raw)": 1.826702356338501, "Pretrain/Step": 1639, "Pretrain/Step Time": 10.056394850835204} +{"Pretrain/Learning Rate": 4.740340382603616e-05, "Pretrain/Loss": 2.086963176727295, "Pretrain/Loss (Raw)": 1.9239039421081543, "Pretrain/Step": 1640, "Pretrain/Step Time": 10.120873231440783} +{"Pretrain/Learning Rate": 4.739963490500785e-05, "Pretrain/Loss": 2.087106704711914, "Pretrain/Loss (Raw)": 2.0994479656219482, "Pretrain/Step": 1641, "Pretrain/Step Time": 10.058824399486184} +{"Pretrain/Learning Rate": 4.7395863400748096e-05, "Pretrain/Loss": 2.0871500968933105, "Pretrain/Loss (Raw)": 2.218423843383789, "Pretrain/Step": 1642, "Pretrain/Step Time": 10.063971439376473} +{"Pretrain/Learning Rate": 4.7392089313691835e-05, "Pretrain/Loss": 2.0883119106292725, "Pretrain/Loss (Raw)": 1.9175384044647217, "Pretrain/Step": 1643, "Pretrain/Step Time": 10.030309099704027} +{"Pretrain/Learning Rate": 4.738831264427432e-05, "Pretrain/Loss": 2.0868358612060547, "Pretrain/Loss (Raw)": 1.994604229927063, "Pretrain/Step": 1644, "Pretrain/Step Time": 10.034556036815047} +{"Pretrain/Learning Rate": 4.73845333929311e-05, "Pretrain/Loss": 2.0880863666534424, "Pretrain/Loss (Raw)": 2.236482858657837, "Pretrain/Step": 1645, "Pretrain/Step Time": 10.011545438319445} +{"Pretrain/Learning Rate": 4.738075156009801e-05, "Pretrain/Loss": 2.0882973670959473, "Pretrain/Loss (Raw)": 2.142326831817627, "Pretrain/Step": 1646, "Pretrain/Step Time": 9.979476088657975} +{"Pretrain/Learning Rate": 4.737696714621118e-05, "Pretrain/Loss": 2.088348627090454, "Pretrain/Loss (Raw)": 1.9279277324676514, "Pretrain/Step": 1647, "Pretrain/Step Time": 9.983393108472228} +{"Pretrain/Learning Rate": 4.7373180151707065e-05, "Pretrain/Loss": 2.087496757507324, "Pretrain/Loss (Raw)": 2.050816297531128, "Pretrain/Step": 1648, "Pretrain/Step Time": 9.95415977947414} +{"Pretrain/Learning Rate": 4.7369390577022385e-05, "Pretrain/Loss": 2.0881199836730957, "Pretrain/Loss (Raw)": 2.1031665802001953, "Pretrain/Step": 1649, "Pretrain/Step Time": 9.96215339191258} +{"Pretrain/Learning Rate": 4.736559842259417e-05, "Pretrain/Loss": 2.085505485534668, "Pretrain/Loss (Raw)": 1.965591549873352, "Pretrain/Step": 1650, "Pretrain/Step Time": 9.948532450944185} +{"Pretrain/Learning Rate": 4.736180368885976e-05, "Pretrain/Loss": 2.085999011993408, "Pretrain/Loss (Raw)": 2.091747522354126, "Pretrain/Step": 1651, "Pretrain/Step Time": 10.012303667142987} +{"Pretrain/Learning Rate": 4.735800637625678e-05, "Pretrain/Loss": 2.085692882537842, "Pretrain/Loss (Raw)": 2.160182237625122, "Pretrain/Step": 1652, "Pretrain/Step Time": 9.987699998542666} +{"Pretrain/Learning Rate": 4.735420648522314e-05, "Pretrain/Loss": 2.083667278289795, "Pretrain/Loss (Raw)": 1.5550036430358887, "Pretrain/Step": 1653, "Pretrain/Step Time": 9.991354087367654} +{"Pretrain/Learning Rate": 4.7350404016197083e-05, "Pretrain/Loss": 2.083759307861328, "Pretrain/Loss (Raw)": 2.1328072547912598, "Pretrain/Step": 1654, "Pretrain/Step Time": 9.953297685831785} +{"Pretrain/Learning Rate": 4.734659896961711e-05, "Pretrain/Loss": 2.085348129272461, "Pretrain/Loss (Raw)": 2.2370214462280273, "Pretrain/Step": 1655, "Pretrain/Step Time": 9.954899739474058} +{"Pretrain/Learning Rate": 4.734279134592204e-05, "Pretrain/Loss": 2.0835447311401367, "Pretrain/Loss (Raw)": 1.8781119585037231, "Pretrain/Step": 1656, "Pretrain/Step Time": 9.934849869459867} +{"Pretrain/Learning Rate": 4.7338981145550994e-05, "Pretrain/Loss": 2.083651065826416, "Pretrain/Loss (Raw)": 2.0670292377471924, "Pretrain/Step": 1657, "Pretrain/Step Time": 9.929899094626307} +{"Pretrain/Learning Rate": 4.7335168368943374e-05, "Pretrain/Loss": 2.0830793380737305, "Pretrain/Loss (Raw)": 1.981424331665039, "Pretrain/Step": 1658, "Pretrain/Step Time": 9.92425812035799} +{"Pretrain/Learning Rate": 4.733135301653889e-05, "Pretrain/Loss": 2.083739995956421, "Pretrain/Loss (Raw)": 2.186087131500244, "Pretrain/Step": 1659, "Pretrain/Step Time": 9.923842841759324} +{"Pretrain/Learning Rate": 4.732753508877755e-05, "Pretrain/Loss": 2.0834949016571045, "Pretrain/Loss (Raw)": 2.0994296073913574, "Pretrain/Step": 1660, "Pretrain/Step Time": 9.923265201970935} +{"Pretrain/Learning Rate": 4.732371458609966e-05, "Pretrain/Loss": 2.083035469055176, "Pretrain/Loss (Raw)": 2.090640068054199, "Pretrain/Step": 1661, "Pretrain/Step Time": 9.908305071294308} +{"Pretrain/Learning Rate": 4.73198915089458e-05, "Pretrain/Loss": 2.081228017807007, "Pretrain/Loss (Raw)": 2.1890110969543457, "Pretrain/Step": 1662, "Pretrain/Step Time": 9.854066098108888} +{"Pretrain/Learning Rate": 4.731606585775689e-05, "Pretrain/Loss": 2.081611156463623, "Pretrain/Loss (Raw)": 2.071712017059326, "Pretrain/Step": 1663, "Pretrain/Step Time": 9.832776352763176} +{"Pretrain/Learning Rate": 4.731223763297409e-05, "Pretrain/Loss": 2.0800561904907227, "Pretrain/Loss (Raw)": 2.1646032333374023, "Pretrain/Step": 1664, "Pretrain/Step Time": 9.858895279467106} +{"Pretrain/Learning Rate": 4.730840683503892e-05, "Pretrain/Loss": 2.080585479736328, "Pretrain/Loss (Raw)": 2.1276135444641113, "Pretrain/Step": 1665, "Pretrain/Step Time": 9.843074638396502} +{"Pretrain/Learning Rate": 4.730457346439315e-05, "Pretrain/Loss": 2.0789895057678223, "Pretrain/Loss (Raw)": 1.955161213874817, "Pretrain/Step": 1666, "Pretrain/Step Time": 9.836118971928954} +{"Pretrain/Learning Rate": 4.7300737521478863e-05, "Pretrain/Loss": 2.0805537700653076, "Pretrain/Loss (Raw)": 2.121715545654297, "Pretrain/Step": 1667, "Pretrain/Step Time": 9.821520933881402} +{"Pretrain/Learning Rate": 4.729689900673845e-05, "Pretrain/Loss": 2.08260440826416, "Pretrain/Loss (Raw)": 2.329967737197876, "Pretrain/Step": 1668, "Pretrain/Step Time": 9.838999034836888} +{"Pretrain/Learning Rate": 4.729305792061457e-05, "Pretrain/Loss": 2.084714651107788, "Pretrain/Loss (Raw)": 2.274580478668213, "Pretrain/Step": 1669, "Pretrain/Step Time": 9.8373520988971} +{"Pretrain/Learning Rate": 4.72892142635502e-05, "Pretrain/Loss": 2.084095001220703, "Pretrain/Loss (Raw)": 2.0872154235839844, "Pretrain/Step": 1670, "Pretrain/Step Time": 9.916355587542057} +{"Pretrain/Learning Rate": 4.728536803598862e-05, "Pretrain/Loss": 2.0857434272766113, "Pretrain/Loss (Raw)": 2.2777135372161865, "Pretrain/Step": 1671, "Pretrain/Step Time": 9.912570228800178} +{"Pretrain/Learning Rate": 4.728151923837337e-05, "Pretrain/Loss": 2.084467887878418, "Pretrain/Loss (Raw)": 2.0961461067199707, "Pretrain/Step": 1672, "Pretrain/Step Time": 9.91512481123209} +{"Pretrain/Learning Rate": 4.727766787114835e-05, "Pretrain/Loss": 2.0856049060821533, "Pretrain/Loss (Raw)": 2.2196202278137207, "Pretrain/Step": 1673, "Pretrain/Step Time": 9.887948712334037} +{"Pretrain/Learning Rate": 4.727381393475767e-05, "Pretrain/Loss": 2.087751865386963, "Pretrain/Loss (Raw)": 2.2677602767944336, "Pretrain/Step": 1674, "Pretrain/Step Time": 9.88538196310401} +{"Pretrain/Learning Rate": 4.726995742964583e-05, "Pretrain/Loss": 2.0881850719451904, "Pretrain/Loss (Raw)": 2.0759928226470947, "Pretrain/Step": 1675, "Pretrain/Step Time": 9.864170480519533} +{"Pretrain/Learning Rate": 4.726609835625755e-05, "Pretrain/Loss": 2.0877137184143066, "Pretrain/Loss (Raw)": 1.9761719703674316, "Pretrain/Step": 1676, "Pretrain/Step Time": 9.86286674439907} +{"Pretrain/Learning Rate": 4.726223671503789e-05, "Pretrain/Loss": 2.0902109146118164, "Pretrain/Loss (Raw)": 2.131187915802002, "Pretrain/Step": 1677, "Pretrain/Step Time": 9.831658804789186} +{"Pretrain/Learning Rate": 4.725837250643218e-05, "Pretrain/Loss": 2.0896029472351074, "Pretrain/Loss (Raw)": 2.082587718963623, "Pretrain/Step": 1678, "Pretrain/Step Time": 9.837834035977721} +{"Pretrain/Learning Rate": 4.7254505730886075e-05, "Pretrain/Loss": 2.0898876190185547, "Pretrain/Loss (Raw)": 2.2066547870635986, "Pretrain/Step": 1679, "Pretrain/Step Time": 9.841019470244646} +{"Pretrain/Learning Rate": 4.725063638884551e-05, "Pretrain/Loss": 2.090216636657715, "Pretrain/Loss (Raw)": 2.093425750732422, "Pretrain/Step": 1680, "Pretrain/Step Time": 9.796217178925872} +{"Pretrain/Learning Rate": 4.724676448075669e-05, "Pretrain/Loss": 2.08829927444458, "Pretrain/Loss (Raw)": 1.8158154487609863, "Pretrain/Step": 1681, "Pretrain/Step Time": 9.83756647631526} +{"Pretrain/Learning Rate": 4.724289000706617e-05, "Pretrain/Loss": 2.0853638648986816, "Pretrain/Loss (Raw)": 1.9087944030761719, "Pretrain/Step": 1682, "Pretrain/Step Time": 9.83916006051004} +{"Pretrain/Learning Rate": 4.723901296822076e-05, "Pretrain/Loss": 2.0869088172912598, "Pretrain/Loss (Raw)": 2.1988701820373535, "Pretrain/Step": 1683, "Pretrain/Step Time": 9.848457716405392} +{"Pretrain/Learning Rate": 4.723513336466759e-05, "Pretrain/Loss": 2.086016893386841, "Pretrain/Loss (Raw)": 2.005913257598877, "Pretrain/Step": 1684, "Pretrain/Step Time": 9.838578628376126} +{"Pretrain/Learning Rate": 4.723125119685405e-05, "Pretrain/Loss": 2.086819648742676, "Pretrain/Loss (Raw)": 2.065762758255005, "Pretrain/Step": 1685, "Pretrain/Step Time": 9.809730971232057} +{"Pretrain/Learning Rate": 4.722736646522788e-05, "Pretrain/Loss": 2.0852487087249756, "Pretrain/Loss (Raw)": 1.9545049667358398, "Pretrain/Step": 1686, "Pretrain/Step Time": 9.811676638200879} +{"Pretrain/Learning Rate": 4.722347917023706e-05, "Pretrain/Loss": 2.0841424465179443, "Pretrain/Loss (Raw)": 2.0853140354156494, "Pretrain/Step": 1687, "Pretrain/Step Time": 9.838147204369307} +{"Pretrain/Learning Rate": 4.72195893123299e-05, "Pretrain/Loss": 2.0839290618896484, "Pretrain/Loss (Raw)": 2.1211087703704834, "Pretrain/Step": 1688, "Pretrain/Step Time": 9.838506244122982} +{"Pretrain/Learning Rate": 4.7215696891955006e-05, "Pretrain/Loss": 2.083481788635254, "Pretrain/Loss (Raw)": 2.130936861038208, "Pretrain/Step": 1689, "Pretrain/Step Time": 9.843449153006077} +{"Pretrain/Learning Rate": 4.721180190956126e-05, "Pretrain/Loss": 2.082432270050049, "Pretrain/Loss (Raw)": 2.0944063663482666, "Pretrain/Step": 1690, "Pretrain/Step Time": 9.842865450307727} +{"Pretrain/Learning Rate": 4.7207904365597855e-05, "Pretrain/Loss": 2.083263874053955, "Pretrain/Loss (Raw)": 2.2159805297851562, "Pretrain/Step": 1691, "Pretrain/Step Time": 9.83183722756803} +{"Pretrain/Learning Rate": 4.720400426051427e-05, "Pretrain/Loss": 2.081982135772705, "Pretrain/Loss (Raw)": 2.0613934993743896, "Pretrain/Step": 1692, "Pretrain/Step Time": 9.802724603563547} +{"Pretrain/Learning Rate": 4.720010159476028e-05, "Pretrain/Loss": 2.0818634033203125, "Pretrain/Loss (Raw)": 2.146195650100708, "Pretrain/Step": 1693, "Pretrain/Step Time": 9.803003596141934} +{"Pretrain/Learning Rate": 4.719619636878597e-05, "Pretrain/Loss": 2.081003427505493, "Pretrain/Loss (Raw)": 1.8442463874816895, "Pretrain/Step": 1694, "Pretrain/Step Time": 9.798812599852681} +{"Pretrain/Learning Rate": 4.71922885830417e-05, "Pretrain/Loss": 2.0804967880249023, "Pretrain/Loss (Raw)": 2.0347468852996826, "Pretrain/Step": 1695, "Pretrain/Step Time": 9.796113640069962} +{"Pretrain/Learning Rate": 4.718837823797814e-05, "Pretrain/Loss": 2.0812854766845703, "Pretrain/Loss (Raw)": 2.123352289199829, "Pretrain/Step": 1696, "Pretrain/Step Time": 9.815308591350913} +{"Pretrain/Learning Rate": 4.7184465334046246e-05, "Pretrain/Loss": 2.0815348625183105, "Pretrain/Loss (Raw)": 2.1549720764160156, "Pretrain/Step": 1697, "Pretrain/Step Time": 9.8285065703094} +{"Pretrain/Learning Rate": 4.718054987169727e-05, "Pretrain/Loss": 2.081272602081299, "Pretrain/Loss (Raw)": 1.983038306236267, "Pretrain/Step": 1698, "Pretrain/Step Time": 9.843758799135685} +{"Pretrain/Learning Rate": 4.717663185138276e-05, "Pretrain/Loss": 2.0812342166900635, "Pretrain/Loss (Raw)": 1.9218602180480957, "Pretrain/Step": 1699, "Pretrain/Step Time": 9.807233167812228} +{"Pretrain/Learning Rate": 4.7172711273554576e-05, "Pretrain/Loss": 2.083148717880249, "Pretrain/Loss (Raw)": 2.152094841003418, "Pretrain/Step": 1700, "Pretrain/Step Time": 9.804921125993133} +{"Pretrain/Learning Rate": 4.7168788138664845e-05, "Pretrain/Loss": 2.084061622619629, "Pretrain/Loss (Raw)": 2.0975170135498047, "Pretrain/Step": 1701, "Pretrain/Step Time": 9.83510061725974} +{"Pretrain/Learning Rate": 4.7164862447165995e-05, "Pretrain/Loss": 2.085474967956543, "Pretrain/Loss (Raw)": 2.2817487716674805, "Pretrain/Step": 1702, "Pretrain/Step Time": 9.841027557849884} +{"Pretrain/Learning Rate": 4.716093419951077e-05, "Pretrain/Loss": 2.086808204650879, "Pretrain/Loss (Raw)": 2.374239444732666, "Pretrain/Step": 1703, "Pretrain/Step Time": 9.810477364808321} +{"Pretrain/Learning Rate": 4.7157003396152184e-05, "Pretrain/Loss": 2.086409091949463, "Pretrain/Loss (Raw)": 2.1298811435699463, "Pretrain/Step": 1704, "Pretrain/Step Time": 9.814036440104246} +{"Pretrain/Learning Rate": 4.715307003754356e-05, "Pretrain/Loss": 2.0875403881073, "Pretrain/Loss (Raw)": 1.8162263631820679, "Pretrain/Step": 1705, "Pretrain/Step Time": 9.793461550027132} +{"Pretrain/Learning Rate": 4.714913412413851e-05, "Pretrain/Loss": 2.087026596069336, "Pretrain/Loss (Raw)": 2.031001329421997, "Pretrain/Step": 1706, "Pretrain/Step Time": 9.81304282695055} +{"Pretrain/Learning Rate": 4.714519565639095e-05, "Pretrain/Loss": 2.087636947631836, "Pretrain/Loss (Raw)": 2.0460574626922607, "Pretrain/Step": 1707, "Pretrain/Step Time": 9.810194697231054} +{"Pretrain/Learning Rate": 4.714125463475506e-05, "Pretrain/Loss": 2.0887622833251953, "Pretrain/Loss (Raw)": 2.0837090015411377, "Pretrain/Step": 1708, "Pretrain/Step Time": 9.799721088260412} +{"Pretrain/Learning Rate": 4.713731105968536e-05, "Pretrain/Loss": 2.0904390811920166, "Pretrain/Loss (Raw)": 2.219790458679199, "Pretrain/Step": 1709, "Pretrain/Step Time": 9.795838870108128} +{"Pretrain/Learning Rate": 4.7133364931636644e-05, "Pretrain/Loss": 2.0879175662994385, "Pretrain/Loss (Raw)": 1.8608670234680176, "Pretrain/Step": 1710, "Pretrain/Step Time": 9.793714320287108} +{"Pretrain/Learning Rate": 4.712941625106398e-05, "Pretrain/Loss": 2.0896854400634766, "Pretrain/Loss (Raw)": 2.3196332454681396, "Pretrain/Step": 1711, "Pretrain/Step Time": 9.782787958160043} +{"Pretrain/Learning Rate": 4.7125465018422755e-05, "Pretrain/Loss": 2.0921802520751953, "Pretrain/Loss (Raw)": 2.2392170429229736, "Pretrain/Step": 1712, "Pretrain/Step Time": 9.768002178519964} +{"Pretrain/Learning Rate": 4.7121511234168644e-05, "Pretrain/Loss": 2.0925443172454834, "Pretrain/Loss (Raw)": 2.142329692840576, "Pretrain/Step": 1713, "Pretrain/Step Time": 9.777843227609992} +{"Pretrain/Learning Rate": 4.711755489875762e-05, "Pretrain/Loss": 2.0938243865966797, "Pretrain/Loss (Raw)": 2.296905994415283, "Pretrain/Step": 1714, "Pretrain/Step Time": 9.694209340959787} +{"Pretrain/Learning Rate": 4.711359601264594e-05, "Pretrain/Loss": 2.0945847034454346, "Pretrain/Loss (Raw)": 2.213052749633789, "Pretrain/Step": 1715, "Pretrain/Step Time": 9.69970765709877} +{"Pretrain/Learning Rate": 4.7109634576290175e-05, "Pretrain/Loss": 2.0969176292419434, "Pretrain/Loss (Raw)": 2.2737300395965576, "Pretrain/Step": 1716, "Pretrain/Step Time": 9.69884418696165} +{"Pretrain/Learning Rate": 4.710567059014716e-05, "Pretrain/Loss": 2.096064329147339, "Pretrain/Loss (Raw)": 1.9014641046524048, "Pretrain/Step": 1717, "Pretrain/Step Time": 9.705950409173965} +{"Pretrain/Learning Rate": 4.710170405467405e-05, "Pretrain/Loss": 2.0970091819763184, "Pretrain/Loss (Raw)": 2.360970973968506, "Pretrain/Step": 1718, "Pretrain/Step Time": 9.70100019685924} +{"Pretrain/Learning Rate": 4.709773497032828e-05, "Pretrain/Loss": 2.0984108448028564, "Pretrain/Loss (Raw)": 2.1586523056030273, "Pretrain/Step": 1719, "Pretrain/Step Time": 9.697608398273587} +{"Pretrain/Learning Rate": 4.7093763337567585e-05, "Pretrain/Loss": 2.0986270904541016, "Pretrain/Loss (Raw)": 2.1416873931884766, "Pretrain/Step": 1720, "Pretrain/Step Time": 9.699440520256758} +{"Pretrain/Learning Rate": 4.708978915685e-05, "Pretrain/Loss": 2.0984652042388916, "Pretrain/Loss (Raw)": 2.062260627746582, "Pretrain/Step": 1721, "Pretrain/Step Time": 9.700736586004496} +{"Pretrain/Learning Rate": 4.708581242863382e-05, "Pretrain/Loss": 2.096125841140747, "Pretrain/Loss (Raw)": 1.9798575639724731, "Pretrain/Step": 1722, "Pretrain/Step Time": 9.71372176706791} +{"Pretrain/Learning Rate": 4.7081833153377694e-05, "Pretrain/Loss": 2.0954318046569824, "Pretrain/Loss (Raw)": 2.0642707347869873, "Pretrain/Step": 1723, "Pretrain/Step Time": 9.706410743296146} +{"Pretrain/Learning Rate": 4.707785133154051e-05, "Pretrain/Loss": 2.0922250747680664, "Pretrain/Loss (Raw)": 1.947932481765747, "Pretrain/Step": 1724, "Pretrain/Step Time": 9.706804463639855} +{"Pretrain/Learning Rate": 4.707386696358148e-05, "Pretrain/Loss": 2.0901412963867188, "Pretrain/Loss (Raw)": 2.095977783203125, "Pretrain/Step": 1725, "Pretrain/Step Time": 9.691487157717347} +{"Pretrain/Learning Rate": 4.7069880049960104e-05, "Pretrain/Loss": 2.090178966522217, "Pretrain/Loss (Raw)": 2.136892318725586, "Pretrain/Step": 1726, "Pretrain/Step Time": 9.688528016209602} +{"Pretrain/Learning Rate": 4.7065890591136154e-05, "Pretrain/Loss": 2.0912158489227295, "Pretrain/Loss (Raw)": 2.2383840084075928, "Pretrain/Step": 1727, "Pretrain/Step Time": 9.651423126459122} +{"Pretrain/Learning Rate": 4.706189858756972e-05, "Pretrain/Loss": 2.091489791870117, "Pretrain/Loss (Raw)": 2.0754733085632324, "Pretrain/Step": 1728, "Pretrain/Step Time": 9.669196953997016} +{"Pretrain/Learning Rate": 4.705790403972119e-05, "Pretrain/Loss": 2.0928542613983154, "Pretrain/Loss (Raw)": 2.213198184967041, "Pretrain/Step": 1729, "Pretrain/Step Time": 9.674601757898927} +{"Pretrain/Learning Rate": 4.705390694805122e-05, "Pretrain/Loss": 2.090761661529541, "Pretrain/Loss (Raw)": 1.911120057106018, "Pretrain/Step": 1730, "Pretrain/Step Time": 9.676571691408753} +{"Pretrain/Learning Rate": 4.704990731302078e-05, "Pretrain/Loss": 2.088905096054077, "Pretrain/Loss (Raw)": 2.099263906478882, "Pretrain/Step": 1731, "Pretrain/Step Time": 9.6789111495018} +{"Pretrain/Learning Rate": 4.7045905135091126e-05, "Pretrain/Loss": 2.09023380279541, "Pretrain/Loss (Raw)": 2.117354154586792, "Pretrain/Step": 1732, "Pretrain/Step Time": 9.706437543034554} +{"Pretrain/Learning Rate": 4.704190041472381e-05, "Pretrain/Loss": 2.0913898944854736, "Pretrain/Loss (Raw)": 2.1363792419433594, "Pretrain/Step": 1733, "Pretrain/Step Time": 9.702587144449353} +{"Pretrain/Learning Rate": 4.703789315238067e-05, "Pretrain/Loss": 2.0920419692993164, "Pretrain/Loss (Raw)": 2.170444965362549, "Pretrain/Step": 1734, "Pretrain/Step Time": 9.73753722384572} +{"Pretrain/Learning Rate": 4.703388334852385e-05, "Pretrain/Loss": 2.0899651050567627, "Pretrain/Loss (Raw)": 1.913952350616455, "Pretrain/Step": 1735, "Pretrain/Step Time": 9.729937870055437} +{"Pretrain/Learning Rate": 4.7029871003615776e-05, "Pretrain/Loss": 2.0908851623535156, "Pretrain/Loss (Raw)": 2.2465803623199463, "Pretrain/Step": 1736, "Pretrain/Step Time": 9.734071617946029} +{"Pretrain/Learning Rate": 4.7025856118119164e-05, "Pretrain/Loss": 2.0905137062072754, "Pretrain/Loss (Raw)": 2.146566152572632, "Pretrain/Step": 1737, "Pretrain/Step Time": 9.724899677559733} +{"Pretrain/Learning Rate": 4.7021838692497046e-05, "Pretrain/Loss": 2.090095281600952, "Pretrain/Loss (Raw)": 1.9087657928466797, "Pretrain/Step": 1738, "Pretrain/Step Time": 9.735097279772162} +{"Pretrain/Learning Rate": 4.70178187272127e-05, "Pretrain/Loss": 2.090877056121826, "Pretrain/Loss (Raw)": 2.1978437900543213, "Pretrain/Step": 1739, "Pretrain/Step Time": 9.703038604930043} +{"Pretrain/Learning Rate": 4.701379622272977e-05, "Pretrain/Loss": 2.090391159057617, "Pretrain/Loss (Raw)": 2.1360340118408203, "Pretrain/Step": 1740, "Pretrain/Step Time": 9.681898459792137} +{"Pretrain/Learning Rate": 4.700977117951211e-05, "Pretrain/Loss": 2.089989185333252, "Pretrain/Loss (Raw)": 2.112298011779785, "Pretrain/Step": 1741, "Pretrain/Step Time": 9.668151760473847} +{"Pretrain/Learning Rate": 4.700574359802393e-05, "Pretrain/Loss": 2.0894956588745117, "Pretrain/Loss (Raw)": 2.048778533935547, "Pretrain/Step": 1742, "Pretrain/Step Time": 9.663240237161517} +{"Pretrain/Learning Rate": 4.700171347872971e-05, "Pretrain/Loss": 2.0901377201080322, "Pretrain/Loss (Raw)": 2.2180213928222656, "Pretrain/Step": 1743, "Pretrain/Step Time": 9.667943481355906} +{"Pretrain/Learning Rate": 4.699768082209421e-05, "Pretrain/Loss": 2.089005947113037, "Pretrain/Loss (Raw)": 1.9969522953033447, "Pretrain/Step": 1744, "Pretrain/Step Time": 9.628194451332092} +{"Pretrain/Learning Rate": 4.69936456285825e-05, "Pretrain/Loss": 2.0887460708618164, "Pretrain/Loss (Raw)": 2.100860118865967, "Pretrain/Step": 1745, "Pretrain/Step Time": 9.622138064354658} +{"Pretrain/Learning Rate": 4.698960789865994e-05, "Pretrain/Loss": 2.088240146636963, "Pretrain/Loss (Raw)": 1.977763295173645, "Pretrain/Step": 1746, "Pretrain/Step Time": 9.624900123104453} +{"Pretrain/Learning Rate": 4.698556763279218e-05, "Pretrain/Loss": 2.085742712020874, "Pretrain/Loss (Raw)": 1.8886358737945557, "Pretrain/Step": 1747, "Pretrain/Step Time": 9.626575611531734} +{"Pretrain/Learning Rate": 4.698152483144516e-05, "Pretrain/Loss": 2.084660291671753, "Pretrain/Loss (Raw)": 1.932035207748413, "Pretrain/Step": 1748, "Pretrain/Step Time": 9.615767503157258} +{"Pretrain/Learning Rate": 4.697747949508512e-05, "Pretrain/Loss": 2.085984230041504, "Pretrain/Loss (Raw)": 2.145143747329712, "Pretrain/Step": 1749, "Pretrain/Step Time": 9.610889069736004} +{"Pretrain/Learning Rate": 4.697343162417858e-05, "Pretrain/Loss": 2.085942268371582, "Pretrain/Loss (Raw)": 2.0936973094940186, "Pretrain/Step": 1750, "Pretrain/Step Time": 9.572494415566325} +{"Pretrain/Learning Rate": 4.696938121919235e-05, "Pretrain/Loss": 2.087082624435425, "Pretrain/Loss (Raw)": 2.1972475051879883, "Pretrain/Step": 1751, "Pretrain/Step Time": 9.568731775507331} +{"Pretrain/Learning Rate": 4.696532828059358e-05, "Pretrain/Loss": 2.0840201377868652, "Pretrain/Loss (Raw)": 1.9784480333328247, "Pretrain/Step": 1752, "Pretrain/Step Time": 9.57237753085792} +{"Pretrain/Learning Rate": 4.6961272808849634e-05, "Pretrain/Loss": 2.0833191871643066, "Pretrain/Loss (Raw)": 2.07297945022583, "Pretrain/Step": 1753, "Pretrain/Step Time": 9.568760972470045} +{"Pretrain/Learning Rate": 4.6957214804428217e-05, "Pretrain/Loss": 2.083418846130371, "Pretrain/Loss (Raw)": 2.1254608631134033, "Pretrain/Step": 1754, "Pretrain/Step Time": 9.573224503546953} +{"Pretrain/Learning Rate": 4.695315426779734e-05, "Pretrain/Loss": 2.0835940837860107, "Pretrain/Loss (Raw)": 2.1356396675109863, "Pretrain/Step": 1755, "Pretrain/Step Time": 9.573265176266432} +{"Pretrain/Learning Rate": 4.694909119942526e-05, "Pretrain/Loss": 2.082763671875, "Pretrain/Loss (Raw)": 2.0122015476226807, "Pretrain/Step": 1756, "Pretrain/Step Time": 9.559383507817984} +{"Pretrain/Learning Rate": 4.694502559978055e-05, "Pretrain/Loss": 2.0817160606384277, "Pretrain/Loss (Raw)": 1.8976112604141235, "Pretrain/Step": 1757, "Pretrain/Step Time": 9.555284909904003} +{"Pretrain/Learning Rate": 4.694095746933208e-05, "Pretrain/Loss": 2.0825698375701904, "Pretrain/Loss (Raw)": 2.269303560256958, "Pretrain/Step": 1758, "Pretrain/Step Time": 9.571511382237077} +{"Pretrain/Learning Rate": 4.6936886808549004e-05, "Pretrain/Loss": 2.08610200881958, "Pretrain/Loss (Raw)": 2.2351725101470947, "Pretrain/Step": 1759, "Pretrain/Step Time": 9.574130022898316} +{"Pretrain/Learning Rate": 4.693281361790077e-05, "Pretrain/Loss": 2.087617874145508, "Pretrain/Loss (Raw)": 2.260525941848755, "Pretrain/Step": 1760, "Pretrain/Step Time": 9.575818145647645} +{"Pretrain/Learning Rate": 4.6928737897857124e-05, "Pretrain/Loss": 2.0880048274993896, "Pretrain/Loss (Raw)": 1.9442349672317505, "Pretrain/Step": 1761, "Pretrain/Step Time": 9.50019370391965} +{"Pretrain/Learning Rate": 4.692465964888809e-05, "Pretrain/Loss": 2.0874106884002686, "Pretrain/Loss (Raw)": 2.203988790512085, "Pretrain/Step": 1762, "Pretrain/Step Time": 9.497996462509036} +{"Pretrain/Learning Rate": 4.692057887146399e-05, "Pretrain/Loss": 2.089965581893921, "Pretrain/Loss (Raw)": 2.110368490219116, "Pretrain/Step": 1763, "Pretrain/Step Time": 9.489077020436525} +{"Pretrain/Learning Rate": 4.691649556605545e-05, "Pretrain/Loss": 2.090178966522217, "Pretrain/Loss (Raw)": 2.1233978271484375, "Pretrain/Step": 1764, "Pretrain/Step Time": 9.49777714163065} +{"Pretrain/Learning Rate": 4.691240973313337e-05, "Pretrain/Loss": 2.091721773147583, "Pretrain/Loss (Raw)": 2.2190046310424805, "Pretrain/Step": 1765, "Pretrain/Step Time": 9.494473537430167} +{"Pretrain/Learning Rate": 4.690832137316893e-05, "Pretrain/Loss": 2.091930389404297, "Pretrain/Loss (Raw)": 2.025521993637085, "Pretrain/Step": 1766, "Pretrain/Step Time": 9.535923462361097} +{"Pretrain/Learning Rate": 4.690423048663364e-05, "Pretrain/Loss": 2.094527006149292, "Pretrain/Loss (Raw)": 2.1590652465820312, "Pretrain/Step": 1767, "Pretrain/Step Time": 9.534479919821024} +{"Pretrain/Learning Rate": 4.690013707399928e-05, "Pretrain/Loss": 2.094604969024658, "Pretrain/Loss (Raw)": 1.9338760375976562, "Pretrain/Step": 1768, "Pretrain/Step Time": 9.470942538231611} +{"Pretrain/Learning Rate": 4.689604113573791e-05, "Pretrain/Loss": 2.0949339866638184, "Pretrain/Loss (Raw)": 2.1415884494781494, "Pretrain/Step": 1769, "Pretrain/Step Time": 9.475821290165186} +{"Pretrain/Learning Rate": 4.68919426723219e-05, "Pretrain/Loss": 2.0936439037323, "Pretrain/Loss (Raw)": 2.0532636642456055, "Pretrain/Step": 1770, "Pretrain/Step Time": 9.47945517860353} +{"Pretrain/Learning Rate": 4.6887841684223905e-05, "Pretrain/Loss": 2.095292091369629, "Pretrain/Loss (Raw)": 2.128541946411133, "Pretrain/Step": 1771, "Pretrain/Step Time": 9.47790889814496} +{"Pretrain/Learning Rate": 4.688373817191687e-05, "Pretrain/Loss": 2.0948901176452637, "Pretrain/Loss (Raw)": 1.9431103467941284, "Pretrain/Step": 1772, "Pretrain/Step Time": 9.487633466720581} +{"Pretrain/Learning Rate": 4.687963213587402e-05, "Pretrain/Loss": 2.093329429626465, "Pretrain/Loss (Raw)": 2.0367226600646973, "Pretrain/Step": 1773, "Pretrain/Step Time": 9.493881735950708} +{"Pretrain/Learning Rate": 4.6875523576568895e-05, "Pretrain/Loss": 2.0934958457946777, "Pretrain/Loss (Raw)": 2.1636266708374023, "Pretrain/Step": 1774, "Pretrain/Step Time": 9.489283118396997} +{"Pretrain/Learning Rate": 4.6871412494475316e-05, "Pretrain/Loss": 2.093402862548828, "Pretrain/Loss (Raw)": 1.9160162210464478, "Pretrain/Step": 1775, "Pretrain/Step Time": 9.481324438005686} +{"Pretrain/Learning Rate": 4.6867298890067377e-05, "Pretrain/Loss": 2.09529709815979, "Pretrain/Loss (Raw)": 2.2932891845703125, "Pretrain/Step": 1776, "Pretrain/Step Time": 9.47486524283886} +{"Pretrain/Learning Rate": 4.68631827638195e-05, "Pretrain/Loss": 2.095492124557495, "Pretrain/Loss (Raw)": 2.128138780593872, "Pretrain/Step": 1777, "Pretrain/Step Time": 9.466477625072002} +{"Pretrain/Learning Rate": 4.6859064116206356e-05, "Pretrain/Loss": 2.0963892936706543, "Pretrain/Loss (Raw)": 2.080416202545166, "Pretrain/Step": 1778, "Pretrain/Step Time": 9.46398319490254} +{"Pretrain/Learning Rate": 4.685494294770294e-05, "Pretrain/Loss": 2.0959508419036865, "Pretrain/Loss (Raw)": 2.0356345176696777, "Pretrain/Step": 1779, "Pretrain/Step Time": 9.40334833227098} +{"Pretrain/Learning Rate": 4.685081925878452e-05, "Pretrain/Loss": 2.0956969261169434, "Pretrain/Loss (Raw)": 2.1276986598968506, "Pretrain/Step": 1780, "Pretrain/Step Time": 9.412542961537838} +{"Pretrain/Learning Rate": 4.684669304992665e-05, "Pretrain/Loss": 2.1006906032562256, "Pretrain/Loss (Raw)": 2.1941893100738525, "Pretrain/Step": 1781, "Pretrain/Step Time": 9.413782527670264} +{"Pretrain/Learning Rate": 4.6842564321605196e-05, "Pretrain/Loss": 2.0969810485839844, "Pretrain/Loss (Raw)": 1.6579645872116089, "Pretrain/Step": 1782, "Pretrain/Step Time": 9.41214096173644} +{"Pretrain/Learning Rate": 4.683843307429631e-05, "Pretrain/Loss": 2.0970804691314697, "Pretrain/Loss (Raw)": 2.249763250350952, "Pretrain/Step": 1783, "Pretrain/Step Time": 9.414850493893027} +{"Pretrain/Learning Rate": 4.68342993084764e-05, "Pretrain/Loss": 2.098886728286743, "Pretrain/Loss (Raw)": 2.10929799079895, "Pretrain/Step": 1784, "Pretrain/Step Time": 9.419800579547882} +{"Pretrain/Learning Rate": 4.683016302462221e-05, "Pretrain/Loss": 2.0993733406066895, "Pretrain/Loss (Raw)": 2.129329204559326, "Pretrain/Step": 1785, "Pretrain/Step Time": 9.41232231259346} +{"Pretrain/Learning Rate": 4.682602422321076e-05, "Pretrain/Loss": 2.0977210998535156, "Pretrain/Loss (Raw)": 1.7699394226074219, "Pretrain/Step": 1786, "Pretrain/Step Time": 9.395372522994876} +{"Pretrain/Learning Rate": 4.6821882904719344e-05, "Pretrain/Loss": 2.0952820777893066, "Pretrain/Loss (Raw)": 1.8739057779312134, "Pretrain/Step": 1787, "Pretrain/Step Time": 9.417354328557849} +{"Pretrain/Learning Rate": 4.6817739069625563e-05, "Pretrain/Loss": 2.096186876296997, "Pretrain/Loss (Raw)": 2.21520733833313, "Pretrain/Step": 1788, "Pretrain/Step Time": 9.419145060703158} +{"Pretrain/Learning Rate": 4.681359271840731e-05, "Pretrain/Loss": 2.0958855152130127, "Pretrain/Loss (Raw)": 2.0520830154418945, "Pretrain/Step": 1789, "Pretrain/Step Time": 9.414321349933743} +{"Pretrain/Learning Rate": 4.6809443851542744e-05, "Pretrain/Loss": 2.094994306564331, "Pretrain/Loss (Raw)": 2.074944496154785, "Pretrain/Step": 1790, "Pretrain/Step Time": 9.421970661729574} +{"Pretrain/Learning Rate": 4.680529246951035e-05, "Pretrain/Loss": 2.095466375350952, "Pretrain/Loss (Raw)": 2.132122039794922, "Pretrain/Step": 1791, "Pretrain/Step Time": 9.447895104065537} +{"Pretrain/Learning Rate": 4.6801138572788885e-05, "Pretrain/Loss": 2.0943007469177246, "Pretrain/Loss (Raw)": 2.0154056549072266, "Pretrain/Step": 1792, "Pretrain/Step Time": 9.424184989184141} +{"Pretrain/Learning Rate": 4.679698216185738e-05, "Pretrain/Loss": 2.091653347015381, "Pretrain/Loss (Raw)": 1.7887505292892456, "Pretrain/Step": 1793, "Pretrain/Step Time": 9.425422532483935} +{"Pretrain/Learning Rate": 4.6792823237195185e-05, "Pretrain/Loss": 2.0926709175109863, "Pretrain/Loss (Raw)": 2.0854012966156006, "Pretrain/Step": 1794, "Pretrain/Step Time": 9.423390202224255} +{"Pretrain/Learning Rate": 4.678866179928193e-05, "Pretrain/Loss": 2.0922837257385254, "Pretrain/Loss (Raw)": 2.0721399784088135, "Pretrain/Step": 1795, "Pretrain/Step Time": 9.411424463614821} +{"Pretrain/Learning Rate": 4.6784497848597516e-05, "Pretrain/Loss": 2.09035325050354, "Pretrain/Loss (Raw)": 2.0828940868377686, "Pretrain/Step": 1796, "Pretrain/Step Time": 9.407864959910512} +{"Pretrain/Learning Rate": 4.678033138562216e-05, "Pretrain/Loss": 2.089733123779297, "Pretrain/Loss (Raw)": 2.195190906524658, "Pretrain/Step": 1797, "Pretrain/Step Time": 9.407050341367722} +{"Pretrain/Learning Rate": 4.6776162410836354e-05, "Pretrain/Loss": 2.0906143188476562, "Pretrain/Loss (Raw)": 2.2000234127044678, "Pretrain/Step": 1798, "Pretrain/Step Time": 9.3291250243783} +{"Pretrain/Learning Rate": 4.677199092472089e-05, "Pretrain/Loss": 2.088871955871582, "Pretrain/Loss (Raw)": 2.054694890975952, "Pretrain/Step": 1799, "Pretrain/Step Time": 9.332621544599533} +{"Pretrain/Learning Rate": 4.6767816927756834e-05, "Pretrain/Loss": 2.088561773300171, "Pretrain/Loss (Raw)": 2.0564377307891846, "Pretrain/Step": 1800, "Pretrain/Step Time": 9.331823388114572} +{"Pretrain/Learning Rate": 4.6763640420425566e-05, "Pretrain/Loss": 2.087453603744507, "Pretrain/Loss (Raw)": 2.0777747631073, "Pretrain/Step": 1801, "Pretrain/Step Time": 9.337645733729005} +{"Pretrain/Learning Rate": 4.675946140320873e-05, "Pretrain/Loss": 2.08622407913208, "Pretrain/Loss (Raw)": 2.1103615760803223, "Pretrain/Step": 1802, "Pretrain/Step Time": 9.343752078711987} +{"Pretrain/Learning Rate": 4.6755279876588256e-05, "Pretrain/Loss": 2.0881409645080566, "Pretrain/Loss (Raw)": 2.32135272026062, "Pretrain/Step": 1803, "Pretrain/Step Time": 9.34241801686585} +{"Pretrain/Learning Rate": 4.67510958410464e-05, "Pretrain/Loss": 2.0887186527252197, "Pretrain/Loss (Raw)": 2.050135612487793, "Pretrain/Step": 1804, "Pretrain/Step Time": 9.338994486257434} +{"Pretrain/Learning Rate": 4.6746909297065685e-05, "Pretrain/Loss": 2.0885119438171387, "Pretrain/Loss (Raw)": 2.1047468185424805, "Pretrain/Step": 1805, "Pretrain/Step Time": 9.338004134595394} +{"Pretrain/Learning Rate": 4.674272024512891e-05, "Pretrain/Loss": 2.088514804840088, "Pretrain/Loss (Raw)": 2.0829522609710693, "Pretrain/Step": 1806, "Pretrain/Step Time": 9.363931139931083} +{"Pretrain/Learning Rate": 4.6738528685719185e-05, "Pretrain/Loss": 2.088718891143799, "Pretrain/Loss (Raw)": 2.2327399253845215, "Pretrain/Step": 1807, "Pretrain/Step Time": 9.36325049214065} +{"Pretrain/Learning Rate": 4.673433461931989e-05, "Pretrain/Loss": 2.087735176086426, "Pretrain/Loss (Raw)": 1.967529296875, "Pretrain/Step": 1808, "Pretrain/Step Time": 9.365827972069383} +{"Pretrain/Learning Rate": 4.6730138046414714e-05, "Pretrain/Loss": 2.0905966758728027, "Pretrain/Loss (Raw)": 2.182089328765869, "Pretrain/Step": 1809, "Pretrain/Step Time": 9.325411971658468} +{"Pretrain/Learning Rate": 4.672593896748763e-05, "Pretrain/Loss": 2.092461585998535, "Pretrain/Loss (Raw)": 2.1474995613098145, "Pretrain/Step": 1810, "Pretrain/Step Time": 9.319733202457428} +{"Pretrain/Learning Rate": 4.6721737383022876e-05, "Pretrain/Loss": 2.091750144958496, "Pretrain/Loss (Raw)": 2.1077873706817627, "Pretrain/Step": 1811, "Pretrain/Step Time": 9.313229570165277} +{"Pretrain/Learning Rate": 4.671753329350502e-05, "Pretrain/Loss": 2.092031955718994, "Pretrain/Loss (Raw)": 2.0419914722442627, "Pretrain/Step": 1812, "Pretrain/Step Time": 9.315308464691043} +{"Pretrain/Learning Rate": 4.671332669941888e-05, "Pretrain/Loss": 2.091503381729126, "Pretrain/Loss (Raw)": 1.9981095790863037, "Pretrain/Step": 1813, "Pretrain/Step Time": 9.30879383534193} +{"Pretrain/Learning Rate": 4.6709117601249596e-05, "Pretrain/Loss": 2.091688871383667, "Pretrain/Loss (Raw)": 1.9782700538635254, "Pretrain/Step": 1814, "Pretrain/Step Time": 9.307594811543822} +{"Pretrain/Learning Rate": 4.6704905999482575e-05, "Pretrain/Loss": 2.0936851501464844, "Pretrain/Loss (Raw)": 2.3408455848693848, "Pretrain/Step": 1815, "Pretrain/Step Time": 9.309360874816775} +{"Pretrain/Learning Rate": 4.670069189460351e-05, "Pretrain/Loss": 2.092357635498047, "Pretrain/Loss (Raw)": 1.9511553049087524, "Pretrain/Step": 1816, "Pretrain/Step Time": 9.317824585363269} +{"Pretrain/Learning Rate": 4.6696475287098396e-05, "Pretrain/Loss": 2.0935702323913574, "Pretrain/Loss (Raw)": 2.2861483097076416, "Pretrain/Step": 1817, "Pretrain/Step Time": 9.312883155420423} +{"Pretrain/Learning Rate": 4.669225617745352e-05, "Pretrain/Loss": 2.093914031982422, "Pretrain/Loss (Raw)": 2.138411045074463, "Pretrain/Step": 1818, "Pretrain/Step Time": 9.308548534289002} +{"Pretrain/Learning Rate": 4.668803456615545e-05, "Pretrain/Loss": 2.0910229682922363, "Pretrain/Loss (Raw)": 1.8459272384643555, "Pretrain/Step": 1819, "Pretrain/Step Time": 9.310111671686172} +{"Pretrain/Learning Rate": 4.668381045369102e-05, "Pretrain/Loss": 2.091637134552002, "Pretrain/Loss (Raw)": 2.1400349140167236, "Pretrain/Step": 1820, "Pretrain/Step Time": 9.310843335464597} +{"Pretrain/Learning Rate": 4.6679583840547405e-05, "Pretrain/Loss": 2.090832233428955, "Pretrain/Loss (Raw)": 2.0431694984436035, "Pretrain/Step": 1821, "Pretrain/Step Time": 9.305497542023659} +{"Pretrain/Learning Rate": 4.667535472721203e-05, "Pretrain/Loss": 2.0935754776000977, "Pretrain/Loss (Raw)": 2.1953351497650146, "Pretrain/Step": 1822, "Pretrain/Step Time": 9.30564220994711} +{"Pretrain/Learning Rate": 4.66711231141726e-05, "Pretrain/Loss": 2.0934576988220215, "Pretrain/Loss (Raw)": 2.0197038650512695, "Pretrain/Step": 1823, "Pretrain/Step Time": 9.309588976204395} +{"Pretrain/Learning Rate": 4.6666889001917136e-05, "Pretrain/Loss": 2.0925278663635254, "Pretrain/Loss (Raw)": 2.0043349266052246, "Pretrain/Step": 1824, "Pretrain/Step Time": 9.292294768616557} +{"Pretrain/Learning Rate": 4.666265239093393e-05, "Pretrain/Loss": 2.092867612838745, "Pretrain/Loss (Raw)": 2.1984384059906006, "Pretrain/Step": 1825, "Pretrain/Step Time": 9.287100221961737} +{"Pretrain/Learning Rate": 4.665841328171158e-05, "Pretrain/Loss": 2.092710494995117, "Pretrain/Loss (Raw)": 1.9629491567611694, "Pretrain/Step": 1826, "Pretrain/Step Time": 9.265564814209938} +{"Pretrain/Learning Rate": 4.665417167473894e-05, "Pretrain/Loss": 2.0948984622955322, "Pretrain/Loss (Raw)": 2.2019197940826416, "Pretrain/Step": 1827, "Pretrain/Step Time": 9.267120320349932} +{"Pretrain/Learning Rate": 4.66499275705052e-05, "Pretrain/Loss": 2.093724012374878, "Pretrain/Loss (Raw)": 2.0017590522766113, "Pretrain/Step": 1828, "Pretrain/Step Time": 9.268074987456203} +{"Pretrain/Learning Rate": 4.6645680969499795e-05, "Pretrain/Loss": 2.094374179840088, "Pretrain/Loss (Raw)": 2.18070912361145, "Pretrain/Step": 1829, "Pretrain/Step Time": 9.232224186882377} +{"Pretrain/Learning Rate": 4.664143187221245e-05, "Pretrain/Loss": 2.092658042907715, "Pretrain/Loss (Raw)": 2.062119245529175, "Pretrain/Step": 1830, "Pretrain/Step Time": 9.225014870986342} +{"Pretrain/Learning Rate": 4.6637180279133216e-05, "Pretrain/Loss": 2.090867280960083, "Pretrain/Loss (Raw)": 2.145019769668579, "Pretrain/Step": 1831, "Pretrain/Step Time": 9.22528393752873} +{"Pretrain/Learning Rate": 4.6632926190752385e-05, "Pretrain/Loss": 2.0907859802246094, "Pretrain/Loss (Raw)": 2.1194896697998047, "Pretrain/Step": 1832, "Pretrain/Step Time": 9.223980063572526} +{"Pretrain/Learning Rate": 4.662866960756057e-05, "Pretrain/Loss": 2.093824863433838, "Pretrain/Loss (Raw)": 2.2051658630371094, "Pretrain/Step": 1833, "Pretrain/Step Time": 9.220845991745591} +{"Pretrain/Learning Rate": 4.662441053004866e-05, "Pretrain/Loss": 2.0933356285095215, "Pretrain/Loss (Raw)": 1.9683741331100464, "Pretrain/Step": 1834, "Pretrain/Step Time": 9.198965607210994} +{"Pretrain/Learning Rate": 4.6620148958707833e-05, "Pretrain/Loss": 2.094472646713257, "Pretrain/Loss (Raw)": 2.191627025604248, "Pretrain/Step": 1835, "Pretrain/Step Time": 9.198279052972794} +{"Pretrain/Learning Rate": 4.661588489402955e-05, "Pretrain/Loss": 2.094417095184326, "Pretrain/Loss (Raw)": 2.076566696166992, "Pretrain/Step": 1836, "Pretrain/Step Time": 9.190517058596015} +{"Pretrain/Learning Rate": 4.661161833650556e-05, "Pretrain/Loss": 2.094222068786621, "Pretrain/Loss (Raw)": 2.1948440074920654, "Pretrain/Step": 1837, "Pretrain/Step Time": 9.194175204262137} +{"Pretrain/Learning Rate": 4.660734928662791e-05, "Pretrain/Loss": 2.0958096981048584, "Pretrain/Loss (Raw)": 2.064084053039551, "Pretrain/Step": 1838, "Pretrain/Step Time": 9.1915018055588} +{"Pretrain/Learning Rate": 4.660307774488892e-05, "Pretrain/Loss": 2.0932345390319824, "Pretrain/Loss (Raw)": 1.990052580833435, "Pretrain/Step": 1839, "Pretrain/Step Time": 9.189355889335275} +{"Pretrain/Learning Rate": 4.65988037117812e-05, "Pretrain/Loss": 2.092231273651123, "Pretrain/Loss (Raw)": 2.1107382774353027, "Pretrain/Step": 1840, "Pretrain/Step Time": 9.181430030614138} +{"Pretrain/Learning Rate": 4.659452718779768e-05, "Pretrain/Loss": 2.092602252960205, "Pretrain/Loss (Raw)": 2.189829111099243, "Pretrain/Step": 1841, "Pretrain/Step Time": 9.177427290007472} +{"Pretrain/Learning Rate": 4.6590248173431505e-05, "Pretrain/Loss": 2.0914855003356934, "Pretrain/Loss (Raw)": 2.1539549827575684, "Pretrain/Step": 1842, "Pretrain/Step Time": 9.17863697372377} +{"Pretrain/Learning Rate": 4.6585966669176186e-05, "Pretrain/Loss": 2.091399669647217, "Pretrain/Loss (Raw)": 2.2020912170410156, "Pretrain/Step": 1843, "Pretrain/Step Time": 9.17456540465355} +{"Pretrain/Learning Rate": 4.658168267552547e-05, "Pretrain/Loss": 2.0890347957611084, "Pretrain/Loss (Raw)": 1.9710310697555542, "Pretrain/Step": 1844, "Pretrain/Step Time": 9.172558471560478} +{"Pretrain/Learning Rate": 4.657739619297342e-05, "Pretrain/Loss": 2.0914466381073, "Pretrain/Loss (Raw)": 2.210174083709717, "Pretrain/Step": 1845, "Pretrain/Step Time": 9.171855198219419} +{"Pretrain/Learning Rate": 4.657310722201436e-05, "Pretrain/Loss": 2.0893259048461914, "Pretrain/Loss (Raw)": 2.0895278453826904, "Pretrain/Step": 1846, "Pretrain/Step Time": 9.170402616262436} +{"Pretrain/Learning Rate": 4.6568815763142914e-05, "Pretrain/Loss": 2.088111162185669, "Pretrain/Loss (Raw)": 2.003160238265991, "Pretrain/Step": 1847, "Pretrain/Step Time": 9.171901278197765} +{"Pretrain/Learning Rate": 4.6564521816854e-05, "Pretrain/Loss": 2.0893898010253906, "Pretrain/Loss (Raw)": 2.305351972579956, "Pretrain/Step": 1848, "Pretrain/Step Time": 9.170760156586766} +{"Pretrain/Learning Rate": 4.656022538364282e-05, "Pretrain/Loss": 2.09009051322937, "Pretrain/Loss (Raw)": 2.1519410610198975, "Pretrain/Step": 1849, "Pretrain/Step Time": 9.167431024834514} +{"Pretrain/Learning Rate": 4.655592646400485e-05, "Pretrain/Loss": 2.0918002128601074, "Pretrain/Loss (Raw)": 2.1986916065216064, "Pretrain/Step": 1850, "Pretrain/Step Time": 9.15587998367846} +{"Pretrain/Learning Rate": 4.6551625058435866e-05, "Pretrain/Loss": 2.091358184814453, "Pretrain/Loss (Raw)": 2.0076887607574463, "Pretrain/Step": 1851, "Pretrain/Step Time": 9.146173123270273} +{"Pretrain/Learning Rate": 4.654732116743194e-05, "Pretrain/Loss": 2.09194278717041, "Pretrain/Loss (Raw)": 2.0227677822113037, "Pretrain/Step": 1852, "Pretrain/Step Time": 9.143162796273828} +{"Pretrain/Learning Rate": 4.654301479148938e-05, "Pretrain/Loss": 2.0921125411987305, "Pretrain/Loss (Raw)": 2.1177356243133545, "Pretrain/Step": 1853, "Pretrain/Step Time": 9.14377685636282} +{"Pretrain/Learning Rate": 4.653870593110485e-05, "Pretrain/Loss": 2.0911121368408203, "Pretrain/Loss (Raw)": 2.008814811706543, "Pretrain/Step": 1854, "Pretrain/Step Time": 9.143756603822112} +{"Pretrain/Learning Rate": 4.6534394586775254e-05, "Pretrain/Loss": 2.089542865753174, "Pretrain/Loss (Raw)": 2.0375266075134277, "Pretrain/Step": 1855, "Pretrain/Step Time": 9.144508395344019} +{"Pretrain/Learning Rate": 4.653008075899781e-05, "Pretrain/Loss": 2.0883867740631104, "Pretrain/Loss (Raw)": 1.9274832010269165, "Pretrain/Step": 1856, "Pretrain/Step Time": 9.121764283627272} +{"Pretrain/Learning Rate": 4.652576444826999e-05, "Pretrain/Loss": 2.087527275085449, "Pretrain/Loss (Raw)": 2.1031901836395264, "Pretrain/Step": 1857, "Pretrain/Step Time": 9.121147867292166} +{"Pretrain/Learning Rate": 4.652144565508959e-05, "Pretrain/Loss": 2.0901927947998047, "Pretrain/Loss (Raw)": 2.2523069381713867, "Pretrain/Step": 1858, "Pretrain/Step Time": 9.130496840924025} +{"Pretrain/Learning Rate": 4.6517124379954655e-05, "Pretrain/Loss": 2.089968204498291, "Pretrain/Loss (Raw)": 2.070512294769287, "Pretrain/Step": 1859, "Pretrain/Step Time": 9.132154677063227} +{"Pretrain/Learning Rate": 4.651280062336355e-05, "Pretrain/Loss": 2.0905113220214844, "Pretrain/Loss (Raw)": 2.186901092529297, "Pretrain/Step": 1860, "Pretrain/Step Time": 9.095260124653578} +{"Pretrain/Learning Rate": 4.65084743858149e-05, "Pretrain/Loss": 2.089841842651367, "Pretrain/Loss (Raw)": 2.050640106201172, "Pretrain/Step": 1861, "Pretrain/Step Time": 9.098672470077872} +{"Pretrain/Learning Rate": 4.6504145667807644e-05, "Pretrain/Loss": 2.089386224746704, "Pretrain/Loss (Raw)": 2.1121551990509033, "Pretrain/Step": 1862, "Pretrain/Step Time": 9.065358832478523} +{"Pretrain/Learning Rate": 4.649981446984097e-05, "Pretrain/Loss": 2.0914292335510254, "Pretrain/Loss (Raw)": 2.175438642501831, "Pretrain/Step": 1863, "Pretrain/Step Time": 9.069006694480777} +{"Pretrain/Learning Rate": 4.649548079241438e-05, "Pretrain/Loss": 2.090395212173462, "Pretrain/Loss (Raw)": 2.1142451763153076, "Pretrain/Step": 1864, "Pretrain/Step Time": 9.06893582828343} +{"Pretrain/Learning Rate": 4.649114463602766e-05, "Pretrain/Loss": 2.090341567993164, "Pretrain/Loss (Raw)": 2.139678716659546, "Pretrain/Step": 1865, "Pretrain/Step Time": 9.080107562243938} +{"Pretrain/Learning Rate": 4.648680600118087e-05, "Pretrain/Loss": 2.092895984649658, "Pretrain/Loss (Raw)": 2.2357192039489746, "Pretrain/Step": 1866, "Pretrain/Step Time": 9.071350738406181} +{"Pretrain/Learning Rate": 4.6482464888374365e-05, "Pretrain/Loss": 2.0923094749450684, "Pretrain/Loss (Raw)": 2.122811794281006, "Pretrain/Step": 1867, "Pretrain/Step Time": 9.074863886460662} +{"Pretrain/Learning Rate": 4.6478121298108776e-05, "Pretrain/Loss": 2.0918471813201904, "Pretrain/Loss (Raw)": 2.076840877532959, "Pretrain/Step": 1868, "Pretrain/Step Time": 9.094936022534966} +{"Pretrain/Learning Rate": 4.647377523088503e-05, "Pretrain/Loss": 2.09181547164917, "Pretrain/Loss (Raw)": 2.1082191467285156, "Pretrain/Step": 1869, "Pretrain/Step Time": 9.091178562492132} +{"Pretrain/Learning Rate": 4.6469426687204346e-05, "Pretrain/Loss": 2.0924301147460938, "Pretrain/Loss (Raw)": 2.1274828910827637, "Pretrain/Step": 1870, "Pretrain/Step Time": 9.14542805030942} +{"Pretrain/Learning Rate": 4.646507566756819e-05, "Pretrain/Loss": 2.092586040496826, "Pretrain/Loss (Raw)": 2.2379846572875977, "Pretrain/Step": 1871, "Pretrain/Step Time": 9.135172566398978} +{"Pretrain/Learning Rate": 4.646072217247838e-05, "Pretrain/Loss": 2.094547748565674, "Pretrain/Loss (Raw)": 2.2480270862579346, "Pretrain/Step": 1872, "Pretrain/Step Time": 9.134455377236009} +{"Pretrain/Learning Rate": 4.645636620243695e-05, "Pretrain/Loss": 2.094275951385498, "Pretrain/Loss (Raw)": 2.066079616546631, "Pretrain/Step": 1873, "Pretrain/Step Time": 9.137918153777719} +{"Pretrain/Learning Rate": 4.645200775794628e-05, "Pretrain/Loss": 2.095975875854492, "Pretrain/Loss (Raw)": 2.195369243621826, "Pretrain/Step": 1874, "Pretrain/Step Time": 9.135765761137009} +{"Pretrain/Learning Rate": 4.6447646839508975e-05, "Pretrain/Loss": 2.096527338027954, "Pretrain/Loss (Raw)": 1.9592022895812988, "Pretrain/Step": 1875, "Pretrain/Step Time": 9.13619077578187} +{"Pretrain/Learning Rate": 4.6443283447627974e-05, "Pretrain/Loss": 2.0979037284851074, "Pretrain/Loss (Raw)": 2.1082308292388916, "Pretrain/Step": 1876, "Pretrain/Step Time": 9.14620209299028} +{"Pretrain/Learning Rate": 4.643891758280649e-05, "Pretrain/Loss": 2.098400592803955, "Pretrain/Loss (Raw)": 2.2087204456329346, "Pretrain/Step": 1877, "Pretrain/Step Time": 9.153076799586415} +{"Pretrain/Learning Rate": 4.6434549245548e-05, "Pretrain/Loss": 2.0998828411102295, "Pretrain/Loss (Raw)": 2.2834227085113525, "Pretrain/Step": 1878, "Pretrain/Step Time": 9.144522432237864} +{"Pretrain/Learning Rate": 4.643017843635629e-05, "Pretrain/Loss": 2.100498676300049, "Pretrain/Loss (Raw)": 2.2760889530181885, "Pretrain/Step": 1879, "Pretrain/Step Time": 9.152985671535134} +{"Pretrain/Learning Rate": 4.6425805155735416e-05, "Pretrain/Loss": 2.101632595062256, "Pretrain/Loss (Raw)": 2.123579263687134, "Pretrain/Step": 1880, "Pretrain/Step Time": 9.15447179414332} +{"Pretrain/Learning Rate": 4.642142940418973e-05, "Pretrain/Loss": 2.103156805038452, "Pretrain/Loss (Raw)": 2.2680764198303223, "Pretrain/Step": 1881, "Pretrain/Step Time": 9.162167321890593} +{"Pretrain/Learning Rate": 4.641705118222387e-05, "Pretrain/Loss": 2.103238582611084, "Pretrain/Loss (Raw)": 2.135927677154541, "Pretrain/Step": 1882, "Pretrain/Step Time": 9.157370403409004} +{"Pretrain/Learning Rate": 4.6412670490342747e-05, "Pretrain/Loss": 2.1026463508605957, "Pretrain/Loss (Raw)": 2.0598645210266113, "Pretrain/Step": 1883, "Pretrain/Step Time": 9.160999963060021} +{"Pretrain/Learning Rate": 4.6408287329051556e-05, "Pretrain/Loss": 2.103048086166382, "Pretrain/Loss (Raw)": 2.0636184215545654, "Pretrain/Step": 1884, "Pretrain/Step Time": 9.167025927454233} +{"Pretrain/Learning Rate": 4.64039016988558e-05, "Pretrain/Loss": 2.10465669631958, "Pretrain/Loss (Raw)": 2.103515148162842, "Pretrain/Step": 1885, "Pretrain/Step Time": 9.158194739371538} +{"Pretrain/Learning Rate": 4.639951360026123e-05, "Pretrain/Loss": 2.1020865440368652, "Pretrain/Loss (Raw)": 1.9403314590454102, "Pretrain/Step": 1886, "Pretrain/Step Time": 9.142687857151031} +{"Pretrain/Learning Rate": 4.639512303377393e-05, "Pretrain/Loss": 2.1009864807128906, "Pretrain/Loss (Raw)": 2.0943193435668945, "Pretrain/Step": 1887, "Pretrain/Step Time": 9.141347849741578} +{"Pretrain/Learning Rate": 4.639072999990022e-05, "Pretrain/Loss": 2.101496696472168, "Pretrain/Loss (Raw)": 2.325873851776123, "Pretrain/Step": 1888, "Pretrain/Step Time": 9.142593758180737} +{"Pretrain/Learning Rate": 4.6386334499146724e-05, "Pretrain/Loss": 2.1023831367492676, "Pretrain/Loss (Raw)": 2.0576632022857666, "Pretrain/Step": 1889, "Pretrain/Step Time": 9.149600291624665} +{"Pretrain/Learning Rate": 4.638193653202035e-05, "Pretrain/Loss": 2.102822780609131, "Pretrain/Loss (Raw)": 2.2602436542510986, "Pretrain/Step": 1890, "Pretrain/Step Time": 9.156377730891109} +{"Pretrain/Learning Rate": 4.6377536099028315e-05, "Pretrain/Loss": 2.101862668991089, "Pretrain/Loss (Raw)": 1.987507939338684, "Pretrain/Step": 1891, "Pretrain/Step Time": 9.148025248199701} +{"Pretrain/Learning Rate": 4.637313320067808e-05, "Pretrain/Loss": 2.1017818450927734, "Pretrain/Loss (Raw)": 2.113070011138916, "Pretrain/Step": 1892, "Pretrain/Step Time": 9.15103298611939} +{"Pretrain/Learning Rate": 4.636872783747741e-05, "Pretrain/Loss": 2.099029064178467, "Pretrain/Loss (Raw)": 1.8666203022003174, "Pretrain/Step": 1893, "Pretrain/Step Time": 9.143053399398923} +{"Pretrain/Learning Rate": 4.636432000993435e-05, "Pretrain/Loss": 2.10037899017334, "Pretrain/Loss (Raw)": 2.1983234882354736, "Pretrain/Step": 1894, "Pretrain/Step Time": 9.104948414489627} +{"Pretrain/Learning Rate": 4.635990971855724e-05, "Pretrain/Loss": 2.0995404720306396, "Pretrain/Loss (Raw)": 2.051745653152466, "Pretrain/Step": 1895, "Pretrain/Step Time": 9.11233601346612} +{"Pretrain/Learning Rate": 4.6355496963854684e-05, "Pretrain/Loss": 2.1001675128936768, "Pretrain/Loss (Raw)": 2.014126777648926, "Pretrain/Step": 1896, "Pretrain/Step Time": 9.110718410462141} +{"Pretrain/Learning Rate": 4.635108174633559e-05, "Pretrain/Loss": 2.0988736152648926, "Pretrain/Loss (Raw)": 1.975968360900879, "Pretrain/Step": 1897, "Pretrain/Step Time": 9.168403232470155} +{"Pretrain/Learning Rate": 4.634666406650914e-05, "Pretrain/Loss": 2.098555564880371, "Pretrain/Loss (Raw)": 2.0125350952148438, "Pretrain/Step": 1898, "Pretrain/Step Time": 9.167378535494208} +{"Pretrain/Learning Rate": 4.63422439248848e-05, "Pretrain/Loss": 2.0980496406555176, "Pretrain/Loss (Raw)": 2.0638182163238525, "Pretrain/Step": 1899, "Pretrain/Step Time": 9.173122242093086} +{"Pretrain/Learning Rate": 4.633782132197232e-05, "Pretrain/Loss": 2.099775791168213, "Pretrain/Loss (Raw)": 2.1640429496765137, "Pretrain/Step": 1900, "Pretrain/Step Time": 9.162146165966988} +{"Pretrain/Learning Rate": 4.633339625828173e-05, "Pretrain/Loss": 2.100071430206299, "Pretrain/Loss (Raw)": 2.0745561122894287, "Pretrain/Step": 1901, "Pretrain/Step Time": 9.16436879709363} +{"Pretrain/Learning Rate": 4.632896873432338e-05, "Pretrain/Loss": 2.099457263946533, "Pretrain/Loss (Raw)": 2.085026741027832, "Pretrain/Step": 1902, "Pretrain/Step Time": 9.171162880957127} +{"Pretrain/Learning Rate": 4.632453875060784e-05, "Pretrain/Loss": 2.100813388824463, "Pretrain/Loss (Raw)": 2.089599847793579, "Pretrain/Step": 1903, "Pretrain/Step Time": 9.185539856553078} +{"Pretrain/Learning Rate": 4.6320106307646e-05, "Pretrain/Loss": 2.098374843597412, "Pretrain/Loss (Raw)": 1.9811500310897827, "Pretrain/Step": 1904, "Pretrain/Step Time": 9.209418296813965} +{"Pretrain/Learning Rate": 4.6315671405949046e-05, "Pretrain/Loss": 2.099006414413452, "Pretrain/Loss (Raw)": 2.208969831466675, "Pretrain/Step": 1905, "Pretrain/Step Time": 9.25038829818368} +{"Pretrain/Learning Rate": 4.631123404602842e-05, "Pretrain/Loss": 2.0997841358184814, "Pretrain/Loss (Raw)": 2.1799559593200684, "Pretrain/Step": 1906, "Pretrain/Step Time": 9.249984439462423} +{"Pretrain/Learning Rate": 4.630679422839585e-05, "Pretrain/Loss": 2.1011674404144287, "Pretrain/Loss (Raw)": 2.2127320766448975, "Pretrain/Step": 1907, "Pretrain/Step Time": 9.29839750751853} +{"Pretrain/Learning Rate": 4.6302351953563385e-05, "Pretrain/Loss": 2.1029446125030518, "Pretrain/Loss (Raw)": 2.355164051055908, "Pretrain/Step": 1908, "Pretrain/Step Time": 9.297197418287396} +{"Pretrain/Learning Rate": 4.629790722204331e-05, "Pretrain/Loss": 2.102827310562134, "Pretrain/Loss (Raw)": 2.1791646480560303, "Pretrain/Step": 1909, "Pretrain/Step Time": 9.303257875144482} +{"Pretrain/Learning Rate": 4.629346003434821e-05, "Pretrain/Loss": 2.1061878204345703, "Pretrain/Loss (Raw)": 2.088123083114624, "Pretrain/Step": 1910, "Pretrain/Step Time": 9.306018475443125} +{"Pretrain/Learning Rate": 4.628901039099096e-05, "Pretrain/Loss": 2.1043171882629395, "Pretrain/Loss (Raw)": 2.010307788848877, "Pretrain/Step": 1911, "Pretrain/Step Time": 9.302111687138677} +{"Pretrain/Learning Rate": 4.6284558292484724e-05, "Pretrain/Loss": 2.1056580543518066, "Pretrain/Loss (Raw)": 2.2809252738952637, "Pretrain/Step": 1912, "Pretrain/Step Time": 9.30024172179401} +{"Pretrain/Learning Rate": 4.628010373934292e-05, "Pretrain/Loss": 2.104004144668579, "Pretrain/Loss (Raw)": 1.9176335334777832, "Pretrain/Step": 1913, "Pretrain/Step Time": 9.304190956056118} +{"Pretrain/Learning Rate": 4.627564673207928e-05, "Pretrain/Loss": 2.1057205200195312, "Pretrain/Loss (Raw)": 1.9896278381347656, "Pretrain/Step": 1914, "Pretrain/Step Time": 9.297093274071813} +{"Pretrain/Learning Rate": 4.62711872712078e-05, "Pretrain/Loss": 2.106593132019043, "Pretrain/Loss (Raw)": 1.9855979681015015, "Pretrain/Step": 1915, "Pretrain/Step Time": 9.302755480632186} +{"Pretrain/Learning Rate": 4.626672535724278e-05, "Pretrain/Loss": 2.105400800704956, "Pretrain/Loss (Raw)": 2.0626001358032227, "Pretrain/Step": 1916, "Pretrain/Step Time": 9.305167902261019} +{"Pretrain/Learning Rate": 4.626226099069878e-05, "Pretrain/Loss": 2.1048057079315186, "Pretrain/Loss (Raw)": 1.9758996963500977, "Pretrain/Step": 1917, "Pretrain/Step Time": 9.318317515775561} +{"Pretrain/Learning Rate": 4.625779417209065e-05, "Pretrain/Loss": 2.1061787605285645, "Pretrain/Loss (Raw)": 2.2507095336914062, "Pretrain/Step": 1918, "Pretrain/Step Time": 9.309321703389287} +{"Pretrain/Learning Rate": 4.625332490193352e-05, "Pretrain/Loss": 2.1046762466430664, "Pretrain/Loss (Raw)": 1.9398236274719238, "Pretrain/Step": 1919, "Pretrain/Step Time": 9.28164791315794} +{"Pretrain/Learning Rate": 4.624885318074282e-05, "Pretrain/Loss": 2.10538649559021, "Pretrain/Loss (Raw)": 2.1062934398651123, "Pretrain/Step": 1920, "Pretrain/Step Time": 9.288785917684436} +{"Pretrain/Learning Rate": 4.624437900903424e-05, "Pretrain/Loss": 2.109147071838379, "Pretrain/Loss (Raw)": 2.2701022624969482, "Pretrain/Step": 1921, "Pretrain/Step Time": 9.285872599110007} +{"Pretrain/Learning Rate": 4.623990238732376e-05, "Pretrain/Loss": 2.108949899673462, "Pretrain/Loss (Raw)": 2.060173511505127, "Pretrain/Step": 1922, "Pretrain/Step Time": 9.288013169541955} +{"Pretrain/Learning Rate": 4.6235423316127655e-05, "Pretrain/Loss": 2.110262393951416, "Pretrain/Loss (Raw)": 2.2401390075683594, "Pretrain/Step": 1923, "Pretrain/Step Time": 9.293840138241649} +{"Pretrain/Learning Rate": 4.623094179596248e-05, "Pretrain/Loss": 2.110457420349121, "Pretrain/Loss (Raw)": 2.107848644256592, "Pretrain/Step": 1924, "Pretrain/Step Time": 9.283855378627777} +{"Pretrain/Learning Rate": 4.622645782734504e-05, "Pretrain/Loss": 2.1098928451538086, "Pretrain/Loss (Raw)": 2.1229310035705566, "Pretrain/Step": 1925, "Pretrain/Step Time": 9.28607377037406} +{"Pretrain/Learning Rate": 4.6221971410792466e-05, "Pretrain/Loss": 2.1089744567871094, "Pretrain/Loss (Raw)": 2.0824873447418213, "Pretrain/Step": 1926, "Pretrain/Step Time": 9.287051847204566} +{"Pretrain/Learning Rate": 4.621748254682214e-05, "Pretrain/Loss": 2.1070175170898438, "Pretrain/Loss (Raw)": 1.8041962385177612, "Pretrain/Step": 1927, "Pretrain/Step Time": 9.304145459085703} +{"Pretrain/Learning Rate": 4.621299123595176e-05, "Pretrain/Loss": 2.10687255859375, "Pretrain/Loss (Raw)": 2.037874937057495, "Pretrain/Step": 1928, "Pretrain/Step Time": 9.30278211273253} +{"Pretrain/Learning Rate": 4.620849747869926e-05, "Pretrain/Loss": 2.107341766357422, "Pretrain/Loss (Raw)": 2.1378512382507324, "Pretrain/Step": 1929, "Pretrain/Step Time": 9.30042109452188} +{"Pretrain/Learning Rate": 4.6204001275582904e-05, "Pretrain/Loss": 2.1048407554626465, "Pretrain/Loss (Raw)": 1.790211796760559, "Pretrain/Step": 1930, "Pretrain/Step Time": 9.337969651445746} +{"Pretrain/Learning Rate": 4.61995026271212e-05, "Pretrain/Loss": 2.102593421936035, "Pretrain/Loss (Raw)": 2.0337181091308594, "Pretrain/Step": 1931, "Pretrain/Step Time": 9.337126601487398} +{"Pretrain/Learning Rate": 4.619500153383296e-05, "Pretrain/Loss": 2.103520154953003, "Pretrain/Loss (Raw)": 2.168750762939453, "Pretrain/Step": 1932, "Pretrain/Step Time": 9.341993160545826} +{"Pretrain/Learning Rate": 4.619049799623726e-05, "Pretrain/Loss": 2.1030538082122803, "Pretrain/Loss (Raw)": 2.0450360774993896, "Pretrain/Step": 1933, "Pretrain/Step Time": 9.34315045364201} +{"Pretrain/Learning Rate": 4.618599201485349e-05, "Pretrain/Loss": 2.102548599243164, "Pretrain/Loss (Raw)": 2.0182647705078125, "Pretrain/Step": 1934, "Pretrain/Step Time": 9.310825284570456} +{"Pretrain/Learning Rate": 4.618148359020128e-05, "Pretrain/Loss": 2.101929187774658, "Pretrain/Loss (Raw)": 2.153486728668213, "Pretrain/Step": 1935, "Pretrain/Step Time": 9.30949936248362} +{"Pretrain/Learning Rate": 4.617697272280057e-05, "Pretrain/Loss": 2.101926326751709, "Pretrain/Loss (Raw)": 1.9671425819396973, "Pretrain/Step": 1936, "Pretrain/Step Time": 9.304714011028409} +{"Pretrain/Learning Rate": 4.6172459413171586e-05, "Pretrain/Loss": 2.100780963897705, "Pretrain/Loss (Raw)": 2.0355138778686523, "Pretrain/Step": 1937, "Pretrain/Step Time": 9.3094223998487} +{"Pretrain/Learning Rate": 4.616794366183481e-05, "Pretrain/Loss": 2.100503921508789, "Pretrain/Loss (Raw)": 2.112015724182129, "Pretrain/Step": 1938, "Pretrain/Step Time": 9.304856711998582} +{"Pretrain/Learning Rate": 4.616342546931102e-05, "Pretrain/Loss": 2.099726915359497, "Pretrain/Loss (Raw)": 2.008335828781128, "Pretrain/Step": 1939, "Pretrain/Step Time": 9.311910063028336} +{"Pretrain/Learning Rate": 4.6158904836121286e-05, "Pretrain/Loss": 2.099714994430542, "Pretrain/Loss (Raw)": 2.040468215942383, "Pretrain/Step": 1940, "Pretrain/Step Time": 9.315232114866376} +{"Pretrain/Learning Rate": 4.6154381762786936e-05, "Pretrain/Loss": 2.102165460586548, "Pretrain/Loss (Raw)": 2.3117685317993164, "Pretrain/Step": 1941, "Pretrain/Step Time": 9.31538381613791} +{"Pretrain/Learning Rate": 4.6149856249829606e-05, "Pretrain/Loss": 2.1028332710266113, "Pretrain/Loss (Raw)": 2.063725233078003, "Pretrain/Step": 1942, "Pretrain/Step Time": 9.31952497549355} +{"Pretrain/Learning Rate": 4.6145328297771183e-05, "Pretrain/Loss": 2.103018283843994, "Pretrain/Loss (Raw)": 2.364553451538086, "Pretrain/Step": 1943, "Pretrain/Step Time": 9.293252827599645} +{"Pretrain/Learning Rate": 4.614079790713387e-05, "Pretrain/Loss": 2.1050631999969482, "Pretrain/Loss (Raw)": 2.2129008769989014, "Pretrain/Step": 1944, "Pretrain/Step Time": 9.29621521010995} +{"Pretrain/Learning Rate": 4.613626507844012e-05, "Pretrain/Loss": 2.1036086082458496, "Pretrain/Loss (Raw)": 2.099963665008545, "Pretrain/Step": 1945, "Pretrain/Step Time": 9.29785049147904} +{"Pretrain/Learning Rate": 4.613172981221268e-05, "Pretrain/Loss": 2.103005886077881, "Pretrain/Loss (Raw)": 2.0612854957580566, "Pretrain/Step": 1946, "Pretrain/Step Time": 9.32423821091652} +{"Pretrain/Learning Rate": 4.612719210897459e-05, "Pretrain/Loss": 2.1025390625, "Pretrain/Loss (Raw)": 1.7861355543136597, "Pretrain/Step": 1947, "Pretrain/Step Time": 9.327277328819036} +{"Pretrain/Learning Rate": 4.612265196924914e-05, "Pretrain/Loss": 2.1022720336914062, "Pretrain/Loss (Raw)": 2.105888843536377, "Pretrain/Step": 1948, "Pretrain/Step Time": 9.323472553864121} +{"Pretrain/Learning Rate": 4.611810939355995e-05, "Pretrain/Loss": 2.1027135848999023, "Pretrain/Loss (Raw)": 2.099652051925659, "Pretrain/Step": 1949, "Pretrain/Step Time": 9.327859226614237} +{"Pretrain/Learning Rate": 4.611356438243085e-05, "Pretrain/Loss": 2.102634906768799, "Pretrain/Loss (Raw)": 2.185251474380493, "Pretrain/Step": 1950, "Pretrain/Step Time": 9.37340173125267} +{"Pretrain/Learning Rate": 4.610901693638603e-05, "Pretrain/Loss": 2.1017165184020996, "Pretrain/Loss (Raw)": 1.902185320854187, "Pretrain/Step": 1951, "Pretrain/Step Time": 9.388040039688349} +{"Pretrain/Learning Rate": 4.610446705594991e-05, "Pretrain/Loss": 2.1024556159973145, "Pretrain/Loss (Raw)": 2.098928689956665, "Pretrain/Step": 1952, "Pretrain/Step Time": 9.385154264047742} +{"Pretrain/Learning Rate": 4.6099914741647196e-05, "Pretrain/Loss": 2.101940393447876, "Pretrain/Loss (Raw)": 2.1324875354766846, "Pretrain/Step": 1953, "Pretrain/Step Time": 9.377346633002162} +{"Pretrain/Learning Rate": 4.609535999400289e-05, "Pretrain/Loss": 2.1025145053863525, "Pretrain/Loss (Raw)": 2.0364418029785156, "Pretrain/Step": 1954, "Pretrain/Step Time": 9.392184654250741} +{"Pretrain/Learning Rate": 4.6090802813542255e-05, "Pretrain/Loss": 2.1007657051086426, "Pretrain/Loss (Raw)": 1.978063702583313, "Pretrain/Step": 1955, "Pretrain/Step Time": 9.393473912030458} +{"Pretrain/Learning Rate": 4.608624320079087e-05, "Pretrain/Loss": 2.101919174194336, "Pretrain/Loss (Raw)": 2.1494181156158447, "Pretrain/Step": 1956, "Pretrain/Step Time": 9.39300873503089} +{"Pretrain/Learning Rate": 4.608168115627455e-05, "Pretrain/Loss": 2.101024627685547, "Pretrain/Loss (Raw)": 2.0661890506744385, "Pretrain/Step": 1957, "Pretrain/Step Time": 9.398713819682598} +{"Pretrain/Learning Rate": 4.607711668051942e-05, "Pretrain/Loss": 2.1044421195983887, "Pretrain/Loss (Raw)": 2.4995765686035156, "Pretrain/Step": 1958, "Pretrain/Step Time": 9.401431690901518} +{"Pretrain/Learning Rate": 4.6072549774051874e-05, "Pretrain/Loss": 2.1050639152526855, "Pretrain/Loss (Raw)": 2.224606990814209, "Pretrain/Step": 1959, "Pretrain/Step Time": 9.397877955809236} +{"Pretrain/Learning Rate": 4.60679804373986e-05, "Pretrain/Loss": 2.1051876544952393, "Pretrain/Loss (Raw)": 2.1353378295898438, "Pretrain/Step": 1960, "Pretrain/Step Time": 9.39616996049881} +{"Pretrain/Learning Rate": 4.606340867108653e-05, "Pretrain/Loss": 2.1045374870300293, "Pretrain/Loss (Raw)": 2.1219482421875, "Pretrain/Step": 1961, "Pretrain/Step Time": 9.402024697512388} +{"Pretrain/Learning Rate": 4.605883447564293e-05, "Pretrain/Loss": 2.105255603790283, "Pretrain/Loss (Raw)": 2.060289144515991, "Pretrain/Step": 1962, "Pretrain/Step Time": 9.401649463921785} +{"Pretrain/Learning Rate": 4.6054257851595303e-05, "Pretrain/Loss": 2.1040902137756348, "Pretrain/Loss (Raw)": 2.042417287826538, "Pretrain/Step": 1963, "Pretrain/Step Time": 9.446285212412477} +{"Pretrain/Learning Rate": 4.604967879947145e-05, "Pretrain/Loss": 2.104192018508911, "Pretrain/Loss (Raw)": 2.0896310806274414, "Pretrain/Step": 1964, "Pretrain/Step Time": 9.455300353467464} +{"Pretrain/Learning Rate": 4.6045097319799447e-05, "Pretrain/Loss": 2.104060173034668, "Pretrain/Loss (Raw)": 2.177971124649048, "Pretrain/Step": 1965, "Pretrain/Step Time": 9.461055414751172} +{"Pretrain/Learning Rate": 4.6040513413107655e-05, "Pretrain/Loss": 2.103663921356201, "Pretrain/Loss (Raw)": 2.01336669921875, "Pretrain/Step": 1966, "Pretrain/Step Time": 9.459830041974783} +{"Pretrain/Learning Rate": 4.603592707992471e-05, "Pretrain/Loss": 2.104642629623413, "Pretrain/Loss (Raw)": 2.1153225898742676, "Pretrain/Step": 1967, "Pretrain/Step Time": 9.470404578372836} +{"Pretrain/Learning Rate": 4.6031338320779534e-05, "Pretrain/Loss": 2.104464054107666, "Pretrain/Loss (Raw)": 2.0878655910491943, "Pretrain/Step": 1968, "Pretrain/Step Time": 9.473393285647035} +{"Pretrain/Learning Rate": 4.602674713620131e-05, "Pretrain/Loss": 2.1040539741516113, "Pretrain/Loss (Raw)": 2.1373581886291504, "Pretrain/Step": 1969, "Pretrain/Step Time": 9.469390513375401} +{"Pretrain/Learning Rate": 4.6022153526719536e-05, "Pretrain/Loss": 2.1034088134765625, "Pretrain/Loss (Raw)": 2.0713961124420166, "Pretrain/Step": 1970, "Pretrain/Step Time": 9.46938574127853} +{"Pretrain/Learning Rate": 4.601755749286395e-05, "Pretrain/Loss": 2.103006601333618, "Pretrain/Loss (Raw)": 2.15057373046875, "Pretrain/Step": 1971, "Pretrain/Step Time": 9.481554828584194} +{"Pretrain/Learning Rate": 4.6012959035164596e-05, "Pretrain/Loss": 2.104870319366455, "Pretrain/Loss (Raw)": 2.209609031677246, "Pretrain/Step": 1972, "Pretrain/Step Time": 9.479739317670465} +{"Pretrain/Learning Rate": 4.6008358154151794e-05, "Pretrain/Loss": 2.103039264678955, "Pretrain/Loss (Raw)": 1.9757635593414307, "Pretrain/Step": 1973, "Pretrain/Step Time": 9.492543110623956} +{"Pretrain/Learning Rate": 4.600375485035613e-05, "Pretrain/Loss": 2.1027753353118896, "Pretrain/Loss (Raw)": 2.0557665824890137, "Pretrain/Step": 1974, "Pretrain/Step Time": 9.49644667468965} +{"Pretrain/Learning Rate": 4.599914912430849e-05, "Pretrain/Loss": 2.1039369106292725, "Pretrain/Loss (Raw)": 2.1518359184265137, "Pretrain/Step": 1975, "Pretrain/Step Time": 9.49494599737227} +{"Pretrain/Learning Rate": 4.5994540976540013e-05, "Pretrain/Loss": 2.1014556884765625, "Pretrain/Loss (Raw)": 1.987765908241272, "Pretrain/Step": 1976, "Pretrain/Step Time": 9.497807033360004} +{"Pretrain/Learning Rate": 4.598993040758215e-05, "Pretrain/Loss": 2.099839925765991, "Pretrain/Loss (Raw)": 1.9451191425323486, "Pretrain/Step": 1977, "Pretrain/Step Time": 9.522172950208187} +{"Pretrain/Learning Rate": 4.59853174179666e-05, "Pretrain/Loss": 2.0983824729919434, "Pretrain/Loss (Raw)": 2.0121140480041504, "Pretrain/Step": 1978, "Pretrain/Step Time": 9.519548701122403} +{"Pretrain/Learning Rate": 4.5980702008225365e-05, "Pretrain/Loss": 2.1002724170684814, "Pretrain/Loss (Raw)": 2.24961256980896, "Pretrain/Step": 1979, "Pretrain/Step Time": 9.518794825300574} +{"Pretrain/Learning Rate": 4.59760841788907e-05, "Pretrain/Loss": 2.101301908493042, "Pretrain/Loss (Raw)": 2.154564380645752, "Pretrain/Step": 1980, "Pretrain/Step Time": 9.518135465681553} +{"Pretrain/Learning Rate": 4.597146393049517e-05, "Pretrain/Loss": 2.101212501525879, "Pretrain/Loss (Raw)": 2.1062989234924316, "Pretrain/Step": 1981, "Pretrain/Step Time": 9.526637328788638} +{"Pretrain/Learning Rate": 4.59668412635716e-05, "Pretrain/Loss": 2.1022305488586426, "Pretrain/Loss (Raw)": 2.1390929222106934, "Pretrain/Step": 1982, "Pretrain/Step Time": 9.53969189710915} +{"Pretrain/Learning Rate": 4.5962216178653095e-05, "Pretrain/Loss": 2.101973056793213, "Pretrain/Loss (Raw)": 2.0045952796936035, "Pretrain/Step": 1983, "Pretrain/Step Time": 9.555021675303578} +{"Pretrain/Learning Rate": 4.5957588676273046e-05, "Pretrain/Loss": 2.1022934913635254, "Pretrain/Loss (Raw)": 1.9685001373291016, "Pretrain/Step": 1984, "Pretrain/Step Time": 9.554957056418061} +{"Pretrain/Learning Rate": 4.595295875696511e-05, "Pretrain/Loss": 2.1017587184906006, "Pretrain/Loss (Raw)": 2.0347254276275635, "Pretrain/Step": 1985, "Pretrain/Step Time": 9.557032635435462} +{"Pretrain/Learning Rate": 4.5948326421263244e-05, "Pretrain/Loss": 2.1005797386169434, "Pretrain/Loss (Raw)": 2.1013777256011963, "Pretrain/Step": 1986, "Pretrain/Step Time": 9.54723098129034} +{"Pretrain/Learning Rate": 4.5943691669701654e-05, "Pretrain/Loss": 2.1012840270996094, "Pretrain/Loss (Raw)": 2.1606621742248535, "Pretrain/Step": 1987, "Pretrain/Step Time": 9.54187823086977} +{"Pretrain/Learning Rate": 4.593905450281486e-05, "Pretrain/Loss": 2.100353717803955, "Pretrain/Loss (Raw)": 2.0678341388702393, "Pretrain/Step": 1988, "Pretrain/Step Time": 9.59716479666531} +{"Pretrain/Learning Rate": 4.593441492113763e-05, "Pretrain/Loss": 2.0998425483703613, "Pretrain/Loss (Raw)": 1.9852252006530762, "Pretrain/Step": 1989, "Pretrain/Step Time": 9.597227931022644} +{"Pretrain/Learning Rate": 4.5929772925205014e-05, "Pretrain/Loss": 2.0989999771118164, "Pretrain/Loss (Raw)": 2.004310131072998, "Pretrain/Step": 1990, "Pretrain/Step Time": 9.614523276686668} +{"Pretrain/Learning Rate": 4.592512851555237e-05, "Pretrain/Loss": 2.098001480102539, "Pretrain/Loss (Raw)": 2.0476014614105225, "Pretrain/Step": 1991, "Pretrain/Step Time": 9.615097425878048} +{"Pretrain/Learning Rate": 4.592048169271531e-05, "Pretrain/Loss": 2.095773220062256, "Pretrain/Loss (Raw)": 1.8290361166000366, "Pretrain/Step": 1992, "Pretrain/Step Time": 9.614582331851125} +{"Pretrain/Learning Rate": 4.591583245722971e-05, "Pretrain/Loss": 2.095533609390259, "Pretrain/Loss (Raw)": 2.1090011596679688, "Pretrain/Step": 1993, "Pretrain/Step Time": 9.605338171124458} +{"Pretrain/Learning Rate": 4.591118080963176e-05, "Pretrain/Loss": 2.0963521003723145, "Pretrain/Loss (Raw)": 2.3404877185821533, "Pretrain/Step": 1994, "Pretrain/Step Time": 9.609345803037286} +{"Pretrain/Learning Rate": 4.590652675045789e-05, "Pretrain/Loss": 2.0963711738586426, "Pretrain/Loss (Raw)": 2.125281572341919, "Pretrain/Step": 1995, "Pretrain/Step Time": 9.61082917638123} +{"Pretrain/Learning Rate": 4.5901870280244855e-05, "Pretrain/Loss": 2.097172260284424, "Pretrain/Loss (Raw)": 2.1793768405914307, "Pretrain/Step": 1996, "Pretrain/Step Time": 9.582369165495038} +{"Pretrain/Learning Rate": 4.589721139952964e-05, "Pretrain/Loss": 2.0974974632263184, "Pretrain/Loss (Raw)": 2.1498162746429443, "Pretrain/Step": 1997, "Pretrain/Step Time": 9.581170532852411} +{"Pretrain/Learning Rate": 4.589255010884953e-05, "Pretrain/Loss": 2.097357749938965, "Pretrain/Loss (Raw)": 2.109614849090576, "Pretrain/Step": 1998, "Pretrain/Step Time": 9.527713440358639} +{"Pretrain/Learning Rate": 4.58878864087421e-05, "Pretrain/Loss": 2.0944485664367676, "Pretrain/Loss (Raw)": 1.8656193017959595, "Pretrain/Step": 1999, "Pretrain/Step Time": 9.523989045992494} +{"Pretrain/Learning Rate": 4.5883220299745176e-05, "Pretrain/Loss": 2.0932199954986572, "Pretrain/Loss (Raw)": 2.090763568878174, "Pretrain/Step": 2000, "Pretrain/Step Time": 9.52746357396245} +{"Pretrain/Learning Rate": 4.587855178239689e-05, "Pretrain/Loss": 2.09470272064209, "Pretrain/Loss (Raw)": 2.2558445930480957, "Pretrain/Step": 2001, "Pretrain/Step Time": 9.529382336884737} +{"Pretrain/Learning Rate": 4.587388085723562e-05, "Pretrain/Loss": 2.0937042236328125, "Pretrain/Loss (Raw)": 2.0675549507141113, "Pretrain/Step": 2002, "Pretrain/Step Time": 9.520220343023539} +{"Pretrain/Learning Rate": 4.586920752480006e-05, "Pretrain/Loss": 2.094527006149292, "Pretrain/Loss (Raw)": 2.0645341873168945, "Pretrain/Step": 2003, "Pretrain/Step Time": 9.515580005943775} +{"Pretrain/Learning Rate": 4.5864531785629136e-05, "Pretrain/Loss": 2.093419075012207, "Pretrain/Loss (Raw)": 1.9664223194122314, "Pretrain/Step": 2004, "Pretrain/Step Time": 9.517085153609514} +{"Pretrain/Learning Rate": 4.5859853640262104e-05, "Pretrain/Loss": 2.093289852142334, "Pretrain/Loss (Raw)": 2.1922030448913574, "Pretrain/Step": 2005, "Pretrain/Step Time": 9.508312407881021} +{"Pretrain/Learning Rate": 4.5855173089238445e-05, "Pretrain/Loss": 2.092365264892578, "Pretrain/Loss (Raw)": 2.165064573287964, "Pretrain/Step": 2006, "Pretrain/Step Time": 9.513421768322587} +{"Pretrain/Learning Rate": 4.5850490133097957e-05, "Pretrain/Loss": 2.0925745964050293, "Pretrain/Loss (Raw)": 2.3028619289398193, "Pretrain/Step": 2007, "Pretrain/Step Time": 9.506205782294273} +{"Pretrain/Learning Rate": 4.584580477238069e-05, "Pretrain/Loss": 2.093458652496338, "Pretrain/Loss (Raw)": 2.2367289066314697, "Pretrain/Step": 2008, "Pretrain/Step Time": 9.515661638230085} +{"Pretrain/Learning Rate": 4.5841117007627e-05, "Pretrain/Loss": 2.09100079536438, "Pretrain/Loss (Raw)": 1.9534703493118286, "Pretrain/Step": 2009, "Pretrain/Step Time": 9.510213781148195} +{"Pretrain/Learning Rate": 4.583642683937748e-05, "Pretrain/Loss": 2.0921027660369873, "Pretrain/Loss (Raw)": 2.276988983154297, "Pretrain/Step": 2010, "Pretrain/Step Time": 9.515134572982788} +{"Pretrain/Learning Rate": 4.583173426817304e-05, "Pretrain/Loss": 2.0917177200317383, "Pretrain/Loss (Raw)": 2.010591745376587, "Pretrain/Step": 2011, "Pretrain/Step Time": 9.51540500111878} +{"Pretrain/Learning Rate": 4.5827039294554833e-05, "Pretrain/Loss": 2.091038465499878, "Pretrain/Loss (Raw)": 1.976676106452942, "Pretrain/Step": 2012, "Pretrain/Step Time": 9.513098038733006} +{"Pretrain/Learning Rate": 4.582234191906432e-05, "Pretrain/Loss": 2.09169864654541, "Pretrain/Loss (Raw)": 2.1880006790161133, "Pretrain/Step": 2013, "Pretrain/Step Time": 9.53259314224124} +{"Pretrain/Learning Rate": 4.581764214224322e-05, "Pretrain/Loss": 2.089874267578125, "Pretrain/Loss (Raw)": 1.7068411111831665, "Pretrain/Step": 2014, "Pretrain/Step Time": 9.52959149517119} +{"Pretrain/Learning Rate": 4.581293996463353e-05, "Pretrain/Loss": 2.090932607650757, "Pretrain/Loss (Raw)": 2.2297723293304443, "Pretrain/Step": 2015, "Pretrain/Step Time": 9.52651841007173} +{"Pretrain/Learning Rate": 4.580823538677753e-05, "Pretrain/Loss": 2.0907483100891113, "Pretrain/Loss (Raw)": 2.3022701740264893, "Pretrain/Step": 2016, "Pretrain/Step Time": 9.54235690832138} +{"Pretrain/Learning Rate": 4.580352840921777e-05, "Pretrain/Loss": 2.091904401779175, "Pretrain/Loss (Raw)": 2.205651044845581, "Pretrain/Step": 2017, "Pretrain/Step Time": 9.564822221174836} +{"Pretrain/Learning Rate": 4.579881903249709e-05, "Pretrain/Loss": 2.090146064758301, "Pretrain/Loss (Raw)": 2.035173177719116, "Pretrain/Step": 2018, "Pretrain/Step Time": 9.55988055281341} +{"Pretrain/Learning Rate": 4.5794107257158595e-05, "Pretrain/Loss": 2.090892791748047, "Pretrain/Loss (Raw)": 2.0830821990966797, "Pretrain/Step": 2019, "Pretrain/Step Time": 9.561445573344827} +{"Pretrain/Learning Rate": 4.578939308374566e-05, "Pretrain/Loss": 2.090378761291504, "Pretrain/Loss (Raw)": 2.0472846031188965, "Pretrain/Step": 2020, "Pretrain/Step Time": 9.551606742665172} +{"Pretrain/Learning Rate": 4.578467651280195e-05, "Pretrain/Loss": 2.0921082496643066, "Pretrain/Loss (Raw)": 2.0879788398742676, "Pretrain/Step": 2021, "Pretrain/Step Time": 9.563286429271102} +{"Pretrain/Learning Rate": 4.57799575448714e-05, "Pretrain/Loss": 2.092630386352539, "Pretrain/Loss (Raw)": 2.2652008533477783, "Pretrain/Step": 2022, "Pretrain/Step Time": 9.572539921849966} +{"Pretrain/Learning Rate": 4.5775236180498235e-05, "Pretrain/Loss": 2.0930538177490234, "Pretrain/Loss (Raw)": 2.105909585952759, "Pretrain/Step": 2023, "Pretrain/Step Time": 9.57487989589572} +{"Pretrain/Learning Rate": 4.5770512420226934e-05, "Pretrain/Loss": 2.094529628753662, "Pretrain/Loss (Raw)": 2.2030551433563232, "Pretrain/Step": 2024, "Pretrain/Step Time": 9.574768235906959} +{"Pretrain/Learning Rate": 4.5765786264602274e-05, "Pretrain/Loss": 2.0952765941619873, "Pretrain/Loss (Raw)": 2.071549892425537, "Pretrain/Step": 2025, "Pretrain/Step Time": 9.514881733804941} +{"Pretrain/Learning Rate": 4.5761057714169284e-05, "Pretrain/Loss": 2.095219612121582, "Pretrain/Loss (Raw)": 2.0052363872528076, "Pretrain/Step": 2026, "Pretrain/Step Time": 9.509676583111286} +{"Pretrain/Learning Rate": 4.575632676947329e-05, "Pretrain/Loss": 2.094921112060547, "Pretrain/Loss (Raw)": 2.025616407394409, "Pretrain/Step": 2027, "Pretrain/Step Time": 9.502379527315497} +{"Pretrain/Learning Rate": 4.575159343105988e-05, "Pretrain/Loss": 2.093052864074707, "Pretrain/Loss (Raw)": 1.9249193668365479, "Pretrain/Step": 2028, "Pretrain/Step Time": 9.507478188723326} +{"Pretrain/Learning Rate": 4.5746857699474946e-05, "Pretrain/Loss": 2.0923874378204346, "Pretrain/Loss (Raw)": 1.9893758296966553, "Pretrain/Step": 2029, "Pretrain/Step Time": 9.511883571743965} +{"Pretrain/Learning Rate": 4.574211957526461e-05, "Pretrain/Loss": 2.092909336090088, "Pretrain/Loss (Raw)": 2.1518218517303467, "Pretrain/Step": 2030, "Pretrain/Step Time": 9.505968110635877} +{"Pretrain/Learning Rate": 4.57373790589753e-05, "Pretrain/Loss": 2.092508316040039, "Pretrain/Loss (Raw)": 2.038297176361084, "Pretrain/Step": 2031, "Pretrain/Step Time": 9.551715459674597} +{"Pretrain/Learning Rate": 4.573263615115372e-05, "Pretrain/Loss": 2.0927834510803223, "Pretrain/Loss (Raw)": 2.016357183456421, "Pretrain/Step": 2032, "Pretrain/Step Time": 9.531117057427764} +{"Pretrain/Learning Rate": 4.572789085234686e-05, "Pretrain/Loss": 2.0931596755981445, "Pretrain/Loss (Raw)": 2.257122039794922, "Pretrain/Step": 2033, "Pretrain/Step Time": 9.503668399527669} +{"Pretrain/Learning Rate": 4.5723143163101934e-05, "Pretrain/Loss": 2.095932960510254, "Pretrain/Loss (Raw)": 2.5349245071411133, "Pretrain/Step": 2034, "Pretrain/Step Time": 9.514839405193925} +{"Pretrain/Learning Rate": 4.571839308396649e-05, "Pretrain/Loss": 2.0961387157440186, "Pretrain/Loss (Raw)": 2.239074230194092, "Pretrain/Step": 2035, "Pretrain/Step Time": 9.470793416723609} +{"Pretrain/Learning Rate": 4.571364061548834e-05, "Pretrain/Loss": 2.0935628414154053, "Pretrain/Loss (Raw)": 2.02546763420105, "Pretrain/Step": 2036, "Pretrain/Step Time": 9.466003211215138} +{"Pretrain/Learning Rate": 4.5708885758215543e-05, "Pretrain/Loss": 2.0925331115722656, "Pretrain/Loss (Raw)": 2.0473670959472656, "Pretrain/Step": 2037, "Pretrain/Step Time": 9.459250096231699} +{"Pretrain/Learning Rate": 4.570412851269645e-05, "Pretrain/Loss": 2.0930371284484863, "Pretrain/Loss (Raw)": 2.152615785598755, "Pretrain/Step": 2038, "Pretrain/Step Time": 9.456623489037156} +{"Pretrain/Learning Rate": 4.56993688794797e-05, "Pretrain/Loss": 2.0954232215881348, "Pretrain/Loss (Raw)": 2.3157355785369873, "Pretrain/Step": 2039, "Pretrain/Step Time": 9.454725932329893} +{"Pretrain/Learning Rate": 4.5694606859114196e-05, "Pretrain/Loss": 2.093562602996826, "Pretrain/Loss (Raw)": 2.042757749557495, "Pretrain/Step": 2040, "Pretrain/Step Time": 9.452795177698135} +{"Pretrain/Learning Rate": 4.5689842452149114e-05, "Pretrain/Loss": 2.0957703590393066, "Pretrain/Loss (Raw)": 2.2002339363098145, "Pretrain/Step": 2041, "Pretrain/Step Time": 9.44946994446218} +{"Pretrain/Learning Rate": 4.56850756591339e-05, "Pretrain/Loss": 2.096900701522827, "Pretrain/Loss (Raw)": 2.1343162059783936, "Pretrain/Step": 2042, "Pretrain/Step Time": 9.444872645661235} +{"Pretrain/Learning Rate": 4.56803064806183e-05, "Pretrain/Loss": 2.098055362701416, "Pretrain/Loss (Raw)": 2.13337779045105, "Pretrain/Step": 2043, "Pretrain/Step Time": 9.415713876485825} +{"Pretrain/Learning Rate": 4.567553491715229e-05, "Pretrain/Loss": 2.096184730529785, "Pretrain/Loss (Raw)": 1.8231632709503174, "Pretrain/Step": 2044, "Pretrain/Step Time": 9.416083199903369} +{"Pretrain/Learning Rate": 4.567076096928618e-05, "Pretrain/Loss": 2.097141981124878, "Pretrain/Loss (Raw)": 2.0984408855438232, "Pretrain/Step": 2045, "Pretrain/Step Time": 9.404032796621323} +{"Pretrain/Learning Rate": 4.566598463757051e-05, "Pretrain/Loss": 2.094545602798462, "Pretrain/Loss (Raw)": 1.9183772802352905, "Pretrain/Step": 2046, "Pretrain/Step Time": 9.40668679960072} +{"Pretrain/Learning Rate": 4.56612059225561e-05, "Pretrain/Loss": 2.095552682876587, "Pretrain/Loss (Raw)": 2.068725347518921, "Pretrain/Step": 2047, "Pretrain/Step Time": 9.400098400190473} +{"Pretrain/Learning Rate": 4.565642482479408e-05, "Pretrain/Loss": 2.094653606414795, "Pretrain/Loss (Raw)": 1.991206407546997, "Pretrain/Step": 2048, "Pretrain/Step Time": 9.400084175169468} +{"Pretrain/Learning Rate": 4.565164134483581e-05, "Pretrain/Loss": 2.094041347503662, "Pretrain/Loss (Raw)": 2.191711902618408, "Pretrain/Step": 2049, "Pretrain/Step Time": 9.401428394019604} +{"Pretrain/Learning Rate": 4.5646855483232935e-05, "Pretrain/Loss": 2.0934529304504395, "Pretrain/Loss (Raw)": 1.9848695993423462, "Pretrain/Step": 2050, "Pretrain/Step Time": 9.397977404296398} +{"Pretrain/Learning Rate": 4.56420672405374e-05, "Pretrain/Loss": 2.094468832015991, "Pretrain/Loss (Raw)": 2.3701727390289307, "Pretrain/Step": 2051, "Pretrain/Step Time": 9.395503679290414} +{"Pretrain/Learning Rate": 4.563727661730141e-05, "Pretrain/Loss": 2.0953903198242188, "Pretrain/Loss (Raw)": 2.225830316543579, "Pretrain/Step": 2052, "Pretrain/Step Time": 9.39392938837409} +{"Pretrain/Learning Rate": 4.563248361407743e-05, "Pretrain/Loss": 2.095388412475586, "Pretrain/Loss (Raw)": 2.122636079788208, "Pretrain/Step": 2053, "Pretrain/Step Time": 9.399482667446136} +{"Pretrain/Learning Rate": 4.562768823141821e-05, "Pretrain/Loss": 2.096719741821289, "Pretrain/Loss (Raw)": 2.252945899963379, "Pretrain/Step": 2054, "Pretrain/Step Time": 9.394962752237916} +{"Pretrain/Learning Rate": 4.562289046987679e-05, "Pretrain/Loss": 2.097299814224243, "Pretrain/Loss (Raw)": 1.8784223794937134, "Pretrain/Step": 2055, "Pretrain/Step Time": 9.381115213036537} +{"Pretrain/Learning Rate": 4.561809033000646e-05, "Pretrain/Loss": 2.097982406616211, "Pretrain/Loss (Raw)": 2.1252570152282715, "Pretrain/Step": 2056, "Pretrain/Step Time": 9.386434722691774} +{"Pretrain/Learning Rate": 4.5613287812360796e-05, "Pretrain/Loss": 2.0971901416778564, "Pretrain/Loss (Raw)": 2.0364279747009277, "Pretrain/Step": 2057, "Pretrain/Step Time": 9.387916577979922} +{"Pretrain/Learning Rate": 4.560848291749365e-05, "Pretrain/Loss": 2.0984604358673096, "Pretrain/Loss (Raw)": 1.9528075456619263, "Pretrain/Step": 2058, "Pretrain/Step Time": 9.346053797751665} +{"Pretrain/Learning Rate": 4.560367564595914e-05, "Pretrain/Loss": 2.097407579421997, "Pretrain/Loss (Raw)": 1.8989423513412476, "Pretrain/Step": 2059, "Pretrain/Step Time": 9.34861308708787} +{"Pretrain/Learning Rate": 4.559886599831167e-05, "Pretrain/Loss": 2.095707893371582, "Pretrain/Loss (Raw)": 1.9512115716934204, "Pretrain/Step": 2060, "Pretrain/Step Time": 9.362168153747916} +{"Pretrain/Learning Rate": 4.559405397510591e-05, "Pretrain/Loss": 2.0955851078033447, "Pretrain/Loss (Raw)": 2.0293188095092773, "Pretrain/Step": 2061, "Pretrain/Step Time": 9.362887782976031} +{"Pretrain/Learning Rate": 4.55892395768968e-05, "Pretrain/Loss": 2.0953354835510254, "Pretrain/Loss (Raw)": 1.986336588859558, "Pretrain/Step": 2062, "Pretrain/Step Time": 9.4074247777462} +{"Pretrain/Learning Rate": 4.5584422804239566e-05, "Pretrain/Loss": 2.095770835876465, "Pretrain/Loss (Raw)": 2.209182024002075, "Pretrain/Step": 2063, "Pretrain/Step Time": 9.441085558384657} +{"Pretrain/Learning Rate": 4.55796036576897e-05, "Pretrain/Loss": 2.0971665382385254, "Pretrain/Loss (Raw)": 2.1458120346069336, "Pretrain/Step": 2064, "Pretrain/Step Time": 9.444884289056063} +{"Pretrain/Learning Rate": 4.557478213780295e-05, "Pretrain/Loss": 2.099048137664795, "Pretrain/Loss (Raw)": 2.2763307094573975, "Pretrain/Step": 2065, "Pretrain/Step Time": 9.440234996378422} +{"Pretrain/Learning Rate": 4.556995824513539e-05, "Pretrain/Loss": 2.0987653732299805, "Pretrain/Loss (Raw)": 2.0758206844329834, "Pretrain/Step": 2066, "Pretrain/Step Time": 9.439622819423676} +{"Pretrain/Learning Rate": 4.5565131980243305e-05, "Pretrain/Loss": 2.099522352218628, "Pretrain/Loss (Raw)": 2.1052420139312744, "Pretrain/Step": 2067, "Pretrain/Step Time": 9.449047207832336} +{"Pretrain/Learning Rate": 4.55603033436833e-05, "Pretrain/Loss": 2.099376678466797, "Pretrain/Loss (Raw)": 2.021821975708008, "Pretrain/Step": 2068, "Pretrain/Step Time": 9.445032354444265} +{"Pretrain/Learning Rate": 4.555547233601223e-05, "Pretrain/Loss": 2.0978126525878906, "Pretrain/Loss (Raw)": 2.1115589141845703, "Pretrain/Step": 2069, "Pretrain/Step Time": 9.440960418432951} +{"Pretrain/Learning Rate": 4.555063895778723e-05, "Pretrain/Loss": 2.097790241241455, "Pretrain/Loss (Raw)": 2.060880661010742, "Pretrain/Step": 2070, "Pretrain/Step Time": 9.439499147236347} +{"Pretrain/Learning Rate": 4.5545803209565704e-05, "Pretrain/Loss": 2.0949630737304688, "Pretrain/Loss (Raw)": 2.0026590824127197, "Pretrain/Step": 2071, "Pretrain/Step Time": 9.44374187104404} +{"Pretrain/Learning Rate": 4.554096509190534e-05, "Pretrain/Loss": 2.095071315765381, "Pretrain/Loss (Raw)": 2.2267653942108154, "Pretrain/Step": 2072, "Pretrain/Step Time": 9.432813066989183} +{"Pretrain/Learning Rate": 4.5536124605364085e-05, "Pretrain/Loss": 2.0954298973083496, "Pretrain/Loss (Raw)": 2.145859956741333, "Pretrain/Step": 2073, "Pretrain/Step Time": 9.429778505116701} +{"Pretrain/Learning Rate": 4.553128175050018e-05, "Pretrain/Loss": 2.0942788124084473, "Pretrain/Loss (Raw)": 1.9139487743377686, "Pretrain/Step": 2074, "Pretrain/Step Time": 9.400636674836278} +{"Pretrain/Learning Rate": 4.552643652787211e-05, "Pretrain/Loss": 2.0960516929626465, "Pretrain/Loss (Raw)": 2.013036012649536, "Pretrain/Step": 2075, "Pretrain/Step Time": 9.397835357114673} +{"Pretrain/Learning Rate": 4.552158893803865e-05, "Pretrain/Loss": 2.095794200897217, "Pretrain/Loss (Raw)": 2.0729658603668213, "Pretrain/Step": 2076, "Pretrain/Step Time": 9.396617395803332} +{"Pretrain/Learning Rate": 4.551673898155886e-05, "Pretrain/Loss": 2.095418691635132, "Pretrain/Loss (Raw)": 2.0515739917755127, "Pretrain/Step": 2077, "Pretrain/Step Time": 9.395822102203965} +{"Pretrain/Learning Rate": 4.5511886658992055e-05, "Pretrain/Loss": 2.0944995880126953, "Pretrain/Loss (Raw)": 2.067633867263794, "Pretrain/Step": 2078, "Pretrain/Step Time": 9.354703199118376} +{"Pretrain/Learning Rate": 4.550703197089782e-05, "Pretrain/Loss": 2.0948877334594727, "Pretrain/Loss (Raw)": 1.9518591165542603, "Pretrain/Step": 2079, "Pretrain/Step Time": 9.341471761465073} +{"Pretrain/Learning Rate": 4.550217491783603e-05, "Pretrain/Loss": 2.0960166454315186, "Pretrain/Loss (Raw)": 2.2434146404266357, "Pretrain/Step": 2080, "Pretrain/Step Time": 9.345629129558802} +{"Pretrain/Learning Rate": 4.549731550036682e-05, "Pretrain/Loss": 2.094855785369873, "Pretrain/Loss (Raw)": 1.9838908910751343, "Pretrain/Step": 2081, "Pretrain/Step Time": 9.348081957548857} +{"Pretrain/Learning Rate": 4.5492453719050596e-05, "Pretrain/Loss": 2.094935417175293, "Pretrain/Loss (Raw)": 2.046642303466797, "Pretrain/Step": 2082, "Pretrain/Step Time": 9.339424336329103} +{"Pretrain/Learning Rate": 4.5487589574448046e-05, "Pretrain/Loss": 2.096737861633301, "Pretrain/Loss (Raw)": 2.20876407623291, "Pretrain/Step": 2083, "Pretrain/Step Time": 9.34010966308415} +{"Pretrain/Learning Rate": 4.5482723067120124e-05, "Pretrain/Loss": 2.097404956817627, "Pretrain/Loss (Raw)": 2.2348039150238037, "Pretrain/Step": 2084, "Pretrain/Step Time": 9.33818613179028} +{"Pretrain/Learning Rate": 4.547785419762807e-05, "Pretrain/Loss": 2.0978097915649414, "Pretrain/Loss (Raw)": 2.11801815032959, "Pretrain/Step": 2085, "Pretrain/Step Time": 9.327822618186474} +{"Pretrain/Learning Rate": 4.547298296653336e-05, "Pretrain/Loss": 2.0953595638275146, "Pretrain/Loss (Raw)": 2.185941696166992, "Pretrain/Step": 2086, "Pretrain/Step Time": 9.33086202479899} +{"Pretrain/Learning Rate": 4.5468109374397796e-05, "Pretrain/Loss": 2.092252016067505, "Pretrain/Loss (Raw)": 1.8268438577651978, "Pretrain/Step": 2087, "Pretrain/Step Time": 9.333273719996214} +{"Pretrain/Learning Rate": 4.54632334217834e-05, "Pretrain/Loss": 2.0923895835876465, "Pretrain/Loss (Raw)": 2.152974843978882, "Pretrain/Step": 2088, "Pretrain/Step Time": 9.333739768713713} +{"Pretrain/Learning Rate": 4.545835510925251e-05, "Pretrain/Loss": 2.0924770832061768, "Pretrain/Loss (Raw)": 2.133131980895996, "Pretrain/Step": 2089, "Pretrain/Step Time": 9.334541372954845} +{"Pretrain/Learning Rate": 4.5453474437367695e-05, "Pretrain/Loss": 2.0938329696655273, "Pretrain/Loss (Raw)": 2.233858585357666, "Pretrain/Step": 2090, "Pretrain/Step Time": 9.336426101624966} +{"Pretrain/Learning Rate": 4.544859140669183e-05, "Pretrain/Loss": 2.092665672302246, "Pretrain/Loss (Raw)": 1.8929678201675415, "Pretrain/Step": 2091, "Pretrain/Step Time": 9.298760848119855} +{"Pretrain/Learning Rate": 4.5443706017788054e-05, "Pretrain/Loss": 2.0929152965545654, "Pretrain/Loss (Raw)": 2.121591091156006, "Pretrain/Step": 2092, "Pretrain/Step Time": 9.292384635657072} +{"Pretrain/Learning Rate": 4.5438818271219765e-05, "Pretrain/Loss": 2.0899219512939453, "Pretrain/Loss (Raw)": 1.7948415279388428, "Pretrain/Step": 2093, "Pretrain/Step Time": 9.279667235910892} +{"Pretrain/Learning Rate": 4.5433928167550634e-05, "Pretrain/Loss": 2.0924673080444336, "Pretrain/Loss (Raw)": 2.3391690254211426, "Pretrain/Step": 2094, "Pretrain/Step Time": 9.285656671971083} +{"Pretrain/Learning Rate": 4.542903570734463e-05, "Pretrain/Loss": 2.092928886413574, "Pretrain/Loss (Raw)": 2.174367904663086, "Pretrain/Step": 2095, "Pretrain/Step Time": 9.274790361523628} +{"Pretrain/Learning Rate": 4.542414089116595e-05, "Pretrain/Loss": 2.0936765670776367, "Pretrain/Loss (Raw)": 2.183581829071045, "Pretrain/Step": 2096, "Pretrain/Step Time": 9.276470242068172} +{"Pretrain/Learning Rate": 4.541924371957911e-05, "Pretrain/Loss": 2.091218948364258, "Pretrain/Loss (Raw)": 1.8227760791778564, "Pretrain/Step": 2097, "Pretrain/Step Time": 9.292928386479616} +{"Pretrain/Learning Rate": 4.5414344193148866e-05, "Pretrain/Loss": 2.088646650314331, "Pretrain/Loss (Raw)": 1.7421625852584839, "Pretrain/Step": 2098, "Pretrain/Step Time": 9.30135658197105} +{"Pretrain/Learning Rate": 4.540944231244025e-05, "Pretrain/Loss": 2.0885980129241943, "Pretrain/Loss (Raw)": 2.14432430267334, "Pretrain/Step": 2099, "Pretrain/Step Time": 9.302508169785142} +{"Pretrain/Learning Rate": 4.540453807801858e-05, "Pretrain/Loss": 2.088352680206299, "Pretrain/Loss (Raw)": 2.178227424621582, "Pretrain/Step": 2100, "Pretrain/Step Time": 9.302405629307032} +{"Pretrain/Learning Rate": 4.539963149044943e-05, "Pretrain/Loss": 2.088298797607422, "Pretrain/Loss (Raw)": 1.9688671827316284, "Pretrain/Step": 2101, "Pretrain/Step Time": 9.290869552642107} +{"Pretrain/Learning Rate": 4.539472255029864e-05, "Pretrain/Loss": 2.088965892791748, "Pretrain/Loss (Raw)": 2.141141176223755, "Pretrain/Step": 2102, "Pretrain/Step Time": 9.28657135926187} +{"Pretrain/Learning Rate": 4.538981125813235e-05, "Pretrain/Loss": 2.0877914428710938, "Pretrain/Loss (Raw)": 2.0014991760253906, "Pretrain/Step": 2103, "Pretrain/Step Time": 9.286280559375882} +{"Pretrain/Learning Rate": 4.538489761451694e-05, "Pretrain/Loss": 2.0882911682128906, "Pretrain/Loss (Raw)": 2.0517585277557373, "Pretrain/Step": 2104, "Pretrain/Step Time": 9.28443761728704} +{"Pretrain/Learning Rate": 4.537998162001909e-05, "Pretrain/Loss": 2.087149143218994, "Pretrain/Loss (Raw)": 1.798907995223999, "Pretrain/Step": 2105, "Pretrain/Step Time": 9.261031730100513} +{"Pretrain/Learning Rate": 4.537506327520571e-05, "Pretrain/Loss": 2.087512969970703, "Pretrain/Loss (Raw)": 2.058713912963867, "Pretrain/Step": 2106, "Pretrain/Step Time": 9.258639140054584} +{"Pretrain/Learning Rate": 4.5370142580644036e-05, "Pretrain/Loss": 2.086332321166992, "Pretrain/Loss (Raw)": 2.098478078842163, "Pretrain/Step": 2107, "Pretrain/Step Time": 9.259616805240512} +{"Pretrain/Learning Rate": 4.536521953690153e-05, "Pretrain/Loss": 2.0863823890686035, "Pretrain/Loss (Raw)": 2.160980463027954, "Pretrain/Step": 2108, "Pretrain/Step Time": 9.263045383617282} +{"Pretrain/Learning Rate": 4.5360294144545946e-05, "Pretrain/Loss": 2.087371826171875, "Pretrain/Loss (Raw)": 2.2329177856445312, "Pretrain/Step": 2109, "Pretrain/Step Time": 9.254940874874592} +{"Pretrain/Learning Rate": 4.5355366404145294e-05, "Pretrain/Loss": 2.0862162113189697, "Pretrain/Loss (Raw)": 1.991219401359558, "Pretrain/Step": 2110, "Pretrain/Step Time": 9.246247589588165} +{"Pretrain/Learning Rate": 4.5350436316267876e-05, "Pretrain/Loss": 2.085618495941162, "Pretrain/Loss (Raw)": 1.9280451536178589, "Pretrain/Step": 2111, "Pretrain/Step Time": 9.22585548646748} +{"Pretrain/Learning Rate": 4.534550388148224e-05, "Pretrain/Loss": 2.0870120525360107, "Pretrain/Loss (Raw)": 2.146890878677368, "Pretrain/Step": 2112, "Pretrain/Step Time": 9.230536412447691} +{"Pretrain/Learning Rate": 4.5340569100357235e-05, "Pretrain/Loss": 2.0873003005981445, "Pretrain/Loss (Raw)": 2.0716395378112793, "Pretrain/Step": 2113, "Pretrain/Step Time": 9.225193500518799} +{"Pretrain/Learning Rate": 4.5335631973461944e-05, "Pretrain/Loss": 2.0885438919067383, "Pretrain/Loss (Raw)": 2.2605597972869873, "Pretrain/Step": 2114, "Pretrain/Step Time": 9.227959331125021} +{"Pretrain/Learning Rate": 4.5330692501365755e-05, "Pretrain/Loss": 2.0893797874450684, "Pretrain/Loss (Raw)": 2.267612934112549, "Pretrain/Step": 2115, "Pretrain/Step Time": 9.233864825218916} +{"Pretrain/Learning Rate": 4.532575068463831e-05, "Pretrain/Loss": 2.090872287750244, "Pretrain/Loss (Raw)": 2.258887529373169, "Pretrain/Step": 2116, "Pretrain/Step Time": 9.177808698266745} +{"Pretrain/Learning Rate": 4.532080652384951e-05, "Pretrain/Loss": 2.090010166168213, "Pretrain/Loss (Raw)": 1.8749008178710938, "Pretrain/Step": 2117, "Pretrain/Step Time": 9.178513104096055} +{"Pretrain/Learning Rate": 4.5315860019569546e-05, "Pretrain/Loss": 2.090684175491333, "Pretrain/Loss (Raw)": 2.090555191040039, "Pretrain/Step": 2118, "Pretrain/Step Time": 9.250601448118687} +{"Pretrain/Learning Rate": 4.531091117236888e-05, "Pretrain/Loss": 2.0913429260253906, "Pretrain/Loss (Raw)": 2.131943464279175, "Pretrain/Step": 2119, "Pretrain/Step Time": 9.245966549962759} +{"Pretrain/Learning Rate": 4.530595998281822e-05, "Pretrain/Loss": 2.0919225215911865, "Pretrain/Loss (Raw)": 1.903221607208252, "Pretrain/Step": 2120, "Pretrain/Step Time": 9.247633066028357} +{"Pretrain/Learning Rate": 4.530100645148858e-05, "Pretrain/Loss": 2.0932135581970215, "Pretrain/Loss (Raw)": 2.2742526531219482, "Pretrain/Step": 2121, "Pretrain/Step Time": 9.250019771978259} +{"Pretrain/Learning Rate": 4.529605057895121e-05, "Pretrain/Loss": 2.0912914276123047, "Pretrain/Loss (Raw)": 2.0944392681121826, "Pretrain/Step": 2122, "Pretrain/Step Time": 9.244588263332844} +{"Pretrain/Learning Rate": 4.529109236577764e-05, "Pretrain/Loss": 2.0909180641174316, "Pretrain/Loss (Raw)": 2.077481508255005, "Pretrain/Step": 2123, "Pretrain/Step Time": 9.239698911085725} +{"Pretrain/Learning Rate": 4.5286131812539704e-05, "Pretrain/Loss": 2.0839731693267822, "Pretrain/Loss (Raw)": 1.2904595136642456, "Pretrain/Step": 2124, "Pretrain/Step Time": 9.249043026939034} +{"Pretrain/Learning Rate": 4.5281168919809444e-05, "Pretrain/Loss": 2.083540678024292, "Pretrain/Loss (Raw)": 2.0944406986236572, "Pretrain/Step": 2125, "Pretrain/Step Time": 9.249899830669165} +{"Pretrain/Learning Rate": 4.527620368815921e-05, "Pretrain/Loss": 2.084869146347046, "Pretrain/Loss (Raw)": 2.2796802520751953, "Pretrain/Step": 2126, "Pretrain/Step Time": 9.242966499179602} +{"Pretrain/Learning Rate": 4.527123611816163e-05, "Pretrain/Loss": 2.0873360633850098, "Pretrain/Loss (Raw)": 2.1813857555389404, "Pretrain/Step": 2127, "Pretrain/Step Time": 9.24088742211461} +{"Pretrain/Learning Rate": 4.526626621038958e-05, "Pretrain/Loss": 2.0867209434509277, "Pretrain/Loss (Raw)": 2.0120046138763428, "Pretrain/Step": 2128, "Pretrain/Step Time": 9.240736903622746} +{"Pretrain/Learning Rate": 4.526129396541621e-05, "Pretrain/Loss": 2.086480140686035, "Pretrain/Loss (Raw)": 2.2250306606292725, "Pretrain/Step": 2129, "Pretrain/Step Time": 9.232788501307368} +{"Pretrain/Learning Rate": 4.525631938381495e-05, "Pretrain/Loss": 2.0848684310913086, "Pretrain/Loss (Raw)": 1.8612773418426514, "Pretrain/Step": 2130, "Pretrain/Step Time": 9.234192375093699} +{"Pretrain/Learning Rate": 4.5251342466159487e-05, "Pretrain/Loss": 2.085092544555664, "Pretrain/Loss (Raw)": 2.0932083129882812, "Pretrain/Step": 2131, "Pretrain/Step Time": 9.240025090053678} +{"Pretrain/Learning Rate": 4.524636321302378e-05, "Pretrain/Loss": 2.0822839736938477, "Pretrain/Loss (Raw)": 1.6069412231445312, "Pretrain/Step": 2132, "Pretrain/Step Time": 9.23068224452436} +{"Pretrain/Learning Rate": 4.524138162498206e-05, "Pretrain/Loss": 2.080254554748535, "Pretrain/Loss (Raw)": 1.9324175119400024, "Pretrain/Step": 2133, "Pretrain/Step Time": 9.241423351690173} +{"Pretrain/Learning Rate": 4.5236397702608833e-05, "Pretrain/Loss": 2.0804758071899414, "Pretrain/Loss (Raw)": 2.193392515182495, "Pretrain/Step": 2134, "Pretrain/Step Time": 9.235662842169404} +{"Pretrain/Learning Rate": 4.5231411446478865e-05, "Pretrain/Loss": 2.0810842514038086, "Pretrain/Loss (Raw)": 2.3807461261749268, "Pretrain/Step": 2135, "Pretrain/Step Time": 9.239263765513897} +{"Pretrain/Learning Rate": 4.5226422857167207e-05, "Pretrain/Loss": 2.0818514823913574, "Pretrain/Loss (Raw)": 2.3349130153656006, "Pretrain/Step": 2136, "Pretrain/Step Time": 9.224076133221388} +{"Pretrain/Learning Rate": 4.5221431935249144e-05, "Pretrain/Loss": 2.078765869140625, "Pretrain/Loss (Raw)": 1.5585201978683472, "Pretrain/Step": 2137, "Pretrain/Step Time": 9.220652900636196} +{"Pretrain/Learning Rate": 4.5216438681300265e-05, "Pretrain/Loss": 2.076685905456543, "Pretrain/Loss (Raw)": 2.0107572078704834, "Pretrain/Step": 2138, "Pretrain/Step Time": 9.223856255412102} +{"Pretrain/Learning Rate": 4.521144309589641e-05, "Pretrain/Loss": 2.0754644870758057, "Pretrain/Loss (Raw)": 1.8542542457580566, "Pretrain/Step": 2139, "Pretrain/Step Time": 9.228793531656265} +{"Pretrain/Learning Rate": 4.520644517961371e-05, "Pretrain/Loss": 2.0778493881225586, "Pretrain/Loss (Raw)": 2.2819435596466064, "Pretrain/Step": 2140, "Pretrain/Step Time": 9.23370587080717} +{"Pretrain/Learning Rate": 4.520144493302853e-05, "Pretrain/Loss": 2.076000928878784, "Pretrain/Loss (Raw)": 1.9513802528381348, "Pretrain/Step": 2141, "Pretrain/Step Time": 9.216391555964947} +{"Pretrain/Learning Rate": 4.519644235671752e-05, "Pretrain/Loss": 2.0781188011169434, "Pretrain/Loss (Raw)": 1.9779490232467651, "Pretrain/Step": 2142, "Pretrain/Step Time": 9.211247831583023} +{"Pretrain/Learning Rate": 4.519143745125762e-05, "Pretrain/Loss": 2.076683521270752, "Pretrain/Loss (Raw)": 2.046037197113037, "Pretrain/Step": 2143, "Pretrain/Step Time": 9.21224475838244} +{"Pretrain/Learning Rate": 4.5186430217226004e-05, "Pretrain/Loss": 2.0750017166137695, "Pretrain/Loss (Raw)": 2.0869877338409424, "Pretrain/Step": 2144, "Pretrain/Step Time": 9.196364322677255} +{"Pretrain/Learning Rate": 4.518142065520013e-05, "Pretrain/Loss": 2.072427749633789, "Pretrain/Loss (Raw)": 1.8762027025222778, "Pretrain/Step": 2145, "Pretrain/Step Time": 9.172648524865508} +{"Pretrain/Learning Rate": 4.5176408765757736e-05, "Pretrain/Loss": 2.073108196258545, "Pretrain/Loss (Raw)": 2.1222777366638184, "Pretrain/Step": 2146, "Pretrain/Step Time": 9.172136060893536} +{"Pretrain/Learning Rate": 4.5171394549476794e-05, "Pretrain/Loss": 2.073319911956787, "Pretrain/Loss (Raw)": 2.1101608276367188, "Pretrain/Step": 2147, "Pretrain/Step Time": 9.172721967101097} +{"Pretrain/Learning Rate": 4.5166378006935595e-05, "Pretrain/Loss": 2.0737667083740234, "Pretrain/Loss (Raw)": 2.104501485824585, "Pretrain/Step": 2148, "Pretrain/Step Time": 9.174258586019278} +{"Pretrain/Learning Rate": 4.5161359138712655e-05, "Pretrain/Loss": 2.0734124183654785, "Pretrain/Loss (Raw)": 2.042583465576172, "Pretrain/Step": 2149, "Pretrain/Step Time": 9.160800151526928} +{"Pretrain/Learning Rate": 4.5156337945386775e-05, "Pretrain/Loss": 2.0718588829040527, "Pretrain/Loss (Raw)": 2.066404104232788, "Pretrain/Step": 2150, "Pretrain/Step Time": 9.149285091087222} +{"Pretrain/Learning Rate": 4.515131442753703e-05, "Pretrain/Loss": 2.0715999603271484, "Pretrain/Loss (Raw)": 2.072756290435791, "Pretrain/Step": 2151, "Pretrain/Step Time": 9.139494970440865} +{"Pretrain/Learning Rate": 4.5146288585742737e-05, "Pretrain/Loss": 2.0705149173736572, "Pretrain/Loss (Raw)": 2.064152479171753, "Pretrain/Step": 2152, "Pretrain/Step Time": 9.137252459302545} +{"Pretrain/Learning Rate": 4.514126042058352e-05, "Pretrain/Loss": 2.0710928440093994, "Pretrain/Loss (Raw)": 2.1455488204956055, "Pretrain/Step": 2153, "Pretrain/Step Time": 9.144602725282311} +{"Pretrain/Learning Rate": 4.513622993263924e-05, "Pretrain/Loss": 2.071974039077759, "Pretrain/Loss (Raw)": 2.1180310249328613, "Pretrain/Step": 2154, "Pretrain/Step Time": 9.14556397497654} +{"Pretrain/Learning Rate": 4.5131197122490035e-05, "Pretrain/Loss": 2.072175979614258, "Pretrain/Loss (Raw)": 2.0514769554138184, "Pretrain/Step": 2155, "Pretrain/Step Time": 9.151700926944613} +{"Pretrain/Learning Rate": 4.512616199071632e-05, "Pretrain/Loss": 2.073045253753662, "Pretrain/Loss (Raw)": 2.0361294746398926, "Pretrain/Step": 2156, "Pretrain/Step Time": 9.152587303891778} +{"Pretrain/Learning Rate": 4.512112453789877e-05, "Pretrain/Loss": 2.0728871822357178, "Pretrain/Loss (Raw)": 1.9691654443740845, "Pretrain/Step": 2157, "Pretrain/Step Time": 9.142743745818734} +{"Pretrain/Learning Rate": 4.5116084764618325e-05, "Pretrain/Loss": 2.072528600692749, "Pretrain/Loss (Raw)": 2.1059510707855225, "Pretrain/Step": 2158, "Pretrain/Step Time": 9.14649848267436} +{"Pretrain/Learning Rate": 4.511104267145618e-05, "Pretrain/Loss": 2.0731568336486816, "Pretrain/Loss (Raw)": 2.118671417236328, "Pretrain/Step": 2159, "Pretrain/Step Time": 9.086760900914669} +{"Pretrain/Learning Rate": 4.510599825899384e-05, "Pretrain/Loss": 2.071418523788452, "Pretrain/Loss (Raw)": 1.7938594818115234, "Pretrain/Step": 2160, "Pretrain/Step Time": 9.09774593822658} +{"Pretrain/Learning Rate": 4.510095152781304e-05, "Pretrain/Loss": 2.070784330368042, "Pretrain/Loss (Raw)": 2.1759650707244873, "Pretrain/Step": 2161, "Pretrain/Step Time": 9.087418643757701} +{"Pretrain/Learning Rate": 4.509590247849579e-05, "Pretrain/Loss": 2.0674805641174316, "Pretrain/Loss (Raw)": 2.112034559249878, "Pretrain/Step": 2162, "Pretrain/Step Time": 9.075718965381384} +{"Pretrain/Learning Rate": 4.509085111162437e-05, "Pretrain/Loss": 2.0665230751037598, "Pretrain/Loss (Raw)": 2.1164958477020264, "Pretrain/Step": 2163, "Pretrain/Step Time": 9.072039453312755} +{"Pretrain/Learning Rate": 4.508579742778133e-05, "Pretrain/Loss": 2.0668540000915527, "Pretrain/Loss (Raw)": 2.067814588546753, "Pretrain/Step": 2164, "Pretrain/Step Time": 9.071284148842096} +{"Pretrain/Learning Rate": 4.508074142754948e-05, "Pretrain/Loss": 2.0657358169555664, "Pretrain/Loss (Raw)": 1.9042617082595825, "Pretrain/Step": 2165, "Pretrain/Step Time": 9.080895068123937} +{"Pretrain/Learning Rate": 4.507568311151191e-05, "Pretrain/Loss": 2.0654170513153076, "Pretrain/Loss (Raw)": 2.1118364334106445, "Pretrain/Step": 2166, "Pretrain/Step Time": 9.089103404432535} +{"Pretrain/Learning Rate": 4.5070622480251955e-05, "Pretrain/Loss": 2.064201593399048, "Pretrain/Loss (Raw)": 2.1601450443267822, "Pretrain/Step": 2167, "Pretrain/Step Time": 9.105227176100016} +{"Pretrain/Learning Rate": 4.506555953435324e-05, "Pretrain/Loss": 2.063237190246582, "Pretrain/Loss (Raw)": 1.9192936420440674, "Pretrain/Step": 2168, "Pretrain/Step Time": 9.102110896259546} +{"Pretrain/Learning Rate": 4.5060494274399654e-05, "Pretrain/Loss": 2.062582015991211, "Pretrain/Loss (Raw)": 2.1164045333862305, "Pretrain/Step": 2169, "Pretrain/Step Time": 9.10585006326437} +{"Pretrain/Learning Rate": 4.505542670097534e-05, "Pretrain/Loss": 2.0620601177215576, "Pretrain/Loss (Raw)": 2.067511796951294, "Pretrain/Step": 2170, "Pretrain/Step Time": 9.107520354911685} +{"Pretrain/Learning Rate": 4.505035681466472e-05, "Pretrain/Loss": 2.0602810382843018, "Pretrain/Loss (Raw)": 1.9056620597839355, "Pretrain/Step": 2171, "Pretrain/Step Time": 9.114656113088131} +{"Pretrain/Learning Rate": 4.504528461605247e-05, "Pretrain/Loss": 2.061969518661499, "Pretrain/Loss (Raw)": 2.039250135421753, "Pretrain/Step": 2172, "Pretrain/Step Time": 9.116069167852402} +{"Pretrain/Learning Rate": 4.5040210105723525e-05, "Pretrain/Loss": 2.0613183975219727, "Pretrain/Loss (Raw)": 2.015126943588257, "Pretrain/Step": 2173, "Pretrain/Step Time": 9.116524040699005} +{"Pretrain/Learning Rate": 4.5035133284263134e-05, "Pretrain/Loss": 2.0625903606414795, "Pretrain/Loss (Raw)": 2.081183910369873, "Pretrain/Step": 2174, "Pretrain/Step Time": 9.118965741246939} +{"Pretrain/Learning Rate": 4.5030054152256756e-05, "Pretrain/Loss": 2.0623793601989746, "Pretrain/Loss (Raw)": 2.041719436645508, "Pretrain/Step": 2175, "Pretrain/Step Time": 9.124401144683361} +{"Pretrain/Learning Rate": 4.502497271029015e-05, "Pretrain/Loss": 2.064011573791504, "Pretrain/Loss (Raw)": 2.2001283168792725, "Pretrain/Step": 2176, "Pretrain/Step Time": 9.125023737549782} +{"Pretrain/Learning Rate": 4.501988895894933e-05, "Pretrain/Loss": 2.0628321170806885, "Pretrain/Loss (Raw)": 2.0407397747039795, "Pretrain/Step": 2177, "Pretrain/Step Time": 9.122960833832622} +{"Pretrain/Learning Rate": 4.501480289882058e-05, "Pretrain/Loss": 2.06418514251709, "Pretrain/Loss (Raw)": 2.158055067062378, "Pretrain/Step": 2178, "Pretrain/Step Time": 9.128368312492967} +{"Pretrain/Learning Rate": 4.5009714530490455e-05, "Pretrain/Loss": 2.0594544410705566, "Pretrain/Loss (Raw)": 1.7646507024765015, "Pretrain/Step": 2179, "Pretrain/Step Time": 9.126453500241041} +{"Pretrain/Learning Rate": 4.5004623854545746e-05, "Pretrain/Loss": 2.0597825050354004, "Pretrain/Loss (Raw)": 2.267784357070923, "Pretrain/Step": 2180, "Pretrain/Step Time": 9.123709546402097} +{"Pretrain/Learning Rate": 4.4999530871573556e-05, "Pretrain/Loss": 2.0599660873413086, "Pretrain/Loss (Raw)": 2.1461570262908936, "Pretrain/Step": 2181, "Pretrain/Step Time": 9.12174753844738} +{"Pretrain/Learning Rate": 4.499443558216123e-05, "Pretrain/Loss": 2.059326171875, "Pretrain/Loss (Raw)": 2.1710476875305176, "Pretrain/Step": 2182, "Pretrain/Step Time": 9.126681432127953} +{"Pretrain/Learning Rate": 4.498933798689638e-05, "Pretrain/Loss": 2.0596041679382324, "Pretrain/Loss (Raw)": 1.9139889478683472, "Pretrain/Step": 2183, "Pretrain/Step Time": 9.119896054267883} +{"Pretrain/Learning Rate": 4.498423808636687e-05, "Pretrain/Loss": 2.0585031509399414, "Pretrain/Loss (Raw)": 1.9843508005142212, "Pretrain/Step": 2184, "Pretrain/Step Time": 9.1154073625803} +{"Pretrain/Learning Rate": 4.497913588116085e-05, "Pretrain/Loss": 2.0580825805664062, "Pretrain/Loss (Raw)": 1.9825921058654785, "Pretrain/Step": 2185, "Pretrain/Step Time": 9.114243047311902} +{"Pretrain/Learning Rate": 4.497403137186674e-05, "Pretrain/Loss": 2.059436321258545, "Pretrain/Loss (Raw)": 2.1261048316955566, "Pretrain/Step": 2186, "Pretrain/Step Time": 9.10863122716546} +{"Pretrain/Learning Rate": 4.496892455907322e-05, "Pretrain/Loss": 2.061286449432373, "Pretrain/Loss (Raw)": 2.1357271671295166, "Pretrain/Step": 2187, "Pretrain/Step Time": 9.146078148856759} +{"Pretrain/Learning Rate": 4.496381544336922e-05, "Pretrain/Loss": 2.063403844833374, "Pretrain/Loss (Raw)": 2.222229242324829, "Pretrain/Step": 2188, "Pretrain/Step Time": 9.131867747753859} +{"Pretrain/Learning Rate": 4.495870402534394e-05, "Pretrain/Loss": 2.0652847290039062, "Pretrain/Loss (Raw)": 2.2701034545898438, "Pretrain/Step": 2189, "Pretrain/Step Time": 9.13561062514782} +{"Pretrain/Learning Rate": 4.495359030558688e-05, "Pretrain/Loss": 2.0656356811523438, "Pretrain/Loss (Raw)": 2.0312516689300537, "Pretrain/Step": 2190, "Pretrain/Step Time": 9.086401600390673} +{"Pretrain/Learning Rate": 4.494847428468775e-05, "Pretrain/Loss": 2.064077377319336, "Pretrain/Loss (Raw)": 2.0097317695617676, "Pretrain/Step": 2191, "Pretrain/Step Time": 9.054191237315536} +{"Pretrain/Learning Rate": 4.494335596323657e-05, "Pretrain/Loss": 2.062753677368164, "Pretrain/Loss (Raw)": 1.9763364791870117, "Pretrain/Step": 2192, "Pretrain/Step Time": 9.052018955349922} +{"Pretrain/Learning Rate": 4.49382353418236e-05, "Pretrain/Loss": 2.0611486434936523, "Pretrain/Loss (Raw)": 2.0709149837493896, "Pretrain/Step": 2193, "Pretrain/Step Time": 9.049759954214096} +{"Pretrain/Learning Rate": 4.493311242103938e-05, "Pretrain/Loss": 2.062922716140747, "Pretrain/Loss (Raw)": 2.302886962890625, "Pretrain/Step": 2194, "Pretrain/Step Time": 9.052505385130644} +{"Pretrain/Learning Rate": 4.4927987201474707e-05, "Pretrain/Loss": 2.06231427192688, "Pretrain/Loss (Raw)": 2.0273733139038086, "Pretrain/Step": 2195, "Pretrain/Step Time": 9.035779977217317} +{"Pretrain/Learning Rate": 4.492285968372065e-05, "Pretrain/Loss": 2.0622754096984863, "Pretrain/Loss (Raw)": 2.0168445110321045, "Pretrain/Step": 2196, "Pretrain/Step Time": 9.034842483699322} +{"Pretrain/Learning Rate": 4.491772986836853e-05, "Pretrain/Loss": 2.0615715980529785, "Pretrain/Loss (Raw)": 2.021474599838257, "Pretrain/Step": 2197, "Pretrain/Step Time": 9.03433307632804} +{"Pretrain/Learning Rate": 4.4912597756009946e-05, "Pretrain/Loss": 2.0613784790039062, "Pretrain/Loss (Raw)": 2.0361733436584473, "Pretrain/Step": 2198, "Pretrain/Step Time": 9.033160103484988} +{"Pretrain/Learning Rate": 4.490746334723677e-05, "Pretrain/Loss": 2.061192750930786, "Pretrain/Loss (Raw)": 1.978865623474121, "Pretrain/Step": 2199, "Pretrain/Step Time": 9.027750510722399} +{"Pretrain/Learning Rate": 4.4902326642641095e-05, "Pretrain/Loss": 2.059659719467163, "Pretrain/Loss (Raw)": 2.0305335521698, "Pretrain/Step": 2200, "Pretrain/Step Time": 9.035595025867224} +{"Pretrain/Learning Rate": 4.489718764281534e-05, "Pretrain/Loss": 2.059312343597412, "Pretrain/Loss (Raw)": 2.1014010906219482, "Pretrain/Step": 2201, "Pretrain/Step Time": 9.038064064458013} +{"Pretrain/Learning Rate": 4.489204634835215e-05, "Pretrain/Loss": 2.059426784515381, "Pretrain/Loss (Raw)": 1.9285717010498047, "Pretrain/Step": 2202, "Pretrain/Step Time": 9.042104545980692} +{"Pretrain/Learning Rate": 4.488690275984443e-05, "Pretrain/Loss": 2.059215545654297, "Pretrain/Loss (Raw)": 1.986039638519287, "Pretrain/Step": 2203, "Pretrain/Step Time": 9.04785511083901} +{"Pretrain/Learning Rate": 4.488175687788538e-05, "Pretrain/Loss": 2.058832883834839, "Pretrain/Loss (Raw)": 2.0239498615264893, "Pretrain/Step": 2204, "Pretrain/Step Time": 9.055661857128143} +{"Pretrain/Learning Rate": 4.4876608703068434e-05, "Pretrain/Loss": 2.0582618713378906, "Pretrain/Loss (Raw)": 1.9785118103027344, "Pretrain/Step": 2205, "Pretrain/Step Time": 9.061880223453045} +{"Pretrain/Learning Rate": 4.487145823598732e-05, "Pretrain/Loss": 2.056879758834839, "Pretrain/Loss (Raw)": 1.8907291889190674, "Pretrain/Step": 2206, "Pretrain/Step Time": 9.059609027579427} +{"Pretrain/Learning Rate": 4.4866305477236e-05, "Pretrain/Loss": 2.0598561763763428, "Pretrain/Loss (Raw)": 2.3328158855438232, "Pretrain/Step": 2207, "Pretrain/Step Time": 9.056842036545277} +{"Pretrain/Learning Rate": 4.486115042740872e-05, "Pretrain/Loss": 2.0583548545837402, "Pretrain/Loss (Raw)": 2.0512564182281494, "Pretrain/Step": 2208, "Pretrain/Step Time": 9.049594877287745} +{"Pretrain/Learning Rate": 4.4855993087099984e-05, "Pretrain/Loss": 2.0594801902770996, "Pretrain/Loss (Raw)": 2.1279401779174805, "Pretrain/Step": 2209, "Pretrain/Step Time": 9.052653139457107} +{"Pretrain/Learning Rate": 4.485083345690456e-05, "Pretrain/Loss": 2.0605669021606445, "Pretrain/Loss (Raw)": 2.185722827911377, "Pretrain/Step": 2210, "Pretrain/Step Time": 9.059380780905485} +{"Pretrain/Learning Rate": 4.4845671537417486e-05, "Pretrain/Loss": 2.0580883026123047, "Pretrain/Loss (Raw)": 1.8914932012557983, "Pretrain/Step": 2211, "Pretrain/Step Time": 9.051760548725724} +{"Pretrain/Learning Rate": 4.484050732923405e-05, "Pretrain/Loss": 2.056898832321167, "Pretrain/Loss (Raw)": 2.0825724601745605, "Pretrain/Step": 2212, "Pretrain/Step Time": 9.057017398998141} +{"Pretrain/Learning Rate": 4.483534083294982e-05, "Pretrain/Loss": 2.0547730922698975, "Pretrain/Loss (Raw)": 1.8459217548370361, "Pretrain/Step": 2213, "Pretrain/Step Time": 9.057605806738138} +{"Pretrain/Learning Rate": 4.483017204916061e-05, "Pretrain/Loss": 2.0544114112854004, "Pretrain/Loss (Raw)": 2.1396398544311523, "Pretrain/Step": 2214, "Pretrain/Step Time": 9.05828638188541} +{"Pretrain/Learning Rate": 4.482500097846253e-05, "Pretrain/Loss": 2.055908203125, "Pretrain/Loss (Raw)": 2.018433094024658, "Pretrain/Step": 2215, "Pretrain/Step Time": 9.058858998119831} +{"Pretrain/Learning Rate": 4.4819827621451906e-05, "Pretrain/Loss": 2.054746627807617, "Pretrain/Loss (Raw)": 2.00430965423584, "Pretrain/Step": 2216, "Pretrain/Step Time": 9.056058308109641} +{"Pretrain/Learning Rate": 4.481465197872538e-05, "Pretrain/Loss": 2.0540733337402344, "Pretrain/Loss (Raw)": 2.046933650970459, "Pretrain/Step": 2217, "Pretrain/Step Time": 9.05190452747047} +{"Pretrain/Learning Rate": 4.4809474050879806e-05, "Pretrain/Loss": 2.051762104034424, "Pretrain/Loss (Raw)": 1.9380258321762085, "Pretrain/Step": 2218, "Pretrain/Step Time": 9.051632773131132} +{"Pretrain/Learning Rate": 4.4804293838512346e-05, "Pretrain/Loss": 2.0524606704711914, "Pretrain/Loss (Raw)": 1.9823986291885376, "Pretrain/Step": 2219, "Pretrain/Step Time": 9.05017812922597} +{"Pretrain/Learning Rate": 4.47991113422204e-05, "Pretrain/Loss": 2.0523903369903564, "Pretrain/Loss (Raw)": 2.1125614643096924, "Pretrain/Step": 2220, "Pretrain/Step Time": 9.046761155128479} +{"Pretrain/Learning Rate": 4.479392656260163e-05, "Pretrain/Loss": 2.0549421310424805, "Pretrain/Loss (Raw)": 2.1214773654937744, "Pretrain/Step": 2221, "Pretrain/Step Time": 9.051598034799099} +{"Pretrain/Learning Rate": 4.4788739500253986e-05, "Pretrain/Loss": 2.0527215003967285, "Pretrain/Loss (Raw)": 2.054941177368164, "Pretrain/Step": 2222, "Pretrain/Step Time": 9.049633637070656} +{"Pretrain/Learning Rate": 4.4783550155775647e-05, "Pretrain/Loss": 2.0519864559173584, "Pretrain/Loss (Raw)": 2.080270767211914, "Pretrain/Step": 2223, "Pretrain/Step Time": 9.055836096405983} +{"Pretrain/Learning Rate": 4.4778358529765085e-05, "Pretrain/Loss": 2.0504438877105713, "Pretrain/Loss (Raw)": 1.986138939857483, "Pretrain/Step": 2224, "Pretrain/Step Time": 9.059175971895456} +{"Pretrain/Learning Rate": 4.477316462282102e-05, "Pretrain/Loss": 2.0522429943084717, "Pretrain/Loss (Raw)": 2.0530731678009033, "Pretrain/Step": 2225, "Pretrain/Step Time": 9.04030848108232} +{"Pretrain/Learning Rate": 4.476796843554243e-05, "Pretrain/Loss": 2.053349018096924, "Pretrain/Loss (Raw)": 1.8837251663208008, "Pretrain/Step": 2226, "Pretrain/Step Time": 9.036468658596277} +{"Pretrain/Learning Rate": 4.4762769968528575e-05, "Pretrain/Loss": 2.0533742904663086, "Pretrain/Loss (Raw)": 2.147535562515259, "Pretrain/Step": 2227, "Pretrain/Step Time": 9.023799316957593} +{"Pretrain/Learning Rate": 4.475756922237896e-05, "Pretrain/Loss": 2.0514633655548096, "Pretrain/Loss (Raw)": 1.9336539506912231, "Pretrain/Step": 2228, "Pretrain/Step Time": 9.02591560781002} +{"Pretrain/Learning Rate": 4.4752366197693365e-05, "Pretrain/Loss": 2.052741765975952, "Pretrain/Loss (Raw)": 2.1324844360351562, "Pretrain/Step": 2229, "Pretrain/Step Time": 9.02183010801673} +{"Pretrain/Learning Rate": 4.474716089507182e-05, "Pretrain/Loss": 2.0516347885131836, "Pretrain/Loss (Raw)": 1.9994624853134155, "Pretrain/Step": 2230, "Pretrain/Step Time": 9.019113022834063} +{"Pretrain/Learning Rate": 4.474195331511464e-05, "Pretrain/Loss": 2.0516114234924316, "Pretrain/Loss (Raw)": 1.9985219240188599, "Pretrain/Step": 2231, "Pretrain/Step Time": 9.019048880785704} +{"Pretrain/Learning Rate": 4.473674345842236e-05, "Pretrain/Loss": 2.05157470703125, "Pretrain/Loss (Raw)": 2.0470542907714844, "Pretrain/Step": 2232, "Pretrain/Step Time": 9.020989952608943} +{"Pretrain/Learning Rate": 4.4731531325595835e-05, "Pretrain/Loss": 2.0551676750183105, "Pretrain/Loss (Raw)": 2.258798360824585, "Pretrain/Step": 2233, "Pretrain/Step Time": 9.014648236334324} +{"Pretrain/Learning Rate": 4.472631691723613e-05, "Pretrain/Loss": 2.055124282836914, "Pretrain/Loss (Raw)": 2.0531625747680664, "Pretrain/Step": 2234, "Pretrain/Step Time": 9.021844703704119} +{"Pretrain/Learning Rate": 4.4721100233944606e-05, "Pretrain/Loss": 2.0554184913635254, "Pretrain/Loss (Raw)": 2.1361613273620605, "Pretrain/Step": 2235, "Pretrain/Step Time": 9.024534186348319} +{"Pretrain/Learning Rate": 4.471588127632288e-05, "Pretrain/Loss": 2.0550646781921387, "Pretrain/Loss (Raw)": 2.1156423091888428, "Pretrain/Step": 2236, "Pretrain/Step Time": 9.023828269913793} +{"Pretrain/Learning Rate": 4.471066004497282e-05, "Pretrain/Loss": 2.0559659004211426, "Pretrain/Loss (Raw)": 2.348275899887085, "Pretrain/Step": 2237, "Pretrain/Step Time": 9.020901218056679} +{"Pretrain/Learning Rate": 4.470543654049656e-05, "Pretrain/Loss": 2.057044506072998, "Pretrain/Loss (Raw)": 2.1293182373046875, "Pretrain/Step": 2238, "Pretrain/Step Time": 9.026877827942371} +{"Pretrain/Learning Rate": 4.47002107634965e-05, "Pretrain/Loss": 2.0582704544067383, "Pretrain/Loss (Raw)": 2.084970474243164, "Pretrain/Step": 2239, "Pretrain/Step Time": 9.025873869657516} +{"Pretrain/Learning Rate": 4.469498271457531e-05, "Pretrain/Loss": 2.0583462715148926, "Pretrain/Loss (Raw)": 2.1565561294555664, "Pretrain/Step": 2240, "Pretrain/Step Time": 9.044072987511754} +{"Pretrain/Learning Rate": 4.468975239433591e-05, "Pretrain/Loss": 2.0584511756896973, "Pretrain/Loss (Raw)": 2.0851101875305176, "Pretrain/Step": 2241, "Pretrain/Step Time": 9.050079867243767} +{"Pretrain/Learning Rate": 4.468451980338148e-05, "Pretrain/Loss": 2.056476593017578, "Pretrain/Loss (Raw)": 2.0078125, "Pretrain/Step": 2242, "Pretrain/Step Time": 9.047351151704788} +{"Pretrain/Learning Rate": 4.467928494231547e-05, "Pretrain/Loss": 2.0560379028320312, "Pretrain/Loss (Raw)": 2.2114291191101074, "Pretrain/Step": 2243, "Pretrain/Step Time": 9.04898925498128} +{"Pretrain/Learning Rate": 4.4674047811741585e-05, "Pretrain/Loss": 2.0560810565948486, "Pretrain/Loss (Raw)": 2.264413833618164, "Pretrain/Step": 2244, "Pretrain/Step Time": 9.052402142435312} +{"Pretrain/Learning Rate": 4.466880841226381e-05, "Pretrain/Loss": 2.058377742767334, "Pretrain/Loss (Raw)": 2.1688671112060547, "Pretrain/Step": 2245, "Pretrain/Step Time": 9.048983437940478} +{"Pretrain/Learning Rate": 4.466356674448635e-05, "Pretrain/Loss": 2.0580685138702393, "Pretrain/Loss (Raw)": 2.051008939743042, "Pretrain/Step": 2246, "Pretrain/Step Time": 8.956501632928848} +{"Pretrain/Learning Rate": 4.4658322809013723e-05, "Pretrain/Loss": 2.058650016784668, "Pretrain/Loss (Raw)": 2.2063605785369873, "Pretrain/Step": 2247, "Pretrain/Step Time": 8.9612622782588} +{"Pretrain/Learning Rate": 4.465307660645068e-05, "Pretrain/Loss": 2.058471441268921, "Pretrain/Loss (Raw)": 1.8803564310073853, "Pretrain/Step": 2248, "Pretrain/Step Time": 8.959355980157852} +{"Pretrain/Learning Rate": 4.464782813740223e-05, "Pretrain/Loss": 2.0569911003112793, "Pretrain/Loss (Raw)": 2.084791421890259, "Pretrain/Step": 2249, "Pretrain/Step Time": 8.968345446512103} +{"Pretrain/Learning Rate": 4.464257740247366e-05, "Pretrain/Loss": 2.0552356243133545, "Pretrain/Loss (Raw)": 1.869716763496399, "Pretrain/Step": 2250, "Pretrain/Step Time": 8.974756559357047} +{"Pretrain/Learning Rate": 4.4637324402270495e-05, "Pretrain/Loss": 2.0543994903564453, "Pretrain/Loss (Raw)": 1.970451831817627, "Pretrain/Step": 2251, "Pretrain/Step Time": 8.974846966564655} +{"Pretrain/Learning Rate": 4.463206913739856e-05, "Pretrain/Loss": 2.0611162185668945, "Pretrain/Loss (Raw)": 2.1502182483673096, "Pretrain/Step": 2252, "Pretrain/Step Time": 8.966509018093348} +{"Pretrain/Learning Rate": 4.462681160846389e-05, "Pretrain/Loss": 2.060885429382324, "Pretrain/Loss (Raw)": 2.0649006366729736, "Pretrain/Step": 2253, "Pretrain/Step Time": 8.965609550476074} +{"Pretrain/Learning Rate": 4.4621551816072835e-05, "Pretrain/Loss": 2.060429096221924, "Pretrain/Loss (Raw)": 2.2212605476379395, "Pretrain/Step": 2254, "Pretrain/Step Time": 8.962551321834326} +{"Pretrain/Learning Rate": 4.4616289760831954e-05, "Pretrain/Loss": 2.0570664405822754, "Pretrain/Loss (Raw)": 1.7509609460830688, "Pretrain/Step": 2255, "Pretrain/Step Time": 8.963149448856711} +{"Pretrain/Learning Rate": 4.46110254433481e-05, "Pretrain/Loss": 2.0575342178344727, "Pretrain/Loss (Raw)": 2.071871280670166, "Pretrain/Step": 2256, "Pretrain/Step Time": 8.957329532131553} +{"Pretrain/Learning Rate": 4.4605758864228384e-05, "Pretrain/Loss": 2.058262586593628, "Pretrain/Loss (Raw)": 2.318282127380371, "Pretrain/Step": 2257, "Pretrain/Step Time": 8.957538379356265} +{"Pretrain/Learning Rate": 4.460049002408018e-05, "Pretrain/Loss": 2.0590739250183105, "Pretrain/Loss (Raw)": 1.965147614479065, "Pretrain/Step": 2258, "Pretrain/Step Time": 8.959514508023858} +{"Pretrain/Learning Rate": 4.45952189235111e-05, "Pretrain/Loss": 2.0595240592956543, "Pretrain/Loss (Raw)": 2.150799512863159, "Pretrain/Step": 2259, "Pretrain/Step Time": 8.963094966486096} +{"Pretrain/Learning Rate": 4.458994556312903e-05, "Pretrain/Loss": 2.0625507831573486, "Pretrain/Loss (Raw)": 1.9943619966506958, "Pretrain/Step": 2260, "Pretrain/Step Time": 8.96929575316608} +{"Pretrain/Learning Rate": 4.458466994354214e-05, "Pretrain/Loss": 2.0624337196350098, "Pretrain/Loss (Raw)": 1.917433261871338, "Pretrain/Step": 2261, "Pretrain/Step Time": 8.971157886087894} +{"Pretrain/Learning Rate": 4.457939206535882e-05, "Pretrain/Loss": 2.061102867126465, "Pretrain/Loss (Raw)": 2.0230400562286377, "Pretrain/Step": 2262, "Pretrain/Step Time": 8.97529462724924} +{"Pretrain/Learning Rate": 4.4574111929187744e-05, "Pretrain/Loss": 2.0589447021484375, "Pretrain/Loss (Raw)": 2.104520320892334, "Pretrain/Step": 2263, "Pretrain/Step Time": 8.98698703199625} +{"Pretrain/Learning Rate": 4.4568829535637844e-05, "Pretrain/Loss": 2.055999994277954, "Pretrain/Loss (Raw)": 1.9579613208770752, "Pretrain/Step": 2264, "Pretrain/Step Time": 8.990168685093522} +{"Pretrain/Learning Rate": 4.456354488531832e-05, "Pretrain/Loss": 2.0610570907592773, "Pretrain/Loss (Raw)": 2.2058541774749756, "Pretrain/Step": 2265, "Pretrain/Step Time": 8.989032035693526} +{"Pretrain/Learning Rate": 4.4558257978838605e-05, "Pretrain/Loss": 2.0629806518554688, "Pretrain/Loss (Raw)": 2.2569496631622314, "Pretrain/Step": 2266, "Pretrain/Step Time": 8.978766998276114} +{"Pretrain/Learning Rate": 4.455296881680842e-05, "Pretrain/Loss": 2.0639333724975586, "Pretrain/Loss (Raw)": 1.9762272834777832, "Pretrain/Step": 2267, "Pretrain/Step Time": 8.974361767992377} +{"Pretrain/Learning Rate": 4.4547677399837726e-05, "Pretrain/Loss": 2.063153028488159, "Pretrain/Loss (Raw)": 2.1820428371429443, "Pretrain/Step": 2268, "Pretrain/Step Time": 8.965864015743136} +{"Pretrain/Learning Rate": 4.4542383728536774e-05, "Pretrain/Loss": 2.062081813812256, "Pretrain/Loss (Raw)": 1.814295768737793, "Pretrain/Step": 2269, "Pretrain/Step Time": 8.967797501012683} +{"Pretrain/Learning Rate": 4.453708780351604e-05, "Pretrain/Loss": 2.062232732772827, "Pretrain/Loss (Raw)": 1.9972366094589233, "Pretrain/Step": 2270, "Pretrain/Step Time": 8.968853693455458} +{"Pretrain/Learning Rate": 4.4531789625386274e-05, "Pretrain/Loss": 2.0629396438598633, "Pretrain/Loss (Raw)": 2.1365432739257812, "Pretrain/Step": 2271, "Pretrain/Step Time": 8.979201301932335} +{"Pretrain/Learning Rate": 4.45264891947585e-05, "Pretrain/Loss": 2.0623297691345215, "Pretrain/Loss (Raw)": 2.0089151859283447, "Pretrain/Step": 2272, "Pretrain/Step Time": 8.990444414317608} +{"Pretrain/Learning Rate": 4.452118651224398e-05, "Pretrain/Loss": 2.062486171722412, "Pretrain/Loss (Raw)": 1.8961917161941528, "Pretrain/Step": 2273, "Pretrain/Step Time": 8.99509048089385} +{"Pretrain/Learning Rate": 4.451588157845424e-05, "Pretrain/Loss": 2.0621070861816406, "Pretrain/Loss (Raw)": 2.0737712383270264, "Pretrain/Step": 2274, "Pretrain/Step Time": 9.028248526155949} +{"Pretrain/Learning Rate": 4.451057439400108e-05, "Pretrain/Loss": 2.0629827976226807, "Pretrain/Loss (Raw)": 2.2222654819488525, "Pretrain/Step": 2275, "Pretrain/Step Time": 9.032654298469424} +{"Pretrain/Learning Rate": 4.450526495949653e-05, "Pretrain/Loss": 2.0637738704681396, "Pretrain/Loss (Raw)": 2.2057549953460693, "Pretrain/Step": 2276, "Pretrain/Step Time": 9.033007193356752} +{"Pretrain/Learning Rate": 4.449995327555293e-05, "Pretrain/Loss": 2.062511444091797, "Pretrain/Loss (Raw)": 1.8809787034988403, "Pretrain/Step": 2277, "Pretrain/Step Time": 9.058082530274987} +{"Pretrain/Learning Rate": 4.449463934278282e-05, "Pretrain/Loss": 2.06223201751709, "Pretrain/Loss (Raw)": 2.0306618213653564, "Pretrain/Step": 2278, "Pretrain/Step Time": 9.057081101462245} +{"Pretrain/Learning Rate": 4.4489323161799045e-05, "Pretrain/Loss": 2.0591721534729004, "Pretrain/Loss (Raw)": 1.6811120510101318, "Pretrain/Step": 2279, "Pretrain/Step Time": 9.055183051154017} +{"Pretrain/Learning Rate": 4.4484004733214685e-05, "Pretrain/Loss": 2.059467315673828, "Pretrain/Loss (Raw)": 2.1018757820129395, "Pretrain/Step": 2280, "Pretrain/Step Time": 9.0656005050987} +{"Pretrain/Learning Rate": 4.447868405764309e-05, "Pretrain/Loss": 2.0566177368164062, "Pretrain/Loss (Raw)": 1.7808188199996948, "Pretrain/Step": 2281, "Pretrain/Step Time": 9.114652175456285} +{"Pretrain/Learning Rate": 4.4473361135697856e-05, "Pretrain/Loss": 2.0555579662323, "Pretrain/Loss (Raw)": 1.982366681098938, "Pretrain/Step": 2282, "Pretrain/Step Time": 9.122080393135548} +{"Pretrain/Learning Rate": 4.446803596799286e-05, "Pretrain/Loss": 2.05173397064209, "Pretrain/Loss (Raw)": 1.562038779258728, "Pretrain/Step": 2283, "Pretrain/Step Time": 9.137453379109502} +{"Pretrain/Learning Rate": 4.446270855514222e-05, "Pretrain/Loss": 2.052722215652466, "Pretrain/Loss (Raw)": 2.1626052856445312, "Pretrain/Step": 2284, "Pretrain/Step Time": 9.132225401699543} +{"Pretrain/Learning Rate": 4.445737889776031e-05, "Pretrain/Loss": 2.052598714828491, "Pretrain/Loss (Raw)": 1.9533722400665283, "Pretrain/Step": 2285, "Pretrain/Step Time": 9.152754174545407} +{"Pretrain/Learning Rate": 4.44520469964618e-05, "Pretrain/Loss": 2.0534539222717285, "Pretrain/Loss (Raw)": 2.2154271602630615, "Pretrain/Step": 2286, "Pretrain/Step Time": 9.146241132169962} +{"Pretrain/Learning Rate": 4.444671285186155e-05, "Pretrain/Loss": 2.054027557373047, "Pretrain/Loss (Raw)": 2.1920807361602783, "Pretrain/Step": 2287, "Pretrain/Step Time": 9.155212031677365} +{"Pretrain/Learning Rate": 4.444137646457474e-05, "Pretrain/Loss": 2.056058883666992, "Pretrain/Loss (Raw)": 2.0538859367370605, "Pretrain/Step": 2288, "Pretrain/Step Time": 9.140309922397137} +{"Pretrain/Learning Rate": 4.4436037835216784e-05, "Pretrain/Loss": 2.0558695793151855, "Pretrain/Loss (Raw)": 2.1517152786254883, "Pretrain/Step": 2289, "Pretrain/Step Time": 9.139483416453004} +{"Pretrain/Learning Rate": 4.4430696964403366e-05, "Pretrain/Loss": 2.055405378341675, "Pretrain/Loss (Raw)": 2.052600860595703, "Pretrain/Step": 2290, "Pretrain/Step Time": 9.140431553125381} +{"Pretrain/Learning Rate": 4.4425353852750414e-05, "Pretrain/Loss": 2.0551810264587402, "Pretrain/Loss (Raw)": 2.087786912918091, "Pretrain/Step": 2291, "Pretrain/Step Time": 9.13638462498784} +{"Pretrain/Learning Rate": 4.4420008500874116e-05, "Pretrain/Loss": 2.054288148880005, "Pretrain/Loss (Raw)": 1.9535315036773682, "Pretrain/Step": 2292, "Pretrain/Step Time": 9.13895384222269} +{"Pretrain/Learning Rate": 4.441466090939093e-05, "Pretrain/Loss": 2.0544943809509277, "Pretrain/Loss (Raw)": 1.930657982826233, "Pretrain/Step": 2293, "Pretrain/Step Time": 9.132749415934086} +{"Pretrain/Learning Rate": 4.440931107891756e-05, "Pretrain/Loss": 2.0546412467956543, "Pretrain/Loss (Raw)": 2.1306498050689697, "Pretrain/Step": 2294, "Pretrain/Step Time": 9.128774266690016} +{"Pretrain/Learning Rate": 4.440395901007098e-05, "Pretrain/Loss": 2.054067611694336, "Pretrain/Loss (Raw)": 2.086740255355835, "Pretrain/Step": 2295, "Pretrain/Step Time": 9.109641920775175} +{"Pretrain/Learning Rate": 4.4398604703468415e-05, "Pretrain/Loss": 2.052781581878662, "Pretrain/Loss (Raw)": 1.7546576261520386, "Pretrain/Step": 2296, "Pretrain/Step Time": 9.11944772861898} +{"Pretrain/Learning Rate": 4.439324815972734e-05, "Pretrain/Loss": 2.0514960289001465, "Pretrain/Loss (Raw)": 1.9518519639968872, "Pretrain/Step": 2297, "Pretrain/Step Time": 9.148340255022049} +{"Pretrain/Learning Rate": 4.438788937946551e-05, "Pretrain/Loss": 2.0530483722686768, "Pretrain/Loss (Raw)": 2.266195058822632, "Pretrain/Step": 2298, "Pretrain/Step Time": 9.15005400404334} +{"Pretrain/Learning Rate": 4.4382528363300916e-05, "Pretrain/Loss": 2.053746223449707, "Pretrain/Loss (Raw)": 1.995008111000061, "Pretrain/Step": 2299, "Pretrain/Step Time": 9.153687581419945} +{"Pretrain/Learning Rate": 4.437716511185181e-05, "Pretrain/Loss": 2.053618907928467, "Pretrain/Loss (Raw)": 2.0229310989379883, "Pretrain/Step": 2300, "Pretrain/Step Time": 9.148409619927406} +{"Pretrain/Learning Rate": 4.437179962573672e-05, "Pretrain/Loss": 2.0545663833618164, "Pretrain/Loss (Raw)": 2.1364145278930664, "Pretrain/Step": 2301, "Pretrain/Step Time": 9.147780450060964} +{"Pretrain/Learning Rate": 4.436643190557441e-05, "Pretrain/Loss": 2.054614782333374, "Pretrain/Loss (Raw)": 2.087381601333618, "Pretrain/Step": 2302, "Pretrain/Step Time": 9.145131137222052} +{"Pretrain/Learning Rate": 4.4361061951983925e-05, "Pretrain/Loss": 2.0558109283447266, "Pretrain/Loss (Raw)": 2.1948184967041016, "Pretrain/Step": 2303, "Pretrain/Step Time": 9.144491715356708} +{"Pretrain/Learning Rate": 4.435568976558454e-05, "Pretrain/Loss": 2.0543246269226074, "Pretrain/Loss (Raw)": 2.0099053382873535, "Pretrain/Step": 2304, "Pretrain/Step Time": 9.138217998668551} +{"Pretrain/Learning Rate": 4.4350315346995804e-05, "Pretrain/Loss": 2.0517001152038574, "Pretrain/Loss (Raw)": 1.704768180847168, "Pretrain/Step": 2305, "Pretrain/Step Time": 9.148499125614762} +{"Pretrain/Learning Rate": 4.434493869683752e-05, "Pretrain/Loss": 2.0515544414520264, "Pretrain/Loss (Raw)": 2.1394124031066895, "Pretrain/Step": 2306, "Pretrain/Step Time": 9.148433117195964} +{"Pretrain/Learning Rate": 4.4339559815729746e-05, "Pretrain/Loss": 2.052173137664795, "Pretrain/Loss (Raw)": 1.8438708782196045, "Pretrain/Step": 2307, "Pretrain/Step Time": 9.150296676903963} +{"Pretrain/Learning Rate": 4.4334178704292805e-05, "Pretrain/Loss": 2.0515685081481934, "Pretrain/Loss (Raw)": 2.1903889179229736, "Pretrain/Step": 2308, "Pretrain/Step Time": 9.151536030694842} +{"Pretrain/Learning Rate": 4.432879536314727e-05, "Pretrain/Loss": 2.0517337322235107, "Pretrain/Loss (Raw)": 2.1673154830932617, "Pretrain/Step": 2309, "Pretrain/Step Time": 9.145191276445985} +{"Pretrain/Learning Rate": 4.4323409792913974e-05, "Pretrain/Loss": 2.052299976348877, "Pretrain/Loss (Raw)": 2.243523597717285, "Pretrain/Step": 2310, "Pretrain/Step Time": 9.162120899185538} +{"Pretrain/Learning Rate": 4.431802199421401e-05, "Pretrain/Loss": 2.053250789642334, "Pretrain/Loss (Raw)": 2.0357019901275635, "Pretrain/Step": 2311, "Pretrain/Step Time": 9.164175312966108} +{"Pretrain/Learning Rate": 4.431263196766872e-05, "Pretrain/Loss": 2.055039882659912, "Pretrain/Loss (Raw)": 2.2133419513702393, "Pretrain/Step": 2312, "Pretrain/Step Time": 9.190732842311263} +{"Pretrain/Learning Rate": 4.43072397138997e-05, "Pretrain/Loss": 2.0556235313415527, "Pretrain/Loss (Raw)": 2.0572636127471924, "Pretrain/Step": 2313, "Pretrain/Step Time": 9.192680099979043} +{"Pretrain/Learning Rate": 4.430184523352881e-05, "Pretrain/Loss": 2.0538740158081055, "Pretrain/Loss (Raw)": 1.9021762609481812, "Pretrain/Step": 2314, "Pretrain/Step Time": 9.200426865369081} +{"Pretrain/Learning Rate": 4.429644852717819e-05, "Pretrain/Loss": 2.0539801120758057, "Pretrain/Loss (Raw)": 2.149324893951416, "Pretrain/Step": 2315, "Pretrain/Step Time": 9.164498658850789} +{"Pretrain/Learning Rate": 4.4291049595470193e-05, "Pretrain/Loss": 2.052563190460205, "Pretrain/Loss (Raw)": 2.0408663749694824, "Pretrain/Step": 2316, "Pretrain/Step Time": 9.162975408136845} +{"Pretrain/Learning Rate": 4.428564843902746e-05, "Pretrain/Loss": 2.051313877105713, "Pretrain/Loss (Raw)": 2.110175132751465, "Pretrain/Step": 2317, "Pretrain/Step Time": 9.171644799411297} +{"Pretrain/Learning Rate": 4.4280245058472866e-05, "Pretrain/Loss": 2.0514392852783203, "Pretrain/Loss (Raw)": 2.047297716140747, "Pretrain/Step": 2318, "Pretrain/Step Time": 9.170390587300062} +{"Pretrain/Learning Rate": 4.427483945442956e-05, "Pretrain/Loss": 2.050137996673584, "Pretrain/Loss (Raw)": 1.843170404434204, "Pretrain/Step": 2319, "Pretrain/Step Time": 9.206353634595871} +{"Pretrain/Learning Rate": 4.426943162752094e-05, "Pretrain/Loss": 2.0506651401519775, "Pretrain/Loss (Raw)": 2.0438179969787598, "Pretrain/Step": 2320, "Pretrain/Step Time": 9.211246196180582} +{"Pretrain/Learning Rate": 4.426402157837067e-05, "Pretrain/Loss": 2.050126314163208, "Pretrain/Loss (Raw)": 2.0019397735595703, "Pretrain/Step": 2321, "Pretrain/Step Time": 9.21047756075859} +{"Pretrain/Learning Rate": 4.425860930760265e-05, "Pretrain/Loss": 2.048326015472412, "Pretrain/Loss (Raw)": 2.072437286376953, "Pretrain/Step": 2322, "Pretrain/Step Time": 9.209494449198246} +{"Pretrain/Learning Rate": 4.4253194815841056e-05, "Pretrain/Loss": 2.0480477809906006, "Pretrain/Loss (Raw)": 1.9917757511138916, "Pretrain/Step": 2323, "Pretrain/Step Time": 9.210921354591846} +{"Pretrain/Learning Rate": 4.424777810371032e-05, "Pretrain/Loss": 2.049099922180176, "Pretrain/Loss (Raw)": 2.1515393257141113, "Pretrain/Step": 2324, "Pretrain/Step Time": 9.211989561095834} +{"Pretrain/Learning Rate": 4.424235917183511e-05, "Pretrain/Loss": 2.0495080947875977, "Pretrain/Loss (Raw)": 2.073711395263672, "Pretrain/Step": 2325, "Pretrain/Step Time": 9.217169791460037} +{"Pretrain/Learning Rate": 4.4236938020840365e-05, "Pretrain/Loss": 2.0485658645629883, "Pretrain/Loss (Raw)": 1.9155786037445068, "Pretrain/Step": 2326, "Pretrain/Step Time": 9.214938122779131} +{"Pretrain/Learning Rate": 4.423151465135128e-05, "Pretrain/Loss": 2.04819917678833, "Pretrain/Loss (Raw)": 1.9319193363189697, "Pretrain/Step": 2327, "Pretrain/Step Time": 9.257545026019216} +{"Pretrain/Learning Rate": 4.422608906399331e-05, "Pretrain/Loss": 2.048649549484253, "Pretrain/Loss (Raw)": 2.088169574737549, "Pretrain/Step": 2328, "Pretrain/Step Time": 9.248813580721617} +{"Pretrain/Learning Rate": 4.4220661259392146e-05, "Pretrain/Loss": 2.0491561889648438, "Pretrain/Loss (Raw)": 2.1662404537200928, "Pretrain/Step": 2329, "Pretrain/Step Time": 9.266084674745798} +{"Pretrain/Learning Rate": 4.421523123817376e-05, "Pretrain/Loss": 2.0499777793884277, "Pretrain/Loss (Raw)": 2.0337588787078857, "Pretrain/Step": 2330, "Pretrain/Step Time": 9.26887713931501} +{"Pretrain/Learning Rate": 4.420979900096436e-05, "Pretrain/Loss": 2.0496153831481934, "Pretrain/Loss (Raw)": 1.9396578073501587, "Pretrain/Step": 2331, "Pretrain/Step Time": 9.264128571376204} +{"Pretrain/Learning Rate": 4.420436454839041e-05, "Pretrain/Loss": 2.0495553016662598, "Pretrain/Loss (Raw)": 2.0162582397460938, "Pretrain/Step": 2332, "Pretrain/Step Time": 9.275430340319872} +{"Pretrain/Learning Rate": 4.419892788107865e-05, "Pretrain/Loss": 2.0494608879089355, "Pretrain/Loss (Raw)": 1.9664007425308228, "Pretrain/Step": 2333, "Pretrain/Step Time": 9.273309426382184} +{"Pretrain/Learning Rate": 4.419348899965608e-05, "Pretrain/Loss": 2.046989679336548, "Pretrain/Loss (Raw)": 1.5744398832321167, "Pretrain/Step": 2334, "Pretrain/Step Time": 9.279642755165696} +{"Pretrain/Learning Rate": 4.4188047904749894e-05, "Pretrain/Loss": 2.045295238494873, "Pretrain/Loss (Raw)": 2.1159403324127197, "Pretrain/Step": 2335, "Pretrain/Step Time": 9.337576910853386} +{"Pretrain/Learning Rate": 4.418260459698761e-05, "Pretrain/Loss": 2.0457897186279297, "Pretrain/Loss (Raw)": 2.1145219802856445, "Pretrain/Step": 2336, "Pretrain/Step Time": 9.34147135540843} +{"Pretrain/Learning Rate": 4.417715907699698e-05, "Pretrain/Loss": 2.0450096130371094, "Pretrain/Loss (Raw)": 2.0280838012695312, "Pretrain/Step": 2337, "Pretrain/Step Time": 9.345304226502776} +{"Pretrain/Learning Rate": 4.417171134540599e-05, "Pretrain/Loss": 2.0455570220947266, "Pretrain/Loss (Raw)": 2.255777359008789, "Pretrain/Step": 2338, "Pretrain/Step Time": 9.333036912605166} +{"Pretrain/Learning Rate": 4.416626140284291e-05, "Pretrain/Loss": 2.047593593597412, "Pretrain/Loss (Raw)": 2.1521918773651123, "Pretrain/Step": 2339, "Pretrain/Step Time": 9.339023185893893} +{"Pretrain/Learning Rate": 4.416080924993625e-05, "Pretrain/Loss": 2.0478460788726807, "Pretrain/Loss (Raw)": 2.1149024963378906, "Pretrain/Step": 2340, "Pretrain/Step Time": 9.337017668411136} +{"Pretrain/Learning Rate": 4.415535488731478e-05, "Pretrain/Loss": 2.050579309463501, "Pretrain/Loss (Raw)": 2.195755958557129, "Pretrain/Step": 2341, "Pretrain/Step Time": 9.339839747175574} +{"Pretrain/Learning Rate": 4.414989831560753e-05, "Pretrain/Loss": 2.050989866256714, "Pretrain/Loss (Raw)": 2.1922178268432617, "Pretrain/Step": 2342, "Pretrain/Step Time": 9.337537614628673} +{"Pretrain/Learning Rate": 4.4144439535443763e-05, "Pretrain/Loss": 2.0510659217834473, "Pretrain/Loss (Raw)": 2.0281589031219482, "Pretrain/Step": 2343, "Pretrain/Step Time": 9.336278762668371} +{"Pretrain/Learning Rate": 4.413897854745301e-05, "Pretrain/Loss": 2.051741123199463, "Pretrain/Loss (Raw)": 2.0907552242279053, "Pretrain/Step": 2344, "Pretrain/Step Time": 9.345111947506666} +{"Pretrain/Learning Rate": 4.413351535226507e-05, "Pretrain/Loss": 2.0518898963928223, "Pretrain/Loss (Raw)": 2.0659449100494385, "Pretrain/Step": 2345, "Pretrain/Step Time": 9.343864409253001} +{"Pretrain/Learning Rate": 4.4128049950509984e-05, "Pretrain/Loss": 2.0531527996063232, "Pretrain/Loss (Raw)": 2.0996880531311035, "Pretrain/Step": 2346, "Pretrain/Step Time": 9.344477400183678} +{"Pretrain/Learning Rate": 4.412258234281804e-05, "Pretrain/Loss": 2.0543339252471924, "Pretrain/Loss (Raw)": 2.133572816848755, "Pretrain/Step": 2347, "Pretrain/Step Time": 9.345778746530414} +{"Pretrain/Learning Rate": 4.411711252981979e-05, "Pretrain/Loss": 2.0527186393737793, "Pretrain/Loss (Raw)": 1.9058183431625366, "Pretrain/Step": 2348, "Pretrain/Step Time": 9.382624432444572} +{"Pretrain/Learning Rate": 4.411164051214603e-05, "Pretrain/Loss": 2.0519659519195557, "Pretrain/Loss (Raw)": 2.025130271911621, "Pretrain/Step": 2349, "Pretrain/Step Time": 9.384305521845818} +{"Pretrain/Learning Rate": 4.4106166290427846e-05, "Pretrain/Loss": 2.0524063110351562, "Pretrain/Loss (Raw)": 2.1113128662109375, "Pretrain/Step": 2350, "Pretrain/Step Time": 9.378506617620587} +{"Pretrain/Learning Rate": 4.410068986529653e-05, "Pretrain/Loss": 2.0518264770507812, "Pretrain/Loss (Raw)": 2.0060439109802246, "Pretrain/Step": 2351, "Pretrain/Step Time": 9.37994952686131} +{"Pretrain/Learning Rate": 4.409521123738365e-05, "Pretrain/Loss": 2.052420139312744, "Pretrain/Loss (Raw)": 2.062143564224243, "Pretrain/Step": 2352, "Pretrain/Step Time": 9.415971837937832} +{"Pretrain/Learning Rate": 4.4089730407321035e-05, "Pretrain/Loss": 2.053395986557007, "Pretrain/Loss (Raw)": 2.177960157394409, "Pretrain/Step": 2353, "Pretrain/Step Time": 9.417090840637684} +{"Pretrain/Learning Rate": 4.408424737574075e-05, "Pretrain/Loss": 2.0546929836273193, "Pretrain/Loss (Raw)": 2.0497357845306396, "Pretrain/Step": 2354, "Pretrain/Step Time": 9.410547226667404} +{"Pretrain/Learning Rate": 4.407876214327513e-05, "Pretrain/Loss": 2.053333282470703, "Pretrain/Loss (Raw)": 1.9734989404678345, "Pretrain/Step": 2355, "Pretrain/Step Time": 9.416504096239805} +{"Pretrain/Learning Rate": 4.407327471055677e-05, "Pretrain/Loss": 2.052833318710327, "Pretrain/Loss (Raw)": 1.8696726560592651, "Pretrain/Step": 2356, "Pretrain/Step Time": 9.417099334299564} +{"Pretrain/Learning Rate": 4.406778507821848e-05, "Pretrain/Loss": 2.05112886428833, "Pretrain/Loss (Raw)": 1.9143091440200806, "Pretrain/Step": 2357, "Pretrain/Step Time": 9.41896870546043} +{"Pretrain/Learning Rate": 4.4062293246893374e-05, "Pretrain/Loss": 2.050504446029663, "Pretrain/Loss (Raw)": 1.9195282459259033, "Pretrain/Step": 2358, "Pretrain/Step Time": 9.419086156412959} +{"Pretrain/Learning Rate": 4.4056799217214774e-05, "Pretrain/Loss": 2.050889015197754, "Pretrain/Loss (Raw)": 2.047755718231201, "Pretrain/Step": 2359, "Pretrain/Step Time": 9.423725621774793} +{"Pretrain/Learning Rate": 4.4051302989816304e-05, "Pretrain/Loss": 2.05242919921875, "Pretrain/Loss (Raw)": 2.244199275970459, "Pretrain/Step": 2360, "Pretrain/Step Time": 9.420682359486818} +{"Pretrain/Learning Rate": 4.404580456533179e-05, "Pretrain/Loss": 2.0508480072021484, "Pretrain/Loss (Raw)": 2.0564048290252686, "Pretrain/Step": 2361, "Pretrain/Step Time": 9.42351501621306} +{"Pretrain/Learning Rate": 4.404030394439535e-05, "Pretrain/Loss": 2.051271438598633, "Pretrain/Loss (Raw)": 2.107386827468872, "Pretrain/Step": 2362, "Pretrain/Step Time": 9.420622747391462} +{"Pretrain/Learning Rate": 4.4034801127641336e-05, "Pretrain/Loss": 2.0501856803894043, "Pretrain/Loss (Raw)": 1.9971426725387573, "Pretrain/Step": 2363, "Pretrain/Step Time": 9.419195340946317} +{"Pretrain/Learning Rate": 4.4029296115704366e-05, "Pretrain/Loss": 2.049304246902466, "Pretrain/Loss (Raw)": 2.0028491020202637, "Pretrain/Step": 2364, "Pretrain/Step Time": 9.428852932527661} +{"Pretrain/Learning Rate": 4.40237889092193e-05, "Pretrain/Loss": 2.0447793006896973, "Pretrain/Loss (Raw)": 1.7690668106079102, "Pretrain/Step": 2365, "Pretrain/Step Time": 9.435485754162073} +{"Pretrain/Learning Rate": 4.401827950882125e-05, "Pretrain/Loss": 2.0458180904388428, "Pretrain/Loss (Raw)": 2.2622673511505127, "Pretrain/Step": 2366, "Pretrain/Step Time": 9.47009076923132} +{"Pretrain/Learning Rate": 4.4012767915145594e-05, "Pretrain/Loss": 2.044769048690796, "Pretrain/Loss (Raw)": 1.9506926536560059, "Pretrain/Step": 2367, "Pretrain/Step Time": 9.480656722560525} +{"Pretrain/Learning Rate": 4.400725412882794e-05, "Pretrain/Loss": 2.0450711250305176, "Pretrain/Loss (Raw)": 2.1952340602874756, "Pretrain/Step": 2368, "Pretrain/Step Time": 9.460276985540986} +{"Pretrain/Learning Rate": 4.400173815050418e-05, "Pretrain/Loss": 2.0450637340545654, "Pretrain/Loss (Raw)": 2.084146499633789, "Pretrain/Step": 2369, "Pretrain/Step Time": 9.459531912580132} +{"Pretrain/Learning Rate": 4.399621998081045e-05, "Pretrain/Loss": 2.0407187938690186, "Pretrain/Loss (Raw)": 1.4516738653182983, "Pretrain/Step": 2370, "Pretrain/Step Time": 9.485913021489978} +{"Pretrain/Learning Rate": 4.39906996203831e-05, "Pretrain/Loss": 2.0401923656463623, "Pretrain/Loss (Raw)": 2.144041061401367, "Pretrain/Step": 2371, "Pretrain/Step Time": 9.47947234287858} +{"Pretrain/Learning Rate": 4.398517706985879e-05, "Pretrain/Loss": 2.0386343002319336, "Pretrain/Loss (Raw)": 2.065004587173462, "Pretrain/Step": 2372, "Pretrain/Step Time": 9.518298596143723} +{"Pretrain/Learning Rate": 4.39796523298744e-05, "Pretrain/Loss": 2.039522171020508, "Pretrain/Loss (Raw)": 2.282492160797119, "Pretrain/Step": 2373, "Pretrain/Step Time": 9.518606347963214} +{"Pretrain/Learning Rate": 4.397412540106707e-05, "Pretrain/Loss": 2.039905071258545, "Pretrain/Loss (Raw)": 2.1000235080718994, "Pretrain/Step": 2374, "Pretrain/Step Time": 9.521249519661069} +{"Pretrain/Learning Rate": 4.396859628407418e-05, "Pretrain/Loss": 2.038616180419922, "Pretrain/Loss (Raw)": 2.041361093521118, "Pretrain/Step": 2375, "Pretrain/Step Time": 9.516532024368644} +{"Pretrain/Learning Rate": 4.39630649795334e-05, "Pretrain/Loss": 2.0401692390441895, "Pretrain/Loss (Raw)": 2.0792055130004883, "Pretrain/Step": 2376, "Pretrain/Step Time": 9.561295816674829} +{"Pretrain/Learning Rate": 4.3957531488082595e-05, "Pretrain/Loss": 2.040557384490967, "Pretrain/Loss (Raw)": 2.1344263553619385, "Pretrain/Step": 2377, "Pretrain/Step Time": 9.553214741870761} +{"Pretrain/Learning Rate": 4.395199581035994e-05, "Pretrain/Loss": 2.0415596961975098, "Pretrain/Loss (Raw)": 1.9980438947677612, "Pretrain/Step": 2378, "Pretrain/Step Time": 9.551307396963239} +{"Pretrain/Learning Rate": 4.3946457947003813e-05, "Pretrain/Loss": 2.0425682067871094, "Pretrain/Loss (Raw)": 2.0995264053344727, "Pretrain/Step": 2379, "Pretrain/Step Time": 9.549205720424652} +{"Pretrain/Learning Rate": 4.394091789865288e-05, "Pretrain/Loss": 2.0424728393554688, "Pretrain/Loss (Raw)": 2.1380138397216797, "Pretrain/Step": 2380, "Pretrain/Step Time": 9.560507839545608} +{"Pretrain/Learning Rate": 4.393537566594605e-05, "Pretrain/Loss": 2.042515277862549, "Pretrain/Loss (Raw)": 2.0703065395355225, "Pretrain/Step": 2381, "Pretrain/Step Time": 9.559435004368424} +{"Pretrain/Learning Rate": 4.392983124952246e-05, "Pretrain/Loss": 2.045944929122925, "Pretrain/Loss (Raw)": 2.660278081893921, "Pretrain/Step": 2382, "Pretrain/Step Time": 9.561389617621899} +{"Pretrain/Learning Rate": 4.392428465002154e-05, "Pretrain/Loss": 2.0482017993927, "Pretrain/Loss (Raw)": 2.039839267730713, "Pretrain/Step": 2383, "Pretrain/Step Time": 9.569612178951502} +{"Pretrain/Learning Rate": 4.391873586808294e-05, "Pretrain/Loss": 2.0483736991882324, "Pretrain/Loss (Raw)": 2.0938594341278076, "Pretrain/Step": 2384, "Pretrain/Step Time": 9.574933752417564} +{"Pretrain/Learning Rate": 4.391318490434656e-05, "Pretrain/Loss": 2.0463366508483887, "Pretrain/Loss (Raw)": 2.057534694671631, "Pretrain/Step": 2385, "Pretrain/Step Time": 9.584655312821269} +{"Pretrain/Learning Rate": 4.3907631759452584e-05, "Pretrain/Loss": 2.047537326812744, "Pretrain/Loss (Raw)": 2.1188442707061768, "Pretrain/Step": 2386, "Pretrain/Step Time": 9.588026728481054} +{"Pretrain/Learning Rate": 4.3902076434041416e-05, "Pretrain/Loss": 2.0466833114624023, "Pretrain/Loss (Raw)": 2.041491746902466, "Pretrain/Step": 2387, "Pretrain/Step Time": 9.579661585390568} +{"Pretrain/Learning Rate": 4.389651892875373e-05, "Pretrain/Loss": 2.0475010871887207, "Pretrain/Loss (Raw)": 2.099065065383911, "Pretrain/Step": 2388, "Pretrain/Step Time": 9.57168298959732} +{"Pretrain/Learning Rate": 4.389095924423043e-05, "Pretrain/Loss": 2.0494494438171387, "Pretrain/Loss (Raw)": 2.166781425476074, "Pretrain/Step": 2389, "Pretrain/Step Time": 9.566998528316617} +{"Pretrain/Learning Rate": 4.388539738111269e-05, "Pretrain/Loss": 2.045853614807129, "Pretrain/Loss (Raw)": 1.5627994537353516, "Pretrain/Step": 2390, "Pretrain/Step Time": 9.563419042155147} +{"Pretrain/Learning Rate": 4.387983334004194e-05, "Pretrain/Loss": 2.0450925827026367, "Pretrain/Loss (Raw)": 2.0071282386779785, "Pretrain/Step": 2391, "Pretrain/Step Time": 9.567915542051196} +{"Pretrain/Learning Rate": 4.387426712165984e-05, "Pretrain/Loss": 2.046753406524658, "Pretrain/Loss (Raw)": 2.1705398559570312, "Pretrain/Step": 2392, "Pretrain/Step Time": 9.563343351706862} +{"Pretrain/Learning Rate": 4.3868698726608325e-05, "Pretrain/Loss": 2.045957565307617, "Pretrain/Loss (Raw)": 2.1039342880249023, "Pretrain/Step": 2393, "Pretrain/Step Time": 9.578530775383115} +{"Pretrain/Learning Rate": 4.3863128155529554e-05, "Pretrain/Loss": 2.0441410541534424, "Pretrain/Loss (Raw)": 2.024470806121826, "Pretrain/Step": 2394, "Pretrain/Step Time": 9.585107458755374} +{"Pretrain/Learning Rate": 4.385755540906595e-05, "Pretrain/Loss": 2.045787811279297, "Pretrain/Loss (Raw)": 2.1870155334472656, "Pretrain/Step": 2395, "Pretrain/Step Time": 9.580863090232015} +{"Pretrain/Learning Rate": 4.385198048786021e-05, "Pretrain/Loss": 2.0450334548950195, "Pretrain/Loss (Raw)": 2.0854642391204834, "Pretrain/Step": 2396, "Pretrain/Step Time": 9.577656487002969} +{"Pretrain/Learning Rate": 4.384640339255525e-05, "Pretrain/Loss": 2.046651601791382, "Pretrain/Loss (Raw)": 2.0214219093322754, "Pretrain/Step": 2397, "Pretrain/Step Time": 9.60203880444169} +{"Pretrain/Learning Rate": 4.384082412379423e-05, "Pretrain/Loss": 2.0486981868743896, "Pretrain/Loss (Raw)": 2.259218215942383, "Pretrain/Step": 2398, "Pretrain/Step Time": 9.598342064768076} +{"Pretrain/Learning Rate": 4.38352426822206e-05, "Pretrain/Loss": 2.048388957977295, "Pretrain/Loss (Raw)": 2.09694766998291, "Pretrain/Step": 2399, "Pretrain/Step Time": 9.594392318278551} +{"Pretrain/Learning Rate": 4.3829659068478026e-05, "Pretrain/Loss": 2.047856569290161, "Pretrain/Loss (Raw)": 1.9407657384872437, "Pretrain/Step": 2400, "Pretrain/Step Time": 9.59059034846723} +{"Pretrain/Learning Rate": 4.3824073283210445e-05, "Pretrain/Loss": 2.0497219562530518, "Pretrain/Loss (Raw)": 2.134965181350708, "Pretrain/Step": 2401, "Pretrain/Step Time": 9.612545751035213} +{"Pretrain/Learning Rate": 4.381848532706202e-05, "Pretrain/Loss": 2.047635555267334, "Pretrain/Loss (Raw)": 1.8067222833633423, "Pretrain/Step": 2402, "Pretrain/Step Time": 9.57742327824235} +{"Pretrain/Learning Rate": 4.38128952006772e-05, "Pretrain/Loss": 2.048003673553467, "Pretrain/Loss (Raw)": 2.269395351409912, "Pretrain/Step": 2403, "Pretrain/Step Time": 9.565699975937605} +{"Pretrain/Learning Rate": 4.380730290470065e-05, "Pretrain/Loss": 2.0470471382141113, "Pretrain/Loss (Raw)": 2.0833280086517334, "Pretrain/Step": 2404, "Pretrain/Step Time": 9.566322483122349} +{"Pretrain/Learning Rate": 4.380170843977731e-05, "Pretrain/Loss": 2.0486056804656982, "Pretrain/Loss (Raw)": 2.0804450511932373, "Pretrain/Step": 2405, "Pretrain/Step Time": 9.54572462849319} +{"Pretrain/Learning Rate": 4.3796111806552364e-05, "Pretrain/Loss": 2.0492594242095947, "Pretrain/Loss (Raw)": 2.1143500804901123, "Pretrain/Step": 2406, "Pretrain/Step Time": 9.547330284491181} +{"Pretrain/Learning Rate": 4.379051300567123e-05, "Pretrain/Loss": 2.051438808441162, "Pretrain/Loss (Raw)": 1.9600653648376465, "Pretrain/Step": 2407, "Pretrain/Step Time": 9.553370716050267} +{"Pretrain/Learning Rate": 4.378491203777958e-05, "Pretrain/Loss": 2.051725387573242, "Pretrain/Loss (Raw)": 2.138547420501709, "Pretrain/Step": 2408, "Pretrain/Step Time": 9.555008416995406} +{"Pretrain/Learning Rate": 4.377930890352337e-05, "Pretrain/Loss": 2.0549278259277344, "Pretrain/Loss (Raw)": 2.190744161605835, "Pretrain/Step": 2409, "Pretrain/Step Time": 9.496030708774924} +{"Pretrain/Learning Rate": 4.3773703603548765e-05, "Pretrain/Loss": 2.0564076900482178, "Pretrain/Loss (Raw)": 2.1717958450317383, "Pretrain/Step": 2410, "Pretrain/Step Time": 9.492509234696627} +{"Pretrain/Learning Rate": 4.3768096138502194e-05, "Pretrain/Loss": 2.0601296424865723, "Pretrain/Loss (Raw)": 2.0384674072265625, "Pretrain/Step": 2411, "Pretrain/Step Time": 9.479158245027065} +{"Pretrain/Learning Rate": 4.376248650903033e-05, "Pretrain/Loss": 2.060443878173828, "Pretrain/Loss (Raw)": 2.2027928829193115, "Pretrain/Step": 2412, "Pretrain/Step Time": 9.473249839618802} +{"Pretrain/Learning Rate": 4.375687471578011e-05, "Pretrain/Loss": 2.061713218688965, "Pretrain/Loss (Raw)": 2.115854501724243, "Pretrain/Step": 2413, "Pretrain/Step Time": 9.451260266825557} +{"Pretrain/Learning Rate": 4.375126075939873e-05, "Pretrain/Loss": 2.060473918914795, "Pretrain/Loss (Raw)": 2.056797504425049, "Pretrain/Step": 2414, "Pretrain/Step Time": 9.461319221183658} +{"Pretrain/Learning Rate": 4.374564464053359e-05, "Pretrain/Loss": 2.0597705841064453, "Pretrain/Loss (Raw)": 2.1020524501800537, "Pretrain/Step": 2415, "Pretrain/Step Time": 9.458903761580586} +{"Pretrain/Learning Rate": 4.374002635983238e-05, "Pretrain/Loss": 2.059398889541626, "Pretrain/Loss (Raw)": 2.0062882900238037, "Pretrain/Step": 2416, "Pretrain/Step Time": 9.458881733939052} +{"Pretrain/Learning Rate": 4.373440591794301e-05, "Pretrain/Loss": 2.0575406551361084, "Pretrain/Loss (Raw)": 1.9138870239257812, "Pretrain/Step": 2417, "Pretrain/Step Time": 9.45852392166853} +{"Pretrain/Learning Rate": 4.372878331551369e-05, "Pretrain/Loss": 2.05816650390625, "Pretrain/Loss (Raw)": 2.1327338218688965, "Pretrain/Step": 2418, "Pretrain/Step Time": 9.460416441783309} +{"Pretrain/Learning Rate": 4.3723158553192813e-05, "Pretrain/Loss": 2.0590662956237793, "Pretrain/Loss (Raw)": 2.2029454708099365, "Pretrain/Step": 2419, "Pretrain/Step Time": 9.460249479860067} +{"Pretrain/Learning Rate": 4.3717531631629075e-05, "Pretrain/Loss": 2.059290885925293, "Pretrain/Loss (Raw)": 1.9822884798049927, "Pretrain/Step": 2420, "Pretrain/Step Time": 9.510455537587404} +{"Pretrain/Learning Rate": 4.371190255147138e-05, "Pretrain/Loss": 2.0593156814575195, "Pretrain/Loss (Raw)": 1.9338221549987793, "Pretrain/Step": 2421, "Pretrain/Step Time": 9.50933775678277} +{"Pretrain/Learning Rate": 4.370627131336891e-05, "Pretrain/Loss": 2.0621047019958496, "Pretrain/Loss (Raw)": 2.4876344203948975, "Pretrain/Step": 2422, "Pretrain/Step Time": 9.507308267056942} +{"Pretrain/Learning Rate": 4.370063791797109e-05, "Pretrain/Loss": 2.0620737075805664, "Pretrain/Loss (Raw)": 2.0827980041503906, "Pretrain/Step": 2423, "Pretrain/Step Time": 9.53423592634499} +{"Pretrain/Learning Rate": 4.3695002365927584e-05, "Pretrain/Loss": 2.0661673545837402, "Pretrain/Loss (Raw)": 2.2786154747009277, "Pretrain/Step": 2424, "Pretrain/Step Time": 9.527075001969934} +{"Pretrain/Learning Rate": 4.368936465788831e-05, "Pretrain/Loss": 2.066443920135498, "Pretrain/Loss (Raw)": 1.9872435331344604, "Pretrain/Step": 2425, "Pretrain/Step Time": 9.492783449590206} +{"Pretrain/Learning Rate": 4.3683724794503436e-05, "Pretrain/Loss": 2.0640504360198975, "Pretrain/Loss (Raw)": 1.9598575830459595, "Pretrain/Step": 2426, "Pretrain/Step Time": 9.489702723920345} +{"Pretrain/Learning Rate": 4.367808277642338e-05, "Pretrain/Loss": 2.066166400909424, "Pretrain/Loss (Raw)": 2.2658329010009766, "Pretrain/Step": 2427, "Pretrain/Step Time": 9.48659087345004} +{"Pretrain/Learning Rate": 4.3672438604298806e-05, "Pretrain/Loss": 2.066960096359253, "Pretrain/Loss (Raw)": 2.1245272159576416, "Pretrain/Step": 2428, "Pretrain/Step Time": 9.489557823166251} +{"Pretrain/Learning Rate": 4.3666792278780625e-05, "Pretrain/Loss": 2.066453695297241, "Pretrain/Loss (Raw)": 2.071597099304199, "Pretrain/Step": 2429, "Pretrain/Step Time": 9.487141462042928} +{"Pretrain/Learning Rate": 4.366114380051999e-05, "Pretrain/Loss": 2.0646073818206787, "Pretrain/Loss (Raw)": 1.8510396480560303, "Pretrain/Step": 2430, "Pretrain/Step Time": 9.488236878067255} +{"Pretrain/Learning Rate": 4.365549317016832e-05, "Pretrain/Loss": 2.0639092922210693, "Pretrain/Loss (Raw)": 2.1054911613464355, "Pretrain/Step": 2431, "Pretrain/Step Time": 9.483721954748034} +{"Pretrain/Learning Rate": 4.364984038837727e-05, "Pretrain/Loss": 2.0660576820373535, "Pretrain/Loss (Raw)": 2.28487491607666, "Pretrain/Step": 2432, "Pretrain/Step Time": 9.484456479549408} +{"Pretrain/Learning Rate": 4.364418545579875e-05, "Pretrain/Loss": 2.0675055980682373, "Pretrain/Loss (Raw)": 1.890106439590454, "Pretrain/Step": 2433, "Pretrain/Step Time": 9.538222182542086} +{"Pretrain/Learning Rate": 4.363852837308491e-05, "Pretrain/Loss": 2.068105697631836, "Pretrain/Loss (Raw)": 2.2161989212036133, "Pretrain/Step": 2434, "Pretrain/Step Time": 9.537572525441647} +{"Pretrain/Learning Rate": 4.3632869140888144e-05, "Pretrain/Loss": 2.069660186767578, "Pretrain/Loss (Raw)": 2.042886257171631, "Pretrain/Step": 2435, "Pretrain/Step Time": 9.551787707954645} +{"Pretrain/Learning Rate": 4.362720775986111e-05, "Pretrain/Loss": 2.068455696105957, "Pretrain/Loss (Raw)": 2.0362095832824707, "Pretrain/Step": 2436, "Pretrain/Step Time": 9.558431534096599} +{"Pretrain/Learning Rate": 4.362154423065671e-05, "Pretrain/Loss": 2.0674076080322266, "Pretrain/Loss (Raw)": 2.033163547515869, "Pretrain/Step": 2437, "Pretrain/Step Time": 9.559402663260698} +{"Pretrain/Learning Rate": 4.361587855392807e-05, "Pretrain/Loss": 2.0642242431640625, "Pretrain/Loss (Raw)": 1.8360657691955566, "Pretrain/Step": 2438, "Pretrain/Step Time": 9.541357524693012} +{"Pretrain/Learning Rate": 4.3610210730328604e-05, "Pretrain/Loss": 2.06441593170166, "Pretrain/Loss (Raw)": 2.0602428913116455, "Pretrain/Step": 2439, "Pretrain/Step Time": 9.547097770497203} +{"Pretrain/Learning Rate": 4.3604540760511935e-05, "Pretrain/Loss": 2.0623698234558105, "Pretrain/Loss (Raw)": 1.9514261484146118, "Pretrain/Step": 2440, "Pretrain/Step Time": 9.521313447505236} +{"Pretrain/Learning Rate": 4.3598868645131964e-05, "Pretrain/Loss": 2.062256097793579, "Pretrain/Loss (Raw)": 2.0426976680755615, "Pretrain/Step": 2441, "Pretrain/Step Time": 9.530025992542505} +{"Pretrain/Learning Rate": 4.359319438484282e-05, "Pretrain/Loss": 2.0613760948181152, "Pretrain/Loss (Raw)": 1.7895405292510986, "Pretrain/Step": 2442, "Pretrain/Step Time": 9.525187583640218} +{"Pretrain/Learning Rate": 4.358751798029887e-05, "Pretrain/Loss": 2.0614542961120605, "Pretrain/Loss (Raw)": 2.159346103668213, "Pretrain/Step": 2443, "Pretrain/Step Time": 9.525022326037288} +{"Pretrain/Learning Rate": 4.358183943215478e-05, "Pretrain/Loss": 2.0632314682006836, "Pretrain/Loss (Raw)": 2.268312454223633, "Pretrain/Step": 2444, "Pretrain/Step Time": 9.525178527459502} +{"Pretrain/Learning Rate": 4.3576158741065395e-05, "Pretrain/Loss": 2.0631215572357178, "Pretrain/Loss (Raw)": 2.0961239337921143, "Pretrain/Step": 2445, "Pretrain/Step Time": 9.517165888100863} +{"Pretrain/Learning Rate": 4.357047590768586e-05, "Pretrain/Loss": 2.063441514968872, "Pretrain/Loss (Raw)": 2.0882506370544434, "Pretrain/Step": 2446, "Pretrain/Step Time": 9.520804438740015} +{"Pretrain/Learning Rate": 4.356479093267153e-05, "Pretrain/Loss": 2.0681869983673096, "Pretrain/Loss (Raw)": 2.4506044387817383, "Pretrain/Step": 2447, "Pretrain/Step Time": 9.486670717597008} +{"Pretrain/Learning Rate": 4.355910381667803e-05, "Pretrain/Loss": 2.0683727264404297, "Pretrain/Loss (Raw)": 2.067598581314087, "Pretrain/Step": 2448, "Pretrain/Step Time": 9.48187356442213} +{"Pretrain/Learning Rate": 4.355341456036122e-05, "Pretrain/Loss": 2.0682549476623535, "Pretrain/Loss (Raw)": 1.9868416786193848, "Pretrain/Step": 2449, "Pretrain/Step Time": 9.521621160209179} +{"Pretrain/Learning Rate": 4.354772316437722e-05, "Pretrain/Loss": 2.0691399574279785, "Pretrain/Loss (Raw)": 2.1857266426086426, "Pretrain/Step": 2450, "Pretrain/Step Time": 9.525704303756356} +{"Pretrain/Learning Rate": 4.354202962938239e-05, "Pretrain/Loss": 2.068845748901367, "Pretrain/Loss (Raw)": 1.9541125297546387, "Pretrain/Step": 2451, "Pretrain/Step Time": 9.527632139623165} +{"Pretrain/Learning Rate": 4.353633395603332e-05, "Pretrain/Loss": 2.068763256072998, "Pretrain/Loss (Raw)": 2.140960454940796, "Pretrain/Step": 2452, "Pretrain/Step Time": 9.544258445501328} +{"Pretrain/Learning Rate": 4.353063614498688e-05, "Pretrain/Loss": 2.068723201751709, "Pretrain/Loss (Raw)": 2.0686044692993164, "Pretrain/Step": 2453, "Pretrain/Step Time": 9.541985174641013} +{"Pretrain/Learning Rate": 4.352493619690016e-05, "Pretrain/Loss": 2.0709214210510254, "Pretrain/Loss (Raw)": 2.196937084197998, "Pretrain/Step": 2454, "Pretrain/Step Time": 9.588601553812623} +{"Pretrain/Learning Rate": 4.351923411243049e-05, "Pretrain/Loss": 2.0713284015655518, "Pretrain/Loss (Raw)": 1.9840360879898071, "Pretrain/Step": 2455, "Pretrain/Step Time": 9.547302454710007} +{"Pretrain/Learning Rate": 4.35135298922355e-05, "Pretrain/Loss": 2.070215940475464, "Pretrain/Loss (Raw)": 1.9457716941833496, "Pretrain/Step": 2456, "Pretrain/Step Time": 9.547603012993932} +{"Pretrain/Learning Rate": 4.350782353697299e-05, "Pretrain/Loss": 2.0702309608459473, "Pretrain/Loss (Raw)": 2.1681625843048096, "Pretrain/Step": 2457, "Pretrain/Step Time": 9.532207164913416} +{"Pretrain/Learning Rate": 4.350211504730106e-05, "Pretrain/Loss": 2.067959785461426, "Pretrain/Loss (Raw)": 1.7430378198623657, "Pretrain/Step": 2458, "Pretrain/Step Time": 9.53038146533072} +{"Pretrain/Learning Rate": 4.3496404423878045e-05, "Pretrain/Loss": 2.0693907737731934, "Pretrain/Loss (Raw)": 2.1228199005126953, "Pretrain/Step": 2459, "Pretrain/Step Time": 9.565625116229057} +{"Pretrain/Learning Rate": 4.349069166736251e-05, "Pretrain/Loss": 2.0706515312194824, "Pretrain/Loss (Raw)": 2.1776676177978516, "Pretrain/Step": 2460, "Pretrain/Step Time": 9.547832518815994} +{"Pretrain/Learning Rate": 4.348497677841328e-05, "Pretrain/Loss": 2.071256160736084, "Pretrain/Loss (Raw)": 2.0437815189361572, "Pretrain/Step": 2461, "Pretrain/Step Time": 9.551874926313758} +{"Pretrain/Learning Rate": 4.3479259757689427e-05, "Pretrain/Loss": 2.075479507446289, "Pretrain/Loss (Raw)": 2.11501145362854, "Pretrain/Step": 2462, "Pretrain/Step Time": 9.543845979496837} +{"Pretrain/Learning Rate": 4.347354060585026e-05, "Pretrain/Loss": 2.0747175216674805, "Pretrain/Loss (Raw)": 2.0184435844421387, "Pretrain/Step": 2463, "Pretrain/Step Time": 9.492204908281565} +{"Pretrain/Learning Rate": 4.346781932355533e-05, "Pretrain/Loss": 2.0731842517852783, "Pretrain/Loss (Raw)": 1.9182279109954834, "Pretrain/Step": 2464, "Pretrain/Step Time": 9.488502824679017} +{"Pretrain/Learning Rate": 4.3462095911464465e-05, "Pretrain/Loss": 2.0730018615722656, "Pretrain/Loss (Raw)": 2.00476336479187, "Pretrain/Step": 2465, "Pretrain/Step Time": 9.485019588842988} +{"Pretrain/Learning Rate": 4.34563703702377e-05, "Pretrain/Loss": 2.073176383972168, "Pretrain/Loss (Raw)": 2.278125524520874, "Pretrain/Step": 2466, "Pretrain/Step Time": 9.512782158330083} +{"Pretrain/Learning Rate": 4.3450642700535335e-05, "Pretrain/Loss": 2.0734567642211914, "Pretrain/Loss (Raw)": 2.1880593299865723, "Pretrain/Step": 2467, "Pretrain/Step Time": 9.517789877951145} +{"Pretrain/Learning Rate": 4.344491290301791e-05, "Pretrain/Loss": 2.072955369949341, "Pretrain/Loss (Raw)": 2.050706148147583, "Pretrain/Step": 2468, "Pretrain/Step Time": 9.54065783508122} +{"Pretrain/Learning Rate": 4.3439180978346216e-05, "Pretrain/Loss": 2.072805404663086, "Pretrain/Loss (Raw)": 2.176581621170044, "Pretrain/Step": 2469, "Pretrain/Step Time": 9.545597838237882} +{"Pretrain/Learning Rate": 4.3433446927181274e-05, "Pretrain/Loss": 2.073929786682129, "Pretrain/Loss (Raw)": 2.3361191749572754, "Pretrain/Step": 2470, "Pretrain/Step Time": 9.599376302212477} +{"Pretrain/Learning Rate": 4.342771075018438e-05, "Pretrain/Loss": 2.073805093765259, "Pretrain/Loss (Raw)": 2.0122220516204834, "Pretrain/Step": 2471, "Pretrain/Step Time": 9.595092670992017} +{"Pretrain/Learning Rate": 4.342197244801705e-05, "Pretrain/Loss": 2.074253559112549, "Pretrain/Loss (Raw)": 2.148155689239502, "Pretrain/Step": 2472, "Pretrain/Step Time": 9.58459853939712} +{"Pretrain/Learning Rate": 4.341623202134105e-05, "Pretrain/Loss": 2.0729432106018066, "Pretrain/Loss (Raw)": 1.8982192277908325, "Pretrain/Step": 2473, "Pretrain/Step Time": 9.588115449994802} +{"Pretrain/Learning Rate": 4.341048947081839e-05, "Pretrain/Loss": 2.073484420776367, "Pretrain/Loss (Raw)": 2.1689512729644775, "Pretrain/Step": 2474, "Pretrain/Step Time": 9.591631464660168} +{"Pretrain/Learning Rate": 4.340474479711133e-05, "Pretrain/Loss": 2.071730613708496, "Pretrain/Loss (Raw)": 1.909082293510437, "Pretrain/Step": 2475, "Pretrain/Step Time": 9.583419049158692} +{"Pretrain/Learning Rate": 4.3398998000882375e-05, "Pretrain/Loss": 2.0733649730682373, "Pretrain/Loss (Raw)": 2.1150147914886475, "Pretrain/Step": 2476, "Pretrain/Step Time": 9.550130739808083} +{"Pretrain/Learning Rate": 4.339324908279427e-05, "Pretrain/Loss": 2.075584888458252, "Pretrain/Loss (Raw)": 2.3093061447143555, "Pretrain/Step": 2477, "Pretrain/Step Time": 9.547998003661633} +{"Pretrain/Learning Rate": 4.338749804351001e-05, "Pretrain/Loss": 2.0735421180725098, "Pretrain/Loss (Raw)": 1.849833369255066, "Pretrain/Step": 2478, "Pretrain/Step Time": 9.55546447634697} +{"Pretrain/Learning Rate": 4.338174488369283e-05, "Pretrain/Loss": 2.07421875, "Pretrain/Loss (Raw)": 2.092625856399536, "Pretrain/Step": 2479, "Pretrain/Step Time": 9.547327622771263} +{"Pretrain/Learning Rate": 4.337598960400622e-05, "Pretrain/Loss": 2.0746326446533203, "Pretrain/Loss (Raw)": 2.1151223182678223, "Pretrain/Step": 2480, "Pretrain/Step Time": 9.506507748737931} +{"Pretrain/Learning Rate": 4.337023220511389e-05, "Pretrain/Loss": 2.0724260807037354, "Pretrain/Loss (Raw)": 1.8955347537994385, "Pretrain/Step": 2481, "Pretrain/Step Time": 9.507618434727192} +{"Pretrain/Learning Rate": 4.336447268767982e-05, "Pretrain/Loss": 2.0740606784820557, "Pretrain/Loss (Raw)": 2.2589635848999023, "Pretrain/Step": 2482, "Pretrain/Step Time": 9.508992675691843} +{"Pretrain/Learning Rate": 4.3358711052368224e-05, "Pretrain/Loss": 2.0790343284606934, "Pretrain/Loss (Raw)": 2.6101269721984863, "Pretrain/Step": 2483, "Pretrain/Step Time": 9.504973093047738} +{"Pretrain/Learning Rate": 4.335294729984356e-05, "Pretrain/Loss": 2.08164644241333, "Pretrain/Loss (Raw)": 2.203997850418091, "Pretrain/Step": 2484, "Pretrain/Step Time": 9.504170959815383} +{"Pretrain/Learning Rate": 4.334718143077054e-05, "Pretrain/Loss": 2.081760883331299, "Pretrain/Loss (Raw)": 1.92899489402771, "Pretrain/Step": 2485, "Pretrain/Step Time": 9.507074054330587} +{"Pretrain/Learning Rate": 4.334141344581408e-05, "Pretrain/Loss": 2.080643892288208, "Pretrain/Loss (Raw)": 1.7765363454818726, "Pretrain/Step": 2486, "Pretrain/Step Time": 9.506560495123267} +{"Pretrain/Learning Rate": 4.3335643345639414e-05, "Pretrain/Loss": 2.0814414024353027, "Pretrain/Loss (Raw)": 2.1498587131500244, "Pretrain/Step": 2487, "Pretrain/Step Time": 9.507662599906325} +{"Pretrain/Learning Rate": 4.332987113091195e-05, "Pretrain/Loss": 2.0797042846679688, "Pretrain/Loss (Raw)": 2.0218212604522705, "Pretrain/Step": 2488, "Pretrain/Step Time": 9.506278296932578} +{"Pretrain/Learning Rate": 4.332409680229737e-05, "Pretrain/Loss": 2.0802688598632812, "Pretrain/Loss (Raw)": 2.1286728382110596, "Pretrain/Step": 2489, "Pretrain/Step Time": 9.508823854848742} +{"Pretrain/Learning Rate": 4.3318320360461616e-05, "Pretrain/Loss": 2.0807785987854004, "Pretrain/Loss (Raw)": 2.17264986038208, "Pretrain/Step": 2490, "Pretrain/Step Time": 9.506553061306477} +{"Pretrain/Learning Rate": 4.331254180607083e-05, "Pretrain/Loss": 2.081454277038574, "Pretrain/Loss (Raw)": 2.083631992340088, "Pretrain/Step": 2491, "Pretrain/Step Time": 9.50630733370781} +{"Pretrain/Learning Rate": 4.330676113979143e-05, "Pretrain/Loss": 2.0804452896118164, "Pretrain/Loss (Raw)": 1.8736456632614136, "Pretrain/Step": 2492, "Pretrain/Step Time": 9.495244726538658} +{"Pretrain/Learning Rate": 4.330097836229007e-05, "Pretrain/Loss": 2.0828466415405273, "Pretrain/Loss (Raw)": 2.0764689445495605, "Pretrain/Step": 2493, "Pretrain/Step Time": 9.492068365216255} +{"Pretrain/Learning Rate": 4.3295193474233655e-05, "Pretrain/Loss": 2.083116054534912, "Pretrain/Loss (Raw)": 2.2967493534088135, "Pretrain/Step": 2494, "Pretrain/Step Time": 9.449737193062901} +{"Pretrain/Learning Rate": 4.328940647628931e-05, "Pretrain/Loss": 2.083991289138794, "Pretrain/Loss (Raw)": 2.062737464904785, "Pretrain/Step": 2495, "Pretrain/Step Time": 9.448739003390074} +{"Pretrain/Learning Rate": 4.328361736912443e-05, "Pretrain/Loss": 2.0814733505249023, "Pretrain/Loss (Raw)": 1.8729157447814941, "Pretrain/Step": 2496, "Pretrain/Step Time": 9.448224499821663} +{"Pretrain/Learning Rate": 4.3277826153406644e-05, "Pretrain/Loss": 2.081031084060669, "Pretrain/Loss (Raw)": 2.0275657176971436, "Pretrain/Step": 2497, "Pretrain/Step Time": 9.462966626510024} +{"Pretrain/Learning Rate": 4.327203282980382e-05, "Pretrain/Loss": 2.0854570865631104, "Pretrain/Loss (Raw)": 2.0181884765625, "Pretrain/Step": 2498, "Pretrain/Step Time": 9.434695241972804} +{"Pretrain/Learning Rate": 4.326623739898406e-05, "Pretrain/Loss": 2.0852673053741455, "Pretrain/Loss (Raw)": 2.119760513305664, "Pretrain/Step": 2499, "Pretrain/Step Time": 9.451306698843837} +{"Pretrain/Learning Rate": 4.3260439861615734e-05, "Pretrain/Loss": 2.085207939147949, "Pretrain/Loss (Raw)": 2.0574073791503906, "Pretrain/Step": 2500, "Pretrain/Step Time": 9.421339208260179} +{"Pretrain/Learning Rate": 4.325464021836744e-05, "Pretrain/Loss": 2.0838940143585205, "Pretrain/Loss (Raw)": 2.114315986633301, "Pretrain/Step": 2501, "Pretrain/Step Time": 9.424531951546669} +{"Pretrain/Learning Rate": 4.3248838469908016e-05, "Pretrain/Loss": 2.0827479362487793, "Pretrain/Loss (Raw)": 1.9533121585845947, "Pretrain/Step": 2502, "Pretrain/Step Time": 9.424077177420259} +{"Pretrain/Learning Rate": 4.324303461690655e-05, "Pretrain/Loss": 2.0839123725891113, "Pretrain/Loss (Raw)": 2.1904001235961914, "Pretrain/Step": 2503, "Pretrain/Step Time": 9.430337700992823} +{"Pretrain/Learning Rate": 4.3237228660032355e-05, "Pretrain/Loss": 2.082824230194092, "Pretrain/Loss (Raw)": 1.9399248361587524, "Pretrain/Step": 2504, "Pretrain/Step Time": 9.38816856406629} +{"Pretrain/Learning Rate": 4.323142059995503e-05, "Pretrain/Loss": 2.0833187103271484, "Pretrain/Loss (Raw)": 2.197723388671875, "Pretrain/Step": 2505, "Pretrain/Step Time": 9.398999212309718} +{"Pretrain/Learning Rate": 4.3225610437344363e-05, "Pretrain/Loss": 2.084475517272949, "Pretrain/Loss (Raw)": 2.146120548248291, "Pretrain/Step": 2506, "Pretrain/Step Time": 9.40186458453536} +{"Pretrain/Learning Rate": 4.321979817287043e-05, "Pretrain/Loss": 2.082493305206299, "Pretrain/Loss (Raw)": 1.8458150625228882, "Pretrain/Step": 2507, "Pretrain/Step Time": 9.415018578991294} +{"Pretrain/Learning Rate": 4.32139838072035e-05, "Pretrain/Loss": 2.0821566581726074, "Pretrain/Loss (Raw)": 2.0948822498321533, "Pretrain/Step": 2508, "Pretrain/Step Time": 9.4041114654392} +{"Pretrain/Learning Rate": 4.320816734101415e-05, "Pretrain/Loss": 2.082167863845825, "Pretrain/Loss (Raw)": 2.0717718601226807, "Pretrain/Step": 2509, "Pretrain/Step Time": 9.416366811841726} +{"Pretrain/Learning Rate": 4.320234877497313e-05, "Pretrain/Loss": 2.0771827697753906, "Pretrain/Loss (Raw)": 2.022181987762451, "Pretrain/Step": 2510, "Pretrain/Step Time": 9.41600226610899} +{"Pretrain/Learning Rate": 4.319652810975148e-05, "Pretrain/Loss": 2.0778255462646484, "Pretrain/Loss (Raw)": 2.1221351623535156, "Pretrain/Step": 2511, "Pretrain/Step Time": 9.408432938158512} +{"Pretrain/Learning Rate": 4.319070534602047e-05, "Pretrain/Loss": 2.075939416885376, "Pretrain/Loss (Raw)": 1.8524138927459717, "Pretrain/Step": 2512, "Pretrain/Step Time": 9.411875421181321} +{"Pretrain/Learning Rate": 4.318488048445158e-05, "Pretrain/Loss": 2.0768465995788574, "Pretrain/Loss (Raw)": 2.1736466884613037, "Pretrain/Step": 2513, "Pretrain/Step Time": 9.403878457844257} +{"Pretrain/Learning Rate": 4.317905352571661e-05, "Pretrain/Loss": 2.0759592056274414, "Pretrain/Loss (Raw)": 2.0052685737609863, "Pretrain/Step": 2514, "Pretrain/Step Time": 9.398798005655408} +{"Pretrain/Learning Rate": 4.317322447048751e-05, "Pretrain/Loss": 2.079446792602539, "Pretrain/Loss (Raw)": 2.4878814220428467, "Pretrain/Step": 2515, "Pretrain/Step Time": 9.397427408024669} +{"Pretrain/Learning Rate": 4.316739331943653e-05, "Pretrain/Loss": 2.0790984630584717, "Pretrain/Loss (Raw)": 2.054494857788086, "Pretrain/Step": 2516, "Pretrain/Step Time": 9.403537824749947} +{"Pretrain/Learning Rate": 4.316156007323614e-05, "Pretrain/Loss": 2.079223871231079, "Pretrain/Loss (Raw)": 2.1828417778015137, "Pretrain/Step": 2517, "Pretrain/Step Time": 9.40596147812903} +{"Pretrain/Learning Rate": 4.315572473255908e-05, "Pretrain/Loss": 2.080314874649048, "Pretrain/Loss (Raw)": 1.702450156211853, "Pretrain/Step": 2518, "Pretrain/Step Time": 9.426278656348586} +{"Pretrain/Learning Rate": 4.3149887298078276e-05, "Pretrain/Loss": 2.081345558166504, "Pretrain/Loss (Raw)": 2.139031171798706, "Pretrain/Step": 2519, "Pretrain/Step Time": 9.43526334501803} +{"Pretrain/Learning Rate": 4.314404777046694e-05, "Pretrain/Loss": 2.081308603286743, "Pretrain/Loss (Raw)": 2.1658148765563965, "Pretrain/Step": 2520, "Pretrain/Step Time": 9.437977138906717} +{"Pretrain/Learning Rate": 4.313820615039853e-05, "Pretrain/Loss": 2.0816309452056885, "Pretrain/Loss (Raw)": 2.1451973915100098, "Pretrain/Step": 2521, "Pretrain/Step Time": 9.420332489535213} +{"Pretrain/Learning Rate": 4.313236243854671e-05, "Pretrain/Loss": 2.083662748336792, "Pretrain/Loss (Raw)": 2.2845542430877686, "Pretrain/Step": 2522, "Pretrain/Step Time": 9.418736543506384} +{"Pretrain/Learning Rate": 4.3126516635585414e-05, "Pretrain/Loss": 2.0830307006835938, "Pretrain/Loss (Raw)": 2.106106996536255, "Pretrain/Step": 2523, "Pretrain/Step Time": 9.435767682269216} +{"Pretrain/Learning Rate": 4.312066874218881e-05, "Pretrain/Loss": 2.084425210952759, "Pretrain/Loss (Raw)": 2.2639541625976562, "Pretrain/Step": 2524, "Pretrain/Step Time": 9.437231166288257} +{"Pretrain/Learning Rate": 4.3114818759031284e-05, "Pretrain/Loss": 2.0848124027252197, "Pretrain/Loss (Raw)": 2.07098126411438, "Pretrain/Step": 2525, "Pretrain/Step Time": 9.411887995898724} +{"Pretrain/Learning Rate": 4.310896668678751e-05, "Pretrain/Loss": 2.081261157989502, "Pretrain/Loss (Raw)": 1.8046623468399048, "Pretrain/Step": 2526, "Pretrain/Step Time": 9.417730797082186} +{"Pretrain/Learning Rate": 4.3103112526132364e-05, "Pretrain/Loss": 2.0814385414123535, "Pretrain/Loss (Raw)": 2.119656801223755, "Pretrain/Step": 2527, "Pretrain/Step Time": 9.446010971441865} +{"Pretrain/Learning Rate": 4.3097256277740976e-05, "Pretrain/Loss": 2.0823843479156494, "Pretrain/Loss (Raw)": 2.061821222305298, "Pretrain/Step": 2528, "Pretrain/Step Time": 9.434019941836596} +{"Pretrain/Learning Rate": 4.309139794228871e-05, "Pretrain/Loss": 2.0834805965423584, "Pretrain/Loss (Raw)": 2.2752888202667236, "Pretrain/Step": 2529, "Pretrain/Step Time": 9.403497133404016} +{"Pretrain/Learning Rate": 4.3085537520451196e-05, "Pretrain/Loss": 2.0855603218078613, "Pretrain/Loss (Raw)": 2.07291579246521, "Pretrain/Step": 2530, "Pretrain/Step Time": 9.40628937445581} +{"Pretrain/Learning Rate": 4.307967501290427e-05, "Pretrain/Loss": 2.0818843841552734, "Pretrain/Loss (Raw)": 1.7988942861557007, "Pretrain/Step": 2531, "Pretrain/Step Time": 9.406864976510406} +{"Pretrain/Learning Rate": 4.307381042032402e-05, "Pretrain/Loss": 2.0825858116149902, "Pretrain/Loss (Raw)": 2.1730854511260986, "Pretrain/Step": 2532, "Pretrain/Step Time": 9.41244469769299} +{"Pretrain/Learning Rate": 4.3067943743386796e-05, "Pretrain/Loss": 2.0806057453155518, "Pretrain/Loss (Raw)": 1.8270167112350464, "Pretrain/Step": 2533, "Pretrain/Step Time": 9.414760863408446} +{"Pretrain/Learning Rate": 4.3062074982769155e-05, "Pretrain/Loss": 2.0800695419311523, "Pretrain/Loss (Raw)": 2.0457279682159424, "Pretrain/Step": 2534, "Pretrain/Step Time": 9.414128405973315} +{"Pretrain/Learning Rate": 4.305620413914792e-05, "Pretrain/Loss": 2.0820021629333496, "Pretrain/Loss (Raw)": 2.207404613494873, "Pretrain/Step": 2535, "Pretrain/Step Time": 9.407745843753219} +{"Pretrain/Learning Rate": 4.305033121320013e-05, "Pretrain/Loss": 2.080846071243286, "Pretrain/Loss (Raw)": 1.9905834197998047, "Pretrain/Step": 2536, "Pretrain/Step Time": 9.39895142056048} +{"Pretrain/Learning Rate": 4.30444562056031e-05, "Pretrain/Loss": 2.0794644355773926, "Pretrain/Loss (Raw)": 2.0138909816741943, "Pretrain/Step": 2537, "Pretrain/Step Time": 9.40309183113277} +{"Pretrain/Learning Rate": 4.3038579117034347e-05, "Pretrain/Loss": 2.079123020172119, "Pretrain/Loss (Raw)": 2.1280925273895264, "Pretrain/Step": 2538, "Pretrain/Step Time": 9.397419264540076} +{"Pretrain/Learning Rate": 4.303269994817165e-05, "Pretrain/Loss": 2.0790319442749023, "Pretrain/Loss (Raw)": 2.0268163681030273, "Pretrain/Step": 2539, "Pretrain/Step Time": 9.389771213755012} +{"Pretrain/Learning Rate": 4.302681869969302e-05, "Pretrain/Loss": 2.078138589859009, "Pretrain/Loss (Raw)": 2.0884358882904053, "Pretrain/Step": 2540, "Pretrain/Step Time": 9.397055979818106} +{"Pretrain/Learning Rate": 4.3020935372276716e-05, "Pretrain/Loss": 2.0759897232055664, "Pretrain/Loss (Raw)": 1.8408243656158447, "Pretrain/Step": 2541, "Pretrain/Step Time": 9.396017465740442} +{"Pretrain/Learning Rate": 4.3015049966601224e-05, "Pretrain/Loss": 2.0759928226470947, "Pretrain/Loss (Raw)": 2.057170867919922, "Pretrain/Step": 2542, "Pretrain/Step Time": 9.394175400957465} +{"Pretrain/Learning Rate": 4.3009162483345275e-05, "Pretrain/Loss": 2.0755176544189453, "Pretrain/Loss (Raw)": 2.0412373542785645, "Pretrain/Step": 2543, "Pretrain/Step Time": 9.389304982498288} +{"Pretrain/Learning Rate": 4.300327292318786e-05, "Pretrain/Loss": 2.0758280754089355, "Pretrain/Loss (Raw)": 2.046027898788452, "Pretrain/Step": 2544, "Pretrain/Step Time": 9.394251719117165} +{"Pretrain/Learning Rate": 4.299738128680817e-05, "Pretrain/Loss": 2.074965715408325, "Pretrain/Loss (Raw)": 1.803491234779358, "Pretrain/Step": 2545, "Pretrain/Step Time": 9.392244007438421} +{"Pretrain/Learning Rate": 4.299148757488567e-05, "Pretrain/Loss": 2.0746593475341797, "Pretrain/Loss (Raw)": 2.093498468399048, "Pretrain/Step": 2546, "Pretrain/Step Time": 9.393654011189938} +{"Pretrain/Learning Rate": 4.298559178810003e-05, "Pretrain/Loss": 2.073634147644043, "Pretrain/Loss (Raw)": 2.0717575550079346, "Pretrain/Step": 2547, "Pretrain/Step Time": 9.399572754278779} +{"Pretrain/Learning Rate": 4.297969392713121e-05, "Pretrain/Loss": 2.073335647583008, "Pretrain/Loss (Raw)": 1.9440388679504395, "Pretrain/Step": 2548, "Pretrain/Step Time": 9.35025362111628} +{"Pretrain/Learning Rate": 4.297379399265935e-05, "Pretrain/Loss": 2.0720276832580566, "Pretrain/Loss (Raw)": 1.7664471864700317, "Pretrain/Step": 2549, "Pretrain/Step Time": 9.352879391983151} +{"Pretrain/Learning Rate": 4.296789198536488e-05, "Pretrain/Loss": 2.068881034851074, "Pretrain/Loss (Raw)": 2.0848278999328613, "Pretrain/Step": 2550, "Pretrain/Step Time": 9.35315633751452} +{"Pretrain/Learning Rate": 4.296198790592843e-05, "Pretrain/Loss": 2.0677876472473145, "Pretrain/Loss (Raw)": 1.942878007888794, "Pretrain/Step": 2551, "Pretrain/Step Time": 9.36398564092815} +{"Pretrain/Learning Rate": 4.295608175503091e-05, "Pretrain/Loss": 2.0672502517700195, "Pretrain/Loss (Raw)": 2.209813356399536, "Pretrain/Step": 2552, "Pretrain/Step Time": 9.366602841764688} +{"Pretrain/Learning Rate": 4.295017353335342e-05, "Pretrain/Loss": 2.06843638420105, "Pretrain/Loss (Raw)": 2.139072895050049, "Pretrain/Step": 2553, "Pretrain/Step Time": 9.369818657636642} +{"Pretrain/Learning Rate": 4.2944263241577334e-05, "Pretrain/Loss": 2.0700201988220215, "Pretrain/Loss (Raw)": 2.1625916957855225, "Pretrain/Step": 2554, "Pretrain/Step Time": 9.371903834864497} +{"Pretrain/Learning Rate": 4.293835088038425e-05, "Pretrain/Loss": 2.0689878463745117, "Pretrain/Loss (Raw)": 2.133713722229004, "Pretrain/Step": 2555, "Pretrain/Step Time": 9.37527153454721} +{"Pretrain/Learning Rate": 4.2932436450456025e-05, "Pretrain/Loss": 2.068085193634033, "Pretrain/Loss (Raw)": 2.0089571475982666, "Pretrain/Step": 2556, "Pretrain/Step Time": 9.370583867654204} +{"Pretrain/Learning Rate": 4.292651995247472e-05, "Pretrain/Loss": 2.067897081375122, "Pretrain/Loss (Raw)": 2.0475149154663086, "Pretrain/Step": 2557, "Pretrain/Step Time": 9.378249429166317} +{"Pretrain/Learning Rate": 4.292060138712266e-05, "Pretrain/Loss": 2.0698366165161133, "Pretrain/Loss (Raw)": 2.099287271499634, "Pretrain/Step": 2558, "Pretrain/Step Time": 9.375465145334601} +{"Pretrain/Learning Rate": 4.2914680755082414e-05, "Pretrain/Loss": 2.068896770477295, "Pretrain/Loss (Raw)": 1.9852354526519775, "Pretrain/Step": 2559, "Pretrain/Step Time": 9.382867557927966} +{"Pretrain/Learning Rate": 4.2908758057036756e-05, "Pretrain/Loss": 2.0675129890441895, "Pretrain/Loss (Raw)": 2.1077022552490234, "Pretrain/Step": 2560, "Pretrain/Step Time": 9.38119306601584} +{"Pretrain/Learning Rate": 4.2902833293668744e-05, "Pretrain/Loss": 2.0686326026916504, "Pretrain/Loss (Raw)": 2.0334362983703613, "Pretrain/Step": 2561, "Pretrain/Step Time": 9.316736478358507} +{"Pretrain/Learning Rate": 4.2896906465661623e-05, "Pretrain/Loss": 2.0668210983276367, "Pretrain/Loss (Raw)": 1.9843096733093262, "Pretrain/Step": 2562, "Pretrain/Step Time": 9.318532401695848} +{"Pretrain/Learning Rate": 4.289097757369892e-05, "Pretrain/Loss": 2.0670015811920166, "Pretrain/Loss (Raw)": 2.0660133361816406, "Pretrain/Step": 2563, "Pretrain/Step Time": 9.30340170301497} +{"Pretrain/Learning Rate": 4.288504661846437e-05, "Pretrain/Loss": 2.0678000450134277, "Pretrain/Loss (Raw)": 2.1384308338165283, "Pretrain/Step": 2564, "Pretrain/Step Time": 9.296325525268912} +{"Pretrain/Learning Rate": 4.2879113600641976e-05, "Pretrain/Loss": 2.068920612335205, "Pretrain/Loss (Raw)": 2.1765685081481934, "Pretrain/Step": 2565, "Pretrain/Step Time": 9.305970344692469} +{"Pretrain/Learning Rate": 4.287317852091595e-05, "Pretrain/Loss": 2.070466995239258, "Pretrain/Loss (Raw)": 2.034008741378784, "Pretrain/Step": 2566, "Pretrain/Step Time": 9.306963037699461} +{"Pretrain/Learning Rate": 4.2867241379970754e-05, "Pretrain/Loss": 2.07167911529541, "Pretrain/Loss (Raw)": 2.2153892517089844, "Pretrain/Step": 2567, "Pretrain/Step Time": 9.304338973015547} +{"Pretrain/Learning Rate": 4.2861302178491094e-05, "Pretrain/Loss": 2.072709560394287, "Pretrain/Loss (Raw)": 2.0833282470703125, "Pretrain/Step": 2568, "Pretrain/Step Time": 9.303075037896633} +{"Pretrain/Learning Rate": 4.28553609171619e-05, "Pretrain/Loss": 2.073770523071289, "Pretrain/Loss (Raw)": 2.1785173416137695, "Pretrain/Step": 2569, "Pretrain/Step Time": 9.288400223478675} +{"Pretrain/Learning Rate": 4.284941759666835e-05, "Pretrain/Loss": 2.0753095149993896, "Pretrain/Loss (Raw)": 1.9865206480026245, "Pretrain/Step": 2570, "Pretrain/Step Time": 9.304119618609548} +{"Pretrain/Learning Rate": 4.2843472217695844e-05, "Pretrain/Loss": 2.0739974975585938, "Pretrain/Loss (Raw)": 1.991400122642517, "Pretrain/Step": 2571, "Pretrain/Step Time": 9.302776101976633} +{"Pretrain/Learning Rate": 4.283752478093005e-05, "Pretrain/Loss": 2.069729804992676, "Pretrain/Loss (Raw)": 1.7220696210861206, "Pretrain/Step": 2572, "Pretrain/Step Time": 9.303773609921336} +{"Pretrain/Learning Rate": 4.283157528705683e-05, "Pretrain/Loss": 2.072293281555176, "Pretrain/Loss (Raw)": 2.4242429733276367, "Pretrain/Step": 2573, "Pretrain/Step Time": 9.296141156926751} +{"Pretrain/Learning Rate": 4.2825623736762344e-05, "Pretrain/Loss": 2.071902275085449, "Pretrain/Loss (Raw)": 2.038187265396118, "Pretrain/Step": 2574, "Pretrain/Step Time": 9.30164859071374} +{"Pretrain/Learning Rate": 4.2819670130732926e-05, "Pretrain/Loss": 2.0693466663360596, "Pretrain/Loss (Raw)": 2.1234805583953857, "Pretrain/Step": 2575, "Pretrain/Step Time": 9.297894759103656} +{"Pretrain/Learning Rate": 4.2813714469655176e-05, "Pretrain/Loss": 2.068563938140869, "Pretrain/Loss (Raw)": 1.96742582321167, "Pretrain/Step": 2576, "Pretrain/Step Time": 9.302577966824174} +{"Pretrain/Learning Rate": 4.280775675421593e-05, "Pretrain/Loss": 2.0683887004852295, "Pretrain/Loss (Raw)": 1.9644044637680054, "Pretrain/Step": 2577, "Pretrain/Step Time": 9.26405007019639} +{"Pretrain/Learning Rate": 4.280179698510226e-05, "Pretrain/Loss": 2.0669801235198975, "Pretrain/Loss (Raw)": 2.0054099559783936, "Pretrain/Step": 2578, "Pretrain/Step Time": 9.259603938087821} +{"Pretrain/Learning Rate": 4.279583516300148e-05, "Pretrain/Loss": 2.066479206085205, "Pretrain/Loss (Raw)": 1.8899959325790405, "Pretrain/Step": 2579, "Pretrain/Step Time": 9.253720130771399} +{"Pretrain/Learning Rate": 4.2789871288601136e-05, "Pretrain/Loss": 2.0635266304016113, "Pretrain/Loss (Raw)": 1.763041377067566, "Pretrain/Step": 2580, "Pretrain/Step Time": 9.238099845126271} +{"Pretrain/Learning Rate": 4.2783905362589e-05, "Pretrain/Loss": 2.063382148742676, "Pretrain/Loss (Raw)": 2.0500991344451904, "Pretrain/Step": 2581, "Pretrain/Step Time": 9.242838624864817} +{"Pretrain/Learning Rate": 4.27779373856531e-05, "Pretrain/Loss": 2.0632829666137695, "Pretrain/Loss (Raw)": 2.184291124343872, "Pretrain/Step": 2582, "Pretrain/Step Time": 9.197291772812605} +{"Pretrain/Learning Rate": 4.277196735848169e-05, "Pretrain/Loss": 2.064197063446045, "Pretrain/Loss (Raw)": 2.101011276245117, "Pretrain/Step": 2583, "Pretrain/Step Time": 9.194623973220587} +{"Pretrain/Learning Rate": 4.2765995281763263e-05, "Pretrain/Loss": 2.063424587249756, "Pretrain/Loss (Raw)": 1.8468924760818481, "Pretrain/Step": 2584, "Pretrain/Step Time": 9.195125197991729} +{"Pretrain/Learning Rate": 4.2760021156186534e-05, "Pretrain/Loss": 2.062689781188965, "Pretrain/Loss (Raw)": 2.074134349822998, "Pretrain/Step": 2585, "Pretrain/Step Time": 9.192706003785133} +{"Pretrain/Learning Rate": 4.2754044982440486e-05, "Pretrain/Loss": 2.0643177032470703, "Pretrain/Loss (Raw)": 1.9513882398605347, "Pretrain/Step": 2586, "Pretrain/Step Time": 9.188920700922608} +{"Pretrain/Learning Rate": 4.2748066761214305e-05, "Pretrain/Loss": 2.062390089035034, "Pretrain/Loss (Raw)": 1.8760980367660522, "Pretrain/Step": 2587, "Pretrain/Step Time": 9.165146976709366} +{"Pretrain/Learning Rate": 4.274208649319744e-05, "Pretrain/Loss": 2.0594019889831543, "Pretrain/Loss (Raw)": 1.7951643466949463, "Pretrain/Step": 2588, "Pretrain/Step Time": 9.165369292721152} +{"Pretrain/Learning Rate": 4.273610417907955e-05, "Pretrain/Loss": 2.059495449066162, "Pretrain/Loss (Raw)": 2.0557475090026855, "Pretrain/Step": 2589, "Pretrain/Step Time": 9.1672940030694} +{"Pretrain/Learning Rate": 4.2730119819550555e-05, "Pretrain/Loss": 2.0592703819274902, "Pretrain/Loss (Raw)": 2.0862016677856445, "Pretrain/Step": 2590, "Pretrain/Step Time": 9.176131814718246} +{"Pretrain/Learning Rate": 4.2724133415300596e-05, "Pretrain/Loss": 2.0604662895202637, "Pretrain/Loss (Raw)": 2.171520471572876, "Pretrain/Step": 2591, "Pretrain/Step Time": 9.169031901285052} +{"Pretrain/Learning Rate": 4.271814496702005e-05, "Pretrain/Loss": 2.0621020793914795, "Pretrain/Loss (Raw)": 2.1276302337646484, "Pretrain/Step": 2592, "Pretrain/Step Time": 9.177006386220455} +{"Pretrain/Learning Rate": 4.2712154475399534e-05, "Pretrain/Loss": 2.061708450317383, "Pretrain/Loss (Raw)": 1.9543594121932983, "Pretrain/Step": 2593, "Pretrain/Step Time": 9.173107147216797} +{"Pretrain/Learning Rate": 4.2706161941129906e-05, "Pretrain/Loss": 2.061042308807373, "Pretrain/Loss (Raw)": 2.192840814590454, "Pretrain/Step": 2594, "Pretrain/Step Time": 9.148010190576315} +{"Pretrain/Learning Rate": 4.270016736490225e-05, "Pretrain/Loss": 2.059602737426758, "Pretrain/Loss (Raw)": 2.0038223266601562, "Pretrain/Step": 2595, "Pretrain/Step Time": 9.139017563313246} +{"Pretrain/Learning Rate": 4.2694170747407886e-05, "Pretrain/Loss": 2.0607147216796875, "Pretrain/Loss (Raw)": 2.1930551528930664, "Pretrain/Step": 2596, "Pretrain/Step Time": 9.116345575079322} +{"Pretrain/Learning Rate": 4.268817208933837e-05, "Pretrain/Loss": 2.0597012042999268, "Pretrain/Loss (Raw)": 2.046841621398926, "Pretrain/Step": 2597, "Pretrain/Step Time": 9.116204906255007} +{"Pretrain/Learning Rate": 4.268217139138551e-05, "Pretrain/Loss": 2.0586655139923096, "Pretrain/Loss (Raw)": 2.20353627204895, "Pretrain/Step": 2598, "Pretrain/Step Time": 9.065669978037477} +{"Pretrain/Learning Rate": 4.267616865424131e-05, "Pretrain/Loss": 2.059518575668335, "Pretrain/Loss (Raw)": 2.1214284896850586, "Pretrain/Step": 2599, "Pretrain/Step Time": 9.06626296043396} +{"Pretrain/Learning Rate": 4.267016387859806e-05, "Pretrain/Loss": 2.057284355163574, "Pretrain/Loss (Raw)": 1.8621622323989868, "Pretrain/Step": 2600, "Pretrain/Step Time": 9.071807896718383} +{"Pretrain/Learning Rate": 4.266415706514824e-05, "Pretrain/Loss": 2.058821201324463, "Pretrain/Loss (Raw)": 2.094958543777466, "Pretrain/Step": 2601, "Pretrain/Step Time": 9.073160177096725} +{"Pretrain/Learning Rate": 4.2658148214584585e-05, "Pretrain/Loss": 2.059094190597534, "Pretrain/Loss (Raw)": 2.20388126373291, "Pretrain/Step": 2602, "Pretrain/Step Time": 9.068705404177308} +{"Pretrain/Learning Rate": 4.265213732760008e-05, "Pretrain/Loss": 2.0608842372894287, "Pretrain/Loss (Raw)": 2.1382172107696533, "Pretrain/Step": 2603, "Pretrain/Step Time": 9.074326317757368} +{"Pretrain/Learning Rate": 4.264612440488791e-05, "Pretrain/Loss": 2.0610275268554688, "Pretrain/Loss (Raw)": 2.1333377361297607, "Pretrain/Step": 2604, "Pretrain/Step Time": 9.071829933673143} +{"Pretrain/Learning Rate": 4.264010944714153e-05, "Pretrain/Loss": 2.0597386360168457, "Pretrain/Loss (Raw)": 2.1443591117858887, "Pretrain/Step": 2605, "Pretrain/Step Time": 9.098904222249985} +{"Pretrain/Learning Rate": 4.263409245505461e-05, "Pretrain/Loss": 2.06058931350708, "Pretrain/Loss (Raw)": 1.958680272102356, "Pretrain/Step": 2606, "Pretrain/Step Time": 9.101134240627289} +{"Pretrain/Learning Rate": 4.262807342932105e-05, "Pretrain/Loss": 2.0605266094207764, "Pretrain/Loss (Raw)": 2.0846309661865234, "Pretrain/Step": 2607, "Pretrain/Step Time": 9.115570191293955} +{"Pretrain/Learning Rate": 4.262205237063499e-05, "Pretrain/Loss": 2.059537887573242, "Pretrain/Loss (Raw)": 1.9885337352752686, "Pretrain/Step": 2608, "Pretrain/Step Time": 9.115181852132082} +{"Pretrain/Learning Rate": 4.2616029279690814e-05, "Pretrain/Loss": 2.059860944747925, "Pretrain/Loss (Raw)": 1.9368911981582642, "Pretrain/Step": 2609, "Pretrain/Step Time": 9.11454513669014} +{"Pretrain/Learning Rate": 4.261000415718312e-05, "Pretrain/Loss": 2.0578994750976562, "Pretrain/Loss (Raw)": 2.0078818798065186, "Pretrain/Step": 2610, "Pretrain/Step Time": 9.118931462988257} +{"Pretrain/Learning Rate": 4.260397700380679e-05, "Pretrain/Loss": 2.0542378425598145, "Pretrain/Loss (Raw)": 2.1414709091186523, "Pretrain/Step": 2611, "Pretrain/Step Time": 9.118270922452211} +{"Pretrain/Learning Rate": 4.259794782025687e-05, "Pretrain/Loss": 2.051548957824707, "Pretrain/Loss (Raw)": 1.8598216772079468, "Pretrain/Step": 2612, "Pretrain/Step Time": 9.117425942793489} +{"Pretrain/Learning Rate": 4.2591916607228675e-05, "Pretrain/Loss": 2.0511155128479004, "Pretrain/Loss (Raw)": 1.8735235929489136, "Pretrain/Step": 2613, "Pretrain/Step Time": 9.116928562521935} +{"Pretrain/Learning Rate": 4.2585883365417774e-05, "Pretrain/Loss": 2.0528438091278076, "Pretrain/Loss (Raw)": 1.997718334197998, "Pretrain/Step": 2614, "Pretrain/Step Time": 9.116784879937768} +{"Pretrain/Learning Rate": 4.2579848095519926e-05, "Pretrain/Loss": 2.0515780448913574, "Pretrain/Loss (Raw)": 1.9878631830215454, "Pretrain/Step": 2615, "Pretrain/Step Time": 9.117174532264471} +{"Pretrain/Learning Rate": 4.257381079823116e-05, "Pretrain/Loss": 2.050832748413086, "Pretrain/Loss (Raw)": 1.9264415502548218, "Pretrain/Step": 2616, "Pretrain/Step Time": 9.117476604878902} +{"Pretrain/Learning Rate": 4.2567771474247726e-05, "Pretrain/Loss": 2.0522265434265137, "Pretrain/Loss (Raw)": 2.3070473670959473, "Pretrain/Step": 2617, "Pretrain/Step Time": 9.119552459567785} +{"Pretrain/Learning Rate": 4.2561730124266094e-05, "Pretrain/Loss": 2.051828622817993, "Pretrain/Loss (Raw)": 2.1217305660247803, "Pretrain/Step": 2618, "Pretrain/Step Time": 9.11616832204163} +{"Pretrain/Learning Rate": 4.255568674898301e-05, "Pretrain/Loss": 2.0513596534729004, "Pretrain/Loss (Raw)": 2.0236129760742188, "Pretrain/Step": 2619, "Pretrain/Step Time": 9.138413649052382} +{"Pretrain/Learning Rate": 4.254964134909538e-05, "Pretrain/Loss": 2.0494306087493896, "Pretrain/Loss (Raw)": 1.6267204284667969, "Pretrain/Step": 2620, "Pretrain/Step Time": 9.143195191398263} +{"Pretrain/Learning Rate": 4.254359392530043e-05, "Pretrain/Loss": 2.048854351043701, "Pretrain/Loss (Raw)": 2.0027174949645996, "Pretrain/Step": 2621, "Pretrain/Step Time": 9.153114695101976} +{"Pretrain/Learning Rate": 4.2537544478295556e-05, "Pretrain/Loss": 2.0469512939453125, "Pretrain/Loss (Raw)": 2.053119659423828, "Pretrain/Step": 2622, "Pretrain/Step Time": 9.15439604781568} +{"Pretrain/Learning Rate": 4.253149300877841e-05, "Pretrain/Loss": 2.046656370162964, "Pretrain/Loss (Raw)": 2.025026559829712, "Pretrain/Step": 2623, "Pretrain/Step Time": 9.162319358438253} +{"Pretrain/Learning Rate": 4.252543951744688e-05, "Pretrain/Loss": 2.0493905544281006, "Pretrain/Loss (Raw)": 2.222870111465454, "Pretrain/Step": 2624, "Pretrain/Step Time": 9.163390839472413} +{"Pretrain/Learning Rate": 4.251938400499909e-05, "Pretrain/Loss": 2.0494492053985596, "Pretrain/Loss (Raw)": 2.035067081451416, "Pretrain/Step": 2625, "Pretrain/Step Time": 9.146913012489676} +{"Pretrain/Learning Rate": 4.251332647213337e-05, "Pretrain/Loss": 2.0503621101379395, "Pretrain/Loss (Raw)": 2.1350300312042236, "Pretrain/Step": 2626, "Pretrain/Step Time": 9.146142141893506} +{"Pretrain/Learning Rate": 4.250726691954832e-05, "Pretrain/Loss": 2.050215244293213, "Pretrain/Loss (Raw)": 2.100980520248413, "Pretrain/Step": 2627, "Pretrain/Step Time": 9.13512129895389} +{"Pretrain/Learning Rate": 4.250120534794275e-05, "Pretrain/Loss": 2.0510599613189697, "Pretrain/Loss (Raw)": 2.165544033050537, "Pretrain/Step": 2628, "Pretrain/Step Time": 9.126221768558025} +{"Pretrain/Learning Rate": 4.249514175801572e-05, "Pretrain/Loss": 2.051109790802002, "Pretrain/Loss (Raw)": 2.1206843852996826, "Pretrain/Step": 2629, "Pretrain/Step Time": 9.121291115880013} +{"Pretrain/Learning Rate": 4.248907615046649e-05, "Pretrain/Loss": 2.0519826412200928, "Pretrain/Loss (Raw)": 2.0650229454040527, "Pretrain/Step": 2630, "Pretrain/Step Time": 9.127081830054522} +{"Pretrain/Learning Rate": 4.24830085259946e-05, "Pretrain/Loss": 2.0503950119018555, "Pretrain/Loss (Raw)": 1.9871906042099, "Pretrain/Step": 2631, "Pretrain/Step Time": 9.124782986938953} +{"Pretrain/Learning Rate": 4.247693888529978e-05, "Pretrain/Loss": 2.051983594894409, "Pretrain/Loss (Raw)": 2.1432645320892334, "Pretrain/Step": 2632, "Pretrain/Step Time": 9.120620641857386} +{"Pretrain/Learning Rate": 4.247086722908201e-05, "Pretrain/Loss": 2.050233840942383, "Pretrain/Loss (Raw)": 1.9737435579299927, "Pretrain/Step": 2633, "Pretrain/Step Time": 9.110099008306861} +{"Pretrain/Learning Rate": 4.24647935580415e-05, "Pretrain/Loss": 2.0499582290649414, "Pretrain/Loss (Raw)": 2.110872983932495, "Pretrain/Step": 2634, "Pretrain/Step Time": 9.11317246966064} +{"Pretrain/Learning Rate": 4.2458717872878715e-05, "Pretrain/Loss": 2.052424907684326, "Pretrain/Loss (Raw)": 2.1615540981292725, "Pretrain/Step": 2635, "Pretrain/Step Time": 9.108361752703786} +{"Pretrain/Learning Rate": 4.245264017429431e-05, "Pretrain/Loss": 2.0519261360168457, "Pretrain/Loss (Raw)": 2.031015396118164, "Pretrain/Step": 2636, "Pretrain/Step Time": 9.107172133401036} +{"Pretrain/Learning Rate": 4.2446560462989203e-05, "Pretrain/Loss": 2.051725149154663, "Pretrain/Loss (Raw)": 2.046069860458374, "Pretrain/Step": 2637, "Pretrain/Step Time": 9.09349755384028} +{"Pretrain/Learning Rate": 4.244047873966452e-05, "Pretrain/Loss": 2.0498180389404297, "Pretrain/Loss (Raw)": 1.7780681848526, "Pretrain/Step": 2638, "Pretrain/Step Time": 9.09795268625021} +{"Pretrain/Learning Rate": 4.2434395005021666e-05, "Pretrain/Loss": 2.049232006072998, "Pretrain/Loss (Raw)": 2.0471298694610596, "Pretrain/Step": 2639, "Pretrain/Step Time": 9.096255209296942} +{"Pretrain/Learning Rate": 4.242830925976221e-05, "Pretrain/Loss": 2.0500030517578125, "Pretrain/Loss (Raw)": 1.9510917663574219, "Pretrain/Step": 2640, "Pretrain/Step Time": 9.094906436279416} +{"Pretrain/Learning Rate": 4.2422221504588016e-05, "Pretrain/Loss": 2.0493898391723633, "Pretrain/Loss (Raw)": 2.0951578617095947, "Pretrain/Step": 2641, "Pretrain/Step Time": 9.094358917325735} +{"Pretrain/Learning Rate": 4.2416131740201134e-05, "Pretrain/Loss": 2.049185276031494, "Pretrain/Loss (Raw)": 1.9790619611740112, "Pretrain/Step": 2642, "Pretrain/Step Time": 9.11484632268548} +{"Pretrain/Learning Rate": 4.241003996730388e-05, "Pretrain/Loss": 2.0443379878997803, "Pretrain/Loss (Raw)": 1.8674463033676147, "Pretrain/Step": 2643, "Pretrain/Step Time": 9.113525742664933} +{"Pretrain/Learning Rate": 4.240394618659878e-05, "Pretrain/Loss": 2.0423052310943604, "Pretrain/Loss (Raw)": 1.7943114042282104, "Pretrain/Step": 2644, "Pretrain/Step Time": 9.118387788534164} +{"Pretrain/Learning Rate": 4.2397850398788586e-05, "Pretrain/Loss": 2.0433831214904785, "Pretrain/Loss (Raw)": 2.3208045959472656, "Pretrain/Step": 2645, "Pretrain/Step Time": 9.116040667518973} +{"Pretrain/Learning Rate": 4.239175260457631e-05, "Pretrain/Loss": 2.047036647796631, "Pretrain/Loss (Raw)": 2.170083522796631, "Pretrain/Step": 2646, "Pretrain/Step Time": 9.100501146167517} +{"Pretrain/Learning Rate": 4.2385652804665164e-05, "Pretrain/Loss": 2.0453805923461914, "Pretrain/Loss (Raw)": 1.9270732402801514, "Pretrain/Step": 2647, "Pretrain/Step Time": 9.070540888234973} +{"Pretrain/Learning Rate": 4.237955099975862e-05, "Pretrain/Loss": 2.043299674987793, "Pretrain/Loss (Raw)": 1.8994327783584595, "Pretrain/Step": 2648, "Pretrain/Step Time": 9.071315394714475} +{"Pretrain/Learning Rate": 4.237344719056035e-05, "Pretrain/Loss": 2.040628433227539, "Pretrain/Loss (Raw)": 1.803287148475647, "Pretrain/Step": 2649, "Pretrain/Step Time": 9.077241770923138} +{"Pretrain/Learning Rate": 4.236734137777429e-05, "Pretrain/Loss": 2.0384888648986816, "Pretrain/Loss (Raw)": 2.0107035636901855, "Pretrain/Step": 2650, "Pretrain/Step Time": 9.072264464572072} +{"Pretrain/Learning Rate": 4.236123356210458e-05, "Pretrain/Loss": 2.0378940105438232, "Pretrain/Loss (Raw)": 2.0299723148345947, "Pretrain/Step": 2651, "Pretrain/Step Time": 9.057526776567101} +{"Pretrain/Learning Rate": 4.235512374425561e-05, "Pretrain/Loss": 2.036547899246216, "Pretrain/Loss (Raw)": 2.0916435718536377, "Pretrain/Step": 2652, "Pretrain/Step Time": 9.072536423802376} +{"Pretrain/Learning Rate": 4.234901192493199e-05, "Pretrain/Loss": 2.0372283458709717, "Pretrain/Loss (Raw)": 2.1580817699432373, "Pretrain/Step": 2653, "Pretrain/Step Time": 9.070510305464268} +{"Pretrain/Learning Rate": 4.234289810483857e-05, "Pretrain/Loss": 2.039801597595215, "Pretrain/Loss (Raw)": 2.1340413093566895, "Pretrain/Step": 2654, "Pretrain/Step Time": 9.079804887995124} +{"Pretrain/Learning Rate": 4.233678228468041e-05, "Pretrain/Loss": 2.038316488265991, "Pretrain/Loss (Raw)": 1.9295654296875, "Pretrain/Step": 2655, "Pretrain/Step Time": 9.047771386802197} +{"Pretrain/Learning Rate": 4.2330664465162826e-05, "Pretrain/Loss": 2.038487434387207, "Pretrain/Loss (Raw)": 2.083672523498535, "Pretrain/Step": 2656, "Pretrain/Step Time": 9.053070276975632} +{"Pretrain/Learning Rate": 4.232454464699135e-05, "Pretrain/Loss": 2.0333003997802734, "Pretrain/Loss (Raw)": 1.6113823652267456, "Pretrain/Step": 2657, "Pretrain/Step Time": 9.054485449567437} +{"Pretrain/Learning Rate": 4.231842283087175e-05, "Pretrain/Loss": 2.0327184200286865, "Pretrain/Loss (Raw)": 1.9983974695205688, "Pretrain/Step": 2658, "Pretrain/Step Time": 9.056436955928802} +{"Pretrain/Learning Rate": 4.231229901751002e-05, "Pretrain/Loss": 2.035332441329956, "Pretrain/Loss (Raw)": 2.1335017681121826, "Pretrain/Step": 2659, "Pretrain/Step Time": 9.055810108780861} +{"Pretrain/Learning Rate": 4.2306173207612394e-05, "Pretrain/Loss": 2.0359244346618652, "Pretrain/Loss (Raw)": 2.248878002166748, "Pretrain/Step": 2660, "Pretrain/Step Time": 9.045746149495244} +{"Pretrain/Learning Rate": 4.230004540188533e-05, "Pretrain/Loss": 2.0399441719055176, "Pretrain/Loss (Raw)": 2.341508150100708, "Pretrain/Step": 2661, "Pretrain/Step Time": 9.073973765596747} +{"Pretrain/Learning Rate": 4.22939156010355e-05, "Pretrain/Loss": 2.039743423461914, "Pretrain/Loss (Raw)": 2.0200304985046387, "Pretrain/Step": 2662, "Pretrain/Step Time": 9.07551572099328} +{"Pretrain/Learning Rate": 4.2287783805769824e-05, "Pretrain/Loss": 2.037504196166992, "Pretrain/Loss (Raw)": 1.920822024345398, "Pretrain/Step": 2663, "Pretrain/Step Time": 9.076516687870026} +{"Pretrain/Learning Rate": 4.2281650016795466e-05, "Pretrain/Loss": 2.0378379821777344, "Pretrain/Loss (Raw)": 2.033269166946411, "Pretrain/Step": 2664, "Pretrain/Step Time": 9.077885752543807} +{"Pretrain/Learning Rate": 4.227551423481979e-05, "Pretrain/Loss": 2.038364887237549, "Pretrain/Loss (Raw)": 2.081333637237549, "Pretrain/Step": 2665, "Pretrain/Step Time": 9.07721883803606} +{"Pretrain/Learning Rate": 4.2269376460550414e-05, "Pretrain/Loss": 2.037308692932129, "Pretrain/Loss (Raw)": 1.9929414987564087, "Pretrain/Step": 2666, "Pretrain/Step Time": 9.08128421753645} +{"Pretrain/Learning Rate": 4.226323669469516e-05, "Pretrain/Loss": 2.036409378051758, "Pretrain/Loss (Raw)": 1.9116734266281128, "Pretrain/Step": 2667, "Pretrain/Step Time": 9.089329374954104} +{"Pretrain/Learning Rate": 4.225709493796211e-05, "Pretrain/Loss": 2.0362038612365723, "Pretrain/Loss (Raw)": 2.0621161460876465, "Pretrain/Step": 2668, "Pretrain/Step Time": 9.101405404508114} +{"Pretrain/Learning Rate": 4.225095119105956e-05, "Pretrain/Loss": 2.038306474685669, "Pretrain/Loss (Raw)": 2.10996150970459, "Pretrain/Step": 2669, "Pretrain/Step Time": 9.100151969119906} +{"Pretrain/Learning Rate": 4.224480545469603e-05, "Pretrain/Loss": 2.0376672744750977, "Pretrain/Loss (Raw)": 1.9753652811050415, "Pretrain/Step": 2670, "Pretrain/Step Time": 9.097608041018248} +{"Pretrain/Learning Rate": 4.223865772958026e-05, "Pretrain/Loss": 2.0391006469726562, "Pretrain/Loss (Raw)": 2.224720001220703, "Pretrain/Step": 2671, "Pretrain/Step Time": 9.097444290295243} +{"Pretrain/Learning Rate": 4.223250801642126e-05, "Pretrain/Loss": 2.038079261779785, "Pretrain/Loss (Raw)": 1.915268063545227, "Pretrain/Step": 2672, "Pretrain/Step Time": 9.102501425892115} +{"Pretrain/Learning Rate": 4.222635631592823e-05, "Pretrain/Loss": 2.040858507156372, "Pretrain/Loss (Raw)": 2.1592347621917725, "Pretrain/Step": 2673, "Pretrain/Step Time": 9.109213959425688} +{"Pretrain/Learning Rate": 4.2220202628810614e-05, "Pretrain/Loss": 2.0384366512298584, "Pretrain/Loss (Raw)": 1.7835142612457275, "Pretrain/Step": 2674, "Pretrain/Step Time": 9.109399193897843} +{"Pretrain/Learning Rate": 4.2214046955778085e-05, "Pretrain/Loss": 2.0388078689575195, "Pretrain/Loss (Raw)": 2.119248867034912, "Pretrain/Step": 2675, "Pretrain/Step Time": 9.10334101319313} +{"Pretrain/Learning Rate": 4.2207889297540546e-05, "Pretrain/Loss": 2.0394344329833984, "Pretrain/Loss (Raw)": 2.0242602825164795, "Pretrain/Step": 2676, "Pretrain/Step Time": 9.10459048859775} +{"Pretrain/Learning Rate": 4.2201729654808136e-05, "Pretrain/Loss": 2.0412821769714355, "Pretrain/Loss (Raw)": 2.002960205078125, "Pretrain/Step": 2677, "Pretrain/Step Time": 9.101196639239788} +{"Pretrain/Learning Rate": 4.21955680282912e-05, "Pretrain/Loss": 2.0416932106018066, "Pretrain/Loss (Raw)": 2.137422800064087, "Pretrain/Step": 2678, "Pretrain/Step Time": 9.103538637980819} +{"Pretrain/Learning Rate": 4.218940441870033e-05, "Pretrain/Loss": 2.0432653427124023, "Pretrain/Loss (Raw)": 2.1441099643707275, "Pretrain/Step": 2679, "Pretrain/Step Time": 9.073118591681123} +{"Pretrain/Learning Rate": 4.218323882674634e-05, "Pretrain/Loss": 2.04359769821167, "Pretrain/Loss (Raw)": 2.252366065979004, "Pretrain/Step": 2680, "Pretrain/Step Time": 9.069213937968016} +{"Pretrain/Learning Rate": 4.217707125314029e-05, "Pretrain/Loss": 2.044463634490967, "Pretrain/Loss (Raw)": 2.249908208847046, "Pretrain/Step": 2681, "Pretrain/Step Time": 9.067211106419563} +{"Pretrain/Learning Rate": 4.217090169859343e-05, "Pretrain/Loss": 2.044557571411133, "Pretrain/Loss (Raw)": 2.1746532917022705, "Pretrain/Step": 2682, "Pretrain/Step Time": 9.097865967079997} +{"Pretrain/Learning Rate": 4.216473016381728e-05, "Pretrain/Loss": 2.041159152984619, "Pretrain/Loss (Raw)": 1.6986794471740723, "Pretrain/Step": 2683, "Pretrain/Step Time": 9.097502961754799} +{"Pretrain/Learning Rate": 4.215855664952356e-05, "Pretrain/Loss": 2.0425620079040527, "Pretrain/Loss (Raw)": 2.1885178089141846, "Pretrain/Step": 2684, "Pretrain/Step Time": 9.100557412952185} +{"Pretrain/Learning Rate": 4.215238115642424e-05, "Pretrain/Loss": 2.0426652431488037, "Pretrain/Loss (Raw)": 2.060727119445801, "Pretrain/Step": 2685, "Pretrain/Step Time": 9.104387862607837} +{"Pretrain/Learning Rate": 4.2146203685231495e-05, "Pretrain/Loss": 2.0430941581726074, "Pretrain/Loss (Raw)": 2.15417218208313, "Pretrain/Step": 2686, "Pretrain/Step Time": 9.102741630747914} +{"Pretrain/Learning Rate": 4.214002423665775e-05, "Pretrain/Loss": 2.0422635078430176, "Pretrain/Loss (Raw)": 1.8789737224578857, "Pretrain/Step": 2687, "Pretrain/Step Time": 9.12559006176889} +{"Pretrain/Learning Rate": 4.213384281141563e-05, "Pretrain/Loss": 2.0390625, "Pretrain/Loss (Raw)": 1.6979323625564575, "Pretrain/Step": 2688, "Pretrain/Step Time": 9.127936456352472} +{"Pretrain/Learning Rate": 4.212765941021804e-05, "Pretrain/Loss": 2.0404491424560547, "Pretrain/Loss (Raw)": 2.210935592651367, "Pretrain/Step": 2689, "Pretrain/Step Time": 9.132382256910205} +{"Pretrain/Learning Rate": 4.212147403377805e-05, "Pretrain/Loss": 2.039714813232422, "Pretrain/Loss (Raw)": 1.8903310298919678, "Pretrain/Step": 2690, "Pretrain/Step Time": 9.12817969545722} +{"Pretrain/Learning Rate": 4.2115286682808995e-05, "Pretrain/Loss": 2.0362777709960938, "Pretrain/Loss (Raw)": 1.6260558366775513, "Pretrain/Step": 2691, "Pretrain/Step Time": 9.147199351340532} +{"Pretrain/Learning Rate": 4.210909735802442e-05, "Pretrain/Loss": 2.035291910171509, "Pretrain/Loss (Raw)": 2.0122580528259277, "Pretrain/Step": 2692, "Pretrain/Step Time": 9.1549774967134} +{"Pretrain/Learning Rate": 4.210290606013812e-05, "Pretrain/Loss": 2.034425735473633, "Pretrain/Loss (Raw)": 2.0656752586364746, "Pretrain/Step": 2693, "Pretrain/Step Time": 9.146472338587046} +{"Pretrain/Learning Rate": 4.209671278986412e-05, "Pretrain/Loss": 2.0359575748443604, "Pretrain/Loss (Raw)": 2.23008394241333, "Pretrain/Step": 2694, "Pretrain/Step Time": 9.142667427659035} +{"Pretrain/Learning Rate": 4.209051754791662e-05, "Pretrain/Loss": 2.0344414710998535, "Pretrain/Loss (Raw)": 2.021317720413208, "Pretrain/Step": 2695, "Pretrain/Step Time": 9.146318377926946} +{"Pretrain/Learning Rate": 4.208432033501011e-05, "Pretrain/Loss": 2.035310745239258, "Pretrain/Loss (Raw)": 2.1946046352386475, "Pretrain/Step": 2696, "Pretrain/Step Time": 9.15073880366981} +{"Pretrain/Learning Rate": 4.2078121151859276e-05, "Pretrain/Loss": 2.034841537475586, "Pretrain/Loss (Raw)": 2.1184425354003906, "Pretrain/Step": 2697, "Pretrain/Step Time": 9.153083387762308} +{"Pretrain/Learning Rate": 4.2071919999179036e-05, "Pretrain/Loss": 2.0344319343566895, "Pretrain/Loss (Raw)": 1.934102177619934, "Pretrain/Step": 2698, "Pretrain/Step Time": 9.13682833313942} +{"Pretrain/Learning Rate": 4.206571687768454e-05, "Pretrain/Loss": 2.0338759422302246, "Pretrain/Loss (Raw)": 1.9202316999435425, "Pretrain/Step": 2699, "Pretrain/Step Time": 9.136324524879456} +{"Pretrain/Learning Rate": 4.2059511788091146e-05, "Pretrain/Loss": 2.036314010620117, "Pretrain/Loss (Raw)": 2.034146308898926, "Pretrain/Step": 2700, "Pretrain/Step Time": 9.13897212408483} +{"Pretrain/Learning Rate": 4.205330473111447e-05, "Pretrain/Loss": 2.03385329246521, "Pretrain/Loss (Raw)": 2.109273672103882, "Pretrain/Step": 2701, "Pretrain/Step Time": 9.14566395431757} +{"Pretrain/Learning Rate": 4.204709570747034e-05, "Pretrain/Loss": 2.0324831008911133, "Pretrain/Loss (Raw)": 1.8628240823745728, "Pretrain/Step": 2702, "Pretrain/Step Time": 9.145463103428483} +{"Pretrain/Learning Rate": 4.2040884717874804e-05, "Pretrain/Loss": 2.030752658843994, "Pretrain/Loss (Raw)": 1.90199613571167, "Pretrain/Step": 2703, "Pretrain/Step Time": 9.15106494538486} +{"Pretrain/Learning Rate": 4.203467176304414e-05, "Pretrain/Loss": 2.0319128036499023, "Pretrain/Loss (Raw)": 2.1158885955810547, "Pretrain/Step": 2704, "Pretrain/Step Time": 9.15700476616621} +{"Pretrain/Learning Rate": 4.202845684369486e-05, "Pretrain/Loss": 2.034302234649658, "Pretrain/Loss (Raw)": 2.2702829837799072, "Pretrain/Step": 2705, "Pretrain/Step Time": 9.16088543459773} +{"Pretrain/Learning Rate": 4.202223996054369e-05, "Pretrain/Loss": 2.035033702850342, "Pretrain/Loss (Raw)": 2.099053144454956, "Pretrain/Step": 2706, "Pretrain/Step Time": 9.176746858283877} +{"Pretrain/Learning Rate": 4.20160211143076e-05, "Pretrain/Loss": 2.0348849296569824, "Pretrain/Loss (Raw)": 1.8709136247634888, "Pretrain/Step": 2707, "Pretrain/Step Time": 9.206611327826977} +{"Pretrain/Learning Rate": 4.200980030570377e-05, "Pretrain/Loss": 2.0371592044830322, "Pretrain/Loss (Raw)": 2.054155111312866, "Pretrain/Step": 2708, "Pretrain/Step Time": 9.203599236905575} +{"Pretrain/Learning Rate": 4.2003577535449624e-05, "Pretrain/Loss": 2.03664231300354, "Pretrain/Loss (Raw)": 1.983920931816101, "Pretrain/Step": 2709, "Pretrain/Step Time": 9.20215155556798} +{"Pretrain/Learning Rate": 4.199735280426279e-05, "Pretrain/Loss": 2.039393901824951, "Pretrain/Loss (Raw)": 2.5365121364593506, "Pretrain/Step": 2710, "Pretrain/Step Time": 9.201395345851779} +{"Pretrain/Learning Rate": 4.199112611286113e-05, "Pretrain/Loss": 2.0401182174682617, "Pretrain/Loss (Raw)": 2.1937096118927, "Pretrain/Step": 2711, "Pretrain/Step Time": 9.204287841916084} +{"Pretrain/Learning Rate": 4.1984897461962754e-05, "Pretrain/Loss": 2.0419769287109375, "Pretrain/Loss (Raw)": 2.0848476886749268, "Pretrain/Step": 2712, "Pretrain/Step Time": 9.203110596165061} +{"Pretrain/Learning Rate": 4.197866685228596e-05, "Pretrain/Loss": 2.0397744178771973, "Pretrain/Loss (Raw)": 1.7921885251998901, "Pretrain/Step": 2713, "Pretrain/Step Time": 9.19740411825478} +{"Pretrain/Learning Rate": 4.19724342845493e-05, "Pretrain/Loss": 2.041414737701416, "Pretrain/Loss (Raw)": 2.1613380908966064, "Pretrain/Step": 2714, "Pretrain/Step Time": 9.202307203784585} +{"Pretrain/Learning Rate": 4.1966199759471535e-05, "Pretrain/Loss": 2.0438003540039062, "Pretrain/Loss (Raw)": 2.1814370155334473, "Pretrain/Step": 2715, "Pretrain/Step Time": 9.191224308684468} +{"Pretrain/Learning Rate": 4.195996327777167e-05, "Pretrain/Loss": 2.0458991527557373, "Pretrain/Loss (Raw)": 2.0638253688812256, "Pretrain/Step": 2716, "Pretrain/Step Time": 9.20903635583818} +{"Pretrain/Learning Rate": 4.195372484016893e-05, "Pretrain/Loss": 2.04567289352417, "Pretrain/Loss (Raw)": 2.0268054008483887, "Pretrain/Step": 2717, "Pretrain/Step Time": 9.194424023851752} +{"Pretrain/Learning Rate": 4.1947484447382746e-05, "Pretrain/Loss": 2.0459649562835693, "Pretrain/Loss (Raw)": 2.1235761642456055, "Pretrain/Step": 2718, "Pretrain/Step Time": 9.190692737698555} +{"Pretrain/Learning Rate": 4.194124210013279e-05, "Pretrain/Loss": 2.0445783138275146, "Pretrain/Loss (Raw)": 1.994035243988037, "Pretrain/Step": 2719, "Pretrain/Step Time": 9.187930537387729} +{"Pretrain/Learning Rate": 4.1934997799138976e-05, "Pretrain/Loss": 2.045466423034668, "Pretrain/Loss (Raw)": 2.241297483444214, "Pretrain/Step": 2720, "Pretrain/Step Time": 9.186720820143819} +{"Pretrain/Learning Rate": 4.192875154512141e-05, "Pretrain/Loss": 2.046420097351074, "Pretrain/Loss (Raw)": 2.0764448642730713, "Pretrain/Step": 2721, "Pretrain/Step Time": 9.189579777419567} +{"Pretrain/Learning Rate": 4.192250333880045e-05, "Pretrain/Loss": 2.046938180923462, "Pretrain/Loss (Raw)": 2.2591657638549805, "Pretrain/Step": 2722, "Pretrain/Step Time": 9.186748564243317} +{"Pretrain/Learning Rate": 4.191625318089666e-05, "Pretrain/Loss": 2.050832748413086, "Pretrain/Loss (Raw)": 2.5022850036621094, "Pretrain/Step": 2723, "Pretrain/Step Time": 9.18643394112587} +{"Pretrain/Learning Rate": 4.191000107213084e-05, "Pretrain/Loss": 2.0488624572753906, "Pretrain/Loss (Raw)": 1.940891146659851, "Pretrain/Step": 2724, "Pretrain/Step Time": 9.187512550503016} +{"Pretrain/Learning Rate": 4.190374701322401e-05, "Pretrain/Loss": 2.0493874549865723, "Pretrain/Loss (Raw)": 2.1140358448028564, "Pretrain/Step": 2725, "Pretrain/Step Time": 9.180574122816324} +{"Pretrain/Learning Rate": 4.1897491004897435e-05, "Pretrain/Loss": 2.0494725704193115, "Pretrain/Loss (Raw)": 2.2144267559051514, "Pretrain/Step": 2726, "Pretrain/Step Time": 9.174998769536614} +{"Pretrain/Learning Rate": 4.189123304787256e-05, "Pretrain/Loss": 2.048022985458374, "Pretrain/Loss (Raw)": 1.9358781576156616, "Pretrain/Step": 2727, "Pretrain/Step Time": 9.178834779188037} +{"Pretrain/Learning Rate": 4.1884973142871096e-05, "Pretrain/Loss": 2.051668882369995, "Pretrain/Loss (Raw)": 2.328848361968994, "Pretrain/Step": 2728, "Pretrain/Step Time": 9.181151643395424} +{"Pretrain/Learning Rate": 4.187871129061498e-05, "Pretrain/Loss": 2.0510904788970947, "Pretrain/Loss (Raw)": 2.0209157466888428, "Pretrain/Step": 2729, "Pretrain/Step Time": 9.18625353090465} +{"Pretrain/Learning Rate": 4.187244749182633e-05, "Pretrain/Loss": 2.0493907928466797, "Pretrain/Loss (Raw)": 1.9863243103027344, "Pretrain/Step": 2730, "Pretrain/Step Time": 9.19205716624856} +{"Pretrain/Learning Rate": 4.1866181747227526e-05, "Pretrain/Loss": 2.049834728240967, "Pretrain/Loss (Raw)": 2.1950159072875977, "Pretrain/Step": 2731, "Pretrain/Step Time": 9.197369271889329} +{"Pretrain/Learning Rate": 4.185991405754118e-05, "Pretrain/Loss": 2.049525260925293, "Pretrain/Loss (Raw)": 2.0937516689300537, "Pretrain/Step": 2732, "Pretrain/Step Time": 9.207561507821083} +{"Pretrain/Learning Rate": 4.185364442349008e-05, "Pretrain/Loss": 2.0482022762298584, "Pretrain/Loss (Raw)": 1.9750347137451172, "Pretrain/Step": 2733, "Pretrain/Step Time": 9.183526230975986} +{"Pretrain/Learning Rate": 4.184737284579731e-05, "Pretrain/Loss": 2.04819393157959, "Pretrain/Loss (Raw)": 1.9575848579406738, "Pretrain/Step": 2734, "Pretrain/Step Time": 9.17937234416604} +{"Pretrain/Learning Rate": 4.18410993251861e-05, "Pretrain/Loss": 2.0478429794311523, "Pretrain/Loss (Raw)": 2.0397047996520996, "Pretrain/Step": 2735, "Pretrain/Step Time": 9.171064442023635} +{"Pretrain/Learning Rate": 4.183482386237996e-05, "Pretrain/Loss": 2.0496363639831543, "Pretrain/Loss (Raw)": 2.2181081771850586, "Pretrain/Step": 2736, "Pretrain/Step Time": 9.170522863045335} +{"Pretrain/Learning Rate": 4.182854645810261e-05, "Pretrain/Loss": 2.0491976737976074, "Pretrain/Loss (Raw)": 1.8807412385940552, "Pretrain/Step": 2737, "Pretrain/Step Time": 9.166585771366954} +{"Pretrain/Learning Rate": 4.182226711307798e-05, "Pretrain/Loss": 2.0480613708496094, "Pretrain/Loss (Raw)": 1.8624430894851685, "Pretrain/Step": 2738, "Pretrain/Step Time": 9.164331564679742} +{"Pretrain/Learning Rate": 4.181598582803024e-05, "Pretrain/Loss": 2.0484209060668945, "Pretrain/Loss (Raw)": 2.1874799728393555, "Pretrain/Step": 2739, "Pretrain/Step Time": 9.16186187416315} +{"Pretrain/Learning Rate": 4.1809702603683776e-05, "Pretrain/Loss": 2.0490505695343018, "Pretrain/Loss (Raw)": 1.9404135942459106, "Pretrain/Step": 2740, "Pretrain/Step Time": 9.165234677493572} +{"Pretrain/Learning Rate": 4.1803417440763196e-05, "Pretrain/Loss": 2.0509421825408936, "Pretrain/Loss (Raw)": 2.1156699657440186, "Pretrain/Step": 2741, "Pretrain/Step Time": 9.15979128330946} +{"Pretrain/Learning Rate": 4.179713033999333e-05, "Pretrain/Loss": 2.052332639694214, "Pretrain/Loss (Raw)": 2.1756858825683594, "Pretrain/Step": 2742, "Pretrain/Step Time": 9.175533846020699} +{"Pretrain/Learning Rate": 4.1790841302099246e-05, "Pretrain/Loss": 2.0522830486297607, "Pretrain/Loss (Raw)": 1.9814995527267456, "Pretrain/Step": 2743, "Pretrain/Step Time": 9.197827350348234} +{"Pretrain/Learning Rate": 4.1784550327806226e-05, "Pretrain/Loss": 2.0526034832000732, "Pretrain/Loss (Raw)": 1.9674690961837769, "Pretrain/Step": 2744, "Pretrain/Step Time": 9.202684899792075} +{"Pretrain/Learning Rate": 4.177825741783977e-05, "Pretrain/Loss": 2.050776958465576, "Pretrain/Loss (Raw)": 2.0732831954956055, "Pretrain/Step": 2745, "Pretrain/Step Time": 9.252343760803342} +{"Pretrain/Learning Rate": 4.1771962572925606e-05, "Pretrain/Loss": 2.050949811935425, "Pretrain/Loss (Raw)": 2.143817663192749, "Pretrain/Step": 2746, "Pretrain/Step Time": 9.25454174913466} +{"Pretrain/Learning Rate": 4.176566579378968e-05, "Pretrain/Loss": 2.0509262084960938, "Pretrain/Loss (Raw)": 2.0205893516540527, "Pretrain/Step": 2747, "Pretrain/Step Time": 9.239097438752651} +{"Pretrain/Learning Rate": 4.175936708115818e-05, "Pretrain/Loss": 2.048736572265625, "Pretrain/Loss (Raw)": 1.3464432954788208, "Pretrain/Step": 2748, "Pretrain/Step Time": 9.236652217805386} +{"Pretrain/Learning Rate": 4.1753066435757494e-05, "Pretrain/Loss": 2.049875259399414, "Pretrain/Loss (Raw)": 2.1484992504119873, "Pretrain/Step": 2749, "Pretrain/Step Time": 9.224338449537754} +{"Pretrain/Learning Rate": 4.1746763858314244e-05, "Pretrain/Loss": 2.04902982711792, "Pretrain/Loss (Raw)": 1.944884181022644, "Pretrain/Step": 2750, "Pretrain/Step Time": 9.222221542149782} +{"Pretrain/Learning Rate": 4.174045934955527e-05, "Pretrain/Loss": 2.049705982208252, "Pretrain/Loss (Raw)": 2.1115634441375732, "Pretrain/Step": 2751, "Pretrain/Step Time": 9.212182121351361} +{"Pretrain/Learning Rate": 4.173415291020764e-05, "Pretrain/Loss": 2.0488739013671875, "Pretrain/Loss (Raw)": 2.1163506507873535, "Pretrain/Step": 2752, "Pretrain/Step Time": 9.209354236721992} +{"Pretrain/Learning Rate": 4.172784454099865e-05, "Pretrain/Loss": 2.0485072135925293, "Pretrain/Loss (Raw)": 1.988154649734497, "Pretrain/Step": 2753, "Pretrain/Step Time": 9.205754160881042} +{"Pretrain/Learning Rate": 4.172153424265579e-05, "Pretrain/Loss": 2.0473856925964355, "Pretrain/Loss (Raw)": 1.9914613962173462, "Pretrain/Step": 2754, "Pretrain/Step Time": 9.206513928249478} +{"Pretrain/Learning Rate": 4.171522201590682e-05, "Pretrain/Loss": 2.047394037246704, "Pretrain/Loss (Raw)": 2.1020750999450684, "Pretrain/Step": 2755, "Pretrain/Step Time": 9.20618431828916} +{"Pretrain/Learning Rate": 4.170890786147967e-05, "Pretrain/Loss": 2.0453314781188965, "Pretrain/Loss (Raw)": 1.9015133380889893, "Pretrain/Step": 2756, "Pretrain/Step Time": 9.201914137229323} +{"Pretrain/Learning Rate": 4.170259178010254e-05, "Pretrain/Loss": 2.043773651123047, "Pretrain/Loss (Raw)": 1.9213180541992188, "Pretrain/Step": 2757, "Pretrain/Step Time": 9.235907576978207} +{"Pretrain/Learning Rate": 4.169627377250382e-05, "Pretrain/Loss": 2.044248342514038, "Pretrain/Loss (Raw)": 2.1257681846618652, "Pretrain/Step": 2758, "Pretrain/Step Time": 9.233286889269948} +{"Pretrain/Learning Rate": 4.1689953839412124e-05, "Pretrain/Loss": 2.042288064956665, "Pretrain/Loss (Raw)": 1.7362608909606934, "Pretrain/Step": 2759, "Pretrain/Step Time": 9.231282103806734} +{"Pretrain/Learning Rate": 4.1683631981556314e-05, "Pretrain/Loss": 2.043292999267578, "Pretrain/Loss (Raw)": 2.271904230117798, "Pretrain/Step": 2760, "Pretrain/Step Time": 9.236854227259755} +{"Pretrain/Learning Rate": 4.167730819966545e-05, "Pretrain/Loss": 2.044140338897705, "Pretrain/Loss (Raw)": 2.0822277069091797, "Pretrain/Step": 2761, "Pretrain/Step Time": 9.237197471782565} +{"Pretrain/Learning Rate": 4.167098249446881e-05, "Pretrain/Loss": 2.0445001125335693, "Pretrain/Loss (Raw)": 2.156886339187622, "Pretrain/Step": 2762, "Pretrain/Step Time": 9.229760298505425} +{"Pretrain/Learning Rate": 4.166465486669592e-05, "Pretrain/Loss": 2.043208599090576, "Pretrain/Loss (Raw)": 1.9962471723556519, "Pretrain/Step": 2763, "Pretrain/Step Time": 9.22603976354003} +{"Pretrain/Learning Rate": 4.16583253170765e-05, "Pretrain/Loss": 2.0445733070373535, "Pretrain/Loss (Raw)": 2.2057008743286133, "Pretrain/Step": 2764, "Pretrain/Step Time": 9.22780585475266} +{"Pretrain/Learning Rate": 4.165199384634051e-05, "Pretrain/Loss": 2.0446152687072754, "Pretrain/Loss (Raw)": 2.051467180252075, "Pretrain/Step": 2765, "Pretrain/Step Time": 9.228725228458643} +{"Pretrain/Learning Rate": 4.164566045521812e-05, "Pretrain/Loss": 2.046675682067871, "Pretrain/Loss (Raw)": 2.041769027709961, "Pretrain/Step": 2766, "Pretrain/Step Time": 9.224999470636249} +{"Pretrain/Learning Rate": 4.163932514443973e-05, "Pretrain/Loss": 2.0473110675811768, "Pretrain/Loss (Raw)": 2.1284711360931396, "Pretrain/Step": 2767, "Pretrain/Step Time": 9.234479736536741} +{"Pretrain/Learning Rate": 4.163298791473596e-05, "Pretrain/Loss": 2.048553943634033, "Pretrain/Loss (Raw)": 2.1101760864257812, "Pretrain/Step": 2768, "Pretrain/Step Time": 9.235940435901284} +{"Pretrain/Learning Rate": 4.1626648766837654e-05, "Pretrain/Loss": 2.046811580657959, "Pretrain/Loss (Raw)": 1.8721323013305664, "Pretrain/Step": 2769, "Pretrain/Step Time": 9.247984224930406} +{"Pretrain/Learning Rate": 4.162030770147585e-05, "Pretrain/Loss": 2.0466976165771484, "Pretrain/Loss (Raw)": 1.9644861221313477, "Pretrain/Step": 2770, "Pretrain/Step Time": 9.227086614817381} +{"Pretrain/Learning Rate": 4.161396471938185e-05, "Pretrain/Loss": 2.046525001525879, "Pretrain/Loss (Raw)": 1.8453471660614014, "Pretrain/Step": 2771, "Pretrain/Step Time": 9.255908012390137} +{"Pretrain/Learning Rate": 4.1607619821287154e-05, "Pretrain/Loss": 2.0493903160095215, "Pretrain/Loss (Raw)": 2.1610469818115234, "Pretrain/Step": 2772, "Pretrain/Step Time": 9.24874715693295} +{"Pretrain/Learning Rate": 4.160127300792348e-05, "Pretrain/Loss": 2.049107074737549, "Pretrain/Loss (Raw)": 2.2845733165740967, "Pretrain/Step": 2773, "Pretrain/Step Time": 9.243363974615932} +{"Pretrain/Learning Rate": 4.159492428002277e-05, "Pretrain/Loss": 2.0448827743530273, "Pretrain/Loss (Raw)": 1.6293514966964722, "Pretrain/Step": 2774, "Pretrain/Step Time": 9.239011710509658} +{"Pretrain/Learning Rate": 4.1588573638317195e-05, "Pretrain/Loss": 2.045891523361206, "Pretrain/Loss (Raw)": 2.056204080581665, "Pretrain/Step": 2775, "Pretrain/Step Time": 9.240502057597041} +{"Pretrain/Learning Rate": 4.158222108353915e-05, "Pretrain/Loss": 2.0466954708099365, "Pretrain/Loss (Raw)": 2.0023534297943115, "Pretrain/Step": 2776, "Pretrain/Step Time": 9.23973759636283} +{"Pretrain/Learning Rate": 4.1575866616421224e-05, "Pretrain/Loss": 2.048210620880127, "Pretrain/Loss (Raw)": 1.997229814529419, "Pretrain/Step": 2777, "Pretrain/Step Time": 9.236896084621549} +{"Pretrain/Learning Rate": 4.156951023769625e-05, "Pretrain/Loss": 2.048595905303955, "Pretrain/Loss (Raw)": 2.0599911212921143, "Pretrain/Step": 2778, "Pretrain/Step Time": 9.235775124281645} +{"Pretrain/Learning Rate": 4.156315194809728e-05, "Pretrain/Loss": 2.0494794845581055, "Pretrain/Loss (Raw)": 2.1430959701538086, "Pretrain/Step": 2779, "Pretrain/Step Time": 9.24052057042718} +{"Pretrain/Learning Rate": 4.1556791748357584e-05, "Pretrain/Loss": 2.0477867126464844, "Pretrain/Loss (Raw)": 1.874977469444275, "Pretrain/Step": 2780, "Pretrain/Step Time": 9.243858110159636} +{"Pretrain/Learning Rate": 4.155042963921064e-05, "Pretrain/Loss": 2.0474324226379395, "Pretrain/Loss (Raw)": 2.1127288341522217, "Pretrain/Step": 2781, "Pretrain/Step Time": 9.257008086889982} +{"Pretrain/Learning Rate": 4.1544065621390165e-05, "Pretrain/Loss": 2.0468780994415283, "Pretrain/Loss (Raw)": 2.0630698204040527, "Pretrain/Step": 2782, "Pretrain/Step Time": 9.280233783647418} +{"Pretrain/Learning Rate": 4.153769969563008e-05, "Pretrain/Loss": 2.0479846000671387, "Pretrain/Loss (Raw)": 2.07118558883667, "Pretrain/Step": 2783, "Pretrain/Step Time": 9.277964828535914} +{"Pretrain/Learning Rate": 4.1531331862664545e-05, "Pretrain/Loss": 2.048022985458374, "Pretrain/Loss (Raw)": 2.0886194705963135, "Pretrain/Step": 2784, "Pretrain/Step Time": 9.27274958230555} +{"Pretrain/Learning Rate": 4.1524962123227914e-05, "Pretrain/Loss": 2.052041530609131, "Pretrain/Loss (Raw)": 2.1257505416870117, "Pretrain/Step": 2785, "Pretrain/Step Time": 9.271179802715778} +{"Pretrain/Learning Rate": 4.151859047805479e-05, "Pretrain/Loss": 2.0502467155456543, "Pretrain/Loss (Raw)": 1.7686316967010498, "Pretrain/Step": 2786, "Pretrain/Step Time": 9.269196603447199} +{"Pretrain/Learning Rate": 4.151221692787997e-05, "Pretrain/Loss": 2.049760580062866, "Pretrain/Loss (Raw)": 2.071302652359009, "Pretrain/Step": 2787, "Pretrain/Step Time": 9.274912770837545} +{"Pretrain/Learning Rate": 4.1505841473438485e-05, "Pretrain/Loss": 2.0485198497772217, "Pretrain/Loss (Raw)": 2.090069532394409, "Pretrain/Step": 2788, "Pretrain/Step Time": 9.282566038891673} +{"Pretrain/Learning Rate": 4.149946411546558e-05, "Pretrain/Loss": 2.047426700592041, "Pretrain/Loss (Raw)": 2.2015748023986816, "Pretrain/Step": 2789, "Pretrain/Step Time": 9.250964960083365} +{"Pretrain/Learning Rate": 4.1493084854696726e-05, "Pretrain/Loss": 2.0478403568267822, "Pretrain/Loss (Raw)": 2.072976589202881, "Pretrain/Step": 2790, "Pretrain/Step Time": 9.258815750479698} +{"Pretrain/Learning Rate": 4.1486703691867616e-05, "Pretrain/Loss": 2.0495615005493164, "Pretrain/Loss (Raw)": 2.1411428451538086, "Pretrain/Step": 2791, "Pretrain/Step Time": 9.266548171639442} +{"Pretrain/Learning Rate": 4.148032062771414e-05, "Pretrain/Loss": 2.0481553077697754, "Pretrain/Loss (Raw)": 1.8532781600952148, "Pretrain/Step": 2792, "Pretrain/Step Time": 9.272510239854455} +{"Pretrain/Learning Rate": 4.147393566297244e-05, "Pretrain/Loss": 2.0473227500915527, "Pretrain/Loss (Raw)": 1.9747599363327026, "Pretrain/Step": 2793, "Pretrain/Step Time": 9.266592970117927} +{"Pretrain/Learning Rate": 4.1467548798378847e-05, "Pretrain/Loss": 2.04738187789917, "Pretrain/Loss (Raw)": 2.000483751296997, "Pretrain/Step": 2794, "Pretrain/Step Time": 9.307112403213978} +{"Pretrain/Learning Rate": 4.1461160034669925e-05, "Pretrain/Loss": 2.0493240356445312, "Pretrain/Loss (Raw)": 2.160285234451294, "Pretrain/Step": 2795, "Pretrain/Step Time": 9.300911026075482} +{"Pretrain/Learning Rate": 4.145476937258247e-05, "Pretrain/Loss": 2.0494704246520996, "Pretrain/Loss (Raw)": 2.0808701515197754, "Pretrain/Step": 2796, "Pretrain/Step Time": 9.32693943940103} +{"Pretrain/Learning Rate": 4.144837681285346e-05, "Pretrain/Loss": 2.050199031829834, "Pretrain/Loss (Raw)": 2.20318865776062, "Pretrain/Step": 2797, "Pretrain/Step Time": 9.335734704509377} +{"Pretrain/Learning Rate": 4.1441982356220144e-05, "Pretrain/Loss": 2.0500025749206543, "Pretrain/Loss (Raw)": 1.9502592086791992, "Pretrain/Step": 2798, "Pretrain/Step Time": 9.337015165016055} +{"Pretrain/Learning Rate": 4.1435586003419935e-05, "Pretrain/Loss": 2.0494468212127686, "Pretrain/Loss (Raw)": 2.1535587310791016, "Pretrain/Step": 2799, "Pretrain/Step Time": 9.339187264442444} +{"Pretrain/Learning Rate": 4.1429187755190504e-05, "Pretrain/Loss": 2.0497891902923584, "Pretrain/Loss (Raw)": 1.9591014385223389, "Pretrain/Step": 2800, "Pretrain/Step Time": 9.328249417245388} +{"Pretrain/Learning Rate": 4.1422787612269726e-05, "Pretrain/Loss": 2.0502450466156006, "Pretrain/Loss (Raw)": 2.2175791263580322, "Pretrain/Step": 2801, "Pretrain/Step Time": 9.322693347930908} +{"Pretrain/Learning Rate": 4.1416385575395686e-05, "Pretrain/Loss": 2.0519211292266846, "Pretrain/Loss (Raw)": 1.998043417930603, "Pretrain/Step": 2802, "Pretrain/Step Time": 9.32128619030118} +{"Pretrain/Learning Rate": 4.140998164530672e-05, "Pretrain/Loss": 2.053811550140381, "Pretrain/Loss (Raw)": 2.3612117767333984, "Pretrain/Step": 2803, "Pretrain/Step Time": 9.32196949981153} +{"Pretrain/Learning Rate": 4.140357582274133e-05, "Pretrain/Loss": 2.0553970336914062, "Pretrain/Loss (Raw)": 2.227212429046631, "Pretrain/Step": 2804, "Pretrain/Step Time": 9.317979585379362} +{"Pretrain/Learning Rate": 4.1397168108438286e-05, "Pretrain/Loss": 2.0557730197906494, "Pretrain/Loss (Raw)": 2.051112174987793, "Pretrain/Step": 2805, "Pretrain/Step Time": 9.311417987570167} +{"Pretrain/Learning Rate": 4.139075850313655e-05, "Pretrain/Loss": 2.0534729957580566, "Pretrain/Loss (Raw)": 1.842976689338684, "Pretrain/Step": 2806, "Pretrain/Step Time": 9.31916793063283} +{"Pretrain/Learning Rate": 4.1384347007575305e-05, "Pretrain/Loss": 2.051809310913086, "Pretrain/Loss (Raw)": 1.9311788082122803, "Pretrain/Step": 2807, "Pretrain/Step Time": 9.313798166811466} +{"Pretrain/Learning Rate": 4.137793362249396e-05, "Pretrain/Loss": 2.052001953125, "Pretrain/Loss (Raw)": 2.2770278453826904, "Pretrain/Step": 2808, "Pretrain/Step Time": 9.31648469530046} +{"Pretrain/Learning Rate": 4.137151834863213e-05, "Pretrain/Loss": 2.05037260055542, "Pretrain/Loss (Raw)": 2.0413661003112793, "Pretrain/Step": 2809, "Pretrain/Step Time": 9.319725571200252} +{"Pretrain/Learning Rate": 4.136510118672966e-05, "Pretrain/Loss": 2.0495247840881348, "Pretrain/Loss (Raw)": 2.0661253929138184, "Pretrain/Step": 2810, "Pretrain/Step Time": 9.296428276225924} +{"Pretrain/Learning Rate": 4.135868213752661e-05, "Pretrain/Loss": 2.05246639251709, "Pretrain/Loss (Raw)": 2.075183629989624, "Pretrain/Step": 2811, "Pretrain/Step Time": 9.28747426904738} +{"Pretrain/Learning Rate": 4.135226120176325e-05, "Pretrain/Loss": 2.050546169281006, "Pretrain/Loss (Raw)": 1.942751169204712, "Pretrain/Step": 2812, "Pretrain/Step Time": 9.288424169644713} +{"Pretrain/Learning Rate": 4.134583838018007e-05, "Pretrain/Loss": 2.049595355987549, "Pretrain/Loss (Raw)": 1.9390289783477783, "Pretrain/Step": 2813, "Pretrain/Step Time": 9.279798623174429} +{"Pretrain/Learning Rate": 4.133941367351779e-05, "Pretrain/Loss": 2.0501136779785156, "Pretrain/Loss (Raw)": 2.2205159664154053, "Pretrain/Step": 2814, "Pretrain/Step Time": 9.281205389648676} +{"Pretrain/Learning Rate": 4.133298708251733e-05, "Pretrain/Loss": 2.0509557723999023, "Pretrain/Loss (Raw)": 1.9867674112319946, "Pretrain/Step": 2815, "Pretrain/Step Time": 9.250921364873648} +{"Pretrain/Learning Rate": 4.132655860791983e-05, "Pretrain/Loss": 2.052666187286377, "Pretrain/Loss (Raw)": 1.9168466329574585, "Pretrain/Step": 2816, "Pretrain/Step Time": 9.251597914844751} +{"Pretrain/Learning Rate": 4.132012825046666e-05, "Pretrain/Loss": 2.050680160522461, "Pretrain/Loss (Raw)": 1.9567289352416992, "Pretrain/Step": 2817, "Pretrain/Step Time": 9.256031822413206} +{"Pretrain/Learning Rate": 4.13136960108994e-05, "Pretrain/Loss": 2.049933910369873, "Pretrain/Loss (Raw)": 1.7948261499404907, "Pretrain/Step": 2818, "Pretrain/Step Time": 9.255671000108123} +{"Pretrain/Learning Rate": 4.130726188995985e-05, "Pretrain/Loss": 2.0538721084594727, "Pretrain/Loss (Raw)": 2.1301324367523193, "Pretrain/Step": 2819, "Pretrain/Step Time": 9.240870589390397} +{"Pretrain/Learning Rate": 4.1300825888390006e-05, "Pretrain/Loss": 2.054255723953247, "Pretrain/Loss (Raw)": 2.061356544494629, "Pretrain/Step": 2820, "Pretrain/Step Time": 9.236778421327472} +{"Pretrain/Learning Rate": 4.1294388006932114e-05, "Pretrain/Loss": 2.0544400215148926, "Pretrain/Loss (Raw)": 2.0892748832702637, "Pretrain/Step": 2821, "Pretrain/Step Time": 9.237951224669814} +{"Pretrain/Learning Rate": 4.128794824632861e-05, "Pretrain/Loss": 2.05462646484375, "Pretrain/Loss (Raw)": 2.253952980041504, "Pretrain/Step": 2822, "Pretrain/Step Time": 9.256884509697556} +{"Pretrain/Learning Rate": 4.1281506607322167e-05, "Pretrain/Loss": 2.053645610809326, "Pretrain/Loss (Raw)": 1.8957456350326538, "Pretrain/Step": 2823, "Pretrain/Step Time": 9.247054992243648} +{"Pretrain/Learning Rate": 4.1275063090655666e-05, "Pretrain/Loss": 2.0530073642730713, "Pretrain/Loss (Raw)": 2.112905502319336, "Pretrain/Step": 2824, "Pretrain/Step Time": 9.250343011692166} +{"Pretrain/Learning Rate": 4.126861769707219e-05, "Pretrain/Loss": 2.0504355430603027, "Pretrain/Loss (Raw)": 1.7892450094223022, "Pretrain/Step": 2825, "Pretrain/Step Time": 9.252929922193289} +{"Pretrain/Learning Rate": 4.126217042731507e-05, "Pretrain/Loss": 2.0512256622314453, "Pretrain/Loss (Raw)": 2.035264015197754, "Pretrain/Step": 2826, "Pretrain/Step Time": 9.251517187803984} +{"Pretrain/Learning Rate": 4.125572128212781e-05, "Pretrain/Loss": 2.0509839057922363, "Pretrain/Loss (Raw)": 1.8892627954483032, "Pretrain/Step": 2827, "Pretrain/Step Time": 9.249060466885567} +{"Pretrain/Learning Rate": 4.124927026225419e-05, "Pretrain/Loss": 2.050945281982422, "Pretrain/Loss (Raw)": 2.029221773147583, "Pretrain/Step": 2828, "Pretrain/Step Time": 9.248702581971884} +{"Pretrain/Learning Rate": 4.124281736843815e-05, "Pretrain/Loss": 2.0499634742736816, "Pretrain/Loss (Raw)": 1.983605146408081, "Pretrain/Step": 2829, "Pretrain/Step Time": 9.247896358370781} +{"Pretrain/Learning Rate": 4.1236362601423865e-05, "Pretrain/Loss": 2.0515365600585938, "Pretrain/Loss (Raw)": 2.064182996749878, "Pretrain/Step": 2830, "Pretrain/Step Time": 9.247035559266806} +{"Pretrain/Learning Rate": 4.122990596195574e-05, "Pretrain/Loss": 2.051884412765503, "Pretrain/Loss (Raw)": 1.9465038776397705, "Pretrain/Step": 2831, "Pretrain/Step Time": 9.24254542030394} +{"Pretrain/Learning Rate": 4.122344745077838e-05, "Pretrain/Loss": 2.0518386363983154, "Pretrain/Loss (Raw)": 2.110025405883789, "Pretrain/Step": 2832, "Pretrain/Step Time": 9.233143247663975} +{"Pretrain/Learning Rate": 4.121698706863662e-05, "Pretrain/Loss": 2.049997091293335, "Pretrain/Loss (Raw)": 2.03456449508667, "Pretrain/Step": 2833, "Pretrain/Step Time": 9.233261736109853} +{"Pretrain/Learning Rate": 4.121052481627549e-05, "Pretrain/Loss": 2.0494775772094727, "Pretrain/Loss (Raw)": 2.0325419902801514, "Pretrain/Step": 2834, "Pretrain/Step Time": 9.219461245462298} +{"Pretrain/Learning Rate": 4.120406069444025e-05, "Pretrain/Loss": 2.051337718963623, "Pretrain/Loss (Raw)": 2.1090235710144043, "Pretrain/Step": 2835, "Pretrain/Step Time": 9.190024165436625} +{"Pretrain/Learning Rate": 4.119759470387637e-05, "Pretrain/Loss": 2.0498785972595215, "Pretrain/Loss (Raw)": 1.867390751838684, "Pretrain/Step": 2836, "Pretrain/Step Time": 9.192176533862948} +{"Pretrain/Learning Rate": 4.1191126845329554e-05, "Pretrain/Loss": 2.0523762702941895, "Pretrain/Loss (Raw)": 2.303637981414795, "Pretrain/Step": 2837, "Pretrain/Step Time": 9.1928405854851} +{"Pretrain/Learning Rate": 4.118465711954569e-05, "Pretrain/Loss": 2.0488317012786865, "Pretrain/Loss (Raw)": 2.082803249359131, "Pretrain/Step": 2838, "Pretrain/Step Time": 9.193421004340053} +{"Pretrain/Learning Rate": 4.1178185527270905e-05, "Pretrain/Loss": 2.0456418991088867, "Pretrain/Loss (Raw)": 1.7854293584823608, "Pretrain/Step": 2839, "Pretrain/Step Time": 9.19264305010438} +{"Pretrain/Learning Rate": 4.1171712069251534e-05, "Pretrain/Loss": 2.045546054840088, "Pretrain/Loss (Raw)": 2.072547435760498, "Pretrain/Step": 2840, "Pretrain/Step Time": 9.208646973595023} +{"Pretrain/Learning Rate": 4.116523674623412e-05, "Pretrain/Loss": 2.04789137840271, "Pretrain/Loss (Raw)": 2.0924031734466553, "Pretrain/Step": 2841, "Pretrain/Step Time": 9.212249837815762} +{"Pretrain/Learning Rate": 4.115875955896543e-05, "Pretrain/Loss": 2.0478973388671875, "Pretrain/Loss (Raw)": 2.1620981693267822, "Pretrain/Step": 2842, "Pretrain/Step Time": 9.206033255904913} +{"Pretrain/Learning Rate": 4.115228050819244e-05, "Pretrain/Loss": 2.046700954437256, "Pretrain/Loss (Raw)": 2.0283164978027344, "Pretrain/Step": 2843, "Pretrain/Step Time": 9.204092361032963} +{"Pretrain/Learning Rate": 4.114579959466235e-05, "Pretrain/Loss": 2.046788454055786, "Pretrain/Loss (Raw)": 2.0750105381011963, "Pretrain/Step": 2844, "Pretrain/Step Time": 9.19630534760654} +{"Pretrain/Learning Rate": 4.113931681912257e-05, "Pretrain/Loss": 2.0480589866638184, "Pretrain/Loss (Raw)": 2.189450979232788, "Pretrain/Step": 2845, "Pretrain/Step Time": 9.207311382517219} +{"Pretrain/Learning Rate": 4.113283218232073e-05, "Pretrain/Loss": 2.045374870300293, "Pretrain/Loss (Raw)": 1.7800074815750122, "Pretrain/Step": 2846, "Pretrain/Step Time": 9.203488850966096} +{"Pretrain/Learning Rate": 4.112634568500466e-05, "Pretrain/Loss": 2.0463953018188477, "Pretrain/Loss (Raw)": 2.124638319015503, "Pretrain/Step": 2847, "Pretrain/Step Time": 9.206106211990118} +{"Pretrain/Learning Rate": 4.111985732792242e-05, "Pretrain/Loss": 2.046750068664551, "Pretrain/Loss (Raw)": 2.286686420440674, "Pretrain/Step": 2848, "Pretrain/Step Time": 9.213707892224193} +{"Pretrain/Learning Rate": 4.111336711182226e-05, "Pretrain/Loss": 2.0471551418304443, "Pretrain/Loss (Raw)": 2.1283154487609863, "Pretrain/Step": 2849, "Pretrain/Step Time": 9.208862351253629} +{"Pretrain/Learning Rate": 4.110687503745269e-05, "Pretrain/Loss": 2.045177459716797, "Pretrain/Loss (Raw)": 2.005997657775879, "Pretrain/Step": 2850, "Pretrain/Step Time": 9.211459396407008} +{"Pretrain/Learning Rate": 4.1100381105562394e-05, "Pretrain/Loss": 2.042048454284668, "Pretrain/Loss (Raw)": 2.10178804397583, "Pretrain/Step": 2851, "Pretrain/Step Time": 9.215549491345882} +{"Pretrain/Learning Rate": 4.109388531690027e-05, "Pretrain/Loss": 2.039875030517578, "Pretrain/Loss (Raw)": 1.6627061367034912, "Pretrain/Step": 2852, "Pretrain/Step Time": 9.21019752882421} +{"Pretrain/Learning Rate": 4.108738767221546e-05, "Pretrain/Loss": 2.039017677307129, "Pretrain/Loss (Raw)": 2.00429630279541, "Pretrain/Step": 2853, "Pretrain/Step Time": 9.21688031218946} +{"Pretrain/Learning Rate": 4.108088817225729e-05, "Pretrain/Loss": 2.037144660949707, "Pretrain/Loss (Raw)": 1.9746581315994263, "Pretrain/Step": 2854, "Pretrain/Step Time": 9.217791147530079} +{"Pretrain/Learning Rate": 4.1074386817775334e-05, "Pretrain/Loss": 2.037355899810791, "Pretrain/Loss (Raw)": 1.9629361629486084, "Pretrain/Step": 2855, "Pretrain/Step Time": 9.21773492358625} +{"Pretrain/Learning Rate": 4.106788360951934e-05, "Pretrain/Loss": 2.0341427326202393, "Pretrain/Loss (Raw)": 1.917545199394226, "Pretrain/Step": 2856, "Pretrain/Step Time": 9.229100732132792} +{"Pretrain/Learning Rate": 4.106137854823929e-05, "Pretrain/Loss": 2.034147024154663, "Pretrain/Loss (Raw)": 2.021486759185791, "Pretrain/Step": 2857, "Pretrain/Step Time": 9.218199465423822} +{"Pretrain/Learning Rate": 4.1054871634685385e-05, "Pretrain/Loss": 2.03291916847229, "Pretrain/Loss (Raw)": 1.8291321992874146, "Pretrain/Step": 2858, "Pretrain/Step Time": 9.21252472139895} +{"Pretrain/Learning Rate": 4.104836286960802e-05, "Pretrain/Loss": 2.032212018966675, "Pretrain/Loss (Raw)": 2.1045126914978027, "Pretrain/Step": 2859, "Pretrain/Step Time": 9.20231269672513} +{"Pretrain/Learning Rate": 4.1041852253757836e-05, "Pretrain/Loss": 2.032683849334717, "Pretrain/Loss (Raw)": 2.1541645526885986, "Pretrain/Step": 2860, "Pretrain/Step Time": 9.205665942281485} +{"Pretrain/Learning Rate": 4.103533978788566e-05, "Pretrain/Loss": 2.034299373626709, "Pretrain/Loss (Raw)": 2.1817924976348877, "Pretrain/Step": 2861, "Pretrain/Step Time": 9.202029002830386} +{"Pretrain/Learning Rate": 4.1028825472742536e-05, "Pretrain/Loss": 2.03627872467041, "Pretrain/Loss (Raw)": 2.210970640182495, "Pretrain/Step": 2862, "Pretrain/Step Time": 9.207925794646144} +{"Pretrain/Learning Rate": 4.1022309309079734e-05, "Pretrain/Loss": 2.0383496284484863, "Pretrain/Loss (Raw)": 2.304779052734375, "Pretrain/Step": 2863, "Pretrain/Step Time": 9.209013490006328} +{"Pretrain/Learning Rate": 4.1015791297648716e-05, "Pretrain/Loss": 2.03753662109375, "Pretrain/Loss (Raw)": 2.1140196323394775, "Pretrain/Step": 2864, "Pretrain/Step Time": 9.20902307331562} +{"Pretrain/Learning Rate": 4.100927143920118e-05, "Pretrain/Loss": 2.039479970932007, "Pretrain/Loss (Raw)": 2.1295156478881836, "Pretrain/Step": 2865, "Pretrain/Step Time": 9.212386805564165} +{"Pretrain/Learning Rate": 4.100274973448902e-05, "Pretrain/Loss": 2.039987087249756, "Pretrain/Loss (Raw)": 1.9273377656936646, "Pretrain/Step": 2866, "Pretrain/Step Time": 9.213268741965294} +{"Pretrain/Learning Rate": 4.099622618426436e-05, "Pretrain/Loss": 2.0381669998168945, "Pretrain/Loss (Raw)": 1.9545072317123413, "Pretrain/Step": 2867, "Pretrain/Step Time": 9.215175490826368} +{"Pretrain/Learning Rate": 4.098970078927951e-05, "Pretrain/Loss": 2.041501522064209, "Pretrain/Loss (Raw)": 2.3672499656677246, "Pretrain/Step": 2868, "Pretrain/Step Time": 9.214299911633134} +{"Pretrain/Learning Rate": 4.0983173550287026e-05, "Pretrain/Loss": 2.0412092208862305, "Pretrain/Loss (Raw)": 2.078244209289551, "Pretrain/Step": 2869, "Pretrain/Step Time": 9.211583316326141} +{"Pretrain/Learning Rate": 4.0976644468039646e-05, "Pretrain/Loss": 2.0403554439544678, "Pretrain/Loss (Raw)": 2.066405773162842, "Pretrain/Step": 2870, "Pretrain/Step Time": 9.20401014201343} +{"Pretrain/Learning Rate": 4.097011354329035e-05, "Pretrain/Loss": 2.041419267654419, "Pretrain/Loss (Raw)": 2.1176705360412598, "Pretrain/Step": 2871, "Pretrain/Step Time": 9.176508465781808} +{"Pretrain/Learning Rate": 4.096358077679231e-05, "Pretrain/Loss": 2.045461416244507, "Pretrain/Loss (Raw)": 2.484853982925415, "Pretrain/Step": 2872, "Pretrain/Step Time": 9.17310611717403} +{"Pretrain/Learning Rate": 4.0957046169298895e-05, "Pretrain/Loss": 2.0455379486083984, "Pretrain/Loss (Raw)": 2.083096742630005, "Pretrain/Step": 2873, "Pretrain/Step Time": 9.117992881685495} +{"Pretrain/Learning Rate": 4.095050972156374e-05, "Pretrain/Loss": 2.043699264526367, "Pretrain/Loss (Raw)": 1.9084354639053345, "Pretrain/Step": 2874, "Pretrain/Step Time": 9.11585534363985} +{"Pretrain/Learning Rate": 4.0943971434340633e-05, "Pretrain/Loss": 2.043238878250122, "Pretrain/Loss (Raw)": 1.9616763591766357, "Pretrain/Step": 2875, "Pretrain/Step Time": 9.108198437839746} +{"Pretrain/Learning Rate": 4.093743130838361e-05, "Pretrain/Loss": 2.044914722442627, "Pretrain/Loss (Raw)": 1.560966968536377, "Pretrain/Step": 2876, "Pretrain/Step Time": 9.107409475371242} +{"Pretrain/Learning Rate": 4.093088934444692e-05, "Pretrain/Loss": 2.043757915496826, "Pretrain/Loss (Raw)": 2.000427007675171, "Pretrain/Step": 2877, "Pretrain/Step Time": 9.11023772135377} +{"Pretrain/Learning Rate": 4.092434554328499e-05, "Pretrain/Loss": 2.0443315505981445, "Pretrain/Loss (Raw)": 2.0182676315307617, "Pretrain/Step": 2878, "Pretrain/Step Time": 9.115558939054608} +{"Pretrain/Learning Rate": 4.09177999056525e-05, "Pretrain/Loss": 2.04242205619812, "Pretrain/Loss (Raw)": 1.8671692609786987, "Pretrain/Step": 2879, "Pretrain/Step Time": 9.125118354335427} +{"Pretrain/Learning Rate": 4.0911252432304316e-05, "Pretrain/Loss": 2.042938709259033, "Pretrain/Loss (Raw)": 2.182471513748169, "Pretrain/Step": 2880, "Pretrain/Step Time": 9.125759650021791} +{"Pretrain/Learning Rate": 4.0904703123995516e-05, "Pretrain/Loss": 2.0430822372436523, "Pretrain/Loss (Raw)": 2.006558418273926, "Pretrain/Step": 2881, "Pretrain/Step Time": 9.135952519252896} +{"Pretrain/Learning Rate": 4.0898151981481416e-05, "Pretrain/Loss": 2.043179512023926, "Pretrain/Loss (Raw)": 2.0039193630218506, "Pretrain/Step": 2882, "Pretrain/Step Time": 9.148595256730914} +{"Pretrain/Learning Rate": 4.089159900551752e-05, "Pretrain/Loss": 2.040881633758545, "Pretrain/Loss (Raw)": 1.807936429977417, "Pretrain/Step": 2883, "Pretrain/Step Time": 9.186308333650231} +{"Pretrain/Learning Rate": 4.0885044196859537e-05, "Pretrain/Loss": 2.0421459674835205, "Pretrain/Loss (Raw)": 2.0633232593536377, "Pretrain/Step": 2884, "Pretrain/Step Time": 9.186239380389452} +{"Pretrain/Learning Rate": 4.08784875562634e-05, "Pretrain/Loss": 2.042140245437622, "Pretrain/Loss (Raw)": 1.9205882549285889, "Pretrain/Step": 2885, "Pretrain/Step Time": 9.159301238134503} +{"Pretrain/Learning Rate": 4.087192908448526e-05, "Pretrain/Loss": 2.041552782058716, "Pretrain/Loss (Raw)": 2.0505847930908203, "Pretrain/Step": 2886, "Pretrain/Step Time": 9.155872248113155} +{"Pretrain/Learning Rate": 4.086536878228147e-05, "Pretrain/Loss": 2.0449585914611816, "Pretrain/Loss (Raw)": 2.1722123622894287, "Pretrain/Step": 2887, "Pretrain/Step Time": 9.159469179809093} +{"Pretrain/Learning Rate": 4.0858806650408586e-05, "Pretrain/Loss": 2.0436289310455322, "Pretrain/Loss (Raw)": 2.101698398590088, "Pretrain/Step": 2888, "Pretrain/Step Time": 9.152494981884956} +{"Pretrain/Learning Rate": 4.08522426896234e-05, "Pretrain/Loss": 2.0428245067596436, "Pretrain/Loss (Raw)": 1.9792550802230835, "Pretrain/Step": 2889, "Pretrain/Step Time": 9.149087239056826} +{"Pretrain/Learning Rate": 4.0845676900682884e-05, "Pretrain/Loss": 2.0425243377685547, "Pretrain/Loss (Raw)": 2.1184723377227783, "Pretrain/Step": 2890, "Pretrain/Step Time": 9.198236851021647} +{"Pretrain/Learning Rate": 4.0839109284344235e-05, "Pretrain/Loss": 2.0434446334838867, "Pretrain/Loss (Raw)": 2.114035129547119, "Pretrain/Step": 2891, "Pretrain/Step Time": 9.19420069642365} +{"Pretrain/Learning Rate": 4.083253984136487e-05, "Pretrain/Loss": 2.0417704582214355, "Pretrain/Loss (Raw)": 1.991391897201538, "Pretrain/Step": 2892, "Pretrain/Step Time": 9.198188474401832} +{"Pretrain/Learning Rate": 4.0825968572502404e-05, "Pretrain/Loss": 2.040163516998291, "Pretrain/Loss (Raw)": 1.8457996845245361, "Pretrain/Step": 2893, "Pretrain/Step Time": 9.199921166524291} +{"Pretrain/Learning Rate": 4.081939547851467e-05, "Pretrain/Loss": 2.0390548706054688, "Pretrain/Loss (Raw)": 1.8998702764511108, "Pretrain/Step": 2894, "Pretrain/Step Time": 9.20250940695405} +{"Pretrain/Learning Rate": 4.0812820560159705e-05, "Pretrain/Loss": 2.037964344024658, "Pretrain/Loss (Raw)": 1.9888476133346558, "Pretrain/Step": 2895, "Pretrain/Step Time": 9.196726404130459} +{"Pretrain/Learning Rate": 4.0806243818195765e-05, "Pretrain/Loss": 2.0362563133239746, "Pretrain/Loss (Raw)": 1.891593337059021, "Pretrain/Step": 2896, "Pretrain/Step Time": 9.187521621584892} +{"Pretrain/Learning Rate": 4.07996652533813e-05, "Pretrain/Loss": 2.0376484394073486, "Pretrain/Loss (Raw)": 2.0503129959106445, "Pretrain/Step": 2897, "Pretrain/Step Time": 9.177854089066386} +{"Pretrain/Learning Rate": 4.0793084866474986e-05, "Pretrain/Loss": 2.0389530658721924, "Pretrain/Loss (Raw)": 2.131495952606201, "Pretrain/Step": 2898, "Pretrain/Step Time": 9.183037200942636} +{"Pretrain/Learning Rate": 4.078650265823571e-05, "Pretrain/Loss": 2.0418238639831543, "Pretrain/Loss (Raw)": 2.2127878665924072, "Pretrain/Step": 2899, "Pretrain/Step Time": 9.162398027256131} +{"Pretrain/Learning Rate": 4.077991862942256e-05, "Pretrain/Loss": 2.0401368141174316, "Pretrain/Loss (Raw)": 1.9450981616973877, "Pretrain/Step": 2900, "Pretrain/Step Time": 9.161960547789931} +{"Pretrain/Learning Rate": 4.0773332780794834e-05, "Pretrain/Loss": 2.0377156734466553, "Pretrain/Loss (Raw)": 1.9746640920639038, "Pretrain/Step": 2901, "Pretrain/Step Time": 9.15980365499854} +{"Pretrain/Learning Rate": 4.076674511311205e-05, "Pretrain/Loss": 2.0399863719940186, "Pretrain/Loss (Raw)": 1.9200167655944824, "Pretrain/Step": 2902, "Pretrain/Step Time": 9.172205964103341} +{"Pretrain/Learning Rate": 4.0760155627133924e-05, "Pretrain/Loss": 2.0370116233825684, "Pretrain/Loss (Raw)": 1.6754353046417236, "Pretrain/Step": 2903, "Pretrain/Step Time": 9.17747782357037} +{"Pretrain/Learning Rate": 4.075356432362037e-05, "Pretrain/Loss": 2.0378947257995605, "Pretrain/Loss (Raw)": 2.115391731262207, "Pretrain/Step": 2904, "Pretrain/Step Time": 9.17568033002317} +{"Pretrain/Learning Rate": 4.074697120333156e-05, "Pretrain/Loss": 2.038102149963379, "Pretrain/Loss (Raw)": 2.0237858295440674, "Pretrain/Step": 2905, "Pretrain/Step Time": 9.174655565991998} +{"Pretrain/Learning Rate": 4.0740376267027836e-05, "Pretrain/Loss": 2.0383901596069336, "Pretrain/Loss (Raw)": 2.0968406200408936, "Pretrain/Step": 2906, "Pretrain/Step Time": 9.182596167549491} +{"Pretrain/Learning Rate": 4.0733779515469736e-05, "Pretrain/Loss": 2.0383224487304688, "Pretrain/Loss (Raw)": 2.1344494819641113, "Pretrain/Step": 2907, "Pretrain/Step Time": 9.176256909966469} +{"Pretrain/Learning Rate": 4.072718094941805e-05, "Pretrain/Loss": 2.036625623703003, "Pretrain/Loss (Raw)": 1.6577563285827637, "Pretrain/Step": 2908, "Pretrain/Step Time": 9.158541409298778} +{"Pretrain/Learning Rate": 4.0720580569633746e-05, "Pretrain/Loss": 2.0354807376861572, "Pretrain/Loss (Raw)": 1.9661757946014404, "Pretrain/Step": 2909, "Pretrain/Step Time": 9.14629695750773} +{"Pretrain/Learning Rate": 4.0713978376878016e-05, "Pretrain/Loss": 2.0368003845214844, "Pretrain/Loss (Raw)": 2.23201847076416, "Pretrain/Step": 2910, "Pretrain/Step Time": 9.112590176984668} +{"Pretrain/Learning Rate": 4.070737437191224e-05, "Pretrain/Loss": 2.0373573303222656, "Pretrain/Loss (Raw)": 2.142487049102783, "Pretrain/Step": 2911, "Pretrain/Step Time": 9.110712444409728} +{"Pretrain/Learning Rate": 4.0700768555498045e-05, "Pretrain/Loss": 2.037733554840088, "Pretrain/Loss (Raw)": 2.1367480754852295, "Pretrain/Step": 2912, "Pretrain/Step Time": 9.108647340908647} +{"Pretrain/Learning Rate": 4.069416092839724e-05, "Pretrain/Loss": 2.0372142791748047, "Pretrain/Loss (Raw)": 2.059296131134033, "Pretrain/Step": 2913, "Pretrain/Step Time": 9.11324923671782} +{"Pretrain/Learning Rate": 4.068755149137184e-05, "Pretrain/Loss": 2.03871488571167, "Pretrain/Loss (Raw)": 1.9607032537460327, "Pretrain/Step": 2914, "Pretrain/Step Time": 9.115534042939544} +{"Pretrain/Learning Rate": 4.0680940245184076e-05, "Pretrain/Loss": 2.0380923748016357, "Pretrain/Loss (Raw)": 1.9916117191314697, "Pretrain/Step": 2915, "Pretrain/Step Time": 9.111288696527481} +{"Pretrain/Learning Rate": 4.06743271905964e-05, "Pretrain/Loss": 2.0395736694335938, "Pretrain/Loss (Raw)": 2.2796802520751953, "Pretrain/Step": 2916, "Pretrain/Step Time": 9.103631801903248} +{"Pretrain/Learning Rate": 4.066771232837144e-05, "Pretrain/Loss": 2.035663604736328, "Pretrain/Loss (Raw)": 1.7010704278945923, "Pretrain/Step": 2917, "Pretrain/Step Time": 9.114098822697997} +{"Pretrain/Learning Rate": 4.066109565927208e-05, "Pretrain/Loss": 2.0342676639556885, "Pretrain/Loss (Raw)": 1.894315242767334, "Pretrain/Step": 2918, "Pretrain/Step Time": 9.106598876416683} +{"Pretrain/Learning Rate": 4.0654477184061356e-05, "Pretrain/Loss": 2.0324532985687256, "Pretrain/Loss (Raw)": 1.9089139699935913, "Pretrain/Step": 2919, "Pretrain/Step Time": 9.113972356542945} +{"Pretrain/Learning Rate": 4.064785690350257e-05, "Pretrain/Loss": 2.0337886810302734, "Pretrain/Loss (Raw)": 2.0242104530334473, "Pretrain/Step": 2920, "Pretrain/Step Time": 9.106188045814633} +{"Pretrain/Learning Rate": 4.064123481835919e-05, "Pretrain/Loss": 2.035212278366089, "Pretrain/Loss (Raw)": 2.156965732574463, "Pretrain/Step": 2921, "Pretrain/Step Time": 9.108656058087945} +{"Pretrain/Learning Rate": 4.0634610929394893e-05, "Pretrain/Loss": 2.035346508026123, "Pretrain/Loss (Raw)": 2.0176775455474854, "Pretrain/Step": 2922, "Pretrain/Step Time": 9.065845508128405} +{"Pretrain/Learning Rate": 4.06279852373736e-05, "Pretrain/Loss": 2.035691261291504, "Pretrain/Loss (Raw)": 2.20439076423645, "Pretrain/Step": 2923, "Pretrain/Step Time": 9.065152496099472} +{"Pretrain/Learning Rate": 4.0621357743059415e-05, "Pretrain/Loss": 2.03231143951416, "Pretrain/Loss (Raw)": 1.6482555866241455, "Pretrain/Step": 2924, "Pretrain/Step Time": 9.026354476809502} +{"Pretrain/Learning Rate": 4.061472844721664e-05, "Pretrain/Loss": 2.030561923980713, "Pretrain/Loss (Raw)": 1.9792554378509521, "Pretrain/Step": 2925, "Pretrain/Step Time": 9.021314725279808} +{"Pretrain/Learning Rate": 4.06080973506098e-05, "Pretrain/Loss": 2.0316243171691895, "Pretrain/Loss (Raw)": 2.0862560272216797, "Pretrain/Step": 2926, "Pretrain/Step Time": 9.018004070967436} +{"Pretrain/Learning Rate": 4.0601464454003624e-05, "Pretrain/Loss": 2.027876377105713, "Pretrain/Loss (Raw)": 1.6738287210464478, "Pretrain/Step": 2927, "Pretrain/Step Time": 9.013361586257815} +{"Pretrain/Learning Rate": 4.059482975816305e-05, "Pretrain/Loss": 2.028806209564209, "Pretrain/Loss (Raw)": 2.078094005584717, "Pretrain/Step": 2928, "Pretrain/Step Time": 9.0210203807801} +{"Pretrain/Learning Rate": 4.058819326385322e-05, "Pretrain/Loss": 2.027341365814209, "Pretrain/Loss (Raw)": 2.0300819873809814, "Pretrain/Step": 2929, "Pretrain/Step Time": 9.023377479985356} +{"Pretrain/Learning Rate": 4.05815549718395e-05, "Pretrain/Loss": 2.0280418395996094, "Pretrain/Loss (Raw)": 2.0877182483673096, "Pretrain/Step": 2930, "Pretrain/Step Time": 9.0222237855196} +{"Pretrain/Learning Rate": 4.057491488288743e-05, "Pretrain/Loss": 2.025275707244873, "Pretrain/Loss (Raw)": 2.0071380138397217, "Pretrain/Step": 2931, "Pretrain/Step Time": 9.0199437122792} +{"Pretrain/Learning Rate": 4.0568272997762785e-05, "Pretrain/Loss": 2.022651195526123, "Pretrain/Loss (Raw)": 1.8912937641143799, "Pretrain/Step": 2932, "Pretrain/Step Time": 9.020418889820576} +{"Pretrain/Learning Rate": 4.056162931723154e-05, "Pretrain/Loss": 2.0229434967041016, "Pretrain/Loss (Raw)": 2.0884976387023926, "Pretrain/Step": 2933, "Pretrain/Step Time": 9.034242337569594} +{"Pretrain/Learning Rate": 4.055498384205987e-05, "Pretrain/Loss": 2.0254063606262207, "Pretrain/Loss (Raw)": 2.1582443714141846, "Pretrain/Step": 2934, "Pretrain/Step Time": 9.034159876406193} +{"Pretrain/Learning Rate": 4.054833657301417e-05, "Pretrain/Loss": 2.026505470275879, "Pretrain/Loss (Raw)": 2.071866989135742, "Pretrain/Step": 2935, "Pretrain/Step Time": 9.034710939973593} +{"Pretrain/Learning Rate": 4.054168751086102e-05, "Pretrain/Loss": 2.0214953422546387, "Pretrain/Loss (Raw)": 1.6357027292251587, "Pretrain/Step": 2936, "Pretrain/Step Time": 9.032752158120275} +{"Pretrain/Learning Rate": 4.053503665636724e-05, "Pretrain/Loss": 2.0217151641845703, "Pretrain/Loss (Raw)": 2.069532632827759, "Pretrain/Step": 2937, "Pretrain/Step Time": 9.030134478583932} +{"Pretrain/Learning Rate": 4.052838401029984e-05, "Pretrain/Loss": 2.02158260345459, "Pretrain/Loss (Raw)": 2.0491268634796143, "Pretrain/Step": 2938, "Pretrain/Step Time": 9.02142259851098} +{"Pretrain/Learning Rate": 4.0521729573426006e-05, "Pretrain/Loss": 2.0221686363220215, "Pretrain/Loss (Raw)": 2.150205373764038, "Pretrain/Step": 2939, "Pretrain/Step Time": 9.021472707390785} +{"Pretrain/Learning Rate": 4.051507334651318e-05, "Pretrain/Loss": 2.02329683303833, "Pretrain/Loss (Raw)": 2.087158441543579, "Pretrain/Step": 2940, "Pretrain/Step Time": 9.020620552822948} +{"Pretrain/Learning Rate": 4.050841533032899e-05, "Pretrain/Loss": 2.024169921875, "Pretrain/Loss (Raw)": 2.0507781505584717, "Pretrain/Step": 2941, "Pretrain/Step Time": 9.0210299231112} +{"Pretrain/Learning Rate": 4.050175552564127e-05, "Pretrain/Loss": 2.022991180419922, "Pretrain/Loss (Raw)": 2.069678544998169, "Pretrain/Step": 2942, "Pretrain/Step Time": 9.020043106749654} +{"Pretrain/Learning Rate": 4.049509393321805e-05, "Pretrain/Loss": 2.0223331451416016, "Pretrain/Loss (Raw)": 1.902526617050171, "Pretrain/Step": 2943, "Pretrain/Step Time": 9.025868710130453} +{"Pretrain/Learning Rate": 4.0488430553827585e-05, "Pretrain/Loss": 2.022822618484497, "Pretrain/Loss (Raw)": 1.979493260383606, "Pretrain/Step": 2944, "Pretrain/Step Time": 9.024195598438382} +{"Pretrain/Learning Rate": 4.0481765388238324e-05, "Pretrain/Loss": 2.0249836444854736, "Pretrain/Loss (Raw)": 2.2333269119262695, "Pretrain/Step": 2945, "Pretrain/Step Time": 9.01790495403111} +{"Pretrain/Learning Rate": 4.047509843721893e-05, "Pretrain/Loss": 2.029169797897339, "Pretrain/Loss (Raw)": 2.330655813217163, "Pretrain/Step": 2946, "Pretrain/Step Time": 9.019269060343504} +{"Pretrain/Learning Rate": 4.0468429701538253e-05, "Pretrain/Loss": 2.028916835784912, "Pretrain/Loss (Raw)": 2.0977602005004883, "Pretrain/Step": 2947, "Pretrain/Step Time": 9.021287649869919} +{"Pretrain/Learning Rate": 4.046175918196538e-05, "Pretrain/Loss": 2.03056001663208, "Pretrain/Loss (Raw)": 2.271693706512451, "Pretrain/Step": 2948, "Pretrain/Step Time": 9.01542104035616} +{"Pretrain/Learning Rate": 4.045508687926958e-05, "Pretrain/Loss": 2.031334161758423, "Pretrain/Loss (Raw)": 2.188354730606079, "Pretrain/Step": 2949, "Pretrain/Step Time": 9.016025757417083} +{"Pretrain/Learning Rate": 4.044841279422034e-05, "Pretrain/Loss": 2.030156373977661, "Pretrain/Loss (Raw)": 2.1032023429870605, "Pretrain/Step": 2950, "Pretrain/Step Time": 8.999381691217422} +{"Pretrain/Learning Rate": 4.044173692758733e-05, "Pretrain/Loss": 2.031263589859009, "Pretrain/Loss (Raw)": 2.0374464988708496, "Pretrain/Step": 2951, "Pretrain/Step Time": 9.006999338045716} +{"Pretrain/Learning Rate": 4.043505928014045e-05, "Pretrain/Loss": 2.0307183265686035, "Pretrain/Loss (Raw)": 2.0431265830993652, "Pretrain/Step": 2952, "Pretrain/Step Time": 9.002462856471539} +{"Pretrain/Learning Rate": 4.0428379852649816e-05, "Pretrain/Loss": 2.0313761234283447, "Pretrain/Loss (Raw)": 1.8734406232833862, "Pretrain/Step": 2953, "Pretrain/Step Time": 9.001615488901734} +{"Pretrain/Learning Rate": 4.042169864588571e-05, "Pretrain/Loss": 2.0305728912353516, "Pretrain/Loss (Raw)": 1.9324634075164795, "Pretrain/Step": 2954, "Pretrain/Step Time": 9.004091301932931} +{"Pretrain/Learning Rate": 4.041501566061865e-05, "Pretrain/Loss": 2.031233310699463, "Pretrain/Loss (Raw)": 1.9737941026687622, "Pretrain/Step": 2955, "Pretrain/Step Time": 9.005059722810984} +{"Pretrain/Learning Rate": 4.040833089761934e-05, "Pretrain/Loss": 2.0313167572021484, "Pretrain/Loss (Raw)": 2.0398826599121094, "Pretrain/Step": 2956, "Pretrain/Step Time": 9.002222206443548} +{"Pretrain/Learning Rate": 4.040164435765871e-05, "Pretrain/Loss": 2.0315778255462646, "Pretrain/Loss (Raw)": 2.0170247554779053, "Pretrain/Step": 2957, "Pretrain/Step Time": 9.00004299916327} +{"Pretrain/Learning Rate": 4.039495604150787e-05, "Pretrain/Loss": 2.03043794631958, "Pretrain/Loss (Raw)": 1.9182626008987427, "Pretrain/Step": 2958, "Pretrain/Step Time": 8.994671983644366} +{"Pretrain/Learning Rate": 4.0388265949938165e-05, "Pretrain/Loss": 2.030353546142578, "Pretrain/Loss (Raw)": 1.935717225074768, "Pretrain/Step": 2959, "Pretrain/Step Time": 8.995821837335825} +{"Pretrain/Learning Rate": 4.038157408372111e-05, "Pretrain/Loss": 2.03115177154541, "Pretrain/Loss (Raw)": 2.2122349739074707, "Pretrain/Step": 2960, "Pretrain/Step Time": 9.001049719750881} +{"Pretrain/Learning Rate": 4.037488044362846e-05, "Pretrain/Loss": 2.030308723449707, "Pretrain/Loss (Raw)": 1.9266244173049927, "Pretrain/Step": 2961, "Pretrain/Step Time": 9.002752864733338} +{"Pretrain/Learning Rate": 4.036818503043214e-05, "Pretrain/Loss": 2.0302343368530273, "Pretrain/Loss (Raw)": 2.023031234741211, "Pretrain/Step": 2962, "Pretrain/Step Time": 9.003534501418471} +{"Pretrain/Learning Rate": 4.0361487844904314e-05, "Pretrain/Loss": 2.030550956726074, "Pretrain/Loss (Raw)": 2.1495308876037598, "Pretrain/Step": 2963, "Pretrain/Step Time": 9.006696939468384} +{"Pretrain/Learning Rate": 4.035478888781732e-05, "Pretrain/Loss": 2.0335845947265625, "Pretrain/Loss (Raw)": 2.2556920051574707, "Pretrain/Step": 2964, "Pretrain/Step Time": 9.012030957266688} +{"Pretrain/Learning Rate": 4.034808815994372e-05, "Pretrain/Loss": 2.0320091247558594, "Pretrain/Loss (Raw)": 2.1019983291625977, "Pretrain/Step": 2965, "Pretrain/Step Time": 9.010489091277122} +{"Pretrain/Learning Rate": 4.0341385662056265e-05, "Pretrain/Loss": 2.0314178466796875, "Pretrain/Loss (Raw)": 2.007120370864868, "Pretrain/Step": 2966, "Pretrain/Step Time": 9.008600613102317} +{"Pretrain/Learning Rate": 4.033468139492793e-05, "Pretrain/Loss": 2.0333080291748047, "Pretrain/Loss (Raw)": 2.027355194091797, "Pretrain/Step": 2967, "Pretrain/Step Time": 9.007591040804982} +{"Pretrain/Learning Rate": 4.032797535933187e-05, "Pretrain/Loss": 2.0350472927093506, "Pretrain/Loss (Raw)": 2.295177936553955, "Pretrain/Step": 2968, "Pretrain/Step Time": 9.010618347674608} +{"Pretrain/Learning Rate": 4.032126755604147e-05, "Pretrain/Loss": 2.0336804389953613, "Pretrain/Loss (Raw)": 1.9174528121948242, "Pretrain/Step": 2969, "Pretrain/Step Time": 9.012151286005974} +{"Pretrain/Learning Rate": 4.03145579858303e-05, "Pretrain/Loss": 2.0328097343444824, "Pretrain/Loss (Raw)": 2.050645589828491, "Pretrain/Step": 2970, "Pretrain/Step Time": 9.017170265316963} +{"Pretrain/Learning Rate": 4.0307846649472134e-05, "Pretrain/Loss": 2.030754566192627, "Pretrain/Loss (Raw)": 1.765272855758667, "Pretrain/Step": 2971, "Pretrain/Step Time": 9.02126793935895} +{"Pretrain/Learning Rate": 4.030113354774096e-05, "Pretrain/Loss": 2.0318665504455566, "Pretrain/Loss (Raw)": 2.2173149585723877, "Pretrain/Step": 2972, "Pretrain/Step Time": 9.030420234426856} +{"Pretrain/Learning Rate": 4.029441868141096e-05, "Pretrain/Loss": 2.0305817127227783, "Pretrain/Loss (Raw)": 2.0249836444854736, "Pretrain/Step": 2973, "Pretrain/Step Time": 9.019958570599556} +{"Pretrain/Learning Rate": 4.0287702051256535e-05, "Pretrain/Loss": 2.0332260131835938, "Pretrain/Loss (Raw)": 2.118485450744629, "Pretrain/Step": 2974, "Pretrain/Step Time": 9.032838704064488} +{"Pretrain/Learning Rate": 4.0280983658052276e-05, "Pretrain/Loss": 2.0331454277038574, "Pretrain/Loss (Raw)": 2.1143102645874023, "Pretrain/Step": 2975, "Pretrain/Step Time": 9.034747956320643} +{"Pretrain/Learning Rate": 4.0274263502572966e-05, "Pretrain/Loss": 2.0306079387664795, "Pretrain/Loss (Raw)": 1.961925745010376, "Pretrain/Step": 2976, "Pretrain/Step Time": 9.025731857866049} +{"Pretrain/Learning Rate": 4.026754158559362e-05, "Pretrain/Loss": 2.0309500694274902, "Pretrain/Loss (Raw)": 2.1720705032348633, "Pretrain/Step": 2977, "Pretrain/Step Time": 9.028046898543835} +{"Pretrain/Learning Rate": 4.026081790788943e-05, "Pretrain/Loss": 2.031932830810547, "Pretrain/Loss (Raw)": 2.1318297386169434, "Pretrain/Step": 2978, "Pretrain/Step Time": 9.026867186650634} +{"Pretrain/Learning Rate": 4.025409247023581e-05, "Pretrain/Loss": 2.0320544242858887, "Pretrain/Loss (Raw)": 2.11734676361084, "Pretrain/Step": 2979, "Pretrain/Step Time": 9.024420976638794} +{"Pretrain/Learning Rate": 4.0247365273408366e-05, "Pretrain/Loss": 2.035867214202881, "Pretrain/Loss (Raw)": 2.1507513523101807, "Pretrain/Step": 2980, "Pretrain/Step Time": 9.028798583894968} +{"Pretrain/Learning Rate": 4.024063631818291e-05, "Pretrain/Loss": 2.0357072353363037, "Pretrain/Loss (Raw)": 1.9837943315505981, "Pretrain/Step": 2981, "Pretrain/Step Time": 9.027695601806045} +{"Pretrain/Learning Rate": 4.023390560533546e-05, "Pretrain/Loss": 2.036283493041992, "Pretrain/Loss (Raw)": 2.0484213829040527, "Pretrain/Step": 2982, "Pretrain/Step Time": 9.03268957696855} +{"Pretrain/Learning Rate": 4.022717313564223e-05, "Pretrain/Loss": 2.0365793704986572, "Pretrain/Loss (Raw)": 2.000828981399536, "Pretrain/Step": 2983, "Pretrain/Step Time": 9.035423127934337} +{"Pretrain/Learning Rate": 4.0220438909879644e-05, "Pretrain/Loss": 2.039632797241211, "Pretrain/Loss (Raw)": 2.3083744049072266, "Pretrain/Step": 2984, "Pretrain/Step Time": 9.020305903628469} +{"Pretrain/Learning Rate": 4.0213702928824315e-05, "Pretrain/Loss": 2.0393106937408447, "Pretrain/Loss (Raw)": 1.9802404642105103, "Pretrain/Step": 2985, "Pretrain/Step Time": 9.022305682301521} +{"Pretrain/Learning Rate": 4.0206965193253075e-05, "Pretrain/Loss": 2.041304588317871, "Pretrain/Loss (Raw)": 2.0843558311462402, "Pretrain/Step": 2986, "Pretrain/Step Time": 9.017643785104156} +{"Pretrain/Learning Rate": 4.0200225703942964e-05, "Pretrain/Loss": 2.0399434566497803, "Pretrain/Loss (Raw)": 1.9303010702133179, "Pretrain/Step": 2987, "Pretrain/Step Time": 9.02514816634357} +{"Pretrain/Learning Rate": 4.0193484461671185e-05, "Pretrain/Loss": 2.039700508117676, "Pretrain/Loss (Raw)": 2.1230669021606445, "Pretrain/Step": 2988, "Pretrain/Step Time": 9.016876097768545} +{"Pretrain/Learning Rate": 4.0186741467215186e-05, "Pretrain/Loss": 2.0383594036102295, "Pretrain/Loss (Raw)": 2.0101096630096436, "Pretrain/Step": 2989, "Pretrain/Step Time": 9.01288248039782} +{"Pretrain/Learning Rate": 4.017999672135261e-05, "Pretrain/Loss": 2.036879301071167, "Pretrain/Loss (Raw)": 2.0215165615081787, "Pretrain/Step": 2990, "Pretrain/Step Time": 9.004547221586108} +{"Pretrain/Learning Rate": 4.017325022486127e-05, "Pretrain/Loss": 2.0358059406280518, "Pretrain/Loss (Raw)": 2.1674013137817383, "Pretrain/Step": 2991, "Pretrain/Step Time": 9.00327656045556} +{"Pretrain/Learning Rate": 4.0166501978519225e-05, "Pretrain/Loss": 2.0339620113372803, "Pretrain/Loss (Raw)": 1.877989649772644, "Pretrain/Step": 2992, "Pretrain/Step Time": 9.003454152494669} +{"Pretrain/Learning Rate": 4.015975198310469e-05, "Pretrain/Loss": 2.034773349761963, "Pretrain/Loss (Raw)": 2.2333621978759766, "Pretrain/Step": 2993, "Pretrain/Step Time": 9.007228821516037} +{"Pretrain/Learning Rate": 4.0153000239396136e-05, "Pretrain/Loss": 2.037177085876465, "Pretrain/Loss (Raw)": 2.2350399494171143, "Pretrain/Step": 2994, "Pretrain/Step Time": 9.003190523013473} +{"Pretrain/Learning Rate": 4.014624674817218e-05, "Pretrain/Loss": 2.0379457473754883, "Pretrain/Loss (Raw)": 2.0528817176818848, "Pretrain/Step": 2995, "Pretrain/Step Time": 9.006662322208285} +{"Pretrain/Learning Rate": 4.0139491510211684e-05, "Pretrain/Loss": 2.037412643432617, "Pretrain/Loss (Raw)": 2.299006700515747, "Pretrain/Step": 2996, "Pretrain/Step Time": 9.005703331902623} +{"Pretrain/Learning Rate": 4.0132734526293685e-05, "Pretrain/Loss": 2.0369582176208496, "Pretrain/Loss (Raw)": 2.0200674533843994, "Pretrain/Step": 2997, "Pretrain/Step Time": 9.004661809653044} +{"Pretrain/Learning Rate": 4.012597579719743e-05, "Pretrain/Loss": 2.0357232093811035, "Pretrain/Loss (Raw)": 1.9083526134490967, "Pretrain/Step": 2998, "Pretrain/Step Time": 9.00102262571454} +{"Pretrain/Learning Rate": 4.011921532370238e-05, "Pretrain/Loss": 2.0350329875946045, "Pretrain/Loss (Raw)": 2.0293118953704834, "Pretrain/Step": 2999, "Pretrain/Step Time": 8.998576492071152} +{"Pretrain/Learning Rate": 4.0112453106588164e-05, "Pretrain/Loss": 2.0296661853790283, "Pretrain/Loss (Raw)": 1.7979167699813843, "Pretrain/Step": 3000, "Pretrain/Step Time": 8.999680390581489} +{"Pretrain/Learning Rate": 4.010568914663465e-05, "Pretrain/Loss": 2.0271925926208496, "Pretrain/Loss (Raw)": 1.766445517539978, "Pretrain/Step": 3001, "Pretrain/Step Time": 8.9981520883739} +{"Pretrain/Learning Rate": 4.0098923444621885e-05, "Pretrain/Loss": 2.0286169052124023, "Pretrain/Loss (Raw)": 2.0907387733459473, "Pretrain/Step": 3002, "Pretrain/Step Time": 9.000120228156447} +{"Pretrain/Learning Rate": 4.0092156001330115e-05, "Pretrain/Loss": 2.030278205871582, "Pretrain/Loss (Raw)": 2.174346923828125, "Pretrain/Step": 3003, "Pretrain/Step Time": 9.004497427493334} +{"Pretrain/Learning Rate": 4.00853868175398e-05, "Pretrain/Loss": 2.0312981605529785, "Pretrain/Loss (Raw)": 1.6915063858032227, "Pretrain/Step": 3004, "Pretrain/Step Time": 9.00117065757513} +{"Pretrain/Learning Rate": 4.007861589403159e-05, "Pretrain/Loss": 2.032783269882202, "Pretrain/Loss (Raw)": 2.1905272006988525, "Pretrain/Step": 3005, "Pretrain/Step Time": 9.003928534686565} +{"Pretrain/Learning Rate": 4.0071843231586345e-05, "Pretrain/Loss": 2.0323538780212402, "Pretrain/Loss (Raw)": 1.9633303880691528, "Pretrain/Step": 3006, "Pretrain/Step Time": 9.002047721296549} +{"Pretrain/Learning Rate": 4.006506883098512e-05, "Pretrain/Loss": 2.033190965652466, "Pretrain/Loss (Raw)": 1.9742995500564575, "Pretrain/Step": 3007, "Pretrain/Step Time": 8.988770933821797} +{"Pretrain/Learning Rate": 4.005829269300917e-05, "Pretrain/Loss": 2.030217170715332, "Pretrain/Loss (Raw)": 1.8018198013305664, "Pretrain/Step": 3008, "Pretrain/Step Time": 8.991345254704356} +{"Pretrain/Learning Rate": 4.005151481843994e-05, "Pretrain/Loss": 2.033815860748291, "Pretrain/Loss (Raw)": 2.4671976566314697, "Pretrain/Step": 3009, "Pretrain/Step Time": 8.985652135685086} +{"Pretrain/Learning Rate": 4.0044735208059104e-05, "Pretrain/Loss": 2.0337324142456055, "Pretrain/Loss (Raw)": 1.9932496547698975, "Pretrain/Step": 3010, "Pretrain/Step Time": 8.972384672611952} +{"Pretrain/Learning Rate": 4.0037953862648504e-05, "Pretrain/Loss": 2.0352580547332764, "Pretrain/Loss (Raw)": 2.0031979084014893, "Pretrain/Step": 3011, "Pretrain/Step Time": 8.93544813990593} +{"Pretrain/Learning Rate": 4.003117078299021e-05, "Pretrain/Loss": 2.035159111022949, "Pretrain/Loss (Raw)": 2.050673007965088, "Pretrain/Step": 3012, "Pretrain/Step Time": 8.936443326994777} +{"Pretrain/Learning Rate": 4.002438596986647e-05, "Pretrain/Loss": 2.037855386734009, "Pretrain/Loss (Raw)": 2.2657053470611572, "Pretrain/Step": 3013, "Pretrain/Step Time": 8.92817822098732} +{"Pretrain/Learning Rate": 4.001759942405974e-05, "Pretrain/Loss": 2.037277936935425, "Pretrain/Loss (Raw)": 1.9766650199890137, "Pretrain/Step": 3014, "Pretrain/Step Time": 8.932949237525463} +{"Pretrain/Learning Rate": 4.001081114635268e-05, "Pretrain/Loss": 2.0378596782684326, "Pretrain/Loss (Raw)": 2.2466814517974854, "Pretrain/Step": 3015, "Pretrain/Step Time": 8.926788872107863} +{"Pretrain/Learning Rate": 4.000402113752815e-05, "Pretrain/Loss": 2.0355000495910645, "Pretrain/Loss (Raw)": 1.7996712923049927, "Pretrain/Step": 3016, "Pretrain/Step Time": 8.931718794628978} +{"Pretrain/Learning Rate": 3.9997229398369194e-05, "Pretrain/Loss": 2.036670207977295, "Pretrain/Loss (Raw)": 2.12902569770813, "Pretrain/Step": 3017, "Pretrain/Step Time": 8.94101420789957} +{"Pretrain/Learning Rate": 3.999043592965908e-05, "Pretrain/Loss": 2.0373635292053223, "Pretrain/Loss (Raw)": 2.2072136402130127, "Pretrain/Step": 3018, "Pretrain/Step Time": 8.888118978589773} +{"Pretrain/Learning Rate": 3.998364073218126e-05, "Pretrain/Loss": 2.0369226932525635, "Pretrain/Loss (Raw)": 2.0576155185699463, "Pretrain/Step": 3019, "Pretrain/Step Time": 8.889542382210493} +{"Pretrain/Learning Rate": 3.997684380671938e-05, "Pretrain/Loss": 2.037997245788574, "Pretrain/Loss (Raw)": 2.128943681716919, "Pretrain/Step": 3020, "Pretrain/Step Time": 8.88954684138298} +{"Pretrain/Learning Rate": 3.9970045154057304e-05, "Pretrain/Loss": 2.0384483337402344, "Pretrain/Loss (Raw)": 1.90354323387146, "Pretrain/Step": 3021, "Pretrain/Step Time": 8.90076477266848} +{"Pretrain/Learning Rate": 3.996324477497907e-05, "Pretrain/Loss": 2.041175365447998, "Pretrain/Loss (Raw)": 2.2489259243011475, "Pretrain/Step": 3022, "Pretrain/Step Time": 8.902379242703319} +{"Pretrain/Learning Rate": 3.9956442670268946e-05, "Pretrain/Loss": 2.0382933616638184, "Pretrain/Loss (Raw)": 1.6199326515197754, "Pretrain/Step": 3023, "Pretrain/Step Time": 8.906019058078527} +{"Pretrain/Learning Rate": 3.9949638840711376e-05, "Pretrain/Loss": 2.0414180755615234, "Pretrain/Loss (Raw)": 2.2915775775909424, "Pretrain/Step": 3024, "Pretrain/Step Time": 8.912706281989813} +{"Pretrain/Learning Rate": 3.9942833287091006e-05, "Pretrain/Loss": 2.040330410003662, "Pretrain/Loss (Raw)": 1.9111030101776123, "Pretrain/Step": 3025, "Pretrain/Step Time": 8.912901598960161} +{"Pretrain/Learning Rate": 3.9936026010192696e-05, "Pretrain/Loss": 2.0392985343933105, "Pretrain/Loss (Raw)": 1.999380111694336, "Pretrain/Step": 3026, "Pretrain/Step Time": 8.909288991242647} +{"Pretrain/Learning Rate": 3.9929217010801476e-05, "Pretrain/Loss": 2.0382678508758545, "Pretrain/Loss (Raw)": 2.080878496170044, "Pretrain/Step": 3027, "Pretrain/Step Time": 8.906087100505829} +{"Pretrain/Learning Rate": 3.992240628970261e-05, "Pretrain/Loss": 2.0391345024108887, "Pretrain/Loss (Raw)": 2.0560524463653564, "Pretrain/Step": 3028, "Pretrain/Step Time": 8.901524469256401} +{"Pretrain/Learning Rate": 3.991559384768153e-05, "Pretrain/Loss": 2.0394279956817627, "Pretrain/Loss (Raw)": 2.012216567993164, "Pretrain/Step": 3029, "Pretrain/Step Time": 8.90377076342702} +{"Pretrain/Learning Rate": 3.9908779685523885e-05, "Pretrain/Loss": 2.038640022277832, "Pretrain/Loss (Raw)": 1.8191499710083008, "Pretrain/Step": 3030, "Pretrain/Step Time": 8.890424441546202} +{"Pretrain/Learning Rate": 3.9901963804015516e-05, "Pretrain/Loss": 2.042670726776123, "Pretrain/Loss (Raw)": 2.191387891769409, "Pretrain/Step": 3031, "Pretrain/Step Time": 8.883603984490037} +{"Pretrain/Learning Rate": 3.9895146203942457e-05, "Pretrain/Loss": 2.042198896408081, "Pretrain/Loss (Raw)": 2.0549709796905518, "Pretrain/Step": 3032, "Pretrain/Step Time": 8.887163400650024} +{"Pretrain/Learning Rate": 3.988832688609095e-05, "Pretrain/Loss": 2.0421528816223145, "Pretrain/Loss (Raw)": 2.0179336071014404, "Pretrain/Step": 3033, "Pretrain/Step Time": 8.890262262895703} +{"Pretrain/Learning Rate": 3.988150585124743e-05, "Pretrain/Loss": 2.0432276725769043, "Pretrain/Loss (Raw)": 2.23439884185791, "Pretrain/Step": 3034, "Pretrain/Step Time": 8.88739320449531} +{"Pretrain/Learning Rate": 3.987468310019853e-05, "Pretrain/Loss": 2.0427374839782715, "Pretrain/Loss (Raw)": 2.071713447570801, "Pretrain/Step": 3035, "Pretrain/Step Time": 8.888980589807034} +{"Pretrain/Learning Rate": 3.986785863373109e-05, "Pretrain/Loss": 2.046266555786133, "Pretrain/Loss (Raw)": 2.1094653606414795, "Pretrain/Step": 3036, "Pretrain/Step Time": 8.888815408572555} +{"Pretrain/Learning Rate": 3.9861032452632124e-05, "Pretrain/Loss": 2.046311855316162, "Pretrain/Loss (Raw)": 1.971945881843567, "Pretrain/Step": 3037, "Pretrain/Step Time": 8.894384974613786} +{"Pretrain/Learning Rate": 3.985420455768887e-05, "Pretrain/Loss": 2.0453643798828125, "Pretrain/Loss (Raw)": 2.110790491104126, "Pretrain/Step": 3038, "Pretrain/Step Time": 8.887806927785277} +{"Pretrain/Learning Rate": 3.9847374949688756e-05, "Pretrain/Loss": 2.044121503829956, "Pretrain/Loss (Raw)": 1.9833608865737915, "Pretrain/Step": 3039, "Pretrain/Step Time": 8.899508474394679} +{"Pretrain/Learning Rate": 3.98405436294194e-05, "Pretrain/Loss": 2.0426321029663086, "Pretrain/Loss (Raw)": 1.9461160898208618, "Pretrain/Step": 3040, "Pretrain/Step Time": 8.908083613961935} +{"Pretrain/Learning Rate": 3.9833710597668614e-05, "Pretrain/Loss": 2.042379379272461, "Pretrain/Loss (Raw)": 2.0269343852996826, "Pretrain/Step": 3041, "Pretrain/Step Time": 8.906492808833718} +{"Pretrain/Learning Rate": 3.9826875855224435e-05, "Pretrain/Loss": 2.0436577796936035, "Pretrain/Loss (Raw)": 2.124356269836426, "Pretrain/Step": 3042, "Pretrain/Step Time": 8.901744669303298} +{"Pretrain/Learning Rate": 3.9820039402875055e-05, "Pretrain/Loss": 2.04526424407959, "Pretrain/Loss (Raw)": 2.1972241401672363, "Pretrain/Step": 3043, "Pretrain/Step Time": 8.910270545631647} +{"Pretrain/Learning Rate": 3.98132012414089e-05, "Pretrain/Loss": 2.0440049171447754, "Pretrain/Loss (Raw)": 2.1185078620910645, "Pretrain/Step": 3044, "Pretrain/Step Time": 8.909184604883194} +{"Pretrain/Learning Rate": 3.9806361371614576e-05, "Pretrain/Loss": 2.0474367141723633, "Pretrain/Loss (Raw)": 2.140336751937866, "Pretrain/Step": 3045, "Pretrain/Step Time": 8.899125147610903} +{"Pretrain/Learning Rate": 3.979951979428089e-05, "Pretrain/Loss": 2.0480313301086426, "Pretrain/Loss (Raw)": 1.9704194068908691, "Pretrain/Step": 3046, "Pretrain/Step Time": 8.896811680868268} +{"Pretrain/Learning Rate": 3.9792676510196835e-05, "Pretrain/Loss": 2.049680709838867, "Pretrain/Loss (Raw)": 2.1200098991394043, "Pretrain/Step": 3047, "Pretrain/Step Time": 8.88542591407895} +{"Pretrain/Learning Rate": 3.978583152015163e-05, "Pretrain/Loss": 2.049445152282715, "Pretrain/Loss (Raw)": 1.9940814971923828, "Pretrain/Step": 3048, "Pretrain/Step Time": 8.888295505195856} +{"Pretrain/Learning Rate": 3.977898482493466e-05, "Pretrain/Loss": 2.0497851371765137, "Pretrain/Loss (Raw)": 2.2004928588867188, "Pretrain/Step": 3049, "Pretrain/Step Time": 8.88866944052279} +{"Pretrain/Learning Rate": 3.977213642533552e-05, "Pretrain/Loss": 2.04984188079834, "Pretrain/Loss (Raw)": 2.024948835372925, "Pretrain/Step": 3050, "Pretrain/Step Time": 8.887515060603619} +{"Pretrain/Learning Rate": 3.976528632214399e-05, "Pretrain/Loss": 2.049344539642334, "Pretrain/Loss (Raw)": 2.1407294273376465, "Pretrain/Step": 3051, "Pretrain/Step Time": 8.886578431352973} +{"Pretrain/Learning Rate": 3.975843451615007e-05, "Pretrain/Loss": 2.0516257286071777, "Pretrain/Loss (Raw)": 1.9402271509170532, "Pretrain/Step": 3052, "Pretrain/Step Time": 8.889256523922086} +{"Pretrain/Learning Rate": 3.9751581008143946e-05, "Pretrain/Loss": 2.053007125854492, "Pretrain/Loss (Raw)": 2.156092882156372, "Pretrain/Step": 3053, "Pretrain/Step Time": 8.887029694393277} +{"Pretrain/Learning Rate": 3.9744725798915974e-05, "Pretrain/Loss": 2.053452968597412, "Pretrain/Loss (Raw)": 2.143293857574463, "Pretrain/Step": 3054, "Pretrain/Step Time": 8.889870325103402} +{"Pretrain/Learning Rate": 3.973786888925675e-05, "Pretrain/Loss": 2.0577011108398438, "Pretrain/Loss (Raw)": 2.217602014541626, "Pretrain/Step": 3055, "Pretrain/Step Time": 8.890637809410691} +{"Pretrain/Learning Rate": 3.973101027995704e-05, "Pretrain/Loss": 2.0580010414123535, "Pretrain/Loss (Raw)": 2.116488456726074, "Pretrain/Step": 3056, "Pretrain/Step Time": 8.881988700479269} +{"Pretrain/Learning Rate": 3.9724149971807814e-05, "Pretrain/Loss": 2.0582103729248047, "Pretrain/Loss (Raw)": 2.0568625926971436, "Pretrain/Step": 3057, "Pretrain/Step Time": 8.885717349126935} +{"Pretrain/Learning Rate": 3.9717287965600224e-05, "Pretrain/Loss": 2.057136297225952, "Pretrain/Loss (Raw)": 1.950250506401062, "Pretrain/Step": 3058, "Pretrain/Step Time": 8.890652921050787} +{"Pretrain/Learning Rate": 3.971042426212563e-05, "Pretrain/Loss": 2.058004856109619, "Pretrain/Loss (Raw)": 2.1182992458343506, "Pretrain/Step": 3059, "Pretrain/Step Time": 8.890960413962603} +{"Pretrain/Learning Rate": 3.970355886217561e-05, "Pretrain/Loss": 2.0580344200134277, "Pretrain/Loss (Raw)": 1.895102620124817, "Pretrain/Step": 3060, "Pretrain/Step Time": 8.889744229614735} +{"Pretrain/Learning Rate": 3.9696691766541884e-05, "Pretrain/Loss": 2.05918550491333, "Pretrain/Loss (Raw)": 2.235837459564209, "Pretrain/Step": 3061, "Pretrain/Step Time": 8.879438746720552} +{"Pretrain/Learning Rate": 3.968982297601641e-05, "Pretrain/Loss": 2.058804750442505, "Pretrain/Loss (Raw)": 2.109508991241455, "Pretrain/Step": 3062, "Pretrain/Step Time": 8.909790612757206} +{"Pretrain/Learning Rate": 3.9682952491391326e-05, "Pretrain/Loss": 2.0581371784210205, "Pretrain/Loss (Raw)": 1.9863966703414917, "Pretrain/Step": 3063, "Pretrain/Step Time": 8.911938849836588} +{"Pretrain/Learning Rate": 3.967608031345898e-05, "Pretrain/Loss": 2.062498092651367, "Pretrain/Loss (Raw)": 2.1939055919647217, "Pretrain/Step": 3064, "Pretrain/Step Time": 8.91418188624084} +{"Pretrain/Learning Rate": 3.96692064430119e-05, "Pretrain/Loss": 2.0642266273498535, "Pretrain/Loss (Raw)": 2.2907631397247314, "Pretrain/Step": 3065, "Pretrain/Step Time": 8.913634097203612} +{"Pretrain/Learning Rate": 3.96623308808428e-05, "Pretrain/Loss": 2.0649495124816895, "Pretrain/Loss (Raw)": 2.1416807174682617, "Pretrain/Step": 3066, "Pretrain/Step Time": 8.912542751058936} +{"Pretrain/Learning Rate": 3.965545362774461e-05, "Pretrain/Loss": 2.0643410682678223, "Pretrain/Loss (Raw)": 2.0723419189453125, "Pretrain/Step": 3067, "Pretrain/Step Time": 8.91568898782134} +{"Pretrain/Learning Rate": 3.964857468451045e-05, "Pretrain/Loss": 2.0602784156799316, "Pretrain/Loss (Raw)": 1.567084789276123, "Pretrain/Step": 3068, "Pretrain/Step Time": 8.919388823211193} +{"Pretrain/Learning Rate": 3.9641694051933644e-05, "Pretrain/Loss": 2.0617966651916504, "Pretrain/Loss (Raw)": 2.2451603412628174, "Pretrain/Step": 3069, "Pretrain/Step Time": 8.921286823228002} +{"Pretrain/Learning Rate": 3.963481173080767e-05, "Pretrain/Loss": 2.061734676361084, "Pretrain/Loss (Raw)": 2.061727523803711, "Pretrain/Step": 3070, "Pretrain/Step Time": 8.923855336382985} +{"Pretrain/Learning Rate": 3.962792772192626e-05, "Pretrain/Loss": 2.062378406524658, "Pretrain/Loss (Raw)": 1.984929084777832, "Pretrain/Step": 3071, "Pretrain/Step Time": 8.92458288744092} +{"Pretrain/Learning Rate": 3.962104202608329e-05, "Pretrain/Loss": 2.063424587249756, "Pretrain/Loss (Raw)": 2.1134183406829834, "Pretrain/Step": 3072, "Pretrain/Step Time": 8.925996383652091} +{"Pretrain/Learning Rate": 3.9614154644072854e-05, "Pretrain/Loss": 2.0624613761901855, "Pretrain/Loss (Raw)": 2.110018491744995, "Pretrain/Step": 3073, "Pretrain/Step Time": 8.92418023943901} +{"Pretrain/Learning Rate": 3.960726557668924e-05, "Pretrain/Loss": 2.0596323013305664, "Pretrain/Loss (Raw)": 1.9685444831848145, "Pretrain/Step": 3074, "Pretrain/Step Time": 8.970765145495534} +{"Pretrain/Learning Rate": 3.960037482472694e-05, "Pretrain/Loss": 2.059805393218994, "Pretrain/Loss (Raw)": 2.119894027709961, "Pretrain/Step": 3075, "Pretrain/Step Time": 8.96558521874249} +{"Pretrain/Learning Rate": 3.95934823889806e-05, "Pretrain/Loss": 2.056828498840332, "Pretrain/Loss (Raw)": 1.8906829357147217, "Pretrain/Step": 3076, "Pretrain/Step Time": 8.967794449999928} +{"Pretrain/Learning Rate": 3.9586588270245115e-05, "Pretrain/Loss": 2.0592246055603027, "Pretrain/Loss (Raw)": 2.4950509071350098, "Pretrain/Step": 3077, "Pretrain/Step Time": 8.96645800769329} +{"Pretrain/Learning Rate": 3.957969246931553e-05, "Pretrain/Loss": 2.0594100952148438, "Pretrain/Loss (Raw)": 2.1269307136535645, "Pretrain/Step": 3078, "Pretrain/Step Time": 8.963057167828083} +{"Pretrain/Learning Rate": 3.95727949869871e-05, "Pretrain/Loss": 2.0595474243164062, "Pretrain/Loss (Raw)": 2.0550034046173096, "Pretrain/Step": 3079, "Pretrain/Step Time": 8.958588361740112} +{"Pretrain/Learning Rate": 3.95658958240553e-05, "Pretrain/Loss": 2.0593836307525635, "Pretrain/Loss (Raw)": 2.022172689437866, "Pretrain/Step": 3080, "Pretrain/Step Time": 8.953338319435716} +{"Pretrain/Learning Rate": 3.955899498131575e-05, "Pretrain/Loss": 2.0592257976531982, "Pretrain/Loss (Raw)": 1.8532646894454956, "Pretrain/Step": 3081, "Pretrain/Step Time": 8.950753811746836} +{"Pretrain/Learning Rate": 3.9552092459564294e-05, "Pretrain/Loss": 2.061368942260742, "Pretrain/Loss (Raw)": 2.206773042678833, "Pretrain/Step": 3082, "Pretrain/Step Time": 8.953279457986355} +{"Pretrain/Learning Rate": 3.9545188259596966e-05, "Pretrain/Loss": 2.0605320930480957, "Pretrain/Loss (Raw)": 1.866661548614502, "Pretrain/Step": 3083, "Pretrain/Step Time": 8.952798556536436} +{"Pretrain/Learning Rate": 3.953828238220998e-05, "Pretrain/Loss": 2.0608363151550293, "Pretrain/Loss (Raw)": 2.0788121223449707, "Pretrain/Step": 3084, "Pretrain/Step Time": 8.96317769214511} +{"Pretrain/Learning Rate": 3.9531374828199774e-05, "Pretrain/Loss": 2.061335325241089, "Pretrain/Loss (Raw)": 2.0809333324432373, "Pretrain/Step": 3085, "Pretrain/Step Time": 8.960968429222703} +{"Pretrain/Learning Rate": 3.952446559836295e-05, "Pretrain/Loss": 2.062911033630371, "Pretrain/Loss (Raw)": 2.1199262142181396, "Pretrain/Step": 3086, "Pretrain/Step Time": 8.969306819140911} +{"Pretrain/Learning Rate": 3.95175546934963e-05, "Pretrain/Loss": 2.0647077560424805, "Pretrain/Loss (Raw)": 2.165696620941162, "Pretrain/Step": 3087, "Pretrain/Step Time": 8.972884951159358} +{"Pretrain/Learning Rate": 3.951064211439684e-05, "Pretrain/Loss": 2.0627782344818115, "Pretrain/Loss (Raw)": 1.9652801752090454, "Pretrain/Step": 3088, "Pretrain/Step Time": 8.976821644231677} +{"Pretrain/Learning Rate": 3.9503727861861756e-05, "Pretrain/Loss": 2.0656347274780273, "Pretrain/Loss (Raw)": 2.292238712310791, "Pretrain/Step": 3089, "Pretrain/Step Time": 8.971857437863946} +{"Pretrain/Learning Rate": 3.9496811936688425e-05, "Pretrain/Loss": 2.065511703491211, "Pretrain/Loss (Raw)": 2.007324457168579, "Pretrain/Step": 3090, "Pretrain/Step Time": 8.970301048830152} +{"Pretrain/Learning Rate": 3.9489894339674435e-05, "Pretrain/Loss": 2.0638375282287598, "Pretrain/Loss (Raw)": 1.9352281093597412, "Pretrain/Step": 3091, "Pretrain/Step Time": 8.969162276014686} +{"Pretrain/Learning Rate": 3.948297507161756e-05, "Pretrain/Loss": 2.062443733215332, "Pretrain/Loss (Raw)": 2.0772688388824463, "Pretrain/Step": 3092, "Pretrain/Step Time": 8.964045321568847} +{"Pretrain/Learning Rate": 3.947605413331574e-05, "Pretrain/Loss": 2.06058406829834, "Pretrain/Loss (Raw)": 1.8639765977859497, "Pretrain/Step": 3093, "Pretrain/Step Time": 8.960464026778936} +{"Pretrain/Learning Rate": 3.946913152556715e-05, "Pretrain/Loss": 2.0617778301239014, "Pretrain/Loss (Raw)": 2.1599135398864746, "Pretrain/Step": 3094, "Pretrain/Step Time": 8.963130239397287} +{"Pretrain/Learning Rate": 3.946220724917013e-05, "Pretrain/Loss": 2.060749053955078, "Pretrain/Loss (Raw)": 1.8956297636032104, "Pretrain/Step": 3095, "Pretrain/Step Time": 8.965287867933512} +{"Pretrain/Learning Rate": 3.945528130492322e-05, "Pretrain/Loss": 2.058664321899414, "Pretrain/Loss (Raw)": 2.0283634662628174, "Pretrain/Step": 3096, "Pretrain/Step Time": 8.944972679018974} +{"Pretrain/Learning Rate": 3.944835369362516e-05, "Pretrain/Loss": 2.059812068939209, "Pretrain/Loss (Raw)": 2.0643601417541504, "Pretrain/Step": 3097, "Pretrain/Step Time": 8.943849658593535} +{"Pretrain/Learning Rate": 3.9441424416074866e-05, "Pretrain/Loss": 2.060610771179199, "Pretrain/Loss (Raw)": 2.1529040336608887, "Pretrain/Step": 3098, "Pretrain/Step Time": 8.941944926977158} +{"Pretrain/Learning Rate": 3.9434493473071456e-05, "Pretrain/Loss": 2.0630202293395996, "Pretrain/Loss (Raw)": 2.073664426803589, "Pretrain/Step": 3099, "Pretrain/Step Time": 8.939250376075506} +{"Pretrain/Learning Rate": 3.9427560865414246e-05, "Pretrain/Loss": 2.0623087882995605, "Pretrain/Loss (Raw)": 2.126251697540283, "Pretrain/Step": 3100, "Pretrain/Step Time": 8.92745864763856} +{"Pretrain/Learning Rate": 3.942062659390273e-05, "Pretrain/Loss": 2.063539981842041, "Pretrain/Loss (Raw)": 2.182589292526245, "Pretrain/Step": 3101, "Pretrain/Step Time": 8.930222731083632} +{"Pretrain/Learning Rate": 3.94136906593366e-05, "Pretrain/Loss": 2.064023017883301, "Pretrain/Loss (Raw)": 2.1802825927734375, "Pretrain/Step": 3102, "Pretrain/Step Time": 8.919605506584048} +{"Pretrain/Learning Rate": 3.940675306251574e-05, "Pretrain/Loss": 2.064122200012207, "Pretrain/Loss (Raw)": 2.127027750015259, "Pretrain/Step": 3103, "Pretrain/Step Time": 8.919699307531118} +{"Pretrain/Learning Rate": 3.939981380424024e-05, "Pretrain/Loss": 2.0630292892456055, "Pretrain/Loss (Raw)": 1.8220188617706299, "Pretrain/Step": 3104, "Pretrain/Step Time": 8.915536306798458} +{"Pretrain/Learning Rate": 3.939287288531035e-05, "Pretrain/Loss": 2.0622429847717285, "Pretrain/Loss (Raw)": 2.0714175701141357, "Pretrain/Step": 3105, "Pretrain/Step Time": 8.913908127695322} +{"Pretrain/Learning Rate": 3.938593030652654e-05, "Pretrain/Loss": 2.060946226119995, "Pretrain/Loss (Raw)": 1.9658716917037964, "Pretrain/Step": 3106, "Pretrain/Step Time": 8.917410327121615} +{"Pretrain/Learning Rate": 3.937898606868946e-05, "Pretrain/Loss": 2.0606462955474854, "Pretrain/Loss (Raw)": 2.078939914703369, "Pretrain/Step": 3107, "Pretrain/Step Time": 8.920853711664677} +{"Pretrain/Learning Rate": 3.9372040172599956e-05, "Pretrain/Loss": 2.0584897994995117, "Pretrain/Loss (Raw)": 1.874725341796875, "Pretrain/Step": 3108, "Pretrain/Step Time": 8.915413534268737} +{"Pretrain/Learning Rate": 3.936509261905905e-05, "Pretrain/Loss": 2.058807849884033, "Pretrain/Loss (Raw)": 2.02451753616333, "Pretrain/Step": 3109, "Pretrain/Step Time": 8.918658962473273} +{"Pretrain/Learning Rate": 3.935814340886797e-05, "Pretrain/Loss": 2.0593466758728027, "Pretrain/Loss (Raw)": 2.117375135421753, "Pretrain/Step": 3110, "Pretrain/Step Time": 8.915586614981294} +{"Pretrain/Learning Rate": 3.935119254282814e-05, "Pretrain/Loss": 2.0600686073303223, "Pretrain/Loss (Raw)": 2.093254327774048, "Pretrain/Step": 3111, "Pretrain/Step Time": 8.909527454525232} +{"Pretrain/Learning Rate": 3.934424002174115e-05, "Pretrain/Loss": 2.059535026550293, "Pretrain/Loss (Raw)": 2.240083694458008, "Pretrain/Step": 3112, "Pretrain/Step Time": 8.911858413368464} +{"Pretrain/Learning Rate": 3.9337285846408826e-05, "Pretrain/Loss": 2.060497760772705, "Pretrain/Loss (Raw)": 2.1034650802612305, "Pretrain/Step": 3113, "Pretrain/Step Time": 8.913806151598692} +{"Pretrain/Learning Rate": 3.9330330017633126e-05, "Pretrain/Loss": 2.060145378112793, "Pretrain/Loss (Raw)": 2.0392284393310547, "Pretrain/Step": 3114, "Pretrain/Step Time": 8.920526515692472} +{"Pretrain/Learning Rate": 3.932337253621624e-05, "Pretrain/Loss": 2.060206174850464, "Pretrain/Loss (Raw)": 1.9380911588668823, "Pretrain/Step": 3115, "Pretrain/Step Time": 8.915025066584349} +{"Pretrain/Learning Rate": 3.9316413402960553e-05, "Pretrain/Loss": 2.0591073036193848, "Pretrain/Loss (Raw)": 1.9824142456054688, "Pretrain/Step": 3116, "Pretrain/Step Time": 8.91386454552412} +{"Pretrain/Learning Rate": 3.93094526186686e-05, "Pretrain/Loss": 2.058612585067749, "Pretrain/Loss (Raw)": 1.9467777013778687, "Pretrain/Step": 3117, "Pretrain/Step Time": 8.918853743001819} +{"Pretrain/Learning Rate": 3.930249018414315e-05, "Pretrain/Loss": 2.0583267211914062, "Pretrain/Loss (Raw)": 1.9849077463150024, "Pretrain/Step": 3118, "Pretrain/Step Time": 8.92108355090022} +{"Pretrain/Learning Rate": 3.9295526100187126e-05, "Pretrain/Loss": 2.0567240715026855, "Pretrain/Loss (Raw)": 1.9622918367385864, "Pretrain/Step": 3119, "Pretrain/Step Time": 8.929902946576476} +{"Pretrain/Learning Rate": 3.928856036760368e-05, "Pretrain/Loss": 2.0581812858581543, "Pretrain/Loss (Raw)": 2.064513683319092, "Pretrain/Step": 3120, "Pretrain/Step Time": 8.936656713485718} +{"Pretrain/Learning Rate": 3.9281592987196115e-05, "Pretrain/Loss": 2.0571513175964355, "Pretrain/Loss (Raw)": 2.101494789123535, "Pretrain/Step": 3121, "Pretrain/Step Time": 8.932227754965425} +{"Pretrain/Learning Rate": 3.9274623959767945e-05, "Pretrain/Loss": 2.0548477172851562, "Pretrain/Loss (Raw)": 1.9402074813842773, "Pretrain/Step": 3122, "Pretrain/Step Time": 8.933890972286463} +{"Pretrain/Learning Rate": 3.9267653286122886e-05, "Pretrain/Loss": 2.0545144081115723, "Pretrain/Loss (Raw)": 2.010206699371338, "Pretrain/Step": 3123, "Pretrain/Step Time": 8.932133058086038} +{"Pretrain/Learning Rate": 3.9260680967064814e-05, "Pretrain/Loss": 2.0518767833709717, "Pretrain/Loss (Raw)": 1.9614009857177734, "Pretrain/Step": 3124, "Pretrain/Step Time": 8.934944618493319} +{"Pretrain/Learning Rate": 3.9253707003397814e-05, "Pretrain/Loss": 2.051915407180786, "Pretrain/Loss (Raw)": 2.0249979496002197, "Pretrain/Step": 3125, "Pretrain/Step Time": 8.936819514259696} +{"Pretrain/Learning Rate": 3.924673139592616e-05, "Pretrain/Loss": 2.0531668663024902, "Pretrain/Loss (Raw)": 2.0685322284698486, "Pretrain/Step": 3126, "Pretrain/Step Time": 8.934486934915185} +{"Pretrain/Learning Rate": 3.9239754145454304e-05, "Pretrain/Loss": 2.0535764694213867, "Pretrain/Loss (Raw)": 2.0817511081695557, "Pretrain/Step": 3127, "Pretrain/Step Time": 8.938577761873603} +{"Pretrain/Learning Rate": 3.92327752527869e-05, "Pretrain/Loss": 2.055713653564453, "Pretrain/Loss (Raw)": 2.071470022201538, "Pretrain/Step": 3128, "Pretrain/Step Time": 8.940059415996075} +{"Pretrain/Learning Rate": 3.922579471872879e-05, "Pretrain/Loss": 2.057769536972046, "Pretrain/Loss (Raw)": 2.02962327003479, "Pretrain/Step": 3129, "Pretrain/Step Time": 8.939676871523261} +{"Pretrain/Learning Rate": 3.9218812544085004e-05, "Pretrain/Loss": 2.058086395263672, "Pretrain/Loss (Raw)": 2.1313014030456543, "Pretrain/Step": 3130, "Pretrain/Step Time": 8.938466837629676} +{"Pretrain/Learning Rate": 3.921182872966075e-05, "Pretrain/Loss": 2.0558693408966064, "Pretrain/Loss (Raw)": 1.8905376195907593, "Pretrain/Step": 3131, "Pretrain/Step Time": 8.93553925678134} +{"Pretrain/Learning Rate": 3.920484327626144e-05, "Pretrain/Loss": 2.0555593967437744, "Pretrain/Loss (Raw)": 1.6518359184265137, "Pretrain/Step": 3132, "Pretrain/Step Time": 8.939921973273158} +{"Pretrain/Learning Rate": 3.919785618469266e-05, "Pretrain/Loss": 2.0547759532928467, "Pretrain/Loss (Raw)": 2.0902485847473145, "Pretrain/Step": 3133, "Pretrain/Step Time": 8.940719632431865} +{"Pretrain/Learning Rate": 3.9190867455760213e-05, "Pretrain/Loss": 2.054795265197754, "Pretrain/Loss (Raw)": 1.9657739400863647, "Pretrain/Step": 3134, "Pretrain/Step Time": 8.939883494749665} +{"Pretrain/Learning Rate": 3.918387709027005e-05, "Pretrain/Loss": 2.0544705390930176, "Pretrain/Loss (Raw)": 1.9327750205993652, "Pretrain/Step": 3135, "Pretrain/Step Time": 8.941303070634604} +{"Pretrain/Learning Rate": 3.917688508902835e-05, "Pretrain/Loss": 2.0568227767944336, "Pretrain/Loss (Raw)": 2.1028835773468018, "Pretrain/Step": 3136, "Pretrain/Step Time": 8.943489534780383} +{"Pretrain/Learning Rate": 3.916989145284146e-05, "Pretrain/Loss": 2.05486798286438, "Pretrain/Loss (Raw)": 2.2169833183288574, "Pretrain/Step": 3137, "Pretrain/Step Time": 8.951162599027157} +{"Pretrain/Learning Rate": 3.9162896182515915e-05, "Pretrain/Loss": 2.055788040161133, "Pretrain/Loss (Raw)": 2.1110429763793945, "Pretrain/Step": 3138, "Pretrain/Step Time": 8.953513728454709} +{"Pretrain/Learning Rate": 3.9155899278858445e-05, "Pretrain/Loss": 2.0576746463775635, "Pretrain/Loss (Raw)": 2.244663715362549, "Pretrain/Step": 3139, "Pretrain/Step Time": 8.947551935911179} +{"Pretrain/Learning Rate": 3.914890074267597e-05, "Pretrain/Loss": 2.0566577911376953, "Pretrain/Loss (Raw)": 1.9205125570297241, "Pretrain/Step": 3140, "Pretrain/Step Time": 8.94504644535482} +{"Pretrain/Learning Rate": 3.914190057477558e-05, "Pretrain/Loss": 2.052321434020996, "Pretrain/Loss (Raw)": 1.7106372117996216, "Pretrain/Step": 3141, "Pretrain/Step Time": 8.946482930332422} +{"Pretrain/Learning Rate": 3.913489877596458e-05, "Pretrain/Loss": 2.05478572845459, "Pretrain/Loss (Raw)": 2.2920894622802734, "Pretrain/Step": 3142, "Pretrain/Step Time": 8.93955003656447} +{"Pretrain/Learning Rate": 3.912789534705045e-05, "Pretrain/Loss": 2.0538687705993652, "Pretrain/Loss (Raw)": 2.1293463706970215, "Pretrain/Step": 3143, "Pretrain/Step Time": 8.940847713500261} +{"Pretrain/Learning Rate": 3.912089028884085e-05, "Pretrain/Loss": 2.0558838844299316, "Pretrain/Loss (Raw)": 2.0575904846191406, "Pretrain/Step": 3144, "Pretrain/Step Time": 8.94114707224071} +{"Pretrain/Learning Rate": 3.9113883602143645e-05, "Pretrain/Loss": 2.054107189178467, "Pretrain/Loss (Raw)": 1.9016221761703491, "Pretrain/Step": 3145, "Pretrain/Step Time": 8.932675417512655} +{"Pretrain/Learning Rate": 3.910687528776688e-05, "Pretrain/Loss": 2.0539519786834717, "Pretrain/Loss (Raw)": 2.187335968017578, "Pretrain/Step": 3146, "Pretrain/Step Time": 8.93227693066001} +{"Pretrain/Learning Rate": 3.9099865346518786e-05, "Pretrain/Loss": 2.0533924102783203, "Pretrain/Loss (Raw)": 1.9859994649887085, "Pretrain/Step": 3147, "Pretrain/Step Time": 8.93538692779839} +{"Pretrain/Learning Rate": 3.909285377920777e-05, "Pretrain/Loss": 2.0512948036193848, "Pretrain/Loss (Raw)": 1.8604192733764648, "Pretrain/Step": 3148, "Pretrain/Step Time": 8.938554715365171} +{"Pretrain/Learning Rate": 3.908584058664245e-05, "Pretrain/Loss": 2.052382707595825, "Pretrain/Loss (Raw)": 2.04282546043396, "Pretrain/Step": 3149, "Pretrain/Step Time": 8.928158847615123} +{"Pretrain/Learning Rate": 3.907882576963162e-05, "Pretrain/Loss": 2.0507168769836426, "Pretrain/Loss (Raw)": 2.0356645584106445, "Pretrain/Step": 3150, "Pretrain/Step Time": 8.924793971702456} +{"Pretrain/Learning Rate": 3.907180932898427e-05, "Pretrain/Loss": 2.0521504878997803, "Pretrain/Loss (Raw)": 1.8034613132476807, "Pretrain/Step": 3151, "Pretrain/Step Time": 8.92041066288948} +{"Pretrain/Learning Rate": 3.9064791265509546e-05, "Pretrain/Loss": 2.0511136054992676, "Pretrain/Loss (Raw)": 2.1588473320007324, "Pretrain/Step": 3152, "Pretrain/Step Time": 8.913404336199164} +{"Pretrain/Learning Rate": 3.905777158001682e-05, "Pretrain/Loss": 2.0524535179138184, "Pretrain/Loss (Raw)": 2.0826408863067627, "Pretrain/Step": 3153, "Pretrain/Step Time": 8.915515471249819} +{"Pretrain/Learning Rate": 3.905075027331564e-05, "Pretrain/Loss": 2.0523605346679688, "Pretrain/Loss (Raw)": 1.9874731302261353, "Pretrain/Step": 3154, "Pretrain/Step Time": 8.91328527405858} +{"Pretrain/Learning Rate": 3.9043727346215726e-05, "Pretrain/Loss": 2.05139422416687, "Pretrain/Loss (Raw)": 1.9571706056594849, "Pretrain/Step": 3155, "Pretrain/Step Time": 8.910037264227867} +{"Pretrain/Learning Rate": 3.9036702799527e-05, "Pretrain/Loss": 2.0505261421203613, "Pretrain/Loss (Raw)": 1.94492769241333, "Pretrain/Step": 3156, "Pretrain/Step Time": 8.914122212678194} +{"Pretrain/Learning Rate": 3.902967663405956e-05, "Pretrain/Loss": 2.0527281761169434, "Pretrain/Loss (Raw)": 2.2940900325775146, "Pretrain/Step": 3157, "Pretrain/Step Time": 8.916909981518984} +{"Pretrain/Learning Rate": 3.90226488506237e-05, "Pretrain/Loss": 2.0534236431121826, "Pretrain/Loss (Raw)": 1.9081707000732422, "Pretrain/Step": 3158, "Pretrain/Step Time": 8.918337250128388} +{"Pretrain/Learning Rate": 3.9015619450029904e-05, "Pretrain/Loss": 2.051849126815796, "Pretrain/Loss (Raw)": 1.9898463487625122, "Pretrain/Step": 3159, "Pretrain/Step Time": 8.91686431504786} +{"Pretrain/Learning Rate": 3.9008588433088825e-05, "Pretrain/Loss": 2.052290916442871, "Pretrain/Loss (Raw)": 2.1115176677703857, "Pretrain/Step": 3160, "Pretrain/Step Time": 8.915849963203073} +{"Pretrain/Learning Rate": 3.900155580061132e-05, "Pretrain/Loss": 2.049839973449707, "Pretrain/Loss (Raw)": 1.704206943511963, "Pretrain/Step": 3161, "Pretrain/Step Time": 8.911983646452427} +{"Pretrain/Learning Rate": 3.899452155340842e-05, "Pretrain/Loss": 2.0495822429656982, "Pretrain/Loss (Raw)": 2.201413869857788, "Pretrain/Step": 3162, "Pretrain/Step Time": 8.913143713027239} +{"Pretrain/Learning Rate": 3.898748569229135e-05, "Pretrain/Loss": 2.048295259475708, "Pretrain/Loss (Raw)": 1.906986951828003, "Pretrain/Step": 3163, "Pretrain/Step Time": 8.917511250823736} +{"Pretrain/Learning Rate": 3.898044821807152e-05, "Pretrain/Loss": 2.045450210571289, "Pretrain/Loss (Raw)": 1.7452845573425293, "Pretrain/Step": 3164, "Pretrain/Step Time": 8.9227642621845} +{"Pretrain/Learning Rate": 3.897340913156052e-05, "Pretrain/Loss": 2.046246290206909, "Pretrain/Loss (Raw)": 2.0738632678985596, "Pretrain/Step": 3165, "Pretrain/Step Time": 8.91848785057664} +{"Pretrain/Learning Rate": 3.896636843357014e-05, "Pretrain/Loss": 2.044006109237671, "Pretrain/Loss (Raw)": 1.824052333831787, "Pretrain/Step": 3166, "Pretrain/Step Time": 8.919265057891607} +{"Pretrain/Learning Rate": 3.895932612491233e-05, "Pretrain/Loss": 2.0429744720458984, "Pretrain/Loss (Raw)": 1.8513201475143433, "Pretrain/Step": 3167, "Pretrain/Step Time": 8.907964788377285} +{"Pretrain/Learning Rate": 3.895228220639926e-05, "Pretrain/Loss": 2.0453081130981445, "Pretrain/Loss (Raw)": 2.244797706604004, "Pretrain/Step": 3168, "Pretrain/Step Time": 8.906393513083458} +{"Pretrain/Learning Rate": 3.8945236678843266e-05, "Pretrain/Loss": 2.0466866493225098, "Pretrain/Loss (Raw)": 2.203418731689453, "Pretrain/Step": 3169, "Pretrain/Step Time": 8.913116529583931} +{"Pretrain/Learning Rate": 3.893818954305686e-05, "Pretrain/Loss": 2.0463991165161133, "Pretrain/Loss (Raw)": 2.087512731552124, "Pretrain/Step": 3170, "Pretrain/Step Time": 8.913759080693126} +{"Pretrain/Learning Rate": 3.893114079985276e-05, "Pretrain/Loss": 2.0444393157958984, "Pretrain/Loss (Raw)": 1.9464001655578613, "Pretrain/Step": 3171, "Pretrain/Step Time": 8.90918399952352} +{"Pretrain/Learning Rate": 3.892409045004385e-05, "Pretrain/Loss": 2.0419416427612305, "Pretrain/Loss (Raw)": 1.7987810373306274, "Pretrain/Step": 3172, "Pretrain/Step Time": 8.914276540279388} +{"Pretrain/Learning Rate": 3.891703849444322e-05, "Pretrain/Loss": 2.040247917175293, "Pretrain/Loss (Raw)": 1.9235323667526245, "Pretrain/Step": 3173, "Pretrain/Step Time": 8.924117533490062} +{"Pretrain/Learning Rate": 3.890998493386414e-05, "Pretrain/Loss": 2.0385961532592773, "Pretrain/Loss (Raw)": 1.7590140104293823, "Pretrain/Step": 3174, "Pretrain/Step Time": 8.922401400282979} +{"Pretrain/Learning Rate": 3.890292976912005e-05, "Pretrain/Loss": 2.0382840633392334, "Pretrain/Loss (Raw)": 2.0800583362579346, "Pretrain/Step": 3175, "Pretrain/Step Time": 8.928408535197377} +{"Pretrain/Learning Rate": 3.889587300102457e-05, "Pretrain/Loss": 2.036614179611206, "Pretrain/Loss (Raw)": 1.7803431749343872, "Pretrain/Step": 3176, "Pretrain/Step Time": 8.927510544657707} +{"Pretrain/Learning Rate": 3.8888814630391556e-05, "Pretrain/Loss": 2.036304473876953, "Pretrain/Loss (Raw)": 2.1608712673187256, "Pretrain/Step": 3177, "Pretrain/Step Time": 8.925679799169302} +{"Pretrain/Learning Rate": 3.8881754658034986e-05, "Pretrain/Loss": 2.0369033813476562, "Pretrain/Loss (Raw)": 2.101581573486328, "Pretrain/Step": 3178, "Pretrain/Step Time": 8.928430713713169} +{"Pretrain/Learning Rate": 3.8874693084769055e-05, "Pretrain/Loss": 2.0361781120300293, "Pretrain/Loss (Raw)": 2.0478718280792236, "Pretrain/Step": 3179, "Pretrain/Step Time": 8.930287120863795} +{"Pretrain/Learning Rate": 3.8867629911408135e-05, "Pretrain/Loss": 2.0356040000915527, "Pretrain/Loss (Raw)": 1.8667879104614258, "Pretrain/Step": 3180, "Pretrain/Step Time": 8.92730538547039} +{"Pretrain/Learning Rate": 3.886056513876679e-05, "Pretrain/Loss": 2.033562660217285, "Pretrain/Loss (Raw)": 1.8947782516479492, "Pretrain/Step": 3181, "Pretrain/Step Time": 8.930967465043068} +{"Pretrain/Learning Rate": 3.885349876765976e-05, "Pretrain/Loss": 2.0341153144836426, "Pretrain/Loss (Raw)": 2.21405291557312, "Pretrain/Step": 3182, "Pretrain/Step Time": 8.929612509906292} +{"Pretrain/Learning Rate": 3.884643079890197e-05, "Pretrain/Loss": 2.0326881408691406, "Pretrain/Loss (Raw)": 2.034911632537842, "Pretrain/Step": 3183, "Pretrain/Step Time": 8.938006235286593} +{"Pretrain/Learning Rate": 3.883936123330853e-05, "Pretrain/Loss": 2.0326499938964844, "Pretrain/Loss (Raw)": 2.11161732673645, "Pretrain/Step": 3184, "Pretrain/Step Time": 8.940230507403612} +{"Pretrain/Learning Rate": 3.883229007169474e-05, "Pretrain/Loss": 2.0330231189727783, "Pretrain/Loss (Raw)": 2.1046290397644043, "Pretrain/Step": 3185, "Pretrain/Step Time": 8.931443065404892} +{"Pretrain/Learning Rate": 3.8825217314876084e-05, "Pretrain/Loss": 2.032230854034424, "Pretrain/Loss (Raw)": 1.8488000631332397, "Pretrain/Step": 3186, "Pretrain/Step Time": 8.930538523942232} +{"Pretrain/Learning Rate": 3.881814296366822e-05, "Pretrain/Loss": 2.0331320762634277, "Pretrain/Loss (Raw)": 2.233660936355591, "Pretrain/Step": 3187, "Pretrain/Step Time": 8.934254366904497} +{"Pretrain/Learning Rate": 3.881106701888699e-05, "Pretrain/Loss": 2.033611536026001, "Pretrain/Loss (Raw)": 1.9564969539642334, "Pretrain/Step": 3188, "Pretrain/Step Time": 8.93321829289198} +{"Pretrain/Learning Rate": 3.880398948134845e-05, "Pretrain/Loss": 2.0312583446502686, "Pretrain/Loss (Raw)": 1.9346370697021484, "Pretrain/Step": 3189, "Pretrain/Step Time": 8.934559283778071} +{"Pretrain/Learning Rate": 3.879691035186878e-05, "Pretrain/Loss": 2.0306472778320312, "Pretrain/Loss (Raw)": 2.0312862396240234, "Pretrain/Step": 3190, "Pretrain/Step Time": 8.893774749711156} +{"Pretrain/Learning Rate": 3.8789829631264394e-05, "Pretrain/Loss": 2.0307059288024902, "Pretrain/Loss (Raw)": 1.99386727809906, "Pretrain/Step": 3191, "Pretrain/Step Time": 8.895076168701053} +{"Pretrain/Learning Rate": 3.878274732035188e-05, "Pretrain/Loss": 2.0298891067504883, "Pretrain/Loss (Raw)": 2.089399814605713, "Pretrain/Step": 3192, "Pretrain/Step Time": 8.893183793872595} +{"Pretrain/Learning Rate": 3.8775663419948e-05, "Pretrain/Loss": 2.027820110321045, "Pretrain/Loss (Raw)": 2.025937557220459, "Pretrain/Step": 3193, "Pretrain/Step Time": 8.995704097673297} +{"Pretrain/Learning Rate": 3.87685779308697e-05, "Pretrain/Loss": 2.0245964527130127, "Pretrain/Loss (Raw)": 1.7290161848068237, "Pretrain/Step": 3194, "Pretrain/Step Time": 8.998875429853797} +{"Pretrain/Learning Rate": 3.8761490853934115e-05, "Pretrain/Loss": 2.025700569152832, "Pretrain/Loss (Raw)": 2.213667869567871, "Pretrain/Step": 3195, "Pretrain/Step Time": 8.996451534330845} +{"Pretrain/Learning Rate": 3.875440218995856e-05, "Pretrain/Loss": 2.0286617279052734, "Pretrain/Loss (Raw)": 1.9461394548416138, "Pretrain/Step": 3196, "Pretrain/Step Time": 8.991553489118814} +{"Pretrain/Learning Rate": 3.874731193976052e-05, "Pretrain/Loss": 2.027549982070923, "Pretrain/Loss (Raw)": 2.102848768234253, "Pretrain/Step": 3197, "Pretrain/Step Time": 8.994479853659868} +{"Pretrain/Learning Rate": 3.87402201041577e-05, "Pretrain/Loss": 2.02506685256958, "Pretrain/Loss (Raw)": 1.7438857555389404, "Pretrain/Step": 3198, "Pretrain/Step Time": 8.99278799816966} +{"Pretrain/Learning Rate": 3.8733126683967946e-05, "Pretrain/Loss": 2.025844097137451, "Pretrain/Loss (Raw)": 2.0844039916992188, "Pretrain/Step": 3199, "Pretrain/Step Time": 8.99255264364183} +{"Pretrain/Learning Rate": 3.872603168000931e-05, "Pretrain/Loss": 2.0261495113372803, "Pretrain/Loss (Raw)": 2.1525204181671143, "Pretrain/Step": 3200, "Pretrain/Step Time": 8.99509003199637} +{"Pretrain/Learning Rate": 3.871893509310003e-05, "Pretrain/Loss": 2.024277687072754, "Pretrain/Loss (Raw)": 1.8704373836517334, "Pretrain/Step": 3201, "Pretrain/Step Time": 8.993087287992239} +{"Pretrain/Learning Rate": 3.87118369240585e-05, "Pretrain/Loss": 2.025919198989868, "Pretrain/Loss (Raw)": 2.1786434650421143, "Pretrain/Step": 3202, "Pretrain/Step Time": 8.94549310579896} +{"Pretrain/Learning Rate": 3.870473717370333e-05, "Pretrain/Loss": 2.025430202484131, "Pretrain/Loss (Raw)": 2.057332754135132, "Pretrain/Step": 3203, "Pretrain/Step Time": 8.947720160707831} +{"Pretrain/Learning Rate": 3.869763584285328e-05, "Pretrain/Loss": 2.0238966941833496, "Pretrain/Loss (Raw)": 1.6943767070770264, "Pretrain/Step": 3204, "Pretrain/Step Time": 8.94317795149982} +{"Pretrain/Learning Rate": 3.869053293232733e-05, "Pretrain/Loss": 2.019848346710205, "Pretrain/Loss (Raw)": 1.9768869876861572, "Pretrain/Step": 3205, "Pretrain/Step Time": 8.947887098416686} +{"Pretrain/Learning Rate": 3.8683428442944604e-05, "Pretrain/Loss": 2.018298625946045, "Pretrain/Loss (Raw)": 1.928547739982605, "Pretrain/Step": 3206, "Pretrain/Step Time": 8.950161447748542} +{"Pretrain/Learning Rate": 3.8676322375524435e-05, "Pretrain/Loss": 2.0176539421081543, "Pretrain/Loss (Raw)": 1.9724624156951904, "Pretrain/Step": 3207, "Pretrain/Step Time": 8.949811032041907} +{"Pretrain/Learning Rate": 3.866921473088632e-05, "Pretrain/Loss": 2.018380641937256, "Pretrain/Loss (Raw)": 2.115220069885254, "Pretrain/Step": 3208, "Pretrain/Step Time": 9.151734640821815} +{"Pretrain/Learning Rate": 3.866210550984996e-05, "Pretrain/Loss": 2.019869327545166, "Pretrain/Loss (Raw)": 2.0438225269317627, "Pretrain/Step": 3209, "Pretrain/Step Time": 9.154782097786665} +{"Pretrain/Learning Rate": 3.86549947132352e-05, "Pretrain/Loss": 2.0159034729003906, "Pretrain/Loss (Raw)": 1.6990798711776733, "Pretrain/Step": 3210, "Pretrain/Step Time": 9.15231236629188} +{"Pretrain/Learning Rate": 3.8647882341862115e-05, "Pretrain/Loss": 2.018632411956787, "Pretrain/Loss (Raw)": 2.2160110473632812, "Pretrain/Step": 3211, "Pretrain/Step Time": 9.152858396992087} +{"Pretrain/Learning Rate": 3.864076839655093e-05, "Pretrain/Loss": 2.018624782562256, "Pretrain/Loss (Raw)": 2.077826738357544, "Pretrain/Step": 3212, "Pretrain/Step Time": 9.14475285448134} +{"Pretrain/Learning Rate": 3.863365287812205e-05, "Pretrain/Loss": 2.0186080932617188, "Pretrain/Loss (Raw)": 2.078794240951538, "Pretrain/Step": 3213, "Pretrain/Step Time": 9.149844715371728} +{"Pretrain/Learning Rate": 3.862653578739608e-05, "Pretrain/Loss": 2.0194716453552246, "Pretrain/Loss (Raw)": 2.230433225631714, "Pretrain/Step": 3214, "Pretrain/Step Time": 9.144671654328704} +{"Pretrain/Learning Rate": 3.861941712519379e-05, "Pretrain/Loss": 2.017810106277466, "Pretrain/Loss (Raw)": 1.9530444145202637, "Pretrain/Step": 3215, "Pretrain/Step Time": 9.13947469741106} +{"Pretrain/Learning Rate": 3.8612296892336144e-05, "Pretrain/Loss": 2.0174524784088135, "Pretrain/Loss (Raw)": 1.9194972515106201, "Pretrain/Step": 3216, "Pretrain/Step Time": 9.131676016375422} +{"Pretrain/Learning Rate": 3.8605175089644274e-05, "Pretrain/Loss": 2.0150742530822754, "Pretrain/Loss (Raw)": 1.9878309965133667, "Pretrain/Step": 3217, "Pretrain/Step Time": 9.128891568630934} +{"Pretrain/Learning Rate": 3.859805171793951e-05, "Pretrain/Loss": 2.0146350860595703, "Pretrain/Loss (Raw)": 1.95109224319458, "Pretrain/Step": 3218, "Pretrain/Step Time": 9.12884009629488} +{"Pretrain/Learning Rate": 3.8590926778043335e-05, "Pretrain/Loss": 2.0158443450927734, "Pretrain/Loss (Raw)": 2.090069532394409, "Pretrain/Step": 3219, "Pretrain/Step Time": 9.13158787600696} +{"Pretrain/Learning Rate": 3.858380027077745e-05, "Pretrain/Loss": 2.0159590244293213, "Pretrain/Loss (Raw)": 2.0919084548950195, "Pretrain/Step": 3220, "Pretrain/Step Time": 9.133624667301774} +{"Pretrain/Learning Rate": 3.8576672196963705e-05, "Pretrain/Loss": 2.015392303466797, "Pretrain/Loss (Raw)": 1.7914551496505737, "Pretrain/Step": 3221, "Pretrain/Step Time": 9.13760693743825} +{"Pretrain/Learning Rate": 3.856954255742414e-05, "Pretrain/Loss": 2.0137782096862793, "Pretrain/Loss (Raw)": 1.9533101320266724, "Pretrain/Step": 3222, "Pretrain/Step Time": 9.134662851691246} +{"Pretrain/Learning Rate": 3.8562411352980996e-05, "Pretrain/Loss": 2.013371229171753, "Pretrain/Loss (Raw)": 1.8435189723968506, "Pretrain/Step": 3223, "Pretrain/Step Time": 9.137895427644253} +{"Pretrain/Learning Rate": 3.8555278584456664e-05, "Pretrain/Loss": 2.013824701309204, "Pretrain/Loss (Raw)": 2.0864224433898926, "Pretrain/Step": 3224, "Pretrain/Step Time": 9.139281691983342} +{"Pretrain/Learning Rate": 3.854814425267373e-05, "Pretrain/Loss": 2.0124974250793457, "Pretrain/Loss (Raw)": 1.894481897354126, "Pretrain/Step": 3225, "Pretrain/Step Time": 9.14144790917635} +{"Pretrain/Learning Rate": 3.8541008358454956e-05, "Pretrain/Loss": 2.01171875, "Pretrain/Loss (Raw)": 2.0532031059265137, "Pretrain/Step": 3226, "Pretrain/Step Time": 9.137489164248109} +{"Pretrain/Learning Rate": 3.853387090262329e-05, "Pretrain/Loss": 2.0088517665863037, "Pretrain/Loss (Raw)": 1.706709623336792, "Pretrain/Step": 3227, "Pretrain/Step Time": 9.143492233008146} +{"Pretrain/Learning Rate": 3.852673188600187e-05, "Pretrain/Loss": 2.009489059448242, "Pretrain/Loss (Raw)": 2.2078044414520264, "Pretrain/Step": 3228, "Pretrain/Step Time": 9.140022652223706} +{"Pretrain/Learning Rate": 3.851959130941398e-05, "Pretrain/Loss": 2.0092599391937256, "Pretrain/Loss (Raw)": 2.1532630920410156, "Pretrain/Step": 3229, "Pretrain/Step Time": 9.138706307858229} +{"Pretrain/Learning Rate": 3.851244917368311e-05, "Pretrain/Loss": 2.0082292556762695, "Pretrain/Loss (Raw)": 2.0483644008636475, "Pretrain/Step": 3230, "Pretrain/Step Time": 9.13834816403687} +{"Pretrain/Learning Rate": 3.8505305479632934e-05, "Pretrain/Loss": 2.0072293281555176, "Pretrain/Loss (Raw)": 1.9990293979644775, "Pretrain/Step": 3231, "Pretrain/Step Time": 9.14486800134182} +{"Pretrain/Learning Rate": 3.8498160228087284e-05, "Pretrain/Loss": 2.00504207611084, "Pretrain/Loss (Raw)": 1.5420355796813965, "Pretrain/Step": 3232, "Pretrain/Step Time": 9.148559667170048} +{"Pretrain/Learning Rate": 3.8491013419870204e-05, "Pretrain/Loss": 2.005056381225586, "Pretrain/Loss (Raw)": 2.0732803344726562, "Pretrain/Step": 3233, "Pretrain/Step Time": 9.148790637031198} +{"Pretrain/Learning Rate": 3.848386505580588e-05, "Pretrain/Loss": 2.0069007873535156, "Pretrain/Loss (Raw)": 2.2019402980804443, "Pretrain/Step": 3234, "Pretrain/Step Time": 9.151215309277177} +{"Pretrain/Learning Rate": 3.84767151367187e-05, "Pretrain/Loss": 2.006436347961426, "Pretrain/Loss (Raw)": 2.0195086002349854, "Pretrain/Step": 3235, "Pretrain/Step Time": 9.149144880473614} +{"Pretrain/Learning Rate": 3.846956366343322e-05, "Pretrain/Loss": 2.0062220096588135, "Pretrain/Loss (Raw)": 1.8472751379013062, "Pretrain/Step": 3236, "Pretrain/Step Time": 9.150157183408737} +{"Pretrain/Learning Rate": 3.8462410636774196e-05, "Pretrain/Loss": 2.007359743118286, "Pretrain/Loss (Raw)": 2.170130491256714, "Pretrain/Step": 3237, "Pretrain/Step Time": 9.143564401194453} +{"Pretrain/Learning Rate": 3.845525605756653e-05, "Pretrain/Loss": 2.0070712566375732, "Pretrain/Loss (Raw)": 2.0804741382598877, "Pretrain/Step": 3238, "Pretrain/Step Time": 9.151716211810708} +{"Pretrain/Learning Rate": 3.844809992663534e-05, "Pretrain/Loss": 2.0077733993530273, "Pretrain/Loss (Raw)": 2.183131694793701, "Pretrain/Step": 3239, "Pretrain/Step Time": 9.157577097415924} +{"Pretrain/Learning Rate": 3.844094224480589e-05, "Pretrain/Loss": 2.0018582344055176, "Pretrain/Loss (Raw)": 1.4829442501068115, "Pretrain/Step": 3240, "Pretrain/Step Time": 9.156131932511926} +{"Pretrain/Learning Rate": 3.843378301290366e-05, "Pretrain/Loss": 2.0024819374084473, "Pretrain/Loss (Raw)": 2.1832971572875977, "Pretrain/Step": 3241, "Pretrain/Step Time": 9.157248491421342} +{"Pretrain/Learning Rate": 3.8426622231754255e-05, "Pretrain/Loss": 2.0028576850891113, "Pretrain/Loss (Raw)": 2.0872879028320312, "Pretrain/Step": 3242, "Pretrain/Step Time": 9.152797089889646} +{"Pretrain/Learning Rate": 3.8419459902183515e-05, "Pretrain/Loss": 2.0033326148986816, "Pretrain/Loss (Raw)": 1.9989064931869507, "Pretrain/Step": 3243, "Pretrain/Step Time": 9.153213633224368} +{"Pretrain/Learning Rate": 3.841229602501742e-05, "Pretrain/Loss": 2.003690719604492, "Pretrain/Loss (Raw)": 2.0282516479492188, "Pretrain/Step": 3244, "Pretrain/Step Time": 9.15366773121059} +{"Pretrain/Learning Rate": 3.840513060108214e-05, "Pretrain/Loss": 2.0037882328033447, "Pretrain/Loss (Raw)": 1.9592630863189697, "Pretrain/Step": 3245, "Pretrain/Step Time": 9.147913543507457} +{"Pretrain/Learning Rate": 3.8397963631204046e-05, "Pretrain/Loss": 2.004718780517578, "Pretrain/Loss (Raw)": 2.1040151119232178, "Pretrain/Step": 3246, "Pretrain/Step Time": 9.145590042695403} +{"Pretrain/Learning Rate": 3.8390795116209645e-05, "Pretrain/Loss": 2.0084285736083984, "Pretrain/Loss (Raw)": 2.4371488094329834, "Pretrain/Step": 3247, "Pretrain/Step Time": 9.131957232952118} +{"Pretrain/Learning Rate": 3.8383625056925654e-05, "Pretrain/Loss": 2.006959915161133, "Pretrain/Loss (Raw)": 1.8765166997909546, "Pretrain/Step": 3248, "Pretrain/Step Time": 9.124003924429417} +{"Pretrain/Learning Rate": 3.837645345417895e-05, "Pretrain/Loss": 2.007767677307129, "Pretrain/Loss (Raw)": 2.2048768997192383, "Pretrain/Step": 3249, "Pretrain/Step Time": 9.129649735987186} +{"Pretrain/Learning Rate": 3.836928030879661e-05, "Pretrain/Loss": 2.009457588195801, "Pretrain/Loss (Raw)": 2.156511068344116, "Pretrain/Step": 3250, "Pretrain/Step Time": 9.754765972495079} +{"Pretrain/Learning Rate": 3.8362105621605866e-05, "Pretrain/Loss": 2.0101733207702637, "Pretrain/Loss (Raw)": 2.101832866668701, "Pretrain/Step": 3251, "Pretrain/Step Time": 9.751588050276041} +{"Pretrain/Learning Rate": 3.835492939343413e-05, "Pretrain/Loss": 2.0073089599609375, "Pretrain/Loss (Raw)": 1.5947625637054443, "Pretrain/Step": 3252, "Pretrain/Step Time": 9.745995927602053} +{"Pretrain/Learning Rate": 3.834775162510901e-05, "Pretrain/Loss": 2.005854845046997, "Pretrain/Loss (Raw)": 1.8388780355453491, "Pretrain/Step": 3253, "Pretrain/Step Time": 9.747805412858725} +{"Pretrain/Learning Rate": 3.834057231745828e-05, "Pretrain/Loss": 2.0044748783111572, "Pretrain/Loss (Raw)": 1.8919107913970947, "Pretrain/Step": 3254, "Pretrain/Step Time": 9.746049832552671} +{"Pretrain/Learning Rate": 3.8333391471309884e-05, "Pretrain/Loss": 2.004401683807373, "Pretrain/Loss (Raw)": 2.072387456893921, "Pretrain/Step": 3255, "Pretrain/Step Time": 9.742096358910203} +{"Pretrain/Learning Rate": 3.8326209087491955e-05, "Pretrain/Loss": 2.001620292663574, "Pretrain/Loss (Raw)": 1.7154542207717896, "Pretrain/Step": 3256, "Pretrain/Step Time": 9.739142190665007} +{"Pretrain/Learning Rate": 3.8319025166832794e-05, "Pretrain/Loss": 2.0018322467803955, "Pretrain/Loss (Raw)": 2.0567238330841064, "Pretrain/Step": 3257, "Pretrain/Step Time": 9.741328109055758} +{"Pretrain/Learning Rate": 3.83118397101609e-05, "Pretrain/Loss": 2.001436233520508, "Pretrain/Loss (Raw)": 2.0806243419647217, "Pretrain/Step": 3258, "Pretrain/Step Time": 9.74293803051114} +{"Pretrain/Learning Rate": 3.830465271830491e-05, "Pretrain/Loss": 2.00273060798645, "Pretrain/Loss (Raw)": 2.056198835372925, "Pretrain/Step": 3259, "Pretrain/Step Time": 9.745985757559538} +{"Pretrain/Learning Rate": 3.829746419209369e-05, "Pretrain/Loss": 2.0063424110412598, "Pretrain/Loss (Raw)": 2.114147186279297, "Pretrain/Step": 3260, "Pretrain/Step Time": 9.750267373397946} +{"Pretrain/Learning Rate": 3.829027413235623e-05, "Pretrain/Loss": 2.0054640769958496, "Pretrain/Loss (Raw)": 1.977851152420044, "Pretrain/Step": 3261, "Pretrain/Step Time": 9.744144214317203} +{"Pretrain/Learning Rate": 3.8283082539921735e-05, "Pretrain/Loss": 2.0058436393737793, "Pretrain/Loss (Raw)": 2.014364242553711, "Pretrain/Step": 3262, "Pretrain/Step Time": 9.742907939478755} +{"Pretrain/Learning Rate": 3.827588941561956e-05, "Pretrain/Loss": 2.006732940673828, "Pretrain/Loss (Raw)": 2.046572685241699, "Pretrain/Step": 3263, "Pretrain/Step Time": 9.740753443911672} +{"Pretrain/Learning Rate": 3.826869476027927e-05, "Pretrain/Loss": 2.0055618286132812, "Pretrain/Loss (Raw)": 1.9530006647109985, "Pretrain/Step": 3264, "Pretrain/Step Time": 9.737108051776886} +{"Pretrain/Learning Rate": 3.826149857473057e-05, "Pretrain/Loss": 2.004335641860962, "Pretrain/Loss (Raw)": 2.0600202083587646, "Pretrain/Step": 3265, "Pretrain/Step Time": 9.72277907654643} +{"Pretrain/Learning Rate": 3.825430085980337e-05, "Pretrain/Loss": 2.003065347671509, "Pretrain/Loss (Raw)": 1.9484542608261108, "Pretrain/Step": 3266, "Pretrain/Step Time": 9.72739190608263} +{"Pretrain/Learning Rate": 3.8247101616327726e-05, "Pretrain/Loss": 2.0007057189941406, "Pretrain/Loss (Raw)": 1.9426339864730835, "Pretrain/Step": 3267, "Pretrain/Step Time": 9.727715054526925} +{"Pretrain/Learning Rate": 3.823990084513391e-05, "Pretrain/Loss": 1.998805284500122, "Pretrain/Loss (Raw)": 1.6772607564926147, "Pretrain/Step": 3268, "Pretrain/Step Time": 9.727804958820343} +{"Pretrain/Learning Rate": 3.8232698547052345e-05, "Pretrain/Loss": 1.9979474544525146, "Pretrain/Loss (Raw)": 1.6008191108703613, "Pretrain/Step": 3269, "Pretrain/Step Time": 9.727494116872549} +{"Pretrain/Learning Rate": 3.8225494722913624e-05, "Pretrain/Loss": 1.9961282014846802, "Pretrain/Loss (Raw)": 2.0592429637908936, "Pretrain/Step": 3270, "Pretrain/Step Time": 9.73120217397809} +{"Pretrain/Learning Rate": 3.821828937354853e-05, "Pretrain/Loss": 1.9957300424575806, "Pretrain/Loss (Raw)": 2.0783674716949463, "Pretrain/Step": 3271, "Pretrain/Step Time": 9.733280539512634} +{"Pretrain/Learning Rate": 3.821108249978802e-05, "Pretrain/Loss": 1.9962509870529175, "Pretrain/Loss (Raw)": 2.1242809295654297, "Pretrain/Step": 3272, "Pretrain/Step Time": 9.731978129595518} +{"Pretrain/Learning Rate": 3.8203874102463235e-05, "Pretrain/Loss": 1.9965496063232422, "Pretrain/Loss (Raw)": 1.939827799797058, "Pretrain/Step": 3273, "Pretrain/Step Time": 9.7319729719311} +{"Pretrain/Learning Rate": 3.819666418240545e-05, "Pretrain/Loss": 1.9948773384094238, "Pretrain/Loss (Raw)": 1.9733108282089233, "Pretrain/Step": 3274, "Pretrain/Step Time": 9.732797410339117} +{"Pretrain/Learning Rate": 3.818945274044618e-05, "Pretrain/Loss": 1.9955451488494873, "Pretrain/Loss (Raw)": 2.071457862854004, "Pretrain/Step": 3275, "Pretrain/Step Time": 9.734548166394234} +{"Pretrain/Learning Rate": 3.8182239777417066e-05, "Pretrain/Loss": 1.9951213598251343, "Pretrain/Loss (Raw)": 1.8061764240264893, "Pretrain/Step": 3276, "Pretrain/Step Time": 9.733142441138625} +{"Pretrain/Learning Rate": 3.817502529414994e-05, "Pretrain/Loss": 1.9960346221923828, "Pretrain/Loss (Raw)": 2.1597084999084473, "Pretrain/Step": 3277, "Pretrain/Step Time": 9.730466570705175} +{"Pretrain/Learning Rate": 3.816780929147682e-05, "Pretrain/Loss": 1.9958908557891846, "Pretrain/Loss (Raw)": 2.017289638519287, "Pretrain/Step": 3278, "Pretrain/Step Time": 9.73192679695785} +{"Pretrain/Learning Rate": 3.816059177022988e-05, "Pretrain/Loss": 1.9994851350784302, "Pretrain/Loss (Raw)": 2.263522148132324, "Pretrain/Step": 3279, "Pretrain/Step Time": 9.729550644755363} +{"Pretrain/Learning Rate": 3.8153372731241486e-05, "Pretrain/Loss": 1.9995410442352295, "Pretrain/Loss (Raw)": 2.1660003662109375, "Pretrain/Step": 3280, "Pretrain/Step Time": 9.731992552056909} +{"Pretrain/Learning Rate": 3.814615217534416e-05, "Pretrain/Loss": 1.9977588653564453, "Pretrain/Loss (Raw)": 1.8545215129852295, "Pretrain/Step": 3281, "Pretrain/Step Time": 9.726010860875249} +{"Pretrain/Learning Rate": 3.813893010337063e-05, "Pretrain/Loss": 1.9990520477294922, "Pretrain/Loss (Raw)": 2.1530165672302246, "Pretrain/Step": 3282, "Pretrain/Step Time": 9.729537861421704} +{"Pretrain/Learning Rate": 3.813170651615376e-05, "Pretrain/Loss": 1.9994337558746338, "Pretrain/Loss (Raw)": 2.006026029586792, "Pretrain/Step": 3283, "Pretrain/Step Time": 9.73076100461185} +{"Pretrain/Learning Rate": 3.8124481414526613e-05, "Pretrain/Loss": 2.000889778137207, "Pretrain/Loss (Raw)": 2.1312997341156006, "Pretrain/Step": 3284, "Pretrain/Step Time": 9.730078544467688} +{"Pretrain/Learning Rate": 3.811725479932243e-05, "Pretrain/Loss": 2.000548839569092, "Pretrain/Loss (Raw)": 2.250427484512329, "Pretrain/Step": 3285, "Pretrain/Step Time": 9.729787401854992} +{"Pretrain/Learning Rate": 3.8110026671374615e-05, "Pretrain/Loss": 2.0025038719177246, "Pretrain/Loss (Raw)": 2.1584110260009766, "Pretrain/Step": 3286, "Pretrain/Step Time": 9.739945350214839} +{"Pretrain/Learning Rate": 3.810279703151674e-05, "Pretrain/Loss": 2.002509832382202, "Pretrain/Loss (Raw)": 1.9906262159347534, "Pretrain/Step": 3287, "Pretrain/Step Time": 9.741021167486906} +{"Pretrain/Learning Rate": 3.809556588058258e-05, "Pretrain/Loss": 2.002401828765869, "Pretrain/Loss (Raw)": 2.0977039337158203, "Pretrain/Step": 3288, "Pretrain/Step Time": 9.73765347711742} +{"Pretrain/Learning Rate": 3.8088333219406046e-05, "Pretrain/Loss": 2.0056045055389404, "Pretrain/Loss (Raw)": 2.1141409873962402, "Pretrain/Step": 3289, "Pretrain/Step Time": 9.75000069476664} +{"Pretrain/Learning Rate": 3.808109904882126e-05, "Pretrain/Loss": 2.004347562789917, "Pretrain/Loss (Raw)": 2.040532350540161, "Pretrain/Step": 3290, "Pretrain/Step Time": 9.750559598207474} +{"Pretrain/Learning Rate": 3.807386336966248e-05, "Pretrain/Loss": 2.0059361457824707, "Pretrain/Loss (Raw)": 2.110311269760132, "Pretrain/Step": 3291, "Pretrain/Step Time": 9.741849340498447} +{"Pretrain/Learning Rate": 3.8066626182764174e-05, "Pretrain/Loss": 2.00783371925354, "Pretrain/Loss (Raw)": 1.9881787300109863, "Pretrain/Step": 3292, "Pretrain/Step Time": 9.741202069446445} +{"Pretrain/Learning Rate": 3.805938748896097e-05, "Pretrain/Loss": 2.006442070007324, "Pretrain/Loss (Raw)": 1.895731806755066, "Pretrain/Step": 3293, "Pretrain/Step Time": 9.740938059985638} +{"Pretrain/Learning Rate": 3.805214728908765e-05, "Pretrain/Loss": 2.0074081420898438, "Pretrain/Loss (Raw)": 1.9476945400238037, "Pretrain/Step": 3294, "Pretrain/Step Time": 9.739783063530922} +{"Pretrain/Learning Rate": 3.804490558397922e-05, "Pretrain/Loss": 2.008066177368164, "Pretrain/Loss (Raw)": 1.9355812072753906, "Pretrain/Step": 3295, "Pretrain/Step Time": 9.74601656012237} +{"Pretrain/Learning Rate": 3.803766237447079e-05, "Pretrain/Loss": 2.0055112838745117, "Pretrain/Loss (Raw)": 1.9177474975585938, "Pretrain/Step": 3296, "Pretrain/Step Time": 9.741087792441249} +{"Pretrain/Learning Rate": 3.803041766139771e-05, "Pretrain/Loss": 2.003910541534424, "Pretrain/Loss (Raw)": 1.9985250234603882, "Pretrain/Step": 3297, "Pretrain/Step Time": 9.735346354544163} +{"Pretrain/Learning Rate": 3.8023171445595464e-05, "Pretrain/Loss": 2.0034425258636475, "Pretrain/Loss (Raw)": 2.027611017227173, "Pretrain/Step": 3298, "Pretrain/Step Time": 9.737044539302588} +{"Pretrain/Learning Rate": 3.8015923727899714e-05, "Pretrain/Loss": 2.003730535507202, "Pretrain/Loss (Raw)": 1.9832580089569092, "Pretrain/Step": 3299, "Pretrain/Step Time": 9.732972756028175} +{"Pretrain/Learning Rate": 3.8008674509146304e-05, "Pretrain/Loss": 2.0077292919158936, "Pretrain/Loss (Raw)": 2.310624122619629, "Pretrain/Step": 3300, "Pretrain/Step Time": 9.73461365327239} +{"Pretrain/Learning Rate": 3.800142379017127e-05, "Pretrain/Loss": 2.009612798690796, "Pretrain/Loss (Raw)": 2.1646223068237305, "Pretrain/Step": 3301, "Pretrain/Step Time": 9.72155768238008} +{"Pretrain/Learning Rate": 3.799417157181076e-05, "Pretrain/Loss": 2.0118417739868164, "Pretrain/Loss (Raw)": 2.044337034225464, "Pretrain/Step": 3302, "Pretrain/Step Time": 9.727146334946156} +{"Pretrain/Learning Rate": 3.798691785490115e-05, "Pretrain/Loss": 2.0075724124908447, "Pretrain/Loss (Raw)": 1.5335685014724731, "Pretrain/Step": 3303, "Pretrain/Step Time": 9.721452306956053} +{"Pretrain/Learning Rate": 3.797966264027899e-05, "Pretrain/Loss": 2.0093586444854736, "Pretrain/Loss (Raw)": 2.00897479057312, "Pretrain/Step": 3304, "Pretrain/Step Time": 9.720137571915984} +{"Pretrain/Learning Rate": 3.7972405928780974e-05, "Pretrain/Loss": 2.0090742111206055, "Pretrain/Loss (Raw)": 2.1244699954986572, "Pretrain/Step": 3305, "Pretrain/Step Time": 9.723296757787466} +{"Pretrain/Learning Rate": 3.796514772124396e-05, "Pretrain/Loss": 2.0096874237060547, "Pretrain/Loss (Raw)": 2.1800923347473145, "Pretrain/Step": 3306, "Pretrain/Step Time": 9.724127020686865} +{"Pretrain/Learning Rate": 3.795788801850504e-05, "Pretrain/Loss": 2.0087974071502686, "Pretrain/Loss (Raw)": 1.9339218139648438, "Pretrain/Step": 3307, "Pretrain/Step Time": 9.725273186340928} +{"Pretrain/Learning Rate": 3.7950626821401405e-05, "Pretrain/Loss": 2.009700298309326, "Pretrain/Loss (Raw)": 1.982345461845398, "Pretrain/Step": 3308, "Pretrain/Step Time": 9.725046461448073} +{"Pretrain/Learning Rate": 3.794336413077045e-05, "Pretrain/Loss": 2.011664390563965, "Pretrain/Loss (Raw)": 2.1461920738220215, "Pretrain/Step": 3309, "Pretrain/Step Time": 9.721348704770207} +{"Pretrain/Learning Rate": 3.793609994744977e-05, "Pretrain/Loss": 2.0113372802734375, "Pretrain/Loss (Raw)": 2.172212600708008, "Pretrain/Step": 3310, "Pretrain/Step Time": 9.717068567872047} +{"Pretrain/Learning Rate": 3.792883427227707e-05, "Pretrain/Loss": 2.012824058532715, "Pretrain/Loss (Raw)": 2.2251944541931152, "Pretrain/Step": 3311, "Pretrain/Step Time": 9.706604866310954} +{"Pretrain/Learning Rate": 3.7921567106090297e-05, "Pretrain/Loss": 2.0134339332580566, "Pretrain/Loss (Raw)": 2.1896555423736572, "Pretrain/Step": 3312, "Pretrain/Step Time": 9.704999458044767} +{"Pretrain/Learning Rate": 3.79142984497275e-05, "Pretrain/Loss": 2.012153148651123, "Pretrain/Loss (Raw)": 1.9407360553741455, "Pretrain/Step": 3313, "Pretrain/Step Time": 9.70950180105865} +{"Pretrain/Learning Rate": 3.790702830402696e-05, "Pretrain/Loss": 2.013113021850586, "Pretrain/Loss (Raw)": 1.971632957458496, "Pretrain/Step": 3314, "Pretrain/Step Time": 9.71056367084384} +{"Pretrain/Learning Rate": 3.7899756669827094e-05, "Pretrain/Loss": 2.0101892948150635, "Pretrain/Loss (Raw)": 1.859453558921814, "Pretrain/Step": 3315, "Pretrain/Step Time": 9.708832915872335} +{"Pretrain/Learning Rate": 3.789248354796651e-05, "Pretrain/Loss": 2.0115864276885986, "Pretrain/Loss (Raw)": 2.135300397872925, "Pretrain/Step": 3316, "Pretrain/Step Time": 9.71114325337112} +{"Pretrain/Learning Rate": 3.788520893928396e-05, "Pretrain/Loss": 2.0108656883239746, "Pretrain/Loss (Raw)": 1.842376708984375, "Pretrain/Step": 3317, "Pretrain/Step Time": 9.70784275047481} +{"Pretrain/Learning Rate": 3.78779328446184e-05, "Pretrain/Loss": 2.0096096992492676, "Pretrain/Loss (Raw)": 1.870545506477356, "Pretrain/Step": 3318, "Pretrain/Step Time": 9.705479556694627} +{"Pretrain/Learning Rate": 3.7870655264808954e-05, "Pretrain/Loss": 2.0100314617156982, "Pretrain/Loss (Raw)": 2.0478439331054688, "Pretrain/Step": 3319, "Pretrain/Step Time": 9.711168888956308} +{"Pretrain/Learning Rate": 3.786337620069488e-05, "Pretrain/Loss": 2.0095019340515137, "Pretrain/Loss (Raw)": 2.021596908569336, "Pretrain/Step": 3320, "Pretrain/Step Time": 9.711059959605336} +{"Pretrain/Learning Rate": 3.7856095653115655e-05, "Pretrain/Loss": 2.0096073150634766, "Pretrain/Loss (Raw)": 2.0394346714019775, "Pretrain/Step": 3321, "Pretrain/Step Time": 9.607522964477539} +{"Pretrain/Learning Rate": 3.7848813622910894e-05, "Pretrain/Loss": 2.0127174854278564, "Pretrain/Loss (Raw)": 2.127133369445801, "Pretrain/Step": 3322, "Pretrain/Step Time": 9.610122306272388} +{"Pretrain/Learning Rate": 3.784153011092041e-05, "Pretrain/Loss": 2.0108985900878906, "Pretrain/Loss (Raw)": 1.9808604717254639, "Pretrain/Step": 3323, "Pretrain/Step Time": 9.615357959643006} +{"Pretrain/Learning Rate": 3.7834245117984155e-05, "Pretrain/Loss": 2.011655807495117, "Pretrain/Loss (Raw)": 2.0430328845977783, "Pretrain/Step": 3324, "Pretrain/Step Time": 9.614199148491025} +{"Pretrain/Learning Rate": 3.782695864494228e-05, "Pretrain/Loss": 2.0110373497009277, "Pretrain/Loss (Raw)": 2.023697853088379, "Pretrain/Step": 3325, "Pretrain/Step Time": 9.610534930601716} +{"Pretrain/Learning Rate": 3.781967069263509e-05, "Pretrain/Loss": 2.0137739181518555, "Pretrain/Loss (Raw)": 2.0941617488861084, "Pretrain/Step": 3326, "Pretrain/Step Time": 9.614843674004078} +{"Pretrain/Learning Rate": 3.781238126190306e-05, "Pretrain/Loss": 2.0135531425476074, "Pretrain/Loss (Raw)": 2.056148052215576, "Pretrain/Step": 3327, "Pretrain/Step Time": 9.60821644589305} +{"Pretrain/Learning Rate": 3.780509035358686e-05, "Pretrain/Loss": 2.01303768157959, "Pretrain/Loss (Raw)": 2.0865395069122314, "Pretrain/Step": 3328, "Pretrain/Step Time": 9.609958985820413} +{"Pretrain/Learning Rate": 3.77977979685273e-05, "Pretrain/Loss": 2.015244483947754, "Pretrain/Loss (Raw)": 2.1529123783111572, "Pretrain/Step": 3329, "Pretrain/Step Time": 9.610057448968291} +{"Pretrain/Learning Rate": 3.7790504107565366e-05, "Pretrain/Loss": 2.0141396522521973, "Pretrain/Loss (Raw)": 2.0372140407562256, "Pretrain/Step": 3330, "Pretrain/Step Time": 9.610211098566651} +{"Pretrain/Learning Rate": 3.7783208771542237e-05, "Pretrain/Loss": 2.0139660835266113, "Pretrain/Loss (Raw)": 2.0351624488830566, "Pretrain/Step": 3331, "Pretrain/Step Time": 9.609475193545222} +{"Pretrain/Learning Rate": 3.7775911961299225e-05, "Pretrain/Loss": 2.0151171684265137, "Pretrain/Loss (Raw)": 1.8416727781295776, "Pretrain/Step": 3332, "Pretrain/Step Time": 9.61803931929171} +{"Pretrain/Learning Rate": 3.776861367767785e-05, "Pretrain/Loss": 2.015686511993408, "Pretrain/Loss (Raw)": 2.0497725009918213, "Pretrain/Step": 3333, "Pretrain/Step Time": 9.6129339504987} +{"Pretrain/Learning Rate": 3.776131392151978e-05, "Pretrain/Loss": 2.015357255935669, "Pretrain/Loss (Raw)": 1.886397123336792, "Pretrain/Step": 3334, "Pretrain/Step Time": 9.610680283978581} +{"Pretrain/Learning Rate": 3.775401269366685e-05, "Pretrain/Loss": 2.013303756713867, "Pretrain/Loss (Raw)": 1.7096328735351562, "Pretrain/Step": 3335, "Pretrain/Step Time": 9.616114918142557} +{"Pretrain/Learning Rate": 3.7746709994961085e-05, "Pretrain/Loss": 2.0126218795776367, "Pretrain/Loss (Raw)": 2.02793025970459, "Pretrain/Step": 3336, "Pretrain/Step Time": 9.415284791961312} +{"Pretrain/Learning Rate": 3.7739405826244645e-05, "Pretrain/Loss": 2.012573480606079, "Pretrain/Loss (Raw)": 2.037616491317749, "Pretrain/Step": 3337, "Pretrain/Step Time": 9.412589957937598} +{"Pretrain/Learning Rate": 3.773210018835991e-05, "Pretrain/Loss": 2.0160024166107178, "Pretrain/Loss (Raw)": 2.1379847526550293, "Pretrain/Step": 3338, "Pretrain/Step Time": 9.412126284092665} +{"Pretrain/Learning Rate": 3.772479308214937e-05, "Pretrain/Loss": 2.013573408126831, "Pretrain/Loss (Raw)": 1.9051017761230469, "Pretrain/Step": 3339, "Pretrain/Step Time": 9.414620446041226} +{"Pretrain/Learning Rate": 3.771748450845575e-05, "Pretrain/Loss": 2.0136351585388184, "Pretrain/Loss (Raw)": 2.085707187652588, "Pretrain/Step": 3340, "Pretrain/Step Time": 9.407395517453551} +{"Pretrain/Learning Rate": 3.771017446812187e-05, "Pretrain/Loss": 2.0112295150756836, "Pretrain/Loss (Raw)": 1.7709214687347412, "Pretrain/Step": 3341, "Pretrain/Step Time": 9.406795244663954} +{"Pretrain/Learning Rate": 3.770286296199079e-05, "Pretrain/Loss": 2.0096898078918457, "Pretrain/Loss (Raw)": 2.033334255218506, "Pretrain/Step": 3342, "Pretrain/Step Time": 9.404632918536663} +{"Pretrain/Learning Rate": 3.7695549990905694e-05, "Pretrain/Loss": 2.00970458984375, "Pretrain/Loss (Raw)": 1.9549247026443481, "Pretrain/Step": 3343, "Pretrain/Step Time": 9.408086854964495} +{"Pretrain/Learning Rate": 3.768823555570995e-05, "Pretrain/Loss": 2.0079431533813477, "Pretrain/Loss (Raw)": 1.6940586566925049, "Pretrain/Step": 3344, "Pretrain/Step Time": 9.4108801856637} +{"Pretrain/Learning Rate": 3.768091965724709e-05, "Pretrain/Loss": 2.0094079971313477, "Pretrain/Loss (Raw)": 2.1753029823303223, "Pretrain/Step": 3345, "Pretrain/Step Time": 9.41209663823247} +{"Pretrain/Learning Rate": 3.767360229636082e-05, "Pretrain/Loss": 2.011075496673584, "Pretrain/Loss (Raw)": 2.1645243167877197, "Pretrain/Step": 3346, "Pretrain/Step Time": 9.413337640464306} +{"Pretrain/Learning Rate": 3.7666283473895014e-05, "Pretrain/Loss": 2.0102038383483887, "Pretrain/Loss (Raw)": 1.978495478630066, "Pretrain/Step": 3347, "Pretrain/Step Time": 9.410648940131068} +{"Pretrain/Learning Rate": 3.765896319069372e-05, "Pretrain/Loss": 2.0096325874328613, "Pretrain/Loss (Raw)": 2.0188305377960205, "Pretrain/Step": 3348, "Pretrain/Step Time": 9.406461168080568} +{"Pretrain/Learning Rate": 3.7651641447601126e-05, "Pretrain/Loss": 2.010650634765625, "Pretrain/Loss (Raw)": 1.921755313873291, "Pretrain/Step": 3349, "Pretrain/Step Time": 9.405221534892917} +{"Pretrain/Learning Rate": 3.764431824546163e-05, "Pretrain/Loss": 2.0109703540802, "Pretrain/Loss (Raw)": 1.9942152500152588, "Pretrain/Step": 3350, "Pretrain/Step Time": 9.409770110622048} +{"Pretrain/Learning Rate": 3.7636993585119775e-05, "Pretrain/Loss": 2.0132646560668945, "Pretrain/Loss (Raw)": 2.137181520462036, "Pretrain/Step": 3351, "Pretrain/Step Time": 9.407742017880082} +{"Pretrain/Learning Rate": 3.762966746742027e-05, "Pretrain/Loss": 2.008113384246826, "Pretrain/Loss (Raw)": 1.4270615577697754, "Pretrain/Step": 3352, "Pretrain/Step Time": 9.412804620340466} +{"Pretrain/Learning Rate": 3.7622339893208e-05, "Pretrain/Loss": 2.0105998516082764, "Pretrain/Loss (Raw)": 2.212768316268921, "Pretrain/Step": 3353, "Pretrain/Step Time": 9.411099186167121} +{"Pretrain/Learning Rate": 3.761501086332802e-05, "Pretrain/Loss": 2.0092885494232178, "Pretrain/Loss (Raw)": 1.885349154472351, "Pretrain/Step": 3354, "Pretrain/Step Time": 9.411645140498877} +{"Pretrain/Learning Rate": 3.760768037862553e-05, "Pretrain/Loss": 2.012803077697754, "Pretrain/Loss (Raw)": 2.1565403938293457, "Pretrain/Step": 3355, "Pretrain/Step Time": 9.41090975701809} +{"Pretrain/Learning Rate": 3.760034843994594e-05, "Pretrain/Loss": 2.013080596923828, "Pretrain/Loss (Raw)": 2.2433671951293945, "Pretrain/Step": 3356, "Pretrain/Step Time": 9.408191511407495} +{"Pretrain/Learning Rate": 3.7593015048134794e-05, "Pretrain/Loss": 2.012826442718506, "Pretrain/Loss (Raw)": 2.120715618133545, "Pretrain/Step": 3357, "Pretrain/Step Time": 9.411910325288773} +{"Pretrain/Learning Rate": 3.758568020403781e-05, "Pretrain/Loss": 2.013497829437256, "Pretrain/Loss (Raw)": 2.1343178749084473, "Pretrain/Step": 3358, "Pretrain/Step Time": 9.4113310277462} +{"Pretrain/Learning Rate": 3.757834390850088e-05, "Pretrain/Loss": 2.0143070220947266, "Pretrain/Loss (Raw)": 2.1026220321655273, "Pretrain/Step": 3359, "Pretrain/Step Time": 9.400908179581165} +{"Pretrain/Learning Rate": 3.7571006162370056e-05, "Pretrain/Loss": 2.0179927349090576, "Pretrain/Loss (Raw)": 2.0137760639190674, "Pretrain/Step": 3360, "Pretrain/Step Time": 9.405865259468555} +{"Pretrain/Learning Rate": 3.7563666966491564e-05, "Pretrain/Loss": 2.0166399478912354, "Pretrain/Loss (Raw)": 1.9001444578170776, "Pretrain/Step": 3361, "Pretrain/Step Time": 9.405023779720068} +{"Pretrain/Learning Rate": 3.7556326321711796e-05, "Pretrain/Loss": 2.0161495208740234, "Pretrain/Loss (Raw)": 2.139155149459839, "Pretrain/Step": 3362, "Pretrain/Step Time": 9.412957698106766} +{"Pretrain/Learning Rate": 3.7548984228877313e-05, "Pretrain/Loss": 2.014305830001831, "Pretrain/Loss (Raw)": 1.7835066318511963, "Pretrain/Step": 3363, "Pretrain/Step Time": 9.410688361153007} +{"Pretrain/Learning Rate": 3.754164068883484e-05, "Pretrain/Loss": 2.0149757862091064, "Pretrain/Loss (Raw)": 1.9330558776855469, "Pretrain/Step": 3364, "Pretrain/Step Time": 9.416997803375125} +{"Pretrain/Learning Rate": 3.7534295702431254e-05, "Pretrain/Loss": 2.0136280059814453, "Pretrain/Loss (Raw)": 1.9975831508636475, "Pretrain/Step": 3365, "Pretrain/Step Time": 9.416234835982323} +{"Pretrain/Learning Rate": 3.7526949270513635e-05, "Pretrain/Loss": 2.011887550354004, "Pretrain/Loss (Raw)": 1.8577286005020142, "Pretrain/Step": 3366, "Pretrain/Step Time": 9.407864121720195} +{"Pretrain/Learning Rate": 3.751960139392919e-05, "Pretrain/Loss": 2.0104641914367676, "Pretrain/Loss (Raw)": 2.0009121894836426, "Pretrain/Step": 3367, "Pretrain/Step Time": 9.404550883919} +{"Pretrain/Learning Rate": 3.7512252073525325e-05, "Pretrain/Loss": 2.013930559158325, "Pretrain/Loss (Raw)": 1.9266362190246582, "Pretrain/Step": 3368, "Pretrain/Step Time": 9.40946001559496} +{"Pretrain/Learning Rate": 3.7504901310149574e-05, "Pretrain/Loss": 2.012791395187378, "Pretrain/Loss (Raw)": 2.0375149250030518, "Pretrain/Step": 3369, "Pretrain/Step Time": 9.404372638091445} +{"Pretrain/Learning Rate": 3.74975491046497e-05, "Pretrain/Loss": 2.012040376663208, "Pretrain/Loss (Raw)": 1.9911481142044067, "Pretrain/Step": 3370, "Pretrain/Step Time": 9.40989007987082} +{"Pretrain/Learning Rate": 3.7490195457873555e-05, "Pretrain/Loss": 2.011983871459961, "Pretrain/Loss (Raw)": 1.9916465282440186, "Pretrain/Step": 3371, "Pretrain/Step Time": 9.4057462438941} +{"Pretrain/Learning Rate": 3.748284037066922e-05, "Pretrain/Loss": 2.0086047649383545, "Pretrain/Loss (Raw)": 1.5957434177398682, "Pretrain/Step": 3372, "Pretrain/Step Time": 9.40297157689929} +{"Pretrain/Learning Rate": 3.7475483843884916e-05, "Pretrain/Loss": 2.0086822509765625, "Pretrain/Loss (Raw)": 1.9692068099975586, "Pretrain/Step": 3373, "Pretrain/Step Time": 9.40264692902565} +{"Pretrain/Learning Rate": 3.746812587836903e-05, "Pretrain/Loss": 2.00830078125, "Pretrain/Loss (Raw)": 2.055161952972412, "Pretrain/Step": 3374, "Pretrain/Step Time": 9.405721774324775} +{"Pretrain/Learning Rate": 3.746076647497011e-05, "Pretrain/Loss": 2.0067713260650635, "Pretrain/Loss (Raw)": 2.241384506225586, "Pretrain/Step": 3375, "Pretrain/Step Time": 9.410385124385357} +{"Pretrain/Learning Rate": 3.7453405634536894e-05, "Pretrain/Loss": 2.009047031402588, "Pretrain/Loss (Raw)": 2.1677932739257812, "Pretrain/Step": 3376, "Pretrain/Step Time": 9.40958889760077} +{"Pretrain/Learning Rate": 3.744604335791825e-05, "Pretrain/Loss": 2.006606101989746, "Pretrain/Loss (Raw)": 1.8924391269683838, "Pretrain/Step": 3377, "Pretrain/Step Time": 9.404636634513736} +{"Pretrain/Learning Rate": 3.743867964596324e-05, "Pretrain/Loss": 2.006617546081543, "Pretrain/Loss (Raw)": 2.1579973697662354, "Pretrain/Step": 3378, "Pretrain/Step Time": 8.782925324514508} +{"Pretrain/Learning Rate": 3.743131449952107e-05, "Pretrain/Loss": 2.006380319595337, "Pretrain/Loss (Raw)": 2.0714573860168457, "Pretrain/Step": 3379, "Pretrain/Step Time": 8.78326778113842} +{"Pretrain/Learning Rate": 3.7423947919441147e-05, "Pretrain/Loss": 2.011087417602539, "Pretrain/Loss (Raw)": 2.1972618103027344, "Pretrain/Step": 3380, "Pretrain/Step Time": 8.78713827393949} +{"Pretrain/Learning Rate": 3.7416579906573e-05, "Pretrain/Loss": 2.0114998817443848, "Pretrain/Loss (Raw)": 1.8916727304458618, "Pretrain/Step": 3381, "Pretrain/Step Time": 8.786864414811134} +{"Pretrain/Learning Rate": 3.7409210461766355e-05, "Pretrain/Loss": 2.012047290802002, "Pretrain/Loss (Raw)": 1.9619803428649902, "Pretrain/Step": 3382, "Pretrain/Step Time": 8.787303943186998} +{"Pretrain/Learning Rate": 3.740183958587108e-05, "Pretrain/Loss": 2.010866641998291, "Pretrain/Loss (Raw)": 1.9212639331817627, "Pretrain/Step": 3383, "Pretrain/Step Time": 8.792816113680601} +{"Pretrain/Learning Rate": 3.7394467279737224e-05, "Pretrain/Loss": 2.0130109786987305, "Pretrain/Loss (Raw)": 1.989933967590332, "Pretrain/Step": 3384, "Pretrain/Step Time": 8.79280849173665} +{"Pretrain/Learning Rate": 3.7387093544215003e-05, "Pretrain/Loss": 2.011842966079712, "Pretrain/Loss (Raw)": 1.907228708267212, "Pretrain/Step": 3385, "Pretrain/Step Time": 8.795847829431295} +{"Pretrain/Learning Rate": 3.7379718380154777e-05, "Pretrain/Loss": 2.0134637355804443, "Pretrain/Loss (Raw)": 2.2880728244781494, "Pretrain/Step": 3386, "Pretrain/Step Time": 8.793316880241036} +{"Pretrain/Learning Rate": 3.737234178840709e-05, "Pretrain/Loss": 2.0136561393737793, "Pretrain/Loss (Raw)": 2.0808162689208984, "Pretrain/Step": 3387, "Pretrain/Step Time": 8.792302435263991} +{"Pretrain/Learning Rate": 3.736496376982266e-05, "Pretrain/Loss": 2.0132358074188232, "Pretrain/Loss (Raw)": 2.060349941253662, "Pretrain/Step": 3388, "Pretrain/Step Time": 8.78611165098846} +{"Pretrain/Learning Rate": 3.7357584325252336e-05, "Pretrain/Loss": 2.0128116607666016, "Pretrain/Loss (Raw)": 1.9235955476760864, "Pretrain/Step": 3389, "Pretrain/Step Time": 8.788258420303464} +{"Pretrain/Learning Rate": 3.7350203455547155e-05, "Pretrain/Loss": 2.012923240661621, "Pretrain/Loss (Raw)": 2.0286221504211426, "Pretrain/Step": 3390, "Pretrain/Step Time": 8.786627693101764} +{"Pretrain/Learning Rate": 3.7342821161558316e-05, "Pretrain/Loss": 2.012754440307617, "Pretrain/Loss (Raw)": 2.0249502658843994, "Pretrain/Step": 3391, "Pretrain/Step Time": 8.783825824037194} +{"Pretrain/Learning Rate": 3.7335437444137175e-05, "Pretrain/Loss": 2.013547897338867, "Pretrain/Loss (Raw)": 2.0545711517333984, "Pretrain/Step": 3392, "Pretrain/Step Time": 8.783961525186896} +{"Pretrain/Learning Rate": 3.732805230413527e-05, "Pretrain/Loss": 2.0133132934570312, "Pretrain/Loss (Raw)": 2.0300018787384033, "Pretrain/Step": 3393, "Pretrain/Step Time": 8.783871551975608} +{"Pretrain/Learning Rate": 3.732066574240428e-05, "Pretrain/Loss": 2.014045000076294, "Pretrain/Loss (Raw)": 2.042095184326172, "Pretrain/Step": 3394, "Pretrain/Step Time": 8.780496979132295} +{"Pretrain/Learning Rate": 3.731327775979605e-05, "Pretrain/Loss": 2.014862298965454, "Pretrain/Loss (Raw)": 2.047269821166992, "Pretrain/Step": 3395, "Pretrain/Step Time": 8.78163057565689} +{"Pretrain/Learning Rate": 3.730588835716262e-05, "Pretrain/Loss": 2.0165281295776367, "Pretrain/Loss (Raw)": 1.8904775381088257, "Pretrain/Step": 3396, "Pretrain/Step Time": 8.785806452855468} +{"Pretrain/Learning Rate": 3.729849753535615e-05, "Pretrain/Loss": 2.0195984840393066, "Pretrain/Loss (Raw)": 1.9938212633132935, "Pretrain/Step": 3397, "Pretrain/Step Time": 8.788201455026865} +{"Pretrain/Learning Rate": 3.7291105295229004e-05, "Pretrain/Loss": 2.0194928646087646, "Pretrain/Loss (Raw)": 2.045720100402832, "Pretrain/Step": 3398, "Pretrain/Step Time": 8.788343161344528} +{"Pretrain/Learning Rate": 3.728371163763366e-05, "Pretrain/Loss": 2.0189852714538574, "Pretrain/Loss (Raw)": 2.0134103298187256, "Pretrain/Step": 3399, "Pretrain/Step Time": 8.785836331546307} +{"Pretrain/Learning Rate": 3.727631656342282e-05, "Pretrain/Loss": 2.0196075439453125, "Pretrain/Loss (Raw)": 2.2039144039154053, "Pretrain/Step": 3400, "Pretrain/Step Time": 8.785750234499574} +{"Pretrain/Learning Rate": 3.7268920073449296e-05, "Pretrain/Loss": 2.019192695617676, "Pretrain/Loss (Raw)": 1.8867498636245728, "Pretrain/Step": 3401, "Pretrain/Step Time": 8.78580086864531} +{"Pretrain/Learning Rate": 3.72615221685661e-05, "Pretrain/Loss": 2.0220508575439453, "Pretrain/Loss (Raw)": 2.339128017425537, "Pretrain/Step": 3402, "Pretrain/Step Time": 8.794389046728611} +{"Pretrain/Learning Rate": 3.725412284962639e-05, "Pretrain/Loss": 2.0208189487457275, "Pretrain/Loss (Raw)": 1.9137935638427734, "Pretrain/Step": 3403, "Pretrain/Step Time": 8.78872543759644} +{"Pretrain/Learning Rate": 3.724672211748349e-05, "Pretrain/Loss": 2.021679401397705, "Pretrain/Loss (Raw)": 1.9162938594818115, "Pretrain/Step": 3404, "Pretrain/Step Time": 8.780499819666147} +{"Pretrain/Learning Rate": 3.723931997299089e-05, "Pretrain/Loss": 2.020493507385254, "Pretrain/Loss (Raw)": 2.007950782775879, "Pretrain/Step": 3405, "Pretrain/Step Time": 8.784122159704566} +{"Pretrain/Learning Rate": 3.723191641700223e-05, "Pretrain/Loss": 2.0208821296691895, "Pretrain/Loss (Raw)": 2.0670273303985596, "Pretrain/Step": 3406, "Pretrain/Step Time": 8.780676720663905} +{"Pretrain/Learning Rate": 3.7224511450371334e-05, "Pretrain/Loss": 2.0184485912323, "Pretrain/Loss (Raw)": 1.9520142078399658, "Pretrain/Step": 3407, "Pretrain/Step Time": 8.781594678759575} +{"Pretrain/Learning Rate": 3.721710507395218e-05, "Pretrain/Loss": 2.0166921615600586, "Pretrain/Loss (Raw)": 1.9411559104919434, "Pretrain/Step": 3408, "Pretrain/Step Time": 8.784126346930861} +{"Pretrain/Learning Rate": 3.720969728859889e-05, "Pretrain/Loss": 2.017544746398926, "Pretrain/Loss (Raw)": 1.963667631149292, "Pretrain/Step": 3409, "Pretrain/Step Time": 8.792718291282654} +{"Pretrain/Learning Rate": 3.720228809516578e-05, "Pretrain/Loss": 2.015486717224121, "Pretrain/Loss (Raw)": 1.8895851373672485, "Pretrain/Step": 3410, "Pretrain/Step Time": 8.79067638143897} +{"Pretrain/Learning Rate": 3.719487749450731e-05, "Pretrain/Loss": 2.0158278942108154, "Pretrain/Loss (Raw)": 2.049712657928467, "Pretrain/Step": 3411, "Pretrain/Step Time": 8.788509862497449} +{"Pretrain/Learning Rate": 3.718746548747809e-05, "Pretrain/Loss": 2.0158636569976807, "Pretrain/Loss (Raw)": 2.1358642578125, "Pretrain/Step": 3412, "Pretrain/Step Time": 8.792898416519165} +{"Pretrain/Learning Rate": 3.7180052074932934e-05, "Pretrain/Loss": 2.0142431259155273, "Pretrain/Loss (Raw)": 2.0429906845092773, "Pretrain/Step": 3413, "Pretrain/Step Time": 8.792597761377692} +{"Pretrain/Learning Rate": 3.7172637257726774e-05, "Pretrain/Loss": 2.012322187423706, "Pretrain/Loss (Raw)": 1.9125312566757202, "Pretrain/Step": 3414, "Pretrain/Step Time": 8.782479677349329} +{"Pretrain/Learning Rate": 3.716522103671473e-05, "Pretrain/Loss": 2.0126147270202637, "Pretrain/Loss (Raw)": 2.028069257736206, "Pretrain/Step": 3415, "Pretrain/Step Time": 8.784606404602528} +{"Pretrain/Learning Rate": 3.715780341275207e-05, "Pretrain/Loss": 2.0123913288116455, "Pretrain/Loss (Raw)": 2.069122076034546, "Pretrain/Step": 3416, "Pretrain/Step Time": 8.791303941980004} +{"Pretrain/Learning Rate": 3.715038438669423e-05, "Pretrain/Loss": 2.0126733779907227, "Pretrain/Loss (Raw)": 2.1502532958984375, "Pretrain/Step": 3417, "Pretrain/Step Time": 8.779418962076306} +{"Pretrain/Learning Rate": 3.7142963959396806e-05, "Pretrain/Loss": 2.0126755237579346, "Pretrain/Loss (Raw)": 2.0408105850219727, "Pretrain/Step": 3418, "Pretrain/Step Time": 8.785738840699196} +{"Pretrain/Learning Rate": 3.713554213171556e-05, "Pretrain/Loss": 2.01194167137146, "Pretrain/Loss (Raw)": 2.0163848400115967, "Pretrain/Step": 3419, "Pretrain/Step Time": 8.785936441272497} +{"Pretrain/Learning Rate": 3.712811890450641e-05, "Pretrain/Loss": 2.0121710300445557, "Pretrain/Loss (Raw)": 2.0175023078918457, "Pretrain/Step": 3420, "Pretrain/Step Time": 8.78275378793478} +{"Pretrain/Learning Rate": 3.712069427862544e-05, "Pretrain/Loss": 2.0133676528930664, "Pretrain/Loss (Raw)": 2.0489253997802734, "Pretrain/Step": 3421, "Pretrain/Step Time": 8.778843307867646} +{"Pretrain/Learning Rate": 3.711326825492889e-05, "Pretrain/Loss": 2.0127694606781006, "Pretrain/Loss (Raw)": 1.8711224794387817, "Pretrain/Step": 3422, "Pretrain/Step Time": 8.779206870123744} +{"Pretrain/Learning Rate": 3.7105840834273164e-05, "Pretrain/Loss": 2.0120441913604736, "Pretrain/Loss (Raw)": 1.8427515029907227, "Pretrain/Step": 3423, "Pretrain/Step Time": 8.77873114682734} +{"Pretrain/Learning Rate": 3.7098412017514835e-05, "Pretrain/Loss": 2.012702465057373, "Pretrain/Loss (Raw)": 2.0019960403442383, "Pretrain/Step": 3424, "Pretrain/Step Time": 8.780366530641913} +{"Pretrain/Learning Rate": 3.7090981805510615e-05, "Pretrain/Loss": 2.01326322555542, "Pretrain/Loss (Raw)": 2.070319175720215, "Pretrain/Step": 3425, "Pretrain/Step Time": 8.778919147327542} +{"Pretrain/Learning Rate": 3.7083550199117403e-05, "Pretrain/Loss": 2.0139098167419434, "Pretrain/Loss (Raw)": 2.1103615760803223, "Pretrain/Step": 3426, "Pretrain/Step Time": 8.784266280010343} +{"Pretrain/Learning Rate": 3.707611719919224e-05, "Pretrain/Loss": 2.0147249698638916, "Pretrain/Loss (Raw)": 2.0875911712646484, "Pretrain/Step": 3427, "Pretrain/Step Time": 8.780942445620894} +{"Pretrain/Learning Rate": 3.706868280659234e-05, "Pretrain/Loss": 2.012922763824463, "Pretrain/Loss (Raw)": 2.0799524784088135, "Pretrain/Step": 3428, "Pretrain/Step Time": 8.776908064261079} +{"Pretrain/Learning Rate": 3.7061247022175064e-05, "Pretrain/Loss": 2.0124287605285645, "Pretrain/Loss (Raw)": 2.1013741493225098, "Pretrain/Step": 3429, "Pretrain/Step Time": 8.780698496848345} +{"Pretrain/Learning Rate": 3.705380984679795e-05, "Pretrain/Loss": 2.0107834339141846, "Pretrain/Loss (Raw)": 1.8337393999099731, "Pretrain/Step": 3430, "Pretrain/Step Time": 8.780104016885161} +{"Pretrain/Learning Rate": 3.704637128131868e-05, "Pretrain/Loss": 2.014116048812866, "Pretrain/Loss (Raw)": 1.9601337909698486, "Pretrain/Step": 3431, "Pretrain/Step Time": 8.77857413701713} +{"Pretrain/Learning Rate": 3.7038931326595115e-05, "Pretrain/Loss": 2.0137853622436523, "Pretrain/Loss (Raw)": 1.9666748046875, "Pretrain/Step": 3432, "Pretrain/Step Time": 8.780282597988844} +{"Pretrain/Learning Rate": 3.703148998348526e-05, "Pretrain/Loss": 2.013545036315918, "Pretrain/Loss (Raw)": 2.0936837196350098, "Pretrain/Step": 3433, "Pretrain/Step Time": 8.78192838653922} +{"Pretrain/Learning Rate": 3.702404725284728e-05, "Pretrain/Loss": 2.0140433311462402, "Pretrain/Loss (Raw)": 2.2438864707946777, "Pretrain/Step": 3434, "Pretrain/Step Time": 8.779909746721387} +{"Pretrain/Learning Rate": 3.7016603135539524e-05, "Pretrain/Loss": 2.0146560668945312, "Pretrain/Loss (Raw)": 2.012366533279419, "Pretrain/Step": 3435, "Pretrain/Step Time": 8.779506044462323} +{"Pretrain/Learning Rate": 3.700915763242046e-05, "Pretrain/Loss": 2.015821695327759, "Pretrain/Loss (Raw)": 2.1315207481384277, "Pretrain/Step": 3436, "Pretrain/Step Time": 8.777028324082494} +{"Pretrain/Learning Rate": 3.700171074434876e-05, "Pretrain/Loss": 2.0153331756591797, "Pretrain/Loss (Raw)": 2.083677291870117, "Pretrain/Step": 3437, "Pretrain/Step Time": 8.79338201135397} +{"Pretrain/Learning Rate": 3.699426247218321e-05, "Pretrain/Loss": 2.0146496295928955, "Pretrain/Loss (Raw)": 2.0847179889678955, "Pretrain/Step": 3438, "Pretrain/Step Time": 8.79449736699462} +{"Pretrain/Learning Rate": 3.69868128167828e-05, "Pretrain/Loss": 2.0151329040527344, "Pretrain/Loss (Raw)": 2.2870497703552246, "Pretrain/Step": 3439, "Pretrain/Step Time": 8.800961751490831} +{"Pretrain/Learning Rate": 3.697936177900665e-05, "Pretrain/Loss": 2.014030933380127, "Pretrain/Loss (Raw)": 2.0485801696777344, "Pretrain/Step": 3440, "Pretrain/Step Time": 8.802494786679745} +{"Pretrain/Learning Rate": 3.697190935971405e-05, "Pretrain/Loss": 2.013453722000122, "Pretrain/Loss (Raw)": 1.8668638467788696, "Pretrain/Step": 3441, "Pretrain/Step Time": 8.799122858792543} +{"Pretrain/Learning Rate": 3.696445555976445e-05, "Pretrain/Loss": 2.0145978927612305, "Pretrain/Loss (Raw)": 2.1181082725524902, "Pretrain/Step": 3442, "Pretrain/Step Time": 8.795497860759497} +{"Pretrain/Learning Rate": 3.695700038001746e-05, "Pretrain/Loss": 2.0151987075805664, "Pretrain/Loss (Raw)": 1.9363652467727661, "Pretrain/Step": 3443, "Pretrain/Step Time": 8.800821242854} +{"Pretrain/Learning Rate": 3.694954382133284e-05, "Pretrain/Loss": 2.0146446228027344, "Pretrain/Loss (Raw)": 2.064363479614258, "Pretrain/Step": 3444, "Pretrain/Step Time": 8.799515118822455} +{"Pretrain/Learning Rate": 3.694208588457051e-05, "Pretrain/Loss": 2.0166397094726562, "Pretrain/Loss (Raw)": 2.0977370738983154, "Pretrain/Step": 3445, "Pretrain/Step Time": 8.807692876085639} +{"Pretrain/Learning Rate": 3.693462657059058e-05, "Pretrain/Loss": 2.0176491737365723, "Pretrain/Loss (Raw)": 1.9997565746307373, "Pretrain/Step": 3446, "Pretrain/Step Time": 8.809077193960547} +{"Pretrain/Learning Rate": 3.6927165880253266e-05, "Pretrain/Loss": 2.0181164741516113, "Pretrain/Loss (Raw)": 2.107645034790039, "Pretrain/Step": 3447, "Pretrain/Step Time": 8.799644324928522} +{"Pretrain/Learning Rate": 3.691970381441898e-05, "Pretrain/Loss": 2.0184037685394287, "Pretrain/Loss (Raw)": 2.0583817958831787, "Pretrain/Step": 3448, "Pretrain/Step Time": 8.79890539124608} +{"Pretrain/Learning Rate": 3.691224037394828e-05, "Pretrain/Loss": 2.018862247467041, "Pretrain/Loss (Raw)": 2.0981287956237793, "Pretrain/Step": 3449, "Pretrain/Step Time": 8.8060437515378} +{"Pretrain/Learning Rate": 3.69047755597019e-05, "Pretrain/Loss": 2.0178442001342773, "Pretrain/Loss (Raw)": 1.996813416481018, "Pretrain/Step": 3450, "Pretrain/Step Time": 8.799821119755507} +{"Pretrain/Learning Rate": 3.68973093725407e-05, "Pretrain/Loss": 2.0193352699279785, "Pretrain/Loss (Raw)": 2.1716928482055664, "Pretrain/Step": 3451, "Pretrain/Step Time": 8.79529444500804} +{"Pretrain/Learning Rate": 3.688984181332572e-05, "Pretrain/Loss": 2.019749641418457, "Pretrain/Loss (Raw)": 2.0961289405822754, "Pretrain/Step": 3452, "Pretrain/Step Time": 8.799138437956572} +{"Pretrain/Learning Rate": 3.688237288291815e-05, "Pretrain/Loss": 2.019061326980591, "Pretrain/Loss (Raw)": 1.9355583190917969, "Pretrain/Step": 3453, "Pretrain/Step Time": 8.797183772549033} +{"Pretrain/Learning Rate": 3.687490258217935e-05, "Pretrain/Loss": 2.0191211700439453, "Pretrain/Loss (Raw)": 2.101832866668701, "Pretrain/Step": 3454, "Pretrain/Step Time": 8.794907934963703} +{"Pretrain/Learning Rate": 3.6867430911970824e-05, "Pretrain/Loss": 2.019030809402466, "Pretrain/Loss (Raw)": 2.044585704803467, "Pretrain/Step": 3455, "Pretrain/Step Time": 8.79801375977695} +{"Pretrain/Learning Rate": 3.6859957873154256e-05, "Pretrain/Loss": 2.0213723182678223, "Pretrain/Loss (Raw)": 2.3862528800964355, "Pretrain/Step": 3456, "Pretrain/Step Time": 8.807847710326314} +{"Pretrain/Learning Rate": 3.6852483466591447e-05, "Pretrain/Loss": 2.020235776901245, "Pretrain/Loss (Raw)": 2.007417917251587, "Pretrain/Step": 3457, "Pretrain/Step Time": 8.809693640097976} +{"Pretrain/Learning Rate": 3.6845007693144404e-05, "Pretrain/Loss": 2.0200929641723633, "Pretrain/Loss (Raw)": 2.018954038619995, "Pretrain/Step": 3458, "Pretrain/Step Time": 8.817482421174645} +{"Pretrain/Learning Rate": 3.683753055367526e-05, "Pretrain/Loss": 2.02004337310791, "Pretrain/Loss (Raw)": 2.0288262367248535, "Pretrain/Step": 3459, "Pretrain/Step Time": 8.816123094409704} +{"Pretrain/Learning Rate": 3.68300520490463e-05, "Pretrain/Loss": 2.0202653408050537, "Pretrain/Loss (Raw)": 1.8700761795043945, "Pretrain/Step": 3460, "Pretrain/Step Time": 8.813511604443192} +{"Pretrain/Learning Rate": 3.682257218012e-05, "Pretrain/Loss": 2.020970344543457, "Pretrain/Loss (Raw)": 2.13999605178833, "Pretrain/Step": 3461, "Pretrain/Step Time": 8.823657255619764} +{"Pretrain/Learning Rate": 3.6815090947758966e-05, "Pretrain/Loss": 2.0216078758239746, "Pretrain/Loss (Raw)": 1.9679960012435913, "Pretrain/Step": 3462, "Pretrain/Step Time": 8.960324831306934} +{"Pretrain/Learning Rate": 3.6807608352825975e-05, "Pretrain/Loss": 2.0237298011779785, "Pretrain/Loss (Raw)": 1.98125159740448, "Pretrain/Step": 3463, "Pretrain/Step Time": 8.95169679261744} +{"Pretrain/Learning Rate": 3.680012439618394e-05, "Pretrain/Loss": 2.0236878395080566, "Pretrain/Loss (Raw)": 2.0225629806518555, "Pretrain/Step": 3464, "Pretrain/Step Time": 8.95129805803299} +{"Pretrain/Learning Rate": 3.679263907869596e-05, "Pretrain/Loss": 2.0233922004699707, "Pretrain/Loss (Raw)": 1.999761700630188, "Pretrain/Step": 3465, "Pretrain/Step Time": 8.956971433013678} +{"Pretrain/Learning Rate": 3.678515240122527e-05, "Pretrain/Loss": 2.0214076042175293, "Pretrain/Loss (Raw)": 1.883959174156189, "Pretrain/Step": 3466, "Pretrain/Step Time": 8.9543795324862} +{"Pretrain/Learning Rate": 3.677766436463527e-05, "Pretrain/Loss": 2.022987127304077, "Pretrain/Loss (Raw)": 2.107267379760742, "Pretrain/Step": 3467, "Pretrain/Step Time": 8.952371748164296} +{"Pretrain/Learning Rate": 3.677017496978952e-05, "Pretrain/Loss": 2.0202791690826416, "Pretrain/Loss (Raw)": 1.7391084432601929, "Pretrain/Step": 3468, "Pretrain/Step Time": 8.956792211160064} +{"Pretrain/Learning Rate": 3.6762684217551735e-05, "Pretrain/Loss": 2.0225586891174316, "Pretrain/Loss (Raw)": 2.062668561935425, "Pretrain/Step": 3469, "Pretrain/Step Time": 8.95478581264615} +{"Pretrain/Learning Rate": 3.675519210878577e-05, "Pretrain/Loss": 2.0225398540496826, "Pretrain/Loss (Raw)": 2.0309596061706543, "Pretrain/Step": 3470, "Pretrain/Step Time": 9.010321363806725} +{"Pretrain/Learning Rate": 3.6747698644355664e-05, "Pretrain/Loss": 2.0240936279296875, "Pretrain/Loss (Raw)": 2.1538116931915283, "Pretrain/Step": 3471, "Pretrain/Step Time": 9.00525394640863} +{"Pretrain/Learning Rate": 3.674020382512559e-05, "Pretrain/Loss": 2.0241408348083496, "Pretrain/Loss (Raw)": 1.7000584602355957, "Pretrain/Step": 3472, "Pretrain/Step Time": 9.031873542815447} +{"Pretrain/Learning Rate": 3.673270765195989e-05, "Pretrain/Loss": 2.022280693054199, "Pretrain/Loss (Raw)": 1.9372221231460571, "Pretrain/Step": 3473, "Pretrain/Step Time": 9.036718105897307} +{"Pretrain/Learning Rate": 3.672521012572307e-05, "Pretrain/Loss": 2.0221409797668457, "Pretrain/Loss (Raw)": 2.1466400623321533, "Pretrain/Step": 3474, "Pretrain/Step Time": 9.03218556754291} +{"Pretrain/Learning Rate": 3.671771124727975e-05, "Pretrain/Loss": 2.022463798522949, "Pretrain/Loss (Raw)": 2.019821882247925, "Pretrain/Step": 3475, "Pretrain/Step Time": 9.0385597422719} +{"Pretrain/Learning Rate": 3.671021101749476e-05, "Pretrain/Loss": 2.0193395614624023, "Pretrain/Loss (Raw)": 1.6189340353012085, "Pretrain/Step": 3476, "Pretrain/Step Time": 9.042009456083179} +{"Pretrain/Learning Rate": 3.670270943723305e-05, "Pretrain/Loss": 2.0202736854553223, "Pretrain/Loss (Raw)": 2.0413360595703125, "Pretrain/Step": 3477, "Pretrain/Step Time": 9.040857449173927} +{"Pretrain/Learning Rate": 3.669520650735975e-05, "Pretrain/Loss": 2.019155979156494, "Pretrain/Loss (Raw)": 1.851149082183838, "Pretrain/Step": 3478, "Pretrain/Step Time": 9.041905496269464} +{"Pretrain/Learning Rate": 3.668770222874012e-05, "Pretrain/Loss": 2.0182464122772217, "Pretrain/Loss (Raw)": 2.020763397216797, "Pretrain/Step": 3479, "Pretrain/Step Time": 9.039763120934367} +{"Pretrain/Learning Rate": 3.6680196602239596e-05, "Pretrain/Loss": 2.0214133262634277, "Pretrain/Loss (Raw)": 1.8324054479599, "Pretrain/Step": 3480, "Pretrain/Step Time": 9.03967484459281} +{"Pretrain/Learning Rate": 3.667268962872376e-05, "Pretrain/Loss": 2.0181195735931396, "Pretrain/Loss (Raw)": 1.7911816835403442, "Pretrain/Step": 3481, "Pretrain/Step Time": 9.036928717046976} +{"Pretrain/Learning Rate": 3.666518130905836e-05, "Pretrain/Loss": 2.0172157287597656, "Pretrain/Loss (Raw)": 1.769668459892273, "Pretrain/Step": 3482, "Pretrain/Step Time": 9.040628651157022} +{"Pretrain/Learning Rate": 3.665767164410928e-05, "Pretrain/Loss": 2.0157017707824707, "Pretrain/Loss (Raw)": 1.9627463817596436, "Pretrain/Step": 3483, "Pretrain/Step Time": 9.03424571827054} +{"Pretrain/Learning Rate": 3.665016063474257e-05, "Pretrain/Loss": 2.014258861541748, "Pretrain/Loss (Raw)": 2.058671236038208, "Pretrain/Step": 3484, "Pretrain/Step Time": 9.036788465455174} +{"Pretrain/Learning Rate": 3.664264828182444e-05, "Pretrain/Loss": 2.0130677223205566, "Pretrain/Loss (Raw)": 1.9682297706604004, "Pretrain/Step": 3485, "Pretrain/Step Time": 9.035619320347905} +{"Pretrain/Learning Rate": 3.663513458622124e-05, "Pretrain/Loss": 2.0114824771881104, "Pretrain/Loss (Raw)": 1.9314368963241577, "Pretrain/Step": 3486, "Pretrain/Step Time": 9.047271218150854} +{"Pretrain/Learning Rate": 3.662761954879951e-05, "Pretrain/Loss": 2.011137008666992, "Pretrain/Loss (Raw)": 2.0584089756011963, "Pretrain/Step": 3487, "Pretrain/Step Time": 9.045498423278332} +{"Pretrain/Learning Rate": 3.662010317042589e-05, "Pretrain/Loss": 2.010108232498169, "Pretrain/Loss (Raw)": 1.8820512294769287, "Pretrain/Step": 3488, "Pretrain/Step Time": 9.045074295252562} +{"Pretrain/Learning Rate": 3.661258545196722e-05, "Pretrain/Loss": 2.011294364929199, "Pretrain/Loss (Raw)": 2.0519893169403076, "Pretrain/Step": 3489, "Pretrain/Step Time": 9.047355618327856} +{"Pretrain/Learning Rate": 3.6605066394290476e-05, "Pretrain/Loss": 2.0098235607147217, "Pretrain/Loss (Raw)": 1.9508923292160034, "Pretrain/Step": 3490, "Pretrain/Step Time": 9.034846439957619} +{"Pretrain/Learning Rate": 3.659754599826279e-05, "Pretrain/Loss": 2.011960506439209, "Pretrain/Loss (Raw)": 2.0570273399353027, "Pretrain/Step": 3491, "Pretrain/Step Time": 9.040217757225037} +{"Pretrain/Learning Rate": 3.659002426475145e-05, "Pretrain/Loss": 2.0127196311950684, "Pretrain/Loss (Raw)": 2.0302369594573975, "Pretrain/Step": 3492, "Pretrain/Step Time": 9.036304352805018} +{"Pretrain/Learning Rate": 3.65825011946239e-05, "Pretrain/Loss": 2.013593912124634, "Pretrain/Loss (Raw)": 2.109490156173706, "Pretrain/Step": 3493, "Pretrain/Step Time": 9.035262070596218} +{"Pretrain/Learning Rate": 3.6574976788747725e-05, "Pretrain/Loss": 2.0130672454833984, "Pretrain/Loss (Raw)": 1.790318489074707, "Pretrain/Step": 3494, "Pretrain/Step Time": 9.033282598480582} +{"Pretrain/Learning Rate": 3.6567451047990696e-05, "Pretrain/Loss": 2.013624668121338, "Pretrain/Loss (Raw)": 2.072277307510376, "Pretrain/Step": 3495, "Pretrain/Step Time": 9.03341175802052} +{"Pretrain/Learning Rate": 3.6559923973220695e-05, "Pretrain/Loss": 2.012730121612549, "Pretrain/Loss (Raw)": 1.8121215105056763, "Pretrain/Step": 3496, "Pretrain/Step Time": 9.028784485533834} +{"Pretrain/Learning Rate": 3.65523955653058e-05, "Pretrain/Loss": 2.0133543014526367, "Pretrain/Loss (Raw)": 2.117391347885132, "Pretrain/Step": 3497, "Pretrain/Step Time": 9.028132194653153} +{"Pretrain/Learning Rate": 3.65448658251142e-05, "Pretrain/Loss": 2.010399341583252, "Pretrain/Loss (Raw)": 1.6129502058029175, "Pretrain/Step": 3498, "Pretrain/Step Time": 9.021370336413383} +{"Pretrain/Learning Rate": 3.653733475351428e-05, "Pretrain/Loss": 2.0141775608062744, "Pretrain/Loss (Raw)": 2.4752368927001953, "Pretrain/Step": 3499, "Pretrain/Step Time": 9.02468060143292} +{"Pretrain/Learning Rate": 3.6529802351374545e-05, "Pretrain/Loss": 2.0150814056396484, "Pretrain/Loss (Raw)": 1.7114109992980957, "Pretrain/Step": 3500, "Pretrain/Step Time": 9.026330566033721} +{"Pretrain/Learning Rate": 3.652226861956368e-05, "Pretrain/Loss": 2.014096736907959, "Pretrain/Loss (Raw)": 1.843189001083374, "Pretrain/Step": 3501, "Pretrain/Step Time": 9.028524965047836} +{"Pretrain/Learning Rate": 3.65147335589505e-05, "Pretrain/Loss": 2.0143933296203613, "Pretrain/Loss (Raw)": 2.093141794204712, "Pretrain/Step": 3502, "Pretrain/Step Time": 9.02744485810399} +{"Pretrain/Learning Rate": 3.650719717040398e-05, "Pretrain/Loss": 2.0120534896850586, "Pretrain/Loss (Raw)": 1.9418818950653076, "Pretrain/Step": 3503, "Pretrain/Step Time": 9.025556672364473} +{"Pretrain/Learning Rate": 3.649965945479326e-05, "Pretrain/Loss": 2.0101637840270996, "Pretrain/Loss (Raw)": 1.9259024858474731, "Pretrain/Step": 3504, "Pretrain/Step Time": 9.025526076555252} +{"Pretrain/Learning Rate": 3.649212041298763e-05, "Pretrain/Loss": 2.0111465454101562, "Pretrain/Loss (Raw)": 2.018224000930786, "Pretrain/Step": 3505, "Pretrain/Step Time": 9.027794571593404} +{"Pretrain/Learning Rate": 3.648458004585652e-05, "Pretrain/Loss": 2.0094332695007324, "Pretrain/Loss (Raw)": 1.9386953115463257, "Pretrain/Step": 3506, "Pretrain/Step Time": 9.021042365580797} +{"Pretrain/Learning Rate": 3.647703835426952e-05, "Pretrain/Loss": 2.008639335632324, "Pretrain/Loss (Raw)": 1.9698671102523804, "Pretrain/Step": 3507, "Pretrain/Step Time": 9.029913820326328} +{"Pretrain/Learning Rate": 3.646949533909637e-05, "Pretrain/Loss": 2.0073704719543457, "Pretrain/Loss (Raw)": 2.0348281860351562, "Pretrain/Step": 3508, "Pretrain/Step Time": 9.032666575163603} +{"Pretrain/Learning Rate": 3.646195100120698e-05, "Pretrain/Loss": 2.010824203491211, "Pretrain/Loss (Raw)": 2.3337554931640625, "Pretrain/Step": 3509, "Pretrain/Step Time": 9.031678151339293} +{"Pretrain/Learning Rate": 3.645440534147139e-05, "Pretrain/Loss": 2.0102384090423584, "Pretrain/Loss (Raw)": 1.8869829177856445, "Pretrain/Step": 3510, "Pretrain/Step Time": 9.03232898004353} +{"Pretrain/Learning Rate": 3.644685836075979e-05, "Pretrain/Loss": 2.0102505683898926, "Pretrain/Loss (Raw)": 1.9228508472442627, "Pretrain/Step": 3511, "Pretrain/Step Time": 9.040581349283457} +{"Pretrain/Learning Rate": 3.643931005994255e-05, "Pretrain/Loss": 2.013676643371582, "Pretrain/Loss (Raw)": 2.4284451007843018, "Pretrain/Step": 3512, "Pretrain/Step Time": 9.038976769894361} +{"Pretrain/Learning Rate": 3.643176043989018e-05, "Pretrain/Loss": 2.0151472091674805, "Pretrain/Loss (Raw)": 2.09548020362854, "Pretrain/Step": 3513, "Pretrain/Step Time": 9.037991356104612} +{"Pretrain/Learning Rate": 3.6424209501473314e-05, "Pretrain/Loss": 2.0124869346618652, "Pretrain/Loss (Raw)": 1.9475566148757935, "Pretrain/Step": 3514, "Pretrain/Step Time": 9.038861159235239} +{"Pretrain/Learning Rate": 3.641665724556278e-05, "Pretrain/Loss": 2.0109755992889404, "Pretrain/Loss (Raw)": 1.8873555660247803, "Pretrain/Step": 3515, "Pretrain/Step Time": 9.037207920104265} +{"Pretrain/Learning Rate": 3.6409103673029535e-05, "Pretrain/Loss": 2.0119128227233887, "Pretrain/Loss (Raw)": 2.180330276489258, "Pretrain/Step": 3516, "Pretrain/Step Time": 9.033918879926205} +{"Pretrain/Learning Rate": 3.64015487847447e-05, "Pretrain/Loss": 2.011443614959717, "Pretrain/Loss (Raw)": 1.8635276556015015, "Pretrain/Step": 3517, "Pretrain/Step Time": 9.04730854742229} +{"Pretrain/Learning Rate": 3.6393992581579526e-05, "Pretrain/Loss": 2.0121045112609863, "Pretrain/Loss (Raw)": 2.1131882667541504, "Pretrain/Step": 3518, "Pretrain/Step Time": 9.049207216128707} +{"Pretrain/Learning Rate": 3.638643506440544e-05, "Pretrain/Loss": 2.012761116027832, "Pretrain/Loss (Raw)": 2.1090023517608643, "Pretrain/Step": 3519, "Pretrain/Step Time": 9.051356680691242} +{"Pretrain/Learning Rate": 3.6378876234094014e-05, "Pretrain/Loss": 2.0137243270874023, "Pretrain/Loss (Raw)": 2.177889108657837, "Pretrain/Step": 3520, "Pretrain/Step Time": 9.048118779435754} +{"Pretrain/Learning Rate": 3.6371316091516955e-05, "Pretrain/Loss": 2.0098700523376465, "Pretrain/Loss (Raw)": 1.5366359949111938, "Pretrain/Step": 3521, "Pretrain/Step Time": 9.05300309509039} +{"Pretrain/Learning Rate": 3.636375463754614e-05, "Pretrain/Loss": 2.0111849308013916, "Pretrain/Loss (Raw)": 2.210395336151123, "Pretrain/Step": 3522, "Pretrain/Step Time": 9.055777754634619} +{"Pretrain/Learning Rate": 3.6356191873053594e-05, "Pretrain/Loss": 2.0120315551757812, "Pretrain/Loss (Raw)": 2.1556286811828613, "Pretrain/Step": 3523, "Pretrain/Step Time": 9.054517328739166} +{"Pretrain/Learning Rate": 3.634862779891148e-05, "Pretrain/Loss": 2.012892246246338, "Pretrain/Loss (Raw)": 2.0006303787231445, "Pretrain/Step": 3524, "Pretrain/Step Time": 9.056911865249276} +{"Pretrain/Learning Rate": 3.634106241599215e-05, "Pretrain/Loss": 2.0147671699523926, "Pretrain/Loss (Raw)": 2.233825445175171, "Pretrain/Step": 3525, "Pretrain/Step Time": 9.055973680689931} +{"Pretrain/Learning Rate": 3.633349572516805e-05, "Pretrain/Loss": 2.0144810676574707, "Pretrain/Loss (Raw)": 2.0091092586517334, "Pretrain/Step": 3526, "Pretrain/Step Time": 9.056675348430872} +{"Pretrain/Learning Rate": 3.632592772731182e-05, "Pretrain/Loss": 2.0139822959899902, "Pretrain/Loss (Raw)": 1.9495831727981567, "Pretrain/Step": 3527, "Pretrain/Step Time": 9.058090817183256} +{"Pretrain/Learning Rate": 3.631835842329624e-05, "Pretrain/Loss": 2.0118162631988525, "Pretrain/Loss (Raw)": 1.9266612529754639, "Pretrain/Step": 3528, "Pretrain/Step Time": 9.052186140790582} +{"Pretrain/Learning Rate": 3.6310787813994226e-05, "Pretrain/Loss": 2.0138425827026367, "Pretrain/Loss (Raw)": 2.1461057662963867, "Pretrain/Step": 3529, "Pretrain/Step Time": 9.052941270172596} +{"Pretrain/Learning Rate": 3.6303215900278864e-05, "Pretrain/Loss": 2.011167526245117, "Pretrain/Loss (Raw)": 1.9967113733291626, "Pretrain/Step": 3530, "Pretrain/Step Time": 9.04619794152677} +{"Pretrain/Learning Rate": 3.629564268302338e-05, "Pretrain/Loss": 2.011932373046875, "Pretrain/Loss (Raw)": 2.0117287635803223, "Pretrain/Step": 3531, "Pretrain/Step Time": 9.047154134139419} +{"Pretrain/Learning Rate": 3.6288068163101156e-05, "Pretrain/Loss": 2.012277126312256, "Pretrain/Loss (Raw)": 1.960410714149475, "Pretrain/Step": 3532, "Pretrain/Step Time": 9.049808559939265} +{"Pretrain/Learning Rate": 3.628049234138572e-05, "Pretrain/Loss": 2.0113110542297363, "Pretrain/Loss (Raw)": 1.8843013048171997, "Pretrain/Step": 3533, "Pretrain/Step Time": 9.047368511557579} +{"Pretrain/Learning Rate": 3.6272915218750755e-05, "Pretrain/Loss": 2.0108392238616943, "Pretrain/Loss (Raw)": 2.006605386734009, "Pretrain/Step": 3534, "Pretrain/Step Time": 9.055240403860807} +{"Pretrain/Learning Rate": 3.6265336796070083e-05, "Pretrain/Loss": 2.011354923248291, "Pretrain/Loss (Raw)": 2.018038034439087, "Pretrain/Step": 3535, "Pretrain/Step Time": 9.055555116385221} +{"Pretrain/Learning Rate": 3.62577570742177e-05, "Pretrain/Loss": 2.0104074478149414, "Pretrain/Loss (Raw)": 1.8198879957199097, "Pretrain/Step": 3536, "Pretrain/Step Time": 9.052672946825624} +{"Pretrain/Learning Rate": 3.625017605406771e-05, "Pretrain/Loss": 2.0125083923339844, "Pretrain/Loss (Raw)": 2.2325682640075684, "Pretrain/Step": 3537, "Pretrain/Step Time": 9.046236608177423} +{"Pretrain/Learning Rate": 3.624259373649441e-05, "Pretrain/Loss": 2.0138754844665527, "Pretrain/Loss (Raw)": 2.0645792484283447, "Pretrain/Step": 3538, "Pretrain/Step Time": 9.056073119863868} +{"Pretrain/Learning Rate": 3.6235010122372214e-05, "Pretrain/Loss": 2.0122547149658203, "Pretrain/Loss (Raw)": 1.8422411680221558, "Pretrain/Step": 3539, "Pretrain/Step Time": 9.05461029522121} +{"Pretrain/Learning Rate": 3.6227425212575725e-05, "Pretrain/Loss": 2.0113086700439453, "Pretrain/Loss (Raw)": 2.014774799346924, "Pretrain/Step": 3540, "Pretrain/Step Time": 9.046339312568307} +{"Pretrain/Learning Rate": 3.621983900797964e-05, "Pretrain/Loss": 2.0109267234802246, "Pretrain/Loss (Raw)": 1.9940879344940186, "Pretrain/Step": 3541, "Pretrain/Step Time": 9.052221776917577} +{"Pretrain/Learning Rate": 3.621225150945886e-05, "Pretrain/Loss": 2.013094186782837, "Pretrain/Loss (Raw)": 2.1899893283843994, "Pretrain/Step": 3542, "Pretrain/Step Time": 9.050144702196121} +{"Pretrain/Learning Rate": 3.620466271788841e-05, "Pretrain/Loss": 2.0121474266052246, "Pretrain/Loss (Raw)": 1.906866431236267, "Pretrain/Step": 3543, "Pretrain/Step Time": 9.052178092300892} +{"Pretrain/Learning Rate": 3.6197072634143436e-05, "Pretrain/Loss": 2.0113306045532227, "Pretrain/Loss (Raw)": 1.9645991325378418, "Pretrain/Step": 3544, "Pretrain/Step Time": 9.0532451197505} +{"Pretrain/Learning Rate": 3.61894812590993e-05, "Pretrain/Loss": 2.011627674102783, "Pretrain/Loss (Raw)": 2.1882379055023193, "Pretrain/Step": 3545, "Pretrain/Step Time": 9.055135138332844} +{"Pretrain/Learning Rate": 3.6181888593631454e-05, "Pretrain/Loss": 2.0128583908081055, "Pretrain/Loss (Raw)": 2.1983816623687744, "Pretrain/Step": 3546, "Pretrain/Step Time": 9.04221767745912} +{"Pretrain/Learning Rate": 3.6174294638615524e-05, "Pretrain/Loss": 2.0109596252441406, "Pretrain/Loss (Raw)": 1.7733370065689087, "Pretrain/Step": 3547, "Pretrain/Step Time": 9.044060068204999} +{"Pretrain/Learning Rate": 3.616669939492728e-05, "Pretrain/Loss": 2.0113353729248047, "Pretrain/Loss (Raw)": 2.065598487854004, "Pretrain/Step": 3548, "Pretrain/Step Time": 9.047735761851072} +{"Pretrain/Learning Rate": 3.615910286344265e-05, "Pretrain/Loss": 2.0115959644317627, "Pretrain/Loss (Raw)": 2.0822651386260986, "Pretrain/Step": 3549, "Pretrain/Step Time": 9.047993630170822} +{"Pretrain/Learning Rate": 3.615150504503768e-05, "Pretrain/Loss": 2.0099825859069824, "Pretrain/Loss (Raw)": 1.6646121740341187, "Pretrain/Step": 3550, "Pretrain/Step Time": 9.049805607646704} +{"Pretrain/Learning Rate": 3.6143905940588616e-05, "Pretrain/Loss": 2.0090837478637695, "Pretrain/Loss (Raw)": 1.7277129888534546, "Pretrain/Step": 3551, "Pretrain/Step Time": 9.047376122325659} +{"Pretrain/Learning Rate": 3.613630555097179e-05, "Pretrain/Loss": 2.0100600719451904, "Pretrain/Loss (Raw)": 2.126950740814209, "Pretrain/Step": 3552, "Pretrain/Step Time": 9.04701648838818} +{"Pretrain/Learning Rate": 3.6128703877063755e-05, "Pretrain/Loss": 2.009218215942383, "Pretrain/Loss (Raw)": 1.9625872373580933, "Pretrain/Step": 3553, "Pretrain/Step Time": 9.045260926708579} +{"Pretrain/Learning Rate": 3.6121100919741126e-05, "Pretrain/Loss": 2.0078649520874023, "Pretrain/Loss (Raw)": 1.9371318817138672, "Pretrain/Step": 3554, "Pretrain/Step Time": 9.043410576879978} +{"Pretrain/Learning Rate": 3.611349667988074e-05, "Pretrain/Loss": 2.0075125694274902, "Pretrain/Loss (Raw)": 2.042466640472412, "Pretrain/Step": 3555, "Pretrain/Step Time": 9.045648952946067} +{"Pretrain/Learning Rate": 3.6105891158359563e-05, "Pretrain/Loss": 2.006692886352539, "Pretrain/Loss (Raw)": 1.9750381708145142, "Pretrain/Step": 3556, "Pretrain/Step Time": 9.04284536652267} +{"Pretrain/Learning Rate": 3.6098284356054666e-05, "Pretrain/Loss": 2.0071747303009033, "Pretrain/Loss (Raw)": 2.1630537509918213, "Pretrain/Step": 3557, "Pretrain/Step Time": 9.041654899716377} +{"Pretrain/Learning Rate": 3.609067627384333e-05, "Pretrain/Loss": 2.008495330810547, "Pretrain/Loss (Raw)": 2.0027916431427, "Pretrain/Step": 3558, "Pretrain/Step Time": 9.061642415821552} +{"Pretrain/Learning Rate": 3.608306691260295e-05, "Pretrain/Loss": 2.009591579437256, "Pretrain/Loss (Raw)": 2.100464344024658, "Pretrain/Step": 3559, "Pretrain/Step Time": 9.05639804713428} +{"Pretrain/Learning Rate": 3.607545627321106e-05, "Pretrain/Loss": 2.0098371505737305, "Pretrain/Loss (Raw)": 1.998103141784668, "Pretrain/Step": 3560, "Pretrain/Step Time": 9.05531338788569} +{"Pretrain/Learning Rate": 3.606784435654536e-05, "Pretrain/Loss": 2.008815288543701, "Pretrain/Loss (Raw)": 1.9628750085830688, "Pretrain/Step": 3561, "Pretrain/Step Time": 9.050450513139367} +{"Pretrain/Learning Rate": 3.6060231163483704e-05, "Pretrain/Loss": 2.0058748722076416, "Pretrain/Loss (Raw)": 1.8675092458724976, "Pretrain/Step": 3562, "Pretrain/Step Time": 9.048605214804411} +{"Pretrain/Learning Rate": 3.6052616694904066e-05, "Pretrain/Loss": 2.007591724395752, "Pretrain/Loss (Raw)": 2.232119560241699, "Pretrain/Step": 3563, "Pretrain/Step Time": 9.048281457275152} +{"Pretrain/Learning Rate": 3.60450009516846e-05, "Pretrain/Loss": 2.0070853233337402, "Pretrain/Loss (Raw)": 2.066690683364868, "Pretrain/Step": 3564, "Pretrain/Step Time": 9.048095166683197} +{"Pretrain/Learning Rate": 3.603738393470357e-05, "Pretrain/Loss": 2.006842613220215, "Pretrain/Loss (Raw)": 2.052617073059082, "Pretrain/Step": 3565, "Pretrain/Step Time": 9.034595172852278} +{"Pretrain/Learning Rate": 3.6029765644839416e-05, "Pretrain/Loss": 2.006261110305786, "Pretrain/Loss (Raw)": 2.0102944374084473, "Pretrain/Step": 3566, "Pretrain/Step Time": 9.039996076375246} +{"Pretrain/Learning Rate": 3.602214608297071e-05, "Pretrain/Loss": 2.003429412841797, "Pretrain/Loss (Raw)": 1.9245749711990356, "Pretrain/Step": 3567, "Pretrain/Step Time": 9.039361242204905} +{"Pretrain/Learning Rate": 3.601452524997619e-05, "Pretrain/Loss": 2.0015716552734375, "Pretrain/Loss (Raw)": 1.810809850692749, "Pretrain/Step": 3568, "Pretrain/Step Time": 9.1084038708359} +{"Pretrain/Learning Rate": 3.600690314673471e-05, "Pretrain/Loss": 2.002288341522217, "Pretrain/Loss (Raw)": 1.9585893154144287, "Pretrain/Step": 3569, "Pretrain/Step Time": 9.106522465124726} +{"Pretrain/Learning Rate": 3.599927977412529e-05, "Pretrain/Loss": 2.0019736289978027, "Pretrain/Loss (Raw)": 2.0778093338012695, "Pretrain/Step": 3570, "Pretrain/Step Time": 9.10631744377315} +{"Pretrain/Learning Rate": 3.59916551330271e-05, "Pretrain/Loss": 2.002110004425049, "Pretrain/Loss (Raw)": 1.9538421630859375, "Pretrain/Step": 3571, "Pretrain/Step Time": 9.106908740475774} +{"Pretrain/Learning Rate": 3.598402922431944e-05, "Pretrain/Loss": 2.001162528991699, "Pretrain/Loss (Raw)": 1.9430782794952393, "Pretrain/Step": 3572, "Pretrain/Step Time": 9.113751366734505} +{"Pretrain/Learning Rate": 3.5976402048881786e-05, "Pretrain/Loss": 2.001904010772705, "Pretrain/Loss (Raw)": 2.1926515102386475, "Pretrain/Step": 3573, "Pretrain/Step Time": 9.107250100001693} +{"Pretrain/Learning Rate": 3.596877360759371e-05, "Pretrain/Loss": 2.001861095428467, "Pretrain/Loss (Raw)": 1.994249701499939, "Pretrain/Step": 3574, "Pretrain/Step Time": 9.10955110564828} +{"Pretrain/Learning Rate": 3.5961143901334984e-05, "Pretrain/Loss": 2.0000643730163574, "Pretrain/Loss (Raw)": 1.8776791095733643, "Pretrain/Step": 3575, "Pretrain/Step Time": 9.11055645160377} +{"Pretrain/Learning Rate": 3.5953512930985486e-05, "Pretrain/Loss": 2.0018603801727295, "Pretrain/Loss (Raw)": 2.2882614135742188, "Pretrain/Step": 3576, "Pretrain/Step Time": 9.117223866283894} +{"Pretrain/Learning Rate": 3.594588069742527e-05, "Pretrain/Loss": 2.0000412464141846, "Pretrain/Loss (Raw)": 1.8652830123901367, "Pretrain/Step": 3577, "Pretrain/Step Time": 9.115668440237641} +{"Pretrain/Learning Rate": 3.5938247201534505e-05, "Pretrain/Loss": 1.9999058246612549, "Pretrain/Loss (Raw)": 1.9794769287109375, "Pretrain/Step": 3578, "Pretrain/Step Time": 9.118156092241406} +{"Pretrain/Learning Rate": 3.5930612444193535e-05, "Pretrain/Loss": 1.9985417127609253, "Pretrain/Loss (Raw)": 1.9970840215682983, "Pretrain/Step": 3579, "Pretrain/Step Time": 9.11496538668871} +{"Pretrain/Learning Rate": 3.592297642628283e-05, "Pretrain/Loss": 1.9978193044662476, "Pretrain/Loss (Raw)": 2.0036473274230957, "Pretrain/Step": 3580, "Pretrain/Step Time": 9.11426393315196} +{"Pretrain/Learning Rate": 3.5915339148683005e-05, "Pretrain/Loss": 1.9997066259384155, "Pretrain/Loss (Raw)": 2.177157402038574, "Pretrain/Step": 3581, "Pretrain/Step Time": 9.114786896854639} +{"Pretrain/Learning Rate": 3.590770061227484e-05, "Pretrain/Loss": 1.9997079372406006, "Pretrain/Loss (Raw)": 2.1019985675811768, "Pretrain/Step": 3582, "Pretrain/Step Time": 9.112538633868098} +{"Pretrain/Learning Rate": 3.590006081793925e-05, "Pretrain/Loss": 1.9989326000213623, "Pretrain/Loss (Raw)": 1.9453397989273071, "Pretrain/Step": 3583, "Pretrain/Step Time": 9.115310441702604} +{"Pretrain/Learning Rate": 3.589241976655727e-05, "Pretrain/Loss": 1.9963293075561523, "Pretrain/Loss (Raw)": 2.0530307292938232, "Pretrain/Step": 3584, "Pretrain/Step Time": 9.09702805802226} +{"Pretrain/Learning Rate": 3.588477745901013e-05, "Pretrain/Loss": 1.9973456859588623, "Pretrain/Loss (Raw)": 2.1375210285186768, "Pretrain/Step": 3585, "Pretrain/Step Time": 9.09652559272945} +{"Pretrain/Learning Rate": 3.587713389617916e-05, "Pretrain/Loss": 1.9972925186157227, "Pretrain/Loss (Raw)": 2.0121512413024902, "Pretrain/Step": 3586, "Pretrain/Step Time": 9.09239218197763} +{"Pretrain/Learning Rate": 3.5869489078945845e-05, "Pretrain/Loss": 1.9974677562713623, "Pretrain/Loss (Raw)": 2.0512516498565674, "Pretrain/Step": 3587, "Pretrain/Step Time": 9.090846901759505} +{"Pretrain/Learning Rate": 3.586184300819184e-05, "Pretrain/Loss": 1.9988601207733154, "Pretrain/Loss (Raw)": 2.0482804775238037, "Pretrain/Step": 3588, "Pretrain/Step Time": 9.087756974622607} +{"Pretrain/Learning Rate": 3.585419568479891e-05, "Pretrain/Loss": 1.9974794387817383, "Pretrain/Loss (Raw)": 1.9632809162139893, "Pretrain/Step": 3589, "Pretrain/Step Time": 9.07739139534533} +{"Pretrain/Learning Rate": 3.584654710964899e-05, "Pretrain/Loss": 1.9983502626419067, "Pretrain/Loss (Raw)": 2.079458475112915, "Pretrain/Step": 3590, "Pretrain/Step Time": 8.945214098319411} +{"Pretrain/Learning Rate": 3.583889728362414e-05, "Pretrain/Loss": 1.9980127811431885, "Pretrain/Loss (Raw)": 1.9380476474761963, "Pretrain/Step": 3591, "Pretrain/Step Time": 8.949322370812297} +{"Pretrain/Learning Rate": 3.583124620760659e-05, "Pretrain/Loss": 1.9945974349975586, "Pretrain/Loss (Raw)": 1.5854076147079468, "Pretrain/Step": 3592, "Pretrain/Step Time": 8.95212502963841} +{"Pretrain/Learning Rate": 3.582359388247869e-05, "Pretrain/Loss": 1.9960993528366089, "Pretrain/Loss (Raw)": 2.1920101642608643, "Pretrain/Step": 3593, "Pretrain/Step Time": 8.951534409075975} +{"Pretrain/Learning Rate": 3.581594030912294e-05, "Pretrain/Loss": 1.9978018999099731, "Pretrain/Loss (Raw)": 2.101881980895996, "Pretrain/Step": 3594, "Pretrain/Step Time": 8.951546741649508} +{"Pretrain/Learning Rate": 3.580828548842198e-05, "Pretrain/Loss": 1.9983646869659424, "Pretrain/Loss (Raw)": 2.1793041229248047, "Pretrain/Step": 3595, "Pretrain/Step Time": 8.950952729210258} +{"Pretrain/Learning Rate": 3.5800629421258606e-05, "Pretrain/Loss": 1.9980272054672241, "Pretrain/Loss (Raw)": 1.6958997249603271, "Pretrain/Step": 3596, "Pretrain/Step Time": 8.955172777175903} +{"Pretrain/Learning Rate": 3.579297210851576e-05, "Pretrain/Loss": 1.9974497556686401, "Pretrain/Loss (Raw)": 1.9887782335281372, "Pretrain/Step": 3597, "Pretrain/Step Time": 8.952277347445488} +{"Pretrain/Learning Rate": 3.5785313551076505e-05, "Pretrain/Loss": 1.998488187789917, "Pretrain/Loss (Raw)": 2.1638615131378174, "Pretrain/Step": 3598, "Pretrain/Step Time": 8.89553226903081} +{"Pretrain/Learning Rate": 3.577765374982408e-05, "Pretrain/Loss": 1.9970648288726807, "Pretrain/Loss (Raw)": 1.9716248512268066, "Pretrain/Step": 3599, "Pretrain/Step Time": 8.900333473458886} +{"Pretrain/Learning Rate": 3.576999270564183e-05, "Pretrain/Loss": 2.000155448913574, "Pretrain/Loss (Raw)": 2.0956475734710693, "Pretrain/Step": 3600, "Pretrain/Step Time": 8.875564334914088} +{"Pretrain/Learning Rate": 3.5762330419413273e-05, "Pretrain/Loss": 2.0018744468688965, "Pretrain/Loss (Raw)": 2.1572577953338623, "Pretrain/Step": 3601, "Pretrain/Step Time": 8.871022842824459} +{"Pretrain/Learning Rate": 3.575466689202206e-05, "Pretrain/Loss": 2.0007333755493164, "Pretrain/Loss (Raw)": 2.0005946159362793, "Pretrain/Step": 3602, "Pretrain/Step Time": 8.873374696820974} +{"Pretrain/Learning Rate": 3.5747002124351986e-05, "Pretrain/Loss": 2.001955509185791, "Pretrain/Loss (Raw)": 2.176234722137451, "Pretrain/Step": 3603, "Pretrain/Step Time": 8.864855846390128} +{"Pretrain/Learning Rate": 3.573933611728698e-05, "Pretrain/Loss": 2.004606246948242, "Pretrain/Loss (Raw)": 1.9582500457763672, "Pretrain/Step": 3604, "Pretrain/Step Time": 8.964601393789053} +{"Pretrain/Learning Rate": 3.573166887171113e-05, "Pretrain/Loss": 2.0047249794006348, "Pretrain/Loss (Raw)": 2.056534767150879, "Pretrain/Step": 3605, "Pretrain/Step Time": 8.968410938978195} +{"Pretrain/Learning Rate": 3.5724000388508655e-05, "Pretrain/Loss": 2.0062456130981445, "Pretrain/Loss (Raw)": 2.0457828044891357, "Pretrain/Step": 3606, "Pretrain/Step Time": 8.965953029692173} +{"Pretrain/Learning Rate": 3.571633066856392e-05, "Pretrain/Loss": 2.006042957305908, "Pretrain/Loss (Raw)": 1.9948208332061768, "Pretrain/Step": 3607, "Pretrain/Step Time": 8.972780875861645} +{"Pretrain/Learning Rate": 3.570865971276144e-05, "Pretrain/Loss": 2.007523536682129, "Pretrain/Loss (Raw)": 2.0219290256500244, "Pretrain/Step": 3608, "Pretrain/Step Time": 8.97000383399427} +{"Pretrain/Learning Rate": 3.570098752198586e-05, "Pretrain/Loss": 2.009730339050293, "Pretrain/Loss (Raw)": 2.073664665222168, "Pretrain/Step": 3609, "Pretrain/Step Time": 8.98131806589663} +{"Pretrain/Learning Rate": 3.569331409712198e-05, "Pretrain/Loss": 2.0111703872680664, "Pretrain/Loss (Raw)": 1.9539954662322998, "Pretrain/Step": 3610, "Pretrain/Step Time": 8.978205990046263} +{"Pretrain/Learning Rate": 3.568563943905472e-05, "Pretrain/Loss": 2.011049270629883, "Pretrain/Loss (Raw)": 1.9472241401672363, "Pretrain/Step": 3611, "Pretrain/Step Time": 8.981239341199398} +{"Pretrain/Learning Rate": 3.5677963548669175e-05, "Pretrain/Loss": 2.0099563598632812, "Pretrain/Loss (Raw)": 1.9187554121017456, "Pretrain/Step": 3612, "Pretrain/Step Time": 8.978535065427423} +{"Pretrain/Learning Rate": 3.567028642685055e-05, "Pretrain/Loss": 2.0101218223571777, "Pretrain/Loss (Raw)": 1.9894630908966064, "Pretrain/Step": 3613, "Pretrain/Step Time": 8.975799573585391} +{"Pretrain/Learning Rate": 3.566260807448422e-05, "Pretrain/Loss": 2.011085033416748, "Pretrain/Loss (Raw)": 2.0547096729278564, "Pretrain/Step": 3614, "Pretrain/Step Time": 8.965249568223953} +{"Pretrain/Learning Rate": 3.565492849245568e-05, "Pretrain/Loss": 2.0108861923217773, "Pretrain/Loss (Raw)": 2.0329527854919434, "Pretrain/Step": 3615, "Pretrain/Step Time": 8.971762303262949} +{"Pretrain/Learning Rate": 3.564724768165058e-05, "Pretrain/Loss": 2.0120770931243896, "Pretrain/Loss (Raw)": 2.034486770629883, "Pretrain/Step": 3616, "Pretrain/Step Time": 8.963617807254195} +{"Pretrain/Learning Rate": 3.5639565642954705e-05, "Pretrain/Loss": 2.012044668197632, "Pretrain/Loss (Raw)": 2.0478427410125732, "Pretrain/Step": 3617, "Pretrain/Step Time": 8.964592916890979} +{"Pretrain/Learning Rate": 3.563188237725399e-05, "Pretrain/Loss": 2.013309955596924, "Pretrain/Loss (Raw)": 2.1128482818603516, "Pretrain/Step": 3618, "Pretrain/Step Time": 8.962983587756753} +{"Pretrain/Learning Rate": 3.562419788543449e-05, "Pretrain/Loss": 2.0124459266662598, "Pretrain/Loss (Raw)": 1.9464576244354248, "Pretrain/Step": 3619, "Pretrain/Step Time": 8.959622910246253} +{"Pretrain/Learning Rate": 3.561651216838243e-05, "Pretrain/Loss": 2.012991428375244, "Pretrain/Loss (Raw)": 2.100022077560425, "Pretrain/Step": 3620, "Pretrain/Step Time": 8.963794628158212} +{"Pretrain/Learning Rate": 3.560882522698417e-05, "Pretrain/Loss": 2.0131211280822754, "Pretrain/Loss (Raw)": 2.1260719299316406, "Pretrain/Step": 3621, "Pretrain/Step Time": 8.963433150202036} +{"Pretrain/Learning Rate": 3.560113706212618e-05, "Pretrain/Loss": 2.012449264526367, "Pretrain/Loss (Raw)": 1.7043581008911133, "Pretrain/Step": 3622, "Pretrain/Step Time": 8.965027904137969} +{"Pretrain/Learning Rate": 3.559344767469512e-05, "Pretrain/Loss": 2.0109777450561523, "Pretrain/Loss (Raw)": 1.883908987045288, "Pretrain/Step": 3623, "Pretrain/Step Time": 8.965522360056639} +{"Pretrain/Learning Rate": 3.5585757065577755e-05, "Pretrain/Loss": 2.0137686729431152, "Pretrain/Loss (Raw)": 2.169386863708496, "Pretrain/Step": 3624, "Pretrain/Step Time": 8.967234762385488} +{"Pretrain/Learning Rate": 3.557806523566099e-05, "Pretrain/Loss": 2.012112617492676, "Pretrain/Loss (Raw)": 1.9054101705551147, "Pretrain/Step": 3625, "Pretrain/Step Time": 8.968924162909389} +{"Pretrain/Learning Rate": 3.557037218583191e-05, "Pretrain/Loss": 2.017456531524658, "Pretrain/Loss (Raw)": 2.2969627380371094, "Pretrain/Step": 3626, "Pretrain/Step Time": 8.975348357111216} +{"Pretrain/Learning Rate": 3.5562677916977704e-05, "Pretrain/Loss": 2.015340805053711, "Pretrain/Loss (Raw)": 2.204430341720581, "Pretrain/Step": 3627, "Pretrain/Step Time": 8.972257673740387} +{"Pretrain/Learning Rate": 3.55549824299857e-05, "Pretrain/Loss": 2.0186104774475098, "Pretrain/Loss (Raw)": 2.1299352645874023, "Pretrain/Step": 3628, "Pretrain/Step Time": 8.974188717082143} +{"Pretrain/Learning Rate": 3.554728572574339e-05, "Pretrain/Loss": 2.0202507972717285, "Pretrain/Loss (Raw)": 2.0531177520751953, "Pretrain/Step": 3629, "Pretrain/Step Time": 8.977265127003193} +{"Pretrain/Learning Rate": 3.5539587805138385e-05, "Pretrain/Loss": 2.0192482471466064, "Pretrain/Loss (Raw)": 1.964816927909851, "Pretrain/Step": 3630, "Pretrain/Step Time": 8.984422504901886} +{"Pretrain/Learning Rate": 3.5531888669058455e-05, "Pretrain/Loss": 2.019648790359497, "Pretrain/Loss (Raw)": 1.9931604862213135, "Pretrain/Step": 3631, "Pretrain/Step Time": 8.981635749340057} +{"Pretrain/Learning Rate": 3.552418831839149e-05, "Pretrain/Loss": 2.021759033203125, "Pretrain/Loss (Raw)": 2.196023464202881, "Pretrain/Step": 3632, "Pretrain/Step Time": 8.986113350838423} +{"Pretrain/Learning Rate": 3.551648675402554e-05, "Pretrain/Loss": 2.0223798751831055, "Pretrain/Loss (Raw)": 2.09770131111145, "Pretrain/Step": 3633, "Pretrain/Step Time": 8.984692119061947} +{"Pretrain/Learning Rate": 3.550878397684878e-05, "Pretrain/Loss": 2.024085760116577, "Pretrain/Loss (Raw)": 2.157028913497925, "Pretrain/Step": 3634, "Pretrain/Step Time": 8.985779717564583} +{"Pretrain/Learning Rate": 3.5501079987749535e-05, "Pretrain/Loss": 2.021775245666504, "Pretrain/Loss (Raw)": 1.6741324663162231, "Pretrain/Step": 3635, "Pretrain/Step Time": 8.97742953337729} +{"Pretrain/Learning Rate": 3.549337478761626e-05, "Pretrain/Loss": 2.0203490257263184, "Pretrain/Loss (Raw)": 1.852280616760254, "Pretrain/Step": 3636, "Pretrain/Step Time": 8.971211198717356} +{"Pretrain/Learning Rate": 3.548566837733756e-05, "Pretrain/Loss": 2.0185933113098145, "Pretrain/Loss (Raw)": 2.1090211868286133, "Pretrain/Step": 3637, "Pretrain/Step Time": 8.968660734593868} +{"Pretrain/Learning Rate": 3.547796075780218e-05, "Pretrain/Loss": 2.020592212677002, "Pretrain/Loss (Raw)": 2.1428351402282715, "Pretrain/Step": 3638, "Pretrain/Step Time": 8.974152874201536} +{"Pretrain/Learning Rate": 3.547025192989898e-05, "Pretrain/Loss": 2.020146369934082, "Pretrain/Loss (Raw)": 1.8657902479171753, "Pretrain/Step": 3639, "Pretrain/Step Time": 8.9634500592947} +{"Pretrain/Learning Rate": 3.546254189451699e-05, "Pretrain/Loss": 2.0164103507995605, "Pretrain/Loss (Raw)": 1.9502360820770264, "Pretrain/Step": 3640, "Pretrain/Step Time": 8.964207885786891} +{"Pretrain/Learning Rate": 3.5454830652545374e-05, "Pretrain/Loss": 2.0170140266418457, "Pretrain/Loss (Raw)": 2.172741651535034, "Pretrain/Step": 3641, "Pretrain/Step Time": 8.969515772536397} +{"Pretrain/Learning Rate": 3.544711820487343e-05, "Pretrain/Loss": 2.0171852111816406, "Pretrain/Loss (Raw)": 1.9694485664367676, "Pretrain/Step": 3642, "Pretrain/Step Time": 8.970309058204293} +{"Pretrain/Learning Rate": 3.543940455239057e-05, "Pretrain/Loss": 2.019259452819824, "Pretrain/Loss (Raw)": 2.1528878211975098, "Pretrain/Step": 3643, "Pretrain/Step Time": 8.968124927952886} +{"Pretrain/Learning Rate": 3.543168969598639e-05, "Pretrain/Loss": 2.018620729446411, "Pretrain/Loss (Raw)": 2.0985515117645264, "Pretrain/Step": 3644, "Pretrain/Step Time": 9.123604437336326} +{"Pretrain/Learning Rate": 3.54239736365506e-05, "Pretrain/Loss": 2.0154519081115723, "Pretrain/Loss (Raw)": 1.4579110145568848, "Pretrain/Step": 3645, "Pretrain/Step Time": 9.107796300202608} +{"Pretrain/Learning Rate": 3.541625637497306e-05, "Pretrain/Loss": 2.0149598121643066, "Pretrain/Loss (Raw)": 2.050215005874634, "Pretrain/Step": 3646, "Pretrain/Step Time": 9.108298918232322} +{"Pretrain/Learning Rate": 3.540853791214373e-05, "Pretrain/Loss": 2.0157179832458496, "Pretrain/Loss (Raw)": 2.2060630321502686, "Pretrain/Step": 3647, "Pretrain/Step Time": 9.111536072567105} +{"Pretrain/Learning Rate": 3.5400818248952786e-05, "Pretrain/Loss": 2.0156848430633545, "Pretrain/Loss (Raw)": 2.1736338138580322, "Pretrain/Step": 3648, "Pretrain/Step Time": 9.114232467487454} +{"Pretrain/Learning Rate": 3.539309738629045e-05, "Pretrain/Loss": 2.017413854598999, "Pretrain/Loss (Raw)": 1.7579495906829834, "Pretrain/Step": 3649, "Pretrain/Step Time": 9.109924187883735} +{"Pretrain/Learning Rate": 3.5385375325047166e-05, "Pretrain/Loss": 2.0134174823760986, "Pretrain/Loss (Raw)": 1.6988599300384521, "Pretrain/Step": 3650, "Pretrain/Step Time": 9.103388464078307} +{"Pretrain/Learning Rate": 3.537765206611345e-05, "Pretrain/Loss": 2.011220932006836, "Pretrain/Loss (Raw)": 1.8744536638259888, "Pretrain/Step": 3651, "Pretrain/Step Time": 9.105795677751303} +{"Pretrain/Learning Rate": 3.536992761038001e-05, "Pretrain/Loss": 2.0109848976135254, "Pretrain/Loss (Raw)": 1.970420002937317, "Pretrain/Step": 3652, "Pretrain/Step Time": 9.100959597155452} +{"Pretrain/Learning Rate": 3.536220195873764e-05, "Pretrain/Loss": 2.0108284950256348, "Pretrain/Loss (Raw)": 2.213826894760132, "Pretrain/Step": 3653, "Pretrain/Step Time": 9.104211661964655} +{"Pretrain/Learning Rate": 3.535447511207731e-05, "Pretrain/Loss": 2.0087215900421143, "Pretrain/Loss (Raw)": 1.7394078969955444, "Pretrain/Step": 3654, "Pretrain/Step Time": 9.316856745630503} +{"Pretrain/Learning Rate": 3.534674707129013e-05, "Pretrain/Loss": 2.0094408988952637, "Pretrain/Loss (Raw)": 2.0416812896728516, "Pretrain/Step": 3655, "Pretrain/Step Time": 9.315315695479512} +{"Pretrain/Learning Rate": 3.5339017837267316e-05, "Pretrain/Loss": 2.0097756385803223, "Pretrain/Loss (Raw)": 1.9694819450378418, "Pretrain/Step": 3656, "Pretrain/Step Time": 9.343562182039022} +{"Pretrain/Learning Rate": 3.5331287410900246e-05, "Pretrain/Loss": 2.0097241401672363, "Pretrain/Loss (Raw)": 2.1395342350006104, "Pretrain/Step": 3657, "Pretrain/Step Time": 9.342166233807802} +{"Pretrain/Learning Rate": 3.532355579308043e-05, "Pretrain/Loss": 2.010180950164795, "Pretrain/Loss (Raw)": 2.0551586151123047, "Pretrain/Step": 3658, "Pretrain/Step Time": 9.347140487283468} +{"Pretrain/Learning Rate": 3.531582298469952e-05, "Pretrain/Loss": 2.011699676513672, "Pretrain/Loss (Raw)": 2.206131935119629, "Pretrain/Step": 3659, "Pretrain/Step Time": 9.349332531914115} +{"Pretrain/Learning Rate": 3.530808898664928e-05, "Pretrain/Loss": 2.009584665298462, "Pretrain/Loss (Raw)": 1.6896766424179077, "Pretrain/Step": 3660, "Pretrain/Step Time": 9.359627407044172} +{"Pretrain/Learning Rate": 3.530035379982166e-05, "Pretrain/Loss": 2.0102179050445557, "Pretrain/Loss (Raw)": 1.9653912782669067, "Pretrain/Step": 3661, "Pretrain/Step Time": 9.36212907731533} +{"Pretrain/Learning Rate": 3.5292617425108694e-05, "Pretrain/Loss": 2.0112462043762207, "Pretrain/Loss (Raw)": 2.1382102966308594, "Pretrain/Step": 3662, "Pretrain/Step Time": 9.357451479882002} +{"Pretrain/Learning Rate": 3.5284879863402585e-05, "Pretrain/Loss": 2.0116171836853027, "Pretrain/Loss (Raw)": 2.065511465072632, "Pretrain/Step": 3663, "Pretrain/Step Time": 9.35814537666738} +{"Pretrain/Learning Rate": 3.527714111559567e-05, "Pretrain/Loss": 2.0131335258483887, "Pretrain/Loss (Raw)": 2.0139856338500977, "Pretrain/Step": 3664, "Pretrain/Step Time": 9.359564121812582} +{"Pretrain/Learning Rate": 3.526940118258041e-05, "Pretrain/Loss": 2.010796546936035, "Pretrain/Loss (Raw)": 1.933448076248169, "Pretrain/Step": 3665, "Pretrain/Step Time": 9.360514653846622} +{"Pretrain/Learning Rate": 3.526166006524942e-05, "Pretrain/Loss": 2.010236978530884, "Pretrain/Loss (Raw)": 1.9929442405700684, "Pretrain/Step": 3666, "Pretrain/Step Time": 9.351391652598977} +{"Pretrain/Learning Rate": 3.525391776449544e-05, "Pretrain/Loss": 2.01163911819458, "Pretrain/Loss (Raw)": 2.021699905395508, "Pretrain/Step": 3667, "Pretrain/Step Time": 9.350732769817114} +{"Pretrain/Learning Rate": 3.5246174281211344e-05, "Pretrain/Loss": 2.0095763206481934, "Pretrain/Loss (Raw)": 1.7507413625717163, "Pretrain/Step": 3668, "Pretrain/Step Time": 9.358286548405886} +{"Pretrain/Learning Rate": 3.523842961629014e-05, "Pretrain/Loss": 2.009979724884033, "Pretrain/Loss (Raw)": 2.0457379817962646, "Pretrain/Step": 3669, "Pretrain/Step Time": 9.34900344349444} +{"Pretrain/Learning Rate": 3.5230683770624987e-05, "Pretrain/Loss": 2.0092897415161133, "Pretrain/Loss (Raw)": 2.101677417755127, "Pretrain/Step": 3670, "Pretrain/Step Time": 9.353154636919498} +{"Pretrain/Learning Rate": 3.522293674510918e-05, "Pretrain/Loss": 2.008441925048828, "Pretrain/Loss (Raw)": 1.7983344793319702, "Pretrain/Step": 3671, "Pretrain/Step Time": 9.350386887788773} +{"Pretrain/Learning Rate": 3.5215188540636134e-05, "Pretrain/Loss": 2.009734630584717, "Pretrain/Loss (Raw)": 2.1300642490386963, "Pretrain/Step": 3672, "Pretrain/Step Time": 9.347553921863437} +{"Pretrain/Learning Rate": 3.520743915809941e-05, "Pretrain/Loss": 2.009204626083374, "Pretrain/Loss (Raw)": 2.1203958988189697, "Pretrain/Step": 3673, "Pretrain/Step Time": 9.344758683815598} +{"Pretrain/Learning Rate": 3.51996885983927e-05, "Pretrain/Loss": 2.0069587230682373, "Pretrain/Loss (Raw)": 1.9109251499176025, "Pretrain/Step": 3674, "Pretrain/Step Time": 9.346223009750247} +{"Pretrain/Learning Rate": 3.519193686240984e-05, "Pretrain/Loss": 2.0077767372131348, "Pretrain/Loss (Raw)": 1.878041386604309, "Pretrain/Step": 3675, "Pretrain/Step Time": 9.348229676485062} +{"Pretrain/Learning Rate": 3.51841839510448e-05, "Pretrain/Loss": 2.007065773010254, "Pretrain/Loss (Raw)": 1.9745984077453613, "Pretrain/Step": 3676, "Pretrain/Step Time": 9.343692837283015} +{"Pretrain/Learning Rate": 3.517642986519167e-05, "Pretrain/Loss": 2.007206916809082, "Pretrain/Loss (Raw)": 2.1003475189208984, "Pretrain/Step": 3677, "Pretrain/Step Time": 9.348138626664877} +{"Pretrain/Learning Rate": 3.51686746057447e-05, "Pretrain/Loss": 2.0102245807647705, "Pretrain/Loss (Raw)": 2.050840377807617, "Pretrain/Step": 3678, "Pretrain/Step Time": 9.348708031699061} +{"Pretrain/Learning Rate": 3.516091817359825e-05, "Pretrain/Loss": 2.0126266479492188, "Pretrain/Loss (Raw)": 2.0352001190185547, "Pretrain/Step": 3679, "Pretrain/Step Time": 9.351873705163598} +{"Pretrain/Learning Rate": 3.515316056964684e-05, "Pretrain/Loss": 2.0113110542297363, "Pretrain/Loss (Raw)": 1.9585627317428589, "Pretrain/Step": 3680, "Pretrain/Step Time": 9.348700335249305} +{"Pretrain/Learning Rate": 3.5145401794785116e-05, "Pretrain/Loss": 2.0123109817504883, "Pretrain/Loss (Raw)": 2.0905749797821045, "Pretrain/Step": 3681, "Pretrain/Step Time": 9.399852082133293} +{"Pretrain/Learning Rate": 3.5137641849907844e-05, "Pretrain/Loss": 2.0137860774993896, "Pretrain/Loss (Raw)": 2.1259262561798096, "Pretrain/Step": 3682, "Pretrain/Step Time": 9.393255930393934} +{"Pretrain/Learning Rate": 3.5129880735909945e-05, "Pretrain/Loss": 2.0141916275024414, "Pretrain/Loss (Raw)": 2.094393491744995, "Pretrain/Step": 3683, "Pretrain/Step Time": 9.39962163567543} +{"Pretrain/Learning Rate": 3.512211845368647e-05, "Pretrain/Loss": 2.014613389968872, "Pretrain/Loss (Raw)": 2.028993844985962, "Pretrain/Step": 3684, "Pretrain/Step Time": 9.40221786312759} +{"Pretrain/Learning Rate": 3.511435500413259e-05, "Pretrain/Loss": 2.0125465393066406, "Pretrain/Loss (Raw)": 1.8984992504119873, "Pretrain/Step": 3685, "Pretrain/Step Time": 9.402251988649368} +{"Pretrain/Learning Rate": 3.510659038814364e-05, "Pretrain/Loss": 2.013178825378418, "Pretrain/Loss (Raw)": 2.0837554931640625, "Pretrain/Step": 3686, "Pretrain/Step Time": 9.38886678405106} +{"Pretrain/Learning Rate": 3.509882460661506e-05, "Pretrain/Loss": 2.0130538940429688, "Pretrain/Loss (Raw)": 2.0844762325286865, "Pretrain/Step": 3687, "Pretrain/Step Time": 9.39132278971374} +{"Pretrain/Learning Rate": 3.5091057660442434e-05, "Pretrain/Loss": 2.0119681358337402, "Pretrain/Loss (Raw)": 1.8591184616088867, "Pretrain/Step": 3688, "Pretrain/Step Time": 9.39174940995872} +{"Pretrain/Learning Rate": 3.5083289550521495e-05, "Pretrain/Loss": 2.0123534202575684, "Pretrain/Loss (Raw)": 2.0121750831604004, "Pretrain/Step": 3689, "Pretrain/Step Time": 9.399860266596079} +{"Pretrain/Learning Rate": 3.507552027774809e-05, "Pretrain/Loss": 2.0136499404907227, "Pretrain/Loss (Raw)": 2.0334603786468506, "Pretrain/Step": 3690, "Pretrain/Step Time": 9.402136409655213} +{"Pretrain/Learning Rate": 3.5067749843018205e-05, "Pretrain/Loss": 2.013511896133423, "Pretrain/Loss (Raw)": 2.214461088180542, "Pretrain/Step": 3691, "Pretrain/Step Time": 9.401651728898287} +{"Pretrain/Learning Rate": 3.5059978247227965e-05, "Pretrain/Loss": 2.0125110149383545, "Pretrain/Loss (Raw)": 1.938565731048584, "Pretrain/Step": 3692, "Pretrain/Step Time": 9.399515835568309} +{"Pretrain/Learning Rate": 3.505220549127364e-05, "Pretrain/Loss": 2.0124950408935547, "Pretrain/Loss (Raw)": 2.0505664348602295, "Pretrain/Step": 3693, "Pretrain/Step Time": 9.40059620141983} +{"Pretrain/Learning Rate": 3.50444315760516e-05, "Pretrain/Loss": 2.0119528770446777, "Pretrain/Loss (Raw)": 1.9409202337265015, "Pretrain/Step": 3694, "Pretrain/Step Time": 9.394076224416494} +{"Pretrain/Learning Rate": 3.503665650245838e-05, "Pretrain/Loss": 2.0127148628234863, "Pretrain/Loss (Raw)": 2.022097587585449, "Pretrain/Step": 3695, "Pretrain/Step Time": 9.396932777017355} +{"Pretrain/Learning Rate": 3.502888027139065e-05, "Pretrain/Loss": 2.0150232315063477, "Pretrain/Loss (Raw)": 2.1062958240509033, "Pretrain/Step": 3696, "Pretrain/Step Time": 9.32709557004273} +{"Pretrain/Learning Rate": 3.502110288374517e-05, "Pretrain/Loss": 2.0155982971191406, "Pretrain/Loss (Raw)": 2.0321860313415527, "Pretrain/Step": 3697, "Pretrain/Step Time": 9.33057575672865} +{"Pretrain/Learning Rate": 3.50133243404189e-05, "Pretrain/Loss": 2.0155203342437744, "Pretrain/Loss (Raw)": 2.067819356918335, "Pretrain/Step": 3698, "Pretrain/Step Time": 9.331868896260858} +{"Pretrain/Learning Rate": 3.5005544642308874e-05, "Pretrain/Loss": 2.0161890983581543, "Pretrain/Loss (Raw)": 2.03944730758667, "Pretrain/Step": 3699, "Pretrain/Step Time": 9.324686786159873} +{"Pretrain/Learning Rate": 3.49977637903123e-05, "Pretrain/Loss": 2.01708984375, "Pretrain/Loss (Raw)": 2.0583598613739014, "Pretrain/Step": 3700, "Pretrain/Step Time": 9.321838924661279} +{"Pretrain/Learning Rate": 3.4989981785326485e-05, "Pretrain/Loss": 2.015072822570801, "Pretrain/Loss (Raw)": 1.934488296508789, "Pretrain/Step": 3701, "Pretrain/Step Time": 9.321192905306816} +{"Pretrain/Learning Rate": 3.498219862824891e-05, "Pretrain/Loss": 2.014799118041992, "Pretrain/Loss (Raw)": 1.959206461906433, "Pretrain/Step": 3702, "Pretrain/Step Time": 9.321094373241067} +{"Pretrain/Learning Rate": 3.497441431997714e-05, "Pretrain/Loss": 2.014068841934204, "Pretrain/Loss (Raw)": 1.784230351448059, "Pretrain/Step": 3703, "Pretrain/Step Time": 9.320636339485645} +{"Pretrain/Learning Rate": 3.4966628861408914e-05, "Pretrain/Loss": 2.012463092803955, "Pretrain/Loss (Raw)": 2.0827314853668213, "Pretrain/Step": 3704, "Pretrain/Step Time": 9.33378753438592} +{"Pretrain/Learning Rate": 3.495884225344208e-05, "Pretrain/Loss": 2.014418125152588, "Pretrain/Loss (Raw)": 2.1154885292053223, "Pretrain/Step": 3705, "Pretrain/Step Time": 9.334479687735438} +{"Pretrain/Learning Rate": 3.495105449697463e-05, "Pretrain/Loss": 2.0140297412872314, "Pretrain/Loss (Raw)": 1.9297786951065063, "Pretrain/Step": 3706, "Pretrain/Step Time": 9.338471915572882} +{"Pretrain/Learning Rate": 3.494326559290469e-05, "Pretrain/Loss": 2.0154099464416504, "Pretrain/Loss (Raw)": 2.173787832260132, "Pretrain/Step": 3707, "Pretrain/Step Time": 9.348906641826034} +{"Pretrain/Learning Rate": 3.4935475542130505e-05, "Pretrain/Loss": 2.016540050506592, "Pretrain/Loss (Raw)": 2.1482527256011963, "Pretrain/Step": 3708, "Pretrain/Step Time": 9.343696121126413} +{"Pretrain/Learning Rate": 3.492768434555046e-05, "Pretrain/Loss": 2.0164685249328613, "Pretrain/Loss (Raw)": 2.168027877807617, "Pretrain/Step": 3709, "Pretrain/Step Time": 9.346368849277496} +{"Pretrain/Learning Rate": 3.4919892004063084e-05, "Pretrain/Loss": 2.01461124420166, "Pretrain/Loss (Raw)": 1.864249348640442, "Pretrain/Step": 3710, "Pretrain/Step Time": 9.344433715566993} +{"Pretrain/Learning Rate": 3.491209851856701e-05, "Pretrain/Loss": 2.0154383182525635, "Pretrain/Loss (Raw)": 2.051199197769165, "Pretrain/Step": 3711, "Pretrain/Step Time": 9.340044999495149} +{"Pretrain/Learning Rate": 3.490430388996103e-05, "Pretrain/Loss": 2.013789176940918, "Pretrain/Loss (Raw)": 1.841965675354004, "Pretrain/Step": 3712, "Pretrain/Step Time": 9.342438401654363} +{"Pretrain/Learning Rate": 3.4896508119144056e-05, "Pretrain/Loss": 2.0118675231933594, "Pretrain/Loss (Raw)": 1.8915197849273682, "Pretrain/Step": 3713, "Pretrain/Step Time": 9.346155250445008} +{"Pretrain/Learning Rate": 3.4888711207015124e-05, "Pretrain/Loss": 2.0122294425964355, "Pretrain/Loss (Raw)": 2.0584795475006104, "Pretrain/Step": 3714, "Pretrain/Step Time": 10.005266236141324} +{"Pretrain/Learning Rate": 3.488091315447343e-05, "Pretrain/Loss": 2.0101418495178223, "Pretrain/Loss (Raw)": 1.7840732336044312, "Pretrain/Step": 3715, "Pretrain/Step Time": 10.00560393370688} +{"Pretrain/Learning Rate": 3.487311396241826e-05, "Pretrain/Loss": 2.0071163177490234, "Pretrain/Loss (Raw)": 1.660967230796814, "Pretrain/Step": 3716, "Pretrain/Step Time": 10.004954647272825} +{"Pretrain/Learning Rate": 3.486531363174908e-05, "Pretrain/Loss": 2.0080502033233643, "Pretrain/Loss (Raw)": 2.082841396331787, "Pretrain/Step": 3717, "Pretrain/Step Time": 10.004065131768584} +{"Pretrain/Learning Rate": 3.4857512163365424e-05, "Pretrain/Loss": 2.0078351497650146, "Pretrain/Loss (Raw)": 2.0519227981567383, "Pretrain/Step": 3718, "Pretrain/Step Time": 10.000927744433284} +{"Pretrain/Learning Rate": 3.484970955816703e-05, "Pretrain/Loss": 2.010014057159424, "Pretrain/Loss (Raw)": 2.216975212097168, "Pretrain/Step": 3719, "Pretrain/Step Time": 10.001297375187278} +{"Pretrain/Learning Rate": 3.484190581705371e-05, "Pretrain/Loss": 2.0154523849487305, "Pretrain/Loss (Raw)": 2.2814831733703613, "Pretrain/Step": 3720, "Pretrain/Step Time": 9.995901448652148} +{"Pretrain/Learning Rate": 3.483410094092543e-05, "Pretrain/Loss": 2.0141234397888184, "Pretrain/Loss (Raw)": 2.021926164627075, "Pretrain/Step": 3721, "Pretrain/Step Time": 10.002537770196795} +{"Pretrain/Learning Rate": 3.48262949306823e-05, "Pretrain/Loss": 2.01385498046875, "Pretrain/Loss (Raw)": 2.067519187927246, "Pretrain/Step": 3722, "Pretrain/Step Time": 10.00243797712028} +{"Pretrain/Learning Rate": 3.481848778722453e-05, "Pretrain/Loss": 2.012115955352783, "Pretrain/Loss (Raw)": 1.9566974639892578, "Pretrain/Step": 3723, "Pretrain/Step Time": 10.000512531027198} +{"Pretrain/Learning Rate": 3.4810679511452484e-05, "Pretrain/Loss": 2.013850212097168, "Pretrain/Loss (Raw)": 1.9178982973098755, "Pretrain/Step": 3724, "Pretrain/Step Time": 9.99349539540708} +{"Pretrain/Learning Rate": 3.480287010426664e-05, "Pretrain/Loss": 2.0151138305664062, "Pretrain/Loss (Raw)": 2.1505234241485596, "Pretrain/Step": 3725, "Pretrain/Step Time": 9.997988699004054} +{"Pretrain/Learning Rate": 3.479505956656764e-05, "Pretrain/Loss": 2.01332950592041, "Pretrain/Loss (Raw)": 1.9354547262191772, "Pretrain/Step": 3726, "Pretrain/Step Time": 9.99756583571434} +{"Pretrain/Learning Rate": 3.47872478992562e-05, "Pretrain/Loss": 2.013916492462158, "Pretrain/Loss (Raw)": 2.0467395782470703, "Pretrain/Step": 3727, "Pretrain/Step Time": 9.993891121819615} +{"Pretrain/Learning Rate": 3.477943510323322e-05, "Pretrain/Loss": 2.013423442840576, "Pretrain/Loss (Raw)": 2.0325582027435303, "Pretrain/Step": 3728, "Pretrain/Step Time": 9.988251948729157} +{"Pretrain/Learning Rate": 3.4771621179399696e-05, "Pretrain/Loss": 2.014519214630127, "Pretrain/Loss (Raw)": 2.297495126724243, "Pretrain/Step": 3729, "Pretrain/Step Time": 9.986962754279375} +{"Pretrain/Learning Rate": 3.476380612865679e-05, "Pretrain/Loss": 2.0149176120758057, "Pretrain/Loss (Raw)": 2.051612615585327, "Pretrain/Step": 3730, "Pretrain/Step Time": 9.987513357773423} +{"Pretrain/Learning Rate": 3.475598995190572e-05, "Pretrain/Loss": 2.0132083892822266, "Pretrain/Loss (Raw)": 1.9574780464172363, "Pretrain/Step": 3731, "Pretrain/Step Time": 9.989519445225596} +{"Pretrain/Learning Rate": 3.4748172650047945e-05, "Pretrain/Loss": 2.014554738998413, "Pretrain/Loss (Raw)": 2.1305484771728516, "Pretrain/Step": 3732, "Pretrain/Step Time": 9.88677161745727} +{"Pretrain/Learning Rate": 3.474035422398496e-05, "Pretrain/Loss": 2.013124465942383, "Pretrain/Loss (Raw)": 1.873460054397583, "Pretrain/Step": 3733, "Pretrain/Step Time": 9.882034547626972} +{"Pretrain/Learning Rate": 3.473253467461842e-05, "Pretrain/Loss": 2.0129528045654297, "Pretrain/Loss (Raw)": 2.02380108833313, "Pretrain/Step": 3734, "Pretrain/Step Time": 9.881875034421682} +{"Pretrain/Learning Rate": 3.4724714002850125e-05, "Pretrain/Loss": 2.0141711235046387, "Pretrain/Loss (Raw)": 2.1508102416992188, "Pretrain/Step": 3735, "Pretrain/Step Time": 9.872725043445826} +{"Pretrain/Learning Rate": 3.471689220958198e-05, "Pretrain/Loss": 2.0127243995666504, "Pretrain/Loss (Raw)": 1.8367401361465454, "Pretrain/Step": 3736, "Pretrain/Step Time": 9.867635874077678} +{"Pretrain/Learning Rate": 3.470906929571605e-05, "Pretrain/Loss": 2.0124452114105225, "Pretrain/Loss (Raw)": 2.0379045009613037, "Pretrain/Step": 3737, "Pretrain/Step Time": 9.859617784619331} +{"Pretrain/Learning Rate": 3.470124526215449e-05, "Pretrain/Loss": 2.0117783546447754, "Pretrain/Loss (Raw)": 1.8686453104019165, "Pretrain/Step": 3738, "Pretrain/Step Time": 9.863652881234884} +{"Pretrain/Learning Rate": 3.469342010979962e-05, "Pretrain/Loss": 2.012045383453369, "Pretrain/Loss (Raw)": 1.9814257621765137, "Pretrain/Step": 3739, "Pretrain/Step Time": 9.862546106800437} +{"Pretrain/Learning Rate": 3.4685593839553856e-05, "Pretrain/Loss": 2.014806032180786, "Pretrain/Loss (Raw)": 2.272075653076172, "Pretrain/Step": 3740, "Pretrain/Step Time": 9.866185555234551} +{"Pretrain/Learning Rate": 3.467776645231978e-05, "Pretrain/Loss": 2.0146727561950684, "Pretrain/Loss (Raw)": 1.9724184274673462, "Pretrain/Step": 3741, "Pretrain/Step Time": 9.865926310420036} +{"Pretrain/Learning Rate": 3.466993794900007e-05, "Pretrain/Loss": 2.0155577659606934, "Pretrain/Loss (Raw)": 2.1680009365081787, "Pretrain/Step": 3742, "Pretrain/Step Time": 9.868329556658864} +{"Pretrain/Learning Rate": 3.466210833049755e-05, "Pretrain/Loss": 2.0148797035217285, "Pretrain/Loss (Raw)": 1.9461640119552612, "Pretrain/Step": 3743, "Pretrain/Step Time": 9.861009079962969} +{"Pretrain/Learning Rate": 3.465427759771516e-05, "Pretrain/Loss": 2.0120859146118164, "Pretrain/Loss (Raw)": 1.6768832206726074, "Pretrain/Step": 3744, "Pretrain/Step Time": 9.863737434148788} +{"Pretrain/Learning Rate": 3.464644575155599e-05, "Pretrain/Loss": 2.0119717121124268, "Pretrain/Loss (Raw)": 2.0332086086273193, "Pretrain/Step": 3745, "Pretrain/Step Time": 9.865499740466475} +{"Pretrain/Learning Rate": 3.463861279292324e-05, "Pretrain/Loss": 2.0113282203674316, "Pretrain/Loss (Raw)": 2.0304739475250244, "Pretrain/Step": 3746, "Pretrain/Step Time": 9.871928606182337} +{"Pretrain/Learning Rate": 3.4630778722720244e-05, "Pretrain/Loss": 2.0130550861358643, "Pretrain/Loss (Raw)": 2.167506217956543, "Pretrain/Step": 3747, "Pretrain/Step Time": 9.871214544400573} +{"Pretrain/Learning Rate": 3.462294354185046e-05, "Pretrain/Loss": 2.013075590133667, "Pretrain/Loss (Raw)": 2.102627754211426, "Pretrain/Step": 3748, "Pretrain/Step Time": 9.864620881155133} +{"Pretrain/Learning Rate": 3.4615107251217496e-05, "Pretrain/Loss": 2.0113914012908936, "Pretrain/Loss (Raw)": 1.910508632659912, "Pretrain/Step": 3749, "Pretrain/Step Time": 9.871930617839098} +{"Pretrain/Learning Rate": 3.460726985172504e-05, "Pretrain/Loss": 2.0141634941101074, "Pretrain/Loss (Raw)": 2.059185743331909, "Pretrain/Step": 3750, "Pretrain/Step Time": 9.877748060971498} +{"Pretrain/Learning Rate": 3.4599431344276966e-05, "Pretrain/Loss": 2.015984058380127, "Pretrain/Loss (Raw)": 2.1169300079345703, "Pretrain/Step": 3751, "Pretrain/Step Time": 9.873643349856138} +{"Pretrain/Learning Rate": 3.459159172977723e-05, "Pretrain/Loss": 2.0130348205566406, "Pretrain/Loss (Raw)": 1.7918834686279297, "Pretrain/Step": 3752, "Pretrain/Step Time": 9.872362293303013} +{"Pretrain/Learning Rate": 3.4583751009129936e-05, "Pretrain/Loss": 2.012643814086914, "Pretrain/Loss (Raw)": 1.8553706407546997, "Pretrain/Step": 3753, "Pretrain/Step Time": 9.874815559014678} +{"Pretrain/Learning Rate": 3.457590918323932e-05, "Pretrain/Loss": 2.0113677978515625, "Pretrain/Loss (Raw)": 2.1336326599121094, "Pretrain/Step": 3754, "Pretrain/Step Time": 9.869781976565719} +{"Pretrain/Learning Rate": 3.4568066253009736e-05, "Pretrain/Loss": 2.009199619293213, "Pretrain/Loss (Raw)": 1.926893711090088, "Pretrain/Step": 3755, "Pretrain/Step Time": 9.873504703864455} +{"Pretrain/Learning Rate": 3.456022221934566e-05, "Pretrain/Loss": 2.0078630447387695, "Pretrain/Loss (Raw)": 1.9588764905929565, "Pretrain/Step": 3756, "Pretrain/Step Time": 9.866357928141952} +{"Pretrain/Learning Rate": 3.455237708315171e-05, "Pretrain/Loss": 2.0072078704833984, "Pretrain/Loss (Raw)": 1.9692554473876953, "Pretrain/Step": 3757, "Pretrain/Step Time": 9.865426080301404} +{"Pretrain/Learning Rate": 3.454453084533262e-05, "Pretrain/Loss": 2.008549690246582, "Pretrain/Loss (Raw)": 2.1365740299224854, "Pretrain/Step": 3758, "Pretrain/Step Time": 9.857402736321092} +{"Pretrain/Learning Rate": 3.453668350679327e-05, "Pretrain/Loss": 2.009817600250244, "Pretrain/Loss (Raw)": 2.1554224491119385, "Pretrain/Step": 3759, "Pretrain/Step Time": 9.856962136924267} +{"Pretrain/Learning Rate": 3.4528835068438625e-05, "Pretrain/Loss": 2.0085501670837402, "Pretrain/Loss (Raw)": 2.0337975025177, "Pretrain/Step": 3760, "Pretrain/Step Time": 9.864257358014584} +{"Pretrain/Learning Rate": 3.452098553117382e-05, "Pretrain/Loss": 2.0051560401916504, "Pretrain/Loss (Raw)": 1.6632713079452515, "Pretrain/Step": 3761, "Pretrain/Step Time": 9.860960718244314} +{"Pretrain/Learning Rate": 3.4513134895904105e-05, "Pretrain/Loss": 2.003818988800049, "Pretrain/Loss (Raw)": 1.9858767986297607, "Pretrain/Step": 3762, "Pretrain/Step Time": 9.8672004211694} +{"Pretrain/Learning Rate": 3.450528316353484e-05, "Pretrain/Loss": 2.009092330932617, "Pretrain/Loss (Raw)": 2.3491079807281494, "Pretrain/Step": 3763, "Pretrain/Step Time": 9.867523798719049} +{"Pretrain/Learning Rate": 3.4497430334971534e-05, "Pretrain/Loss": 2.008481740951538, "Pretrain/Loss (Raw)": 1.7741382122039795, "Pretrain/Step": 3764, "Pretrain/Step Time": 9.870008362457156} +{"Pretrain/Learning Rate": 3.448957641111981e-05, "Pretrain/Loss": 2.0073447227478027, "Pretrain/Loss (Raw)": 1.9634628295898438, "Pretrain/Step": 3765, "Pretrain/Step Time": 9.879635060206056} +{"Pretrain/Learning Rate": 3.4481721392885414e-05, "Pretrain/Loss": 2.0062713623046875, "Pretrain/Loss (Raw)": 2.005469799041748, "Pretrain/Step": 3766, "Pretrain/Step Time": 9.873753586784005} +{"Pretrain/Learning Rate": 3.447386528117423e-05, "Pretrain/Loss": 2.007845878601074, "Pretrain/Loss (Raw)": 2.067333459854126, "Pretrain/Step": 3767, "Pretrain/Step Time": 9.868891136720777} +{"Pretrain/Learning Rate": 3.446600807689226e-05, "Pretrain/Loss": 2.00838565826416, "Pretrain/Loss (Raw)": 2.019310712814331, "Pretrain/Step": 3768, "Pretrain/Step Time": 9.87157586030662} +{"Pretrain/Learning Rate": 3.4458149780945636e-05, "Pretrain/Loss": 2.007927417755127, "Pretrain/Loss (Raw)": 2.1141109466552734, "Pretrain/Step": 3769, "Pretrain/Step Time": 9.869263332337141} +{"Pretrain/Learning Rate": 3.4450290394240606e-05, "Pretrain/Loss": 2.0080478191375732, "Pretrain/Loss (Raw)": 1.9848499298095703, "Pretrain/Step": 3770, "Pretrain/Step Time": 9.878944538533688} +{"Pretrain/Learning Rate": 3.444242991768356e-05, "Pretrain/Loss": 2.0079991817474365, "Pretrain/Loss (Raw)": 2.146651268005371, "Pretrain/Step": 3771, "Pretrain/Step Time": 9.879642777144909} +{"Pretrain/Learning Rate": 3.4434568352181e-05, "Pretrain/Loss": 2.0084142684936523, "Pretrain/Loss (Raw)": 2.1516835689544678, "Pretrain/Step": 3772, "Pretrain/Step Time": 9.722431510686874} +{"Pretrain/Learning Rate": 3.442670569863956e-05, "Pretrain/Loss": 2.012009859085083, "Pretrain/Loss (Raw)": 1.9181480407714844, "Pretrain/Step": 3773, "Pretrain/Step Time": 9.724004799500108} +{"Pretrain/Learning Rate": 3.4418841957965995e-05, "Pretrain/Loss": 2.013296127319336, "Pretrain/Loss (Raw)": 2.2148938179016113, "Pretrain/Step": 3774, "Pretrain/Step Time": 9.722174666821957} +{"Pretrain/Learning Rate": 3.44109771310672e-05, "Pretrain/Loss": 2.0101277828216553, "Pretrain/Loss (Raw)": 1.8004871606826782, "Pretrain/Step": 3775, "Pretrain/Step Time": 9.717222139239311} +{"Pretrain/Learning Rate": 3.440311121885018e-05, "Pretrain/Loss": 2.009459972381592, "Pretrain/Loss (Raw)": 2.088124990463257, "Pretrain/Step": 3776, "Pretrain/Step Time": 9.719836186617613} +{"Pretrain/Learning Rate": 3.4395244222222054e-05, "Pretrain/Loss": 2.012202501296997, "Pretrain/Loss (Raw)": 2.109025001525879, "Pretrain/Step": 3777, "Pretrain/Step Time": 9.722499158233404} +{"Pretrain/Learning Rate": 3.43873761420901e-05, "Pretrain/Loss": 2.0156359672546387, "Pretrain/Loss (Raw)": 2.138349771499634, "Pretrain/Step": 3778, "Pretrain/Step Time": 9.721236379817128} +{"Pretrain/Learning Rate": 3.4379506979361694e-05, "Pretrain/Loss": 2.0141425132751465, "Pretrain/Loss (Raw)": 1.6833010911941528, "Pretrain/Step": 3779, "Pretrain/Step Time": 9.724815282970667} +{"Pretrain/Learning Rate": 3.437163673494434e-05, "Pretrain/Loss": 2.015528440475464, "Pretrain/Loss (Raw)": 2.1477930545806885, "Pretrain/Step": 3780, "Pretrain/Step Time": 9.724819069728255} +{"Pretrain/Learning Rate": 3.436376540974568e-05, "Pretrain/Loss": 2.01356840133667, "Pretrain/Loss (Raw)": 1.9629135131835938, "Pretrain/Step": 3781, "Pretrain/Step Time": 9.71915189921856} +{"Pretrain/Learning Rate": 3.4355893004673476e-05, "Pretrain/Loss": 2.016235828399658, "Pretrain/Loss (Raw)": 2.0808706283569336, "Pretrain/Step": 3782, "Pretrain/Step Time": 9.50321290642023} +{"Pretrain/Learning Rate": 3.4348019520635587e-05, "Pretrain/Loss": 2.0166497230529785, "Pretrain/Loss (Raw)": 2.0946567058563232, "Pretrain/Step": 3783, "Pretrain/Step Time": 9.502169461920857} +{"Pretrain/Learning Rate": 3.434014495854006e-05, "Pretrain/Loss": 2.017134189605713, "Pretrain/Loss (Raw)": 2.031503677368164, "Pretrain/Step": 3784, "Pretrain/Step Time": 9.475660160183907} +{"Pretrain/Learning Rate": 3.4332269319294984e-05, "Pretrain/Loss": 2.0142195224761963, "Pretrain/Loss (Raw)": 1.7664517164230347, "Pretrain/Step": 3785, "Pretrain/Step Time": 9.483556972816586} +{"Pretrain/Learning Rate": 3.432439260380865e-05, "Pretrain/Loss": 2.0128860473632812, "Pretrain/Loss (Raw)": 1.8844952583312988, "Pretrain/Step": 3786, "Pretrain/Step Time": 9.478253277018666} +{"Pretrain/Learning Rate": 3.4316514812989406e-05, "Pretrain/Loss": 2.0128705501556396, "Pretrain/Loss (Raw)": 2.2041187286376953, "Pretrain/Step": 3787, "Pretrain/Step Time": 9.478498140349984} +{"Pretrain/Learning Rate": 3.4308635947745796e-05, "Pretrain/Loss": 2.0142626762390137, "Pretrain/Loss (Raw)": 1.8678486347198486, "Pretrain/Step": 3788, "Pretrain/Step Time": 9.47768366895616} +{"Pretrain/Learning Rate": 3.43007560089864e-05, "Pretrain/Loss": 2.0136795043945312, "Pretrain/Loss (Raw)": 1.8907405138015747, "Pretrain/Step": 3789, "Pretrain/Step Time": 9.471393724903464} +{"Pretrain/Learning Rate": 3.429287499762001e-05, "Pretrain/Loss": 2.012814998626709, "Pretrain/Loss (Raw)": 2.027611494064331, "Pretrain/Step": 3790, "Pretrain/Step Time": 9.47018263861537} +{"Pretrain/Learning Rate": 3.428499291455548e-05, "Pretrain/Loss": 2.009572982788086, "Pretrain/Loss (Raw)": 1.6505354642868042, "Pretrain/Step": 3791, "Pretrain/Step Time": 9.46724203787744} +{"Pretrain/Learning Rate": 3.427710976070182e-05, "Pretrain/Loss": 2.0098373889923096, "Pretrain/Loss (Raw)": 2.0477962493896484, "Pretrain/Step": 3792, "Pretrain/Step Time": 9.466704377904534} +{"Pretrain/Learning Rate": 3.426922553696814e-05, "Pretrain/Loss": 2.0105843544006348, "Pretrain/Loss (Raw)": 2.0290679931640625, "Pretrain/Step": 3793, "Pretrain/Step Time": 9.465306539088488} +{"Pretrain/Learning Rate": 3.426134024426371e-05, "Pretrain/Loss": 2.0082931518554688, "Pretrain/Loss (Raw)": 1.6996581554412842, "Pretrain/Step": 3794, "Pretrain/Step Time": 9.46450993977487} +{"Pretrain/Learning Rate": 3.425345388349786e-05, "Pretrain/Loss": 2.007439136505127, "Pretrain/Loss (Raw)": 1.9124201536178589, "Pretrain/Step": 3795, "Pretrain/Step Time": 9.46836944296956} +{"Pretrain/Learning Rate": 3.4245566455580116e-05, "Pretrain/Loss": 2.0096631050109863, "Pretrain/Loss (Raw)": 2.035372495651245, "Pretrain/Step": 3796, "Pretrain/Step Time": 9.464759247377515} +{"Pretrain/Learning Rate": 3.423767796142008e-05, "Pretrain/Loss": 2.007805347442627, "Pretrain/Loss (Raw)": 1.80794358253479, "Pretrain/Step": 3797, "Pretrain/Step Time": 9.464593360200524} +{"Pretrain/Learning Rate": 3.422978840192749e-05, "Pretrain/Loss": 2.007781505584717, "Pretrain/Loss (Raw)": 2.098637342453003, "Pretrain/Step": 3798, "Pretrain/Step Time": 9.460006885230541} +{"Pretrain/Learning Rate": 3.4221897778012214e-05, "Pretrain/Loss": 2.006397247314453, "Pretrain/Loss (Raw)": 1.6211535930633545, "Pretrain/Step": 3799, "Pretrain/Step Time": 9.45897009037435} +{"Pretrain/Learning Rate": 3.421400609058423e-05, "Pretrain/Loss": 2.004228115081787, "Pretrain/Loss (Raw)": 1.8524259328842163, "Pretrain/Step": 3800, "Pretrain/Step Time": 9.458837162703276} +{"Pretrain/Learning Rate": 3.420611334055365e-05, "Pretrain/Loss": 1.9998564720153809, "Pretrain/Loss (Raw)": 1.5608160495758057, "Pretrain/Step": 3801, "Pretrain/Step Time": 9.46295746229589} +{"Pretrain/Learning Rate": 3.4198219528830675e-05, "Pretrain/Loss": 2.001993417739868, "Pretrain/Loss (Raw)": 2.184450387954712, "Pretrain/Step": 3802, "Pretrain/Step Time": 9.470241105183959} +{"Pretrain/Learning Rate": 3.4190324656325704e-05, "Pretrain/Loss": 2.001201629638672, "Pretrain/Loss (Raw)": 1.7766846418380737, "Pretrain/Step": 3803, "Pretrain/Step Time": 9.468009248375893} +{"Pretrain/Learning Rate": 3.418242872394919e-05, "Pretrain/Loss": 2.0026071071624756, "Pretrain/Loss (Raw)": 2.154489278793335, "Pretrain/Step": 3804, "Pretrain/Step Time": 9.470717730000615} +{"Pretrain/Learning Rate": 3.417453173261171e-05, "Pretrain/Loss": 2.002591609954834, "Pretrain/Loss (Raw)": 2.0983879566192627, "Pretrain/Step": 3805, "Pretrain/Step Time": 9.469645412638783} +{"Pretrain/Learning Rate": 3.4166633683224015e-05, "Pretrain/Loss": 2.0034379959106445, "Pretrain/Loss (Raw)": 2.159144878387451, "Pretrain/Step": 3806, "Pretrain/Step Time": 9.466399505734444} +{"Pretrain/Learning Rate": 3.4158734576696915e-05, "Pretrain/Loss": 2.002114772796631, "Pretrain/Loss (Raw)": 1.8658536672592163, "Pretrain/Step": 3807, "Pretrain/Step Time": 9.461949063465} +{"Pretrain/Learning Rate": 3.4150834413941394e-05, "Pretrain/Loss": 2.001577615737915, "Pretrain/Loss (Raw)": 1.8897950649261475, "Pretrain/Step": 3808, "Pretrain/Step Time": 9.475449858233333} +{"Pretrain/Learning Rate": 3.414293319586853e-05, "Pretrain/Loss": 2.0012197494506836, "Pretrain/Loss (Raw)": 2.0447659492492676, "Pretrain/Step": 3809, "Pretrain/Step Time": 9.42093000933528} +{"Pretrain/Learning Rate": 3.4135030923389525e-05, "Pretrain/Loss": 2.0013039112091064, "Pretrain/Loss (Raw)": 2.1367149353027344, "Pretrain/Step": 3810, "Pretrain/Step Time": 9.424891294911504} +{"Pretrain/Learning Rate": 3.412712759741571e-05, "Pretrain/Loss": 2.0018434524536133, "Pretrain/Loss (Raw)": 2.163470506668091, "Pretrain/Step": 3811, "Pretrain/Step Time": 9.418010825291276} +{"Pretrain/Learning Rate": 3.411922321885853e-05, "Pretrain/Loss": 2.0036203861236572, "Pretrain/Loss (Raw)": 2.2564196586608887, "Pretrain/Step": 3812, "Pretrain/Step Time": 9.419990742579103} +{"Pretrain/Learning Rate": 3.411131778862955e-05, "Pretrain/Loss": 2.0064048767089844, "Pretrain/Loss (Raw)": 2.254934787750244, "Pretrain/Step": 3813, "Pretrain/Step Time": 9.425196981057525} +{"Pretrain/Learning Rate": 3.4103411307640475e-05, "Pretrain/Loss": 2.0056636333465576, "Pretrain/Loss (Raw)": 1.9888627529144287, "Pretrain/Step": 3814, "Pretrain/Step Time": 9.413488198071718} +{"Pretrain/Learning Rate": 3.409550377680311e-05, "Pretrain/Loss": 2.005413293838501, "Pretrain/Loss (Raw)": 2.052441358566284, "Pretrain/Step": 3815, "Pretrain/Step Time": 9.412311716005206} +{"Pretrain/Learning Rate": 3.408759519702939e-05, "Pretrain/Loss": 2.0056650638580322, "Pretrain/Loss (Raw)": 1.8913257122039795, "Pretrain/Step": 3816, "Pretrain/Step Time": 9.415305834263563} +{"Pretrain/Learning Rate": 3.407968556923137e-05, "Pretrain/Loss": 2.003035068511963, "Pretrain/Loss (Raw)": 1.6755361557006836, "Pretrain/Step": 3817, "Pretrain/Step Time": 9.416439287364483} +{"Pretrain/Learning Rate": 3.407177489432123e-05, "Pretrain/Loss": 2.0028605461120605, "Pretrain/Loss (Raw)": 2.011147975921631, "Pretrain/Step": 3818, "Pretrain/Step Time": 9.417906235903502} +{"Pretrain/Learning Rate": 3.406386317321126e-05, "Pretrain/Loss": 2.0018985271453857, "Pretrain/Loss (Raw)": 2.0912981033325195, "Pretrain/Step": 3819, "Pretrain/Step Time": 9.41456251963973} +{"Pretrain/Learning Rate": 3.4055950406813875e-05, "Pretrain/Loss": 2.0026695728302, "Pretrain/Loss (Raw)": 2.037266969680786, "Pretrain/Step": 3820, "Pretrain/Step Time": 9.419203901663423} +{"Pretrain/Learning Rate": 3.404803659604162e-05, "Pretrain/Loss": 2.002683639526367, "Pretrain/Loss (Raw)": 2.052394390106201, "Pretrain/Step": 3821, "Pretrain/Step Time": 9.414728920906782} +{"Pretrain/Learning Rate": 3.4040121741807146e-05, "Pretrain/Loss": 2.001683235168457, "Pretrain/Loss (Raw)": 1.8128093481063843, "Pretrain/Step": 3822, "Pretrain/Step Time": 9.417589917778969} +{"Pretrain/Learning Rate": 3.403220584502323e-05, "Pretrain/Loss": 1.9997646808624268, "Pretrain/Loss (Raw)": 1.7765685319900513, "Pretrain/Step": 3823, "Pretrain/Step Time": 9.4157341606915} +{"Pretrain/Learning Rate": 3.402428890660279e-05, "Pretrain/Loss": 1.9972014427185059, "Pretrain/Loss (Raw)": 1.7781834602355957, "Pretrain/Step": 3824, "Pretrain/Step Time": 9.42592609860003} +{"Pretrain/Learning Rate": 3.401637092745882e-05, "Pretrain/Loss": 1.9965347051620483, "Pretrain/Loss (Raw)": 1.9468547105789185, "Pretrain/Step": 3825, "Pretrain/Step Time": 9.43001020140946} +{"Pretrain/Learning Rate": 3.4008451908504457e-05, "Pretrain/Loss": 1.9978697299957275, "Pretrain/Loss (Raw)": 2.238701343536377, "Pretrain/Step": 3826, "Pretrain/Step Time": 9.438728025183082} +{"Pretrain/Learning Rate": 3.400053185065298e-05, "Pretrain/Loss": 1.997854471206665, "Pretrain/Loss (Raw)": 2.0374841690063477, "Pretrain/Step": 3827, "Pretrain/Step Time": 9.433614801615477} +{"Pretrain/Learning Rate": 3.399261075481776e-05, "Pretrain/Loss": 1.997281789779663, "Pretrain/Loss (Raw)": 1.985067367553711, "Pretrain/Step": 3828, "Pretrain/Step Time": 9.430341055616736} +{"Pretrain/Learning Rate": 3.39846886219123e-05, "Pretrain/Loss": 1.9989523887634277, "Pretrain/Loss (Raw)": 2.148324489593506, "Pretrain/Step": 3829, "Pretrain/Step Time": 9.428968131542206} +{"Pretrain/Learning Rate": 3.3976765452850194e-05, "Pretrain/Loss": 1.9996196031570435, "Pretrain/Loss (Raw)": 2.0445973873138428, "Pretrain/Step": 3830, "Pretrain/Step Time": 9.43207062408328} +{"Pretrain/Learning Rate": 3.3968841248545214e-05, "Pretrain/Loss": 2.002288341522217, "Pretrain/Loss (Raw)": 2.1258420944213867, "Pretrain/Step": 3831, "Pretrain/Step Time": 9.43008198402822} +{"Pretrain/Learning Rate": 3.396091600991118e-05, "Pretrain/Loss": 2.0002570152282715, "Pretrain/Loss (Raw)": 1.8227041959762573, "Pretrain/Step": 3832, "Pretrain/Step Time": 9.413572814315557} +{"Pretrain/Learning Rate": 3.39529897378621e-05, "Pretrain/Loss": 1.998795747756958, "Pretrain/Loss (Raw)": 1.9284635782241821, "Pretrain/Step": 3833, "Pretrain/Step Time": 9.412743255496025} +{"Pretrain/Learning Rate": 3.3945062433312055e-05, "Pretrain/Loss": 1.9995508193969727, "Pretrain/Loss (Raw)": 2.0264101028442383, "Pretrain/Step": 3834, "Pretrain/Step Time": 9.407745422795415} +{"Pretrain/Learning Rate": 3.3937134097175256e-05, "Pretrain/Loss": 1.9994760751724243, "Pretrain/Loss (Raw)": 2.16422700881958, "Pretrain/Step": 3835, "Pretrain/Step Time": 9.39623511955142} +{"Pretrain/Learning Rate": 3.392920473036604e-05, "Pretrain/Loss": 1.9978817701339722, "Pretrain/Loss (Raw)": 1.9441978931427002, "Pretrain/Step": 3836, "Pretrain/Step Time": 9.396749261766672} +{"Pretrain/Learning Rate": 3.392127433379886e-05, "Pretrain/Loss": 1.995431661605835, "Pretrain/Loss (Raw)": 1.8544063568115234, "Pretrain/Step": 3837, "Pretrain/Step Time": 9.394547827541828} +{"Pretrain/Learning Rate": 3.391334290838829e-05, "Pretrain/Loss": 1.9955973625183105, "Pretrain/Loss (Raw)": 1.8854433298110962, "Pretrain/Step": 3838, "Pretrain/Step Time": 9.394334251061082} +{"Pretrain/Learning Rate": 3.3905410455049e-05, "Pretrain/Loss": 1.9944344758987427, "Pretrain/Loss (Raw)": 1.9023667573928833, "Pretrain/Step": 3839, "Pretrain/Step Time": 9.395327486097813} +{"Pretrain/Learning Rate": 3.389747697469583e-05, "Pretrain/Loss": 1.9952552318572998, "Pretrain/Loss (Raw)": 1.9470025300979614, "Pretrain/Step": 3840, "Pretrain/Step Time": 9.39480528049171} +{"Pretrain/Learning Rate": 3.388954246824367e-05, "Pretrain/Loss": 1.9948127269744873, "Pretrain/Loss (Raw)": 1.8348965644836426, "Pretrain/Step": 3841, "Pretrain/Step Time": 9.39064490608871} +{"Pretrain/Learning Rate": 3.3881606936607604e-05, "Pretrain/Loss": 1.992363452911377, "Pretrain/Loss (Raw)": 1.7449686527252197, "Pretrain/Step": 3842, "Pretrain/Step Time": 8.727565862238407} +{"Pretrain/Learning Rate": 3.387367038070275e-05, "Pretrain/Loss": 1.9955203533172607, "Pretrain/Loss (Raw)": 2.188152551651001, "Pretrain/Step": 3843, "Pretrain/Step Time": 8.73448391072452} +{"Pretrain/Learning Rate": 3.386573280144444e-05, "Pretrain/Loss": 1.9979768991470337, "Pretrain/Loss (Raw)": 1.9754093885421753, "Pretrain/Step": 3844, "Pretrain/Step Time": 8.735287437215447} +{"Pretrain/Learning Rate": 3.385779419974803e-05, "Pretrain/Loss": 1.998876929283142, "Pretrain/Loss (Raw)": 2.1980466842651367, "Pretrain/Step": 3845, "Pretrain/Step Time": 8.736748397350311} +{"Pretrain/Learning Rate": 3.384985457652906e-05, "Pretrain/Loss": 1.999001383781433, "Pretrain/Loss (Raw)": 2.067854881286621, "Pretrain/Step": 3846, "Pretrain/Step Time": 8.734854470938444} +{"Pretrain/Learning Rate": 3.384191393270316e-05, "Pretrain/Loss": 1.996690034866333, "Pretrain/Loss (Raw)": 1.9211221933364868, "Pretrain/Step": 3847, "Pretrain/Step Time": 8.736895522102714} +{"Pretrain/Learning Rate": 3.383397226918607e-05, "Pretrain/Loss": 1.9952094554901123, "Pretrain/Loss (Raw)": 2.0919666290283203, "Pretrain/Step": 3848, "Pretrain/Step Time": 8.7412218041718} +{"Pretrain/Learning Rate": 3.382602958689369e-05, "Pretrain/Loss": 1.9936742782592773, "Pretrain/Loss (Raw)": 1.8254122734069824, "Pretrain/Step": 3849, "Pretrain/Step Time": 8.733166644349694} +{"Pretrain/Learning Rate": 3.381808588674197e-05, "Pretrain/Loss": 1.991631269454956, "Pretrain/Loss (Raw)": 1.8060088157653809, "Pretrain/Step": 3850, "Pretrain/Step Time": 8.731430765241385} +{"Pretrain/Learning Rate": 3.381014116964705e-05, "Pretrain/Loss": 1.9901798963546753, "Pretrain/Loss (Raw)": 1.7709296941757202, "Pretrain/Step": 3851, "Pretrain/Step Time": 8.735595082864165} +{"Pretrain/Learning Rate": 3.380219543652512e-05, "Pretrain/Loss": 1.9907283782958984, "Pretrain/Loss (Raw)": 1.9881137609481812, "Pretrain/Step": 3852, "Pretrain/Step Time": 8.738209651783109} +{"Pretrain/Learning Rate": 3.379424868829254e-05, "Pretrain/Loss": 1.9901707172393799, "Pretrain/Loss (Raw)": 2.079144239425659, "Pretrain/Step": 3853, "Pretrain/Step Time": 8.740068703889847} +{"Pretrain/Learning Rate": 3.378630092586576e-05, "Pretrain/Loss": 1.9912976026535034, "Pretrain/Loss (Raw)": 2.0796797275543213, "Pretrain/Step": 3854, "Pretrain/Step Time": 8.74215760268271} +{"Pretrain/Learning Rate": 3.377835215016136e-05, "Pretrain/Loss": 1.991660714149475, "Pretrain/Loss (Raw)": 2.093230724334717, "Pretrain/Step": 3855, "Pretrain/Step Time": 8.748425748199224} +{"Pretrain/Learning Rate": 3.3770402362096024e-05, "Pretrain/Loss": 1.990154504776001, "Pretrain/Loss (Raw)": 1.8397469520568848, "Pretrain/Step": 3856, "Pretrain/Step Time": 8.75658743083477} +{"Pretrain/Learning Rate": 3.3762451562586565e-05, "Pretrain/Loss": 1.987477421760559, "Pretrain/Loss (Raw)": 1.9548375606536865, "Pretrain/Step": 3857, "Pretrain/Step Time": 8.757033793255687} +{"Pretrain/Learning Rate": 3.3754499752549885e-05, "Pretrain/Loss": 1.9886270761489868, "Pretrain/Loss (Raw)": 2.198760986328125, "Pretrain/Step": 3858, "Pretrain/Step Time": 8.756179790943861} +{"Pretrain/Learning Rate": 3.374654693290306e-05, "Pretrain/Loss": 1.987558364868164, "Pretrain/Loss (Raw)": 1.8206896781921387, "Pretrain/Step": 3859, "Pretrain/Step Time": 8.758707286790013} +{"Pretrain/Learning Rate": 3.373859310456321e-05, "Pretrain/Loss": 1.9877666234970093, "Pretrain/Loss (Raw)": 2.15720796585083, "Pretrain/Step": 3860, "Pretrain/Step Time": 8.75707589648664} +{"Pretrain/Learning Rate": 3.373063826844764e-05, "Pretrain/Loss": 1.9902024269104004, "Pretrain/Loss (Raw)": 2.185248851776123, "Pretrain/Step": 3861, "Pretrain/Step Time": 8.759966287761927} +{"Pretrain/Learning Rate": 3.3722682425473715e-05, "Pretrain/Loss": 1.9902154207229614, "Pretrain/Loss (Raw)": 2.025470018386841, "Pretrain/Step": 3862, "Pretrain/Step Time": 8.758774043992162} +{"Pretrain/Learning Rate": 3.371472557655896e-05, "Pretrain/Loss": 1.988267421722412, "Pretrain/Loss (Raw)": 1.901465892791748, "Pretrain/Step": 3863, "Pretrain/Step Time": 8.763809585943818} +{"Pretrain/Learning Rate": 3.370676772262098e-05, "Pretrain/Loss": 1.9897862672805786, "Pretrain/Loss (Raw)": 2.0311410427093506, "Pretrain/Step": 3864, "Pretrain/Step Time": 8.769827093929052} +{"Pretrain/Learning Rate": 3.369880886457751e-05, "Pretrain/Loss": 1.9903786182403564, "Pretrain/Loss (Raw)": 2.1137311458587646, "Pretrain/Step": 3865, "Pretrain/Step Time": 8.767114678397775} +{"Pretrain/Learning Rate": 3.369084900334643e-05, "Pretrain/Loss": 1.9900577068328857, "Pretrain/Loss (Raw)": 1.827564001083374, "Pretrain/Step": 3866, "Pretrain/Step Time": 8.768035126850009} +{"Pretrain/Learning Rate": 3.368288813984568e-05, "Pretrain/Loss": 1.989620566368103, "Pretrain/Loss (Raw)": 1.9254624843597412, "Pretrain/Step": 3867, "Pretrain/Step Time": 8.769574804231524} +{"Pretrain/Learning Rate": 3.3674926274993356e-05, "Pretrain/Loss": 1.9867398738861084, "Pretrain/Loss (Raw)": 1.9033535718917847, "Pretrain/Step": 3868, "Pretrain/Step Time": 8.767257930710912} +{"Pretrain/Learning Rate": 3.3666963409707655e-05, "Pretrain/Loss": 1.9880212545394897, "Pretrain/Loss (Raw)": 2.1364333629608154, "Pretrain/Step": 3869, "Pretrain/Step Time": 8.768429458141327} +{"Pretrain/Learning Rate": 3.36589995449069e-05, "Pretrain/Loss": 1.9859075546264648, "Pretrain/Loss (Raw)": 1.8974449634552002, "Pretrain/Step": 3870, "Pretrain/Step Time": 8.773309875279665} +{"Pretrain/Learning Rate": 3.36510346815095e-05, "Pretrain/Loss": 1.9884997606277466, "Pretrain/Loss (Raw)": 2.2779760360717773, "Pretrain/Step": 3871, "Pretrain/Step Time": 8.77349816262722} +{"Pretrain/Learning Rate": 3.3643068820434035e-05, "Pretrain/Loss": 1.9937779903411865, "Pretrain/Loss (Raw)": 2.3524885177612305, "Pretrain/Step": 3872, "Pretrain/Step Time": 8.776142053306103} +{"Pretrain/Learning Rate": 3.363510196259913e-05, "Pretrain/Loss": 1.9944111108779907, "Pretrain/Loss (Raw)": 2.1142566204071045, "Pretrain/Step": 3873, "Pretrain/Step Time": 8.772340359166265} +{"Pretrain/Learning Rate": 3.362713410892359e-05, "Pretrain/Loss": 1.9949288368225098, "Pretrain/Loss (Raw)": 2.0967295169830322, "Pretrain/Step": 3874, "Pretrain/Step Time": 8.769337745383382} +{"Pretrain/Learning Rate": 3.361916526032628e-05, "Pretrain/Loss": 1.9943240880966187, "Pretrain/Loss (Raw)": 2.090102195739746, "Pretrain/Step": 3875, "Pretrain/Step Time": 8.769249584525824} +{"Pretrain/Learning Rate": 3.361119541772622e-05, "Pretrain/Loss": 1.9928107261657715, "Pretrain/Loss (Raw)": 1.9089275598526, "Pretrain/Step": 3876, "Pretrain/Step Time": 8.772354347631335} +{"Pretrain/Learning Rate": 3.360322458204253e-05, "Pretrain/Loss": 1.9903481006622314, "Pretrain/Loss (Raw)": 1.5952942371368408, "Pretrain/Step": 3877, "Pretrain/Step Time": 8.76598815061152} +{"Pretrain/Learning Rate": 3.3595252754194445e-05, "Pretrain/Loss": 1.9903556108474731, "Pretrain/Loss (Raw)": 2.0601537227630615, "Pretrain/Step": 3878, "Pretrain/Step Time": 8.765388341620564} +{"Pretrain/Learning Rate": 3.3587279935101306e-05, "Pretrain/Loss": 1.9897775650024414, "Pretrain/Loss (Raw)": 2.042922258377075, "Pretrain/Step": 3879, "Pretrain/Step Time": 8.770081773400307} +{"Pretrain/Learning Rate": 3.357930612568258e-05, "Pretrain/Loss": 1.9889925718307495, "Pretrain/Loss (Raw)": 1.6914058923721313, "Pretrain/Step": 3880, "Pretrain/Step Time": 8.769926251843572} +{"Pretrain/Learning Rate": 3.3571331326857844e-05, "Pretrain/Loss": 1.9901753664016724, "Pretrain/Loss (Raw)": 2.0067763328552246, "Pretrain/Step": 3881, "Pretrain/Step Time": 8.772376349195838} +{"Pretrain/Learning Rate": 3.3563355539546795e-05, "Pretrain/Loss": 1.989516019821167, "Pretrain/Loss (Raw)": 2.0492265224456787, "Pretrain/Step": 3882, "Pretrain/Step Time": 8.77572113648057} +{"Pretrain/Learning Rate": 3.355537876466923e-05, "Pretrain/Loss": 1.9911937713623047, "Pretrain/Loss (Raw)": 2.1416397094726562, "Pretrain/Step": 3883, "Pretrain/Step Time": 8.775030955672264} +{"Pretrain/Learning Rate": 3.354740100314506e-05, "Pretrain/Loss": 1.9919110536575317, "Pretrain/Loss (Raw)": 2.050698757171631, "Pretrain/Step": 3884, "Pretrain/Step Time": 8.777329100295901} +{"Pretrain/Learning Rate": 3.3539422255894345e-05, "Pretrain/Loss": 1.9912409782409668, "Pretrain/Loss (Raw)": 1.8834940195083618, "Pretrain/Step": 3885, "Pretrain/Step Time": 8.771690413355827} +{"Pretrain/Learning Rate": 3.353144252383721e-05, "Pretrain/Loss": 1.9906822443008423, "Pretrain/Loss (Raw)": 2.0650558471679688, "Pretrain/Step": 3886, "Pretrain/Step Time": 8.770679119974375} +{"Pretrain/Learning Rate": 3.3523461807893925e-05, "Pretrain/Loss": 1.9904226064682007, "Pretrain/Loss (Raw)": 2.1221747398376465, "Pretrain/Step": 3887, "Pretrain/Step Time": 8.778079103678465} +{"Pretrain/Learning Rate": 3.351548010898486e-05, "Pretrain/Loss": 1.9887863397598267, "Pretrain/Loss (Raw)": 1.8243684768676758, "Pretrain/Step": 3888, "Pretrain/Step Time": 8.76828233525157} +{"Pretrain/Learning Rate": 3.35074974280305e-05, "Pretrain/Loss": 1.9912257194519043, "Pretrain/Loss (Raw)": 1.975506067276001, "Pretrain/Step": 3889, "Pretrain/Step Time": 8.77617715485394} +{"Pretrain/Learning Rate": 3.349951376595145e-05, "Pretrain/Loss": 1.9905908107757568, "Pretrain/Loss (Raw)": 1.9046086072921753, "Pretrain/Step": 3890, "Pretrain/Step Time": 8.769242394715548} +{"Pretrain/Learning Rate": 3.3491529123668425e-05, "Pretrain/Loss": 1.987868070602417, "Pretrain/Loss (Raw)": 2.000581979751587, "Pretrain/Step": 3891, "Pretrain/Step Time": 8.7681402284652} +{"Pretrain/Learning Rate": 3.348354350210224e-05, "Pretrain/Loss": 1.9883270263671875, "Pretrain/Loss (Raw)": 1.8329111337661743, "Pretrain/Step": 3892, "Pretrain/Step Time": 8.768229402601719} +{"Pretrain/Learning Rate": 3.347555690217385e-05, "Pretrain/Loss": 1.9890365600585938, "Pretrain/Loss (Raw)": 2.0542731285095215, "Pretrain/Step": 3893, "Pretrain/Step Time": 8.75826589204371} +{"Pretrain/Learning Rate": 3.34675693248043e-05, "Pretrain/Loss": 1.9886837005615234, "Pretrain/Loss (Raw)": 1.960310935974121, "Pretrain/Step": 3894, "Pretrain/Step Time": 8.766970824450254} +{"Pretrain/Learning Rate": 3.3459580770914744e-05, "Pretrain/Loss": 1.9877281188964844, "Pretrain/Loss (Raw)": 1.9450135231018066, "Pretrain/Step": 3895, "Pretrain/Step Time": 8.769990857690573} +{"Pretrain/Learning Rate": 3.3451591241426486e-05, "Pretrain/Loss": 1.9879437685012817, "Pretrain/Loss (Raw)": 2.046916961669922, "Pretrain/Step": 3896, "Pretrain/Step Time": 8.77218915708363} +{"Pretrain/Learning Rate": 3.3443600737260885e-05, "Pretrain/Loss": 1.9897537231445312, "Pretrain/Loss (Raw)": 2.3457820415496826, "Pretrain/Step": 3897, "Pretrain/Step Time": 8.768332563340664} +{"Pretrain/Learning Rate": 3.343560925933947e-05, "Pretrain/Loss": 1.9900667667388916, "Pretrain/Loss (Raw)": 2.0249032974243164, "Pretrain/Step": 3898, "Pretrain/Step Time": 8.75926493294537} +{"Pretrain/Learning Rate": 3.342761680858385e-05, "Pretrain/Loss": 1.989565372467041, "Pretrain/Loss (Raw)": 2.0824830532073975, "Pretrain/Step": 3899, "Pretrain/Step Time": 8.75574372522533} +{"Pretrain/Learning Rate": 3.3419623385915736e-05, "Pretrain/Loss": 1.9871714115142822, "Pretrain/Loss (Raw)": 1.8452684879302979, "Pretrain/Step": 3900, "Pretrain/Step Time": 8.764828039333224} +{"Pretrain/Learning Rate": 3.3411628992256984e-05, "Pretrain/Loss": 1.987569808959961, "Pretrain/Loss (Raw)": 1.9691389799118042, "Pretrain/Step": 3901, "Pretrain/Step Time": 8.765111932531} +{"Pretrain/Learning Rate": 3.340363362852954e-05, "Pretrain/Loss": 1.9846305847167969, "Pretrain/Loss (Raw)": 1.8386754989624023, "Pretrain/Step": 3902, "Pretrain/Step Time": 8.767867092043161} +{"Pretrain/Learning Rate": 3.339563729565547e-05, "Pretrain/Loss": 1.985656499862671, "Pretrain/Loss (Raw)": 1.93179452419281, "Pretrain/Step": 3903, "Pretrain/Step Time": 8.766517275944352} +{"Pretrain/Learning Rate": 3.3387639994556934e-05, "Pretrain/Loss": 1.9875730276107788, "Pretrain/Loss (Raw)": 2.3334462642669678, "Pretrain/Step": 3904, "Pretrain/Step Time": 8.76570344902575} +{"Pretrain/Learning Rate": 3.337964172615624e-05, "Pretrain/Loss": 1.9889742136001587, "Pretrain/Loss (Raw)": 2.28836989402771, "Pretrain/Step": 3905, "Pretrain/Step Time": 8.763995219022036} +{"Pretrain/Learning Rate": 3.337164249137577e-05, "Pretrain/Loss": 1.9907076358795166, "Pretrain/Loss (Raw)": 2.360227584838867, "Pretrain/Step": 3906, "Pretrain/Step Time": 8.777902575209737} +{"Pretrain/Learning Rate": 3.3363642291138046e-05, "Pretrain/Loss": 1.993866205215454, "Pretrain/Loss (Raw)": 2.0876100063323975, "Pretrain/Step": 3907, "Pretrain/Step Time": 8.774300681427121} +{"Pretrain/Learning Rate": 3.3355641126365676e-05, "Pretrain/Loss": 1.993384599685669, "Pretrain/Loss (Raw)": 2.0861282348632812, "Pretrain/Step": 3908, "Pretrain/Step Time": 8.774786163121462} +{"Pretrain/Learning Rate": 3.33476389979814e-05, "Pretrain/Loss": 1.9935762882232666, "Pretrain/Loss (Raw)": 1.9874597787857056, "Pretrain/Step": 3909, "Pretrain/Step Time": 8.777073128148913} +{"Pretrain/Learning Rate": 3.3339635906908064e-05, "Pretrain/Loss": 1.992856740951538, "Pretrain/Loss (Raw)": 1.9887615442276, "Pretrain/Step": 3910, "Pretrain/Step Time": 8.77641548961401} +{"Pretrain/Learning Rate": 3.3331631854068616e-05, "Pretrain/Loss": 1.9939155578613281, "Pretrain/Loss (Raw)": 2.230193614959717, "Pretrain/Step": 3911, "Pretrain/Step Time": 8.783920053392649} +{"Pretrain/Learning Rate": 3.3323626840386115e-05, "Pretrain/Loss": 1.9933356046676636, "Pretrain/Loss (Raw)": 1.9572802782058716, "Pretrain/Step": 3912, "Pretrain/Step Time": 8.785968853160739} +{"Pretrain/Learning Rate": 3.3315620866783755e-05, "Pretrain/Loss": 1.995381474494934, "Pretrain/Loss (Raw)": 2.0283195972442627, "Pretrain/Step": 3913, "Pretrain/Step Time": 8.777864998206496} +{"Pretrain/Learning Rate": 3.33076139341848e-05, "Pretrain/Loss": 1.9968587160110474, "Pretrain/Loss (Raw)": 2.073563575744629, "Pretrain/Step": 3914, "Pretrain/Step Time": 8.781445799395442} +{"Pretrain/Learning Rate": 3.329960604351267e-05, "Pretrain/Loss": 1.994571328163147, "Pretrain/Loss (Raw)": 1.9113600254058838, "Pretrain/Step": 3915, "Pretrain/Step Time": 8.792452277615666} +{"Pretrain/Learning Rate": 3.329159719569085e-05, "Pretrain/Loss": 1.9969475269317627, "Pretrain/Loss (Raw)": 2.171976089477539, "Pretrain/Step": 3916, "Pretrain/Step Time": 8.784337557852268} +{"Pretrain/Learning Rate": 3.328358739164299e-05, "Pretrain/Loss": 1.9978973865509033, "Pretrain/Loss (Raw)": 2.0123369693756104, "Pretrain/Step": 3917, "Pretrain/Step Time": 8.786631872877479} +{"Pretrain/Learning Rate": 3.327557663229278e-05, "Pretrain/Loss": 1.9976834058761597, "Pretrain/Loss (Raw)": 2.0002150535583496, "Pretrain/Step": 3918, "Pretrain/Step Time": 8.786667125299573} +{"Pretrain/Learning Rate": 3.326756491856409e-05, "Pretrain/Loss": 2.001347541809082, "Pretrain/Loss (Raw)": 2.1195597648620605, "Pretrain/Step": 3919, "Pretrain/Step Time": 8.795858716592193} +{"Pretrain/Learning Rate": 3.325955225138085e-05, "Pretrain/Loss": 2.002070426940918, "Pretrain/Loss (Raw)": 2.140313148498535, "Pretrain/Step": 3920, "Pretrain/Step Time": 8.793629063293338} +{"Pretrain/Learning Rate": 3.3251538631667125e-05, "Pretrain/Loss": 2.0011701583862305, "Pretrain/Loss (Raw)": 1.9138351678848267, "Pretrain/Step": 3921, "Pretrain/Step Time": 8.793107446283102} +{"Pretrain/Learning Rate": 3.324352406034707e-05, "Pretrain/Loss": 2.003610849380493, "Pretrain/Loss (Raw)": 2.0120534896850586, "Pretrain/Step": 3922, "Pretrain/Step Time": 8.804758127778769} +{"Pretrain/Learning Rate": 3.3235508538344996e-05, "Pretrain/Loss": 2.0049195289611816, "Pretrain/Loss (Raw)": 2.0799367427825928, "Pretrain/Step": 3923, "Pretrain/Step Time": 8.802402798086405} +{"Pretrain/Learning Rate": 3.322749206658526e-05, "Pretrain/Loss": 2.0045156478881836, "Pretrain/Loss (Raw)": 1.9836647510528564, "Pretrain/Step": 3924, "Pretrain/Step Time": 8.800198329612613} +{"Pretrain/Learning Rate": 3.3219474645992366e-05, "Pretrain/Loss": 2.005988121032715, "Pretrain/Loss (Raw)": 1.9964427947998047, "Pretrain/Step": 3925, "Pretrain/Step Time": 8.80380491539836} +{"Pretrain/Learning Rate": 3.3211456277490926e-05, "Pretrain/Loss": 2.0054540634155273, "Pretrain/Loss (Raw)": 2.030251979827881, "Pretrain/Step": 3926, "Pretrain/Step Time": 8.805119767785072} +{"Pretrain/Learning Rate": 3.3203436962005655e-05, "Pretrain/Loss": 2.0088610649108887, "Pretrain/Loss (Raw)": 2.0572731494903564, "Pretrain/Step": 3927, "Pretrain/Step Time": 8.806420287117362} +{"Pretrain/Learning Rate": 3.3195416700461385e-05, "Pretrain/Loss": 2.0111920833587646, "Pretrain/Loss (Raw)": 2.1507956981658936, "Pretrain/Step": 3928, "Pretrain/Step Time": 8.807405535131693} +{"Pretrain/Learning Rate": 3.318739549378304e-05, "Pretrain/Loss": 2.0144832134246826, "Pretrain/Loss (Raw)": 1.9820828437805176, "Pretrain/Step": 3929, "Pretrain/Step Time": 8.80535177513957} +{"Pretrain/Learning Rate": 3.317937334289566e-05, "Pretrain/Loss": 2.0129222869873047, "Pretrain/Loss (Raw)": 1.9846619367599487, "Pretrain/Step": 3930, "Pretrain/Step Time": 8.799803515896201} +{"Pretrain/Learning Rate": 3.317135024872442e-05, "Pretrain/Loss": 2.0155115127563477, "Pretrain/Loss (Raw)": 2.1080832481384277, "Pretrain/Step": 3931, "Pretrain/Step Time": 8.801012493669987} +{"Pretrain/Learning Rate": 3.3163326212194546e-05, "Pretrain/Loss": 2.0154240131378174, "Pretrain/Loss (Raw)": 2.1433048248291016, "Pretrain/Step": 3932, "Pretrain/Step Time": 8.797054428607225} +{"Pretrain/Learning Rate": 3.315530123423143e-05, "Pretrain/Loss": 2.018390655517578, "Pretrain/Loss (Raw)": 2.478119134902954, "Pretrain/Step": 3933, "Pretrain/Step Time": 8.797755664214492} +{"Pretrain/Learning Rate": 3.314727531576055e-05, "Pretrain/Loss": 2.018345355987549, "Pretrain/Loss (Raw)": 2.1533420085906982, "Pretrain/Step": 3934, "Pretrain/Step Time": 8.79852182045579} +{"Pretrain/Learning Rate": 3.3139248457707495e-05, "Pretrain/Loss": 2.017083168029785, "Pretrain/Loss (Raw)": 1.70432448387146, "Pretrain/Step": 3935, "Pretrain/Step Time": 8.808874340727925} +{"Pretrain/Learning Rate": 3.313122066099794e-05, "Pretrain/Loss": 2.0189309120178223, "Pretrain/Loss (Raw)": 2.1262545585632324, "Pretrain/Step": 3936, "Pretrain/Step Time": 8.801076889038086} +{"Pretrain/Learning Rate": 3.312319192655772e-05, "Pretrain/Loss": 2.0191917419433594, "Pretrain/Loss (Raw)": 2.078166961669922, "Pretrain/Step": 3937, "Pretrain/Step Time": 8.805497279390693} +{"Pretrain/Learning Rate": 3.311516225531271e-05, "Pretrain/Loss": 2.019122838973999, "Pretrain/Loss (Raw)": 2.127903938293457, "Pretrain/Step": 3938, "Pretrain/Step Time": 8.805087631568313} +{"Pretrain/Learning Rate": 3.3107131648188966e-05, "Pretrain/Loss": 2.0189576148986816, "Pretrain/Loss (Raw)": 2.1423158645629883, "Pretrain/Step": 3939, "Pretrain/Step Time": 8.806603526696563} +{"Pretrain/Learning Rate": 3.309910010611259e-05, "Pretrain/Loss": 2.015148639678955, "Pretrain/Loss (Raw)": 1.7688552141189575, "Pretrain/Step": 3940, "Pretrain/Step Time": 8.802230732515454} +{"Pretrain/Learning Rate": 3.3091067630009834e-05, "Pretrain/Loss": 2.0133066177368164, "Pretrain/Loss (Raw)": 2.019167423248291, "Pretrain/Step": 3941, "Pretrain/Step Time": 8.800386771559715} +{"Pretrain/Learning Rate": 3.3083034220807016e-05, "Pretrain/Loss": 2.0129148960113525, "Pretrain/Loss (Raw)": 1.9387304782867432, "Pretrain/Step": 3942, "Pretrain/Step Time": 8.801499454304576} +{"Pretrain/Learning Rate": 3.307499987943062e-05, "Pretrain/Loss": 2.0132107734680176, "Pretrain/Loss (Raw)": 2.0903139114379883, "Pretrain/Step": 3943, "Pretrain/Step Time": 8.811243616044521} +{"Pretrain/Learning Rate": 3.3066964606807175e-05, "Pretrain/Loss": 2.0136234760284424, "Pretrain/Loss (Raw)": 1.944145679473877, "Pretrain/Step": 3944, "Pretrain/Step Time": 8.805228278040886} +{"Pretrain/Learning Rate": 3.3058928403863364e-05, "Pretrain/Loss": 2.0151822566986084, "Pretrain/Loss (Raw)": 1.8750613927841187, "Pretrain/Step": 3945, "Pretrain/Step Time": 8.800081837922335} +{"Pretrain/Learning Rate": 3.305089127152596e-05, "Pretrain/Loss": 2.015011787414551, "Pretrain/Loss (Raw)": 1.9893553256988525, "Pretrain/Step": 3946, "Pretrain/Step Time": 8.801982814446092} +{"Pretrain/Learning Rate": 3.304285321072183e-05, "Pretrain/Loss": 2.011782646179199, "Pretrain/Loss (Raw)": 1.6779221296310425, "Pretrain/Step": 3947, "Pretrain/Step Time": 8.803969798609614} +{"Pretrain/Learning Rate": 3.303481422237797e-05, "Pretrain/Loss": 2.01411509513855, "Pretrain/Loss (Raw)": 2.3358564376831055, "Pretrain/Step": 3948, "Pretrain/Step Time": 8.813591167330742} +{"Pretrain/Learning Rate": 3.3026774307421476e-05, "Pretrain/Loss": 2.0110135078430176, "Pretrain/Loss (Raw)": 1.6553953886032104, "Pretrain/Step": 3949, "Pretrain/Step Time": 8.81934493035078} +{"Pretrain/Learning Rate": 3.301873346677954e-05, "Pretrain/Loss": 2.013326644897461, "Pretrain/Loss (Raw)": 2.108894109725952, "Pretrain/Step": 3950, "Pretrain/Step Time": 8.817895740270615} +{"Pretrain/Learning Rate": 3.301069170137948e-05, "Pretrain/Loss": 2.0168113708496094, "Pretrain/Loss (Raw)": 2.222609519958496, "Pretrain/Step": 3951, "Pretrain/Step Time": 8.813502237200737} +{"Pretrain/Learning Rate": 3.3002649012148704e-05, "Pretrain/Loss": 2.019028663635254, "Pretrain/Loss (Raw)": 2.0619707107543945, "Pretrain/Step": 3952, "Pretrain/Step Time": 8.804544188082218} +{"Pretrain/Learning Rate": 3.2994605400014736e-05, "Pretrain/Loss": 2.0200653076171875, "Pretrain/Loss (Raw)": 2.0795533657073975, "Pretrain/Step": 3953, "Pretrain/Step Time": 8.80319795012474} +{"Pretrain/Learning Rate": 3.29865608659052e-05, "Pretrain/Loss": 2.0183913707733154, "Pretrain/Loss (Raw)": 2.0244367122650146, "Pretrain/Step": 3954, "Pretrain/Step Time": 8.795643609017134} +{"Pretrain/Learning Rate": 3.297851541074782e-05, "Pretrain/Loss": 2.0178565979003906, "Pretrain/Loss (Raw)": 1.9690618515014648, "Pretrain/Step": 3955, "Pretrain/Step Time": 8.797537215054035} +{"Pretrain/Learning Rate": 3.297046903547046e-05, "Pretrain/Loss": 2.018460273742676, "Pretrain/Loss (Raw)": 2.0622968673706055, "Pretrain/Step": 3956, "Pretrain/Step Time": 8.800577875226736} +{"Pretrain/Learning Rate": 3.296242174100105e-05, "Pretrain/Loss": 2.018345832824707, "Pretrain/Loss (Raw)": 2.133692979812622, "Pretrain/Step": 3957, "Pretrain/Step Time": 8.801973281428218} +{"Pretrain/Learning Rate": 3.2954373528267646e-05, "Pretrain/Loss": 2.0170669555664062, "Pretrain/Loss (Raw)": 1.8808923959732056, "Pretrain/Step": 3958, "Pretrain/Step Time": 8.802800085395575} +{"Pretrain/Learning Rate": 3.29463243981984e-05, "Pretrain/Loss": 2.0163626670837402, "Pretrain/Loss (Raw)": 2.035717010498047, "Pretrain/Step": 3959, "Pretrain/Step Time": 8.80312741175294} +{"Pretrain/Learning Rate": 3.2938274351721587e-05, "Pretrain/Loss": 2.0167675018310547, "Pretrain/Loss (Raw)": 1.8745018243789673, "Pretrain/Step": 3960, "Pretrain/Step Time": 8.80097977258265} +{"Pretrain/Learning Rate": 3.2930223389765566e-05, "Pretrain/Loss": 2.0181632041931152, "Pretrain/Loss (Raw)": 2.107106924057007, "Pretrain/Step": 3961, "Pretrain/Step Time": 8.795209433883429} +{"Pretrain/Learning Rate": 3.292217151325882e-05, "Pretrain/Loss": 2.017509937286377, "Pretrain/Loss (Raw)": 1.942817211151123, "Pretrain/Step": 3962, "Pretrain/Step Time": 8.804820278659463} +{"Pretrain/Learning Rate": 3.2914118723129916e-05, "Pretrain/Loss": 2.018176794052124, "Pretrain/Loss (Raw)": 2.2495648860931396, "Pretrain/Step": 3963, "Pretrain/Step Time": 8.810803201049566} +{"Pretrain/Learning Rate": 3.2906065020307545e-05, "Pretrain/Loss": 2.0186619758605957, "Pretrain/Loss (Raw)": 2.0063228607177734, "Pretrain/Step": 3964, "Pretrain/Step Time": 8.816400492563844} +{"Pretrain/Learning Rate": 3.289801040572051e-05, "Pretrain/Loss": 2.018808126449585, "Pretrain/Loss (Raw)": 1.8731014728546143, "Pretrain/Step": 3965, "Pretrain/Step Time": 8.814806969836354} +{"Pretrain/Learning Rate": 3.288995488029769e-05, "Pretrain/Loss": 2.018991470336914, "Pretrain/Loss (Raw)": 1.9089146852493286, "Pretrain/Step": 3966, "Pretrain/Step Time": 8.814886346459389} +{"Pretrain/Learning Rate": 3.288189844496811e-05, "Pretrain/Loss": 2.02083683013916, "Pretrain/Loss (Raw)": 2.138533353805542, "Pretrain/Step": 3967, "Pretrain/Step Time": 8.813943032175303} +{"Pretrain/Learning Rate": 3.287384110066084e-05, "Pretrain/Loss": 2.020890235900879, "Pretrain/Loss (Raw)": 1.9538880586624146, "Pretrain/Step": 3968, "Pretrain/Step Time": 8.8149473965168} +{"Pretrain/Learning Rate": 3.286578284830513e-05, "Pretrain/Loss": 2.019402503967285, "Pretrain/Loss (Raw)": 1.6444679498672485, "Pretrain/Step": 3969, "Pretrain/Step Time": 8.81649492867291} +{"Pretrain/Learning Rate": 3.2857723688830264e-05, "Pretrain/Loss": 2.017918825149536, "Pretrain/Loss (Raw)": 1.5550286769866943, "Pretrain/Step": 3970, "Pretrain/Step Time": 8.817765407264233} +{"Pretrain/Learning Rate": 3.284966362316568e-05, "Pretrain/Loss": 2.015657901763916, "Pretrain/Loss (Raw)": 1.8987672328948975, "Pretrain/Step": 3971, "Pretrain/Step Time": 8.822624415159225} +{"Pretrain/Learning Rate": 3.28416026522409e-05, "Pretrain/Loss": 2.0153656005859375, "Pretrain/Loss (Raw)": 1.9379727840423584, "Pretrain/Step": 3972, "Pretrain/Step Time": 8.82324042916298} +{"Pretrain/Learning Rate": 3.283354077698555e-05, "Pretrain/Loss": 2.0144917964935303, "Pretrain/Loss (Raw)": 2.0862228870391846, "Pretrain/Step": 3973, "Pretrain/Step Time": 8.821210777387023} +{"Pretrain/Learning Rate": 3.2825477998329366e-05, "Pretrain/Loss": 2.0140507221221924, "Pretrain/Loss (Raw)": 2.0113799571990967, "Pretrain/Step": 3974, "Pretrain/Step Time": 8.824647860601544} +{"Pretrain/Learning Rate": 3.281741431720219e-05, "Pretrain/Loss": 2.015157461166382, "Pretrain/Loss (Raw)": 2.0628035068511963, "Pretrain/Step": 3975, "Pretrain/Step Time": 8.819752281531692} +{"Pretrain/Learning Rate": 3.280934973453395e-05, "Pretrain/Loss": 2.0154128074645996, "Pretrain/Loss (Raw)": 2.1246464252471924, "Pretrain/Step": 3976, "Pretrain/Step Time": 8.823997784405947} +{"Pretrain/Learning Rate": 3.28012842512547e-05, "Pretrain/Loss": 2.017322540283203, "Pretrain/Loss (Raw)": 2.069840669631958, "Pretrain/Step": 3977, "Pretrain/Step Time": 8.822095131501555} +{"Pretrain/Learning Rate": 3.279321786829459e-05, "Pretrain/Loss": 2.019284248352051, "Pretrain/Loss (Raw)": 2.057128667831421, "Pretrain/Step": 3978, "Pretrain/Step Time": 8.823327004909515} +{"Pretrain/Learning Rate": 3.278515058658387e-05, "Pretrain/Loss": 2.0235910415649414, "Pretrain/Loss (Raw)": 2.3221940994262695, "Pretrain/Step": 3979, "Pretrain/Step Time": 8.830395927652717} +{"Pretrain/Learning Rate": 3.27770824070529e-05, "Pretrain/Loss": 2.0233869552612305, "Pretrain/Loss (Raw)": 1.9619711637496948, "Pretrain/Step": 3980, "Pretrain/Step Time": 8.834749531000853} +{"Pretrain/Learning Rate": 3.276901333063215e-05, "Pretrain/Loss": 2.022764205932617, "Pretrain/Loss (Raw)": 1.9994546175003052, "Pretrain/Step": 3981, "Pretrain/Step Time": 8.82810222916305} +{"Pretrain/Learning Rate": 3.276094335825217e-05, "Pretrain/Loss": 2.022451162338257, "Pretrain/Loss (Raw)": 2.0395963191986084, "Pretrain/Step": 3982, "Pretrain/Step Time": 8.830695539712906} +{"Pretrain/Learning Rate": 3.2752872490843626e-05, "Pretrain/Loss": 2.02116060256958, "Pretrain/Loss (Raw)": 1.9280595779418945, "Pretrain/Step": 3983, "Pretrain/Step Time": 8.825326768681407} +{"Pretrain/Learning Rate": 3.274480072933729e-05, "Pretrain/Loss": 2.0211715698242188, "Pretrain/Loss (Raw)": 1.8411383628845215, "Pretrain/Step": 3984, "Pretrain/Step Time": 8.815325355157256} +{"Pretrain/Learning Rate": 3.273672807466405e-05, "Pretrain/Loss": 2.0225727558135986, "Pretrain/Loss (Raw)": 2.1341969966888428, "Pretrain/Step": 3985, "Pretrain/Step Time": 8.816288318485022} +{"Pretrain/Learning Rate": 3.272865452775487e-05, "Pretrain/Loss": 2.0213005542755127, "Pretrain/Loss (Raw)": 2.0359086990356445, "Pretrain/Step": 3986, "Pretrain/Step Time": 8.816497717052698} +{"Pretrain/Learning Rate": 3.272058008954083e-05, "Pretrain/Loss": 2.022589683532715, "Pretrain/Loss (Raw)": 1.9856940507888794, "Pretrain/Step": 3987, "Pretrain/Step Time": 8.81637104228139} +{"Pretrain/Learning Rate": 3.271250476095311e-05, "Pretrain/Loss": 2.0213871002197266, "Pretrain/Loss (Raw)": 2.003309965133667, "Pretrain/Step": 3988, "Pretrain/Step Time": 8.818635480478406} +{"Pretrain/Learning Rate": 3.2704428542923e-05, "Pretrain/Loss": 2.0196452140808105, "Pretrain/Loss (Raw)": 1.962281584739685, "Pretrain/Step": 3989, "Pretrain/Step Time": 8.816894114017487} +{"Pretrain/Learning Rate": 3.269635143638188e-05, "Pretrain/Loss": 2.02010440826416, "Pretrain/Loss (Raw)": 2.0842061042785645, "Pretrain/Step": 3990, "Pretrain/Step Time": 8.817508233711123} +{"Pretrain/Learning Rate": 3.2688273442261255e-05, "Pretrain/Loss": 2.0202012062072754, "Pretrain/Loss (Raw)": 1.913891315460205, "Pretrain/Step": 3991, "Pretrain/Step Time": 8.816450027748942} +{"Pretrain/Learning Rate": 3.26801945614927e-05, "Pretrain/Loss": 2.019160270690918, "Pretrain/Loss (Raw)": 1.8978826999664307, "Pretrain/Step": 3992, "Pretrain/Step Time": 8.817118598148227} +{"Pretrain/Learning Rate": 3.2672114795007926e-05, "Pretrain/Loss": 2.018996238708496, "Pretrain/Loss (Raw)": 2.092761754989624, "Pretrain/Step": 3993, "Pretrain/Step Time": 8.819647124037147} +{"Pretrain/Learning Rate": 3.266403414373872e-05, "Pretrain/Loss": 2.0199713706970215, "Pretrain/Loss (Raw)": 1.9523383378982544, "Pretrain/Step": 3994, "Pretrain/Step Time": 8.823258323594928} +{"Pretrain/Learning Rate": 3.265595260861698e-05, "Pretrain/Loss": 2.019491672515869, "Pretrain/Loss (Raw)": 1.864080786705017, "Pretrain/Step": 3995, "Pretrain/Step Time": 8.819259693846107} +{"Pretrain/Learning Rate": 3.264787019057471e-05, "Pretrain/Loss": 2.02009916305542, "Pretrain/Loss (Raw)": 1.9811056852340698, "Pretrain/Step": 3996, "Pretrain/Step Time": 8.819965513423085} +{"Pretrain/Learning Rate": 3.2639786890544014e-05, "Pretrain/Loss": 2.0200071334838867, "Pretrain/Loss (Raw)": 2.124677896499634, "Pretrain/Step": 3997, "Pretrain/Step Time": 8.820061348378658} +{"Pretrain/Learning Rate": 3.263170270945709e-05, "Pretrain/Loss": 2.0209012031555176, "Pretrain/Loss (Raw)": 2.0118770599365234, "Pretrain/Step": 3998, "Pretrain/Step Time": 8.808358203619719} +{"Pretrain/Learning Rate": 3.262361764824625e-05, "Pretrain/Loss": 2.0183053016662598, "Pretrain/Loss (Raw)": 1.9457004070281982, "Pretrain/Step": 3999, "Pretrain/Step Time": 8.815941255539656} +{"Pretrain/Learning Rate": 3.26155317078439e-05, "Pretrain/Loss": 2.0160317420959473, "Pretrain/Loss (Raw)": 2.061465263366699, "Pretrain/Step": 4000, "Pretrain/Step Time": 8.812732007354498} +{"Pretrain/Learning Rate": 3.260744488918254e-05, "Pretrain/Loss": 2.012190341949463, "Pretrain/Loss (Raw)": 1.622546672821045, "Pretrain/Step": 4001, "Pretrain/Step Time": 8.809645229950547} +{"Pretrain/Learning Rate": 3.25993571931948e-05, "Pretrain/Loss": 2.0115814208984375, "Pretrain/Loss (Raw)": 2.0187783241271973, "Pretrain/Step": 4002, "Pretrain/Step Time": 8.814831275492907} +{"Pretrain/Learning Rate": 3.259126862081337e-05, "Pretrain/Loss": 2.0106453895568848, "Pretrain/Loss (Raw)": 1.970306158065796, "Pretrain/Step": 4003, "Pretrain/Step Time": 8.812315247952938} +{"Pretrain/Learning Rate": 3.258317917297108e-05, "Pretrain/Loss": 2.0119285583496094, "Pretrain/Loss (Raw)": 2.073178768157959, "Pretrain/Step": 4004, "Pretrain/Step Time": 8.810533175244927} +{"Pretrain/Learning Rate": 3.2575088850600826e-05, "Pretrain/Loss": 2.0150270462036133, "Pretrain/Loss (Raw)": 1.9919068813323975, "Pretrain/Step": 4005, "Pretrain/Step Time": 8.816263688728213} +{"Pretrain/Learning Rate": 3.2566997654635634e-05, "Pretrain/Loss": 2.012571334838867, "Pretrain/Loss (Raw)": 1.745800256729126, "Pretrain/Step": 4006, "Pretrain/Step Time": 8.80995012074709} +{"Pretrain/Learning Rate": 3.2558905586008616e-05, "Pretrain/Loss": 2.01312518119812, "Pretrain/Loss (Raw)": 2.113821268081665, "Pretrain/Step": 4007, "Pretrain/Step Time": 8.807514002546668} +{"Pretrain/Learning Rate": 3.2550812645652985e-05, "Pretrain/Loss": 2.0155298709869385, "Pretrain/Loss (Raw)": 1.999205231666565, "Pretrain/Step": 4008, "Pretrain/Step Time": 8.808523423969746} +{"Pretrain/Learning Rate": 3.2542718834502056e-05, "Pretrain/Loss": 2.0168044567108154, "Pretrain/Loss (Raw)": 2.1699228286743164, "Pretrain/Step": 4009, "Pretrain/Step Time": 8.808774940669537} +{"Pretrain/Learning Rate": 3.253462415348926e-05, "Pretrain/Loss": 2.0153775215148926, "Pretrain/Loss (Raw)": 1.866594672203064, "Pretrain/Step": 4010, "Pretrain/Step Time": 8.807940017431974} +{"Pretrain/Learning Rate": 3.252652860354809e-05, "Pretrain/Loss": 2.010352373123169, "Pretrain/Loss (Raw)": 1.4983999729156494, "Pretrain/Step": 4011, "Pretrain/Step Time": 8.813853055238724} +{"Pretrain/Learning Rate": 3.2518432185612184e-05, "Pretrain/Loss": 2.0105464458465576, "Pretrain/Loss (Raw)": 2.0755422115325928, "Pretrain/Step": 4012, "Pretrain/Step Time": 8.811610516160727} +{"Pretrain/Learning Rate": 3.2510334900615254e-05, "Pretrain/Loss": 2.0118448734283447, "Pretrain/Loss (Raw)": 2.0496914386749268, "Pretrain/Step": 4013, "Pretrain/Step Time": 8.817594001069665} +{"Pretrain/Learning Rate": 3.25022367494911e-05, "Pretrain/Loss": 2.0114903450012207, "Pretrain/Loss (Raw)": 2.0196917057037354, "Pretrain/Step": 4014, "Pretrain/Step Time": 8.814776392653584} +{"Pretrain/Learning Rate": 3.2494137733173666e-05, "Pretrain/Loss": 2.0106780529022217, "Pretrain/Loss (Raw)": 2.0182087421417236, "Pretrain/Step": 4015, "Pretrain/Step Time": 8.80773962289095} +{"Pretrain/Learning Rate": 3.2486037852596946e-05, "Pretrain/Loss": 2.0115561485290527, "Pretrain/Loss (Raw)": 1.9367512464523315, "Pretrain/Step": 4016, "Pretrain/Step Time": 8.811407456174493} +{"Pretrain/Learning Rate": 3.247793710869507e-05, "Pretrain/Loss": 2.0090880393981934, "Pretrain/Loss (Raw)": 1.659597396850586, "Pretrain/Step": 4017, "Pretrain/Step Time": 8.806424595415592} +{"Pretrain/Learning Rate": 3.2469835502402246e-05, "Pretrain/Loss": 2.0104892253875732, "Pretrain/Loss (Raw)": 2.083951711654663, "Pretrain/Step": 4018, "Pretrain/Step Time": 8.809088300913572} +{"Pretrain/Learning Rate": 3.2461733034652794e-05, "Pretrain/Loss": 2.008452892303467, "Pretrain/Loss (Raw)": 1.7399346828460693, "Pretrain/Step": 4019, "Pretrain/Step Time": 8.81037979759276} +{"Pretrain/Learning Rate": 3.245362970638113e-05, "Pretrain/Loss": 2.010221004486084, "Pretrain/Loss (Raw)": 2.0592215061187744, "Pretrain/Step": 4020, "Pretrain/Step Time": 8.811407674103975} +{"Pretrain/Learning Rate": 3.244552551852176e-05, "Pretrain/Loss": 2.0116615295410156, "Pretrain/Loss (Raw)": 2.2386715412139893, "Pretrain/Step": 4021, "Pretrain/Step Time": 8.811804806813598} +{"Pretrain/Learning Rate": 3.24374204720093e-05, "Pretrain/Loss": 2.010746955871582, "Pretrain/Loss (Raw)": 1.8432395458221436, "Pretrain/Step": 4022, "Pretrain/Step Time": 8.806857407093048} +{"Pretrain/Learning Rate": 3.242931456777848e-05, "Pretrain/Loss": 2.01059889793396, "Pretrain/Loss (Raw)": 1.9260563850402832, "Pretrain/Step": 4023, "Pretrain/Step Time": 8.809357220306993} +{"Pretrain/Learning Rate": 3.242120780676408e-05, "Pretrain/Loss": 2.0116448402404785, "Pretrain/Loss (Raw)": 2.1808109283447266, "Pretrain/Step": 4024, "Pretrain/Step Time": 8.802784750238061} +{"Pretrain/Learning Rate": 3.2413100189901036e-05, "Pretrain/Loss": 2.010204553604126, "Pretrain/Loss (Raw)": 2.1614253520965576, "Pretrain/Step": 4025, "Pretrain/Step Time": 8.802111512050033} +{"Pretrain/Learning Rate": 3.2404991718124346e-05, "Pretrain/Loss": 2.010003089904785, "Pretrain/Loss (Raw)": 1.9990826845169067, "Pretrain/Step": 4026, "Pretrain/Step Time": 8.801018783822656} +{"Pretrain/Learning Rate": 3.239688239236911e-05, "Pretrain/Loss": 2.009993553161621, "Pretrain/Loss (Raw)": 2.081273317337036, "Pretrain/Step": 4027, "Pretrain/Step Time": 8.806877875700593} +{"Pretrain/Learning Rate": 3.238877221357054e-05, "Pretrain/Loss": 2.0096116065979004, "Pretrain/Loss (Raw)": 1.7964057922363281, "Pretrain/Step": 4028, "Pretrain/Step Time": 8.798958031460643} +{"Pretrain/Learning Rate": 3.2380661182663956e-05, "Pretrain/Loss": 2.01070499420166, "Pretrain/Loss (Raw)": 2.1090939044952393, "Pretrain/Step": 4029, "Pretrain/Step Time": 8.800354244187474} +{"Pretrain/Learning Rate": 3.237254930058474e-05, "Pretrain/Loss": 2.01409912109375, "Pretrain/Loss (Raw)": 2.273130178451538, "Pretrain/Step": 4030, "Pretrain/Step Time": 8.797232188284397} +{"Pretrain/Learning Rate": 3.236443656826839e-05, "Pretrain/Loss": 2.014469623565674, "Pretrain/Loss (Raw)": 1.9791934490203857, "Pretrain/Step": 4031, "Pretrain/Step Time": 8.8020065035671} +{"Pretrain/Learning Rate": 3.235632298665052e-05, "Pretrain/Loss": 2.01296329498291, "Pretrain/Loss (Raw)": 2.1406633853912354, "Pretrain/Step": 4032, "Pretrain/Step Time": 8.80311550758779} +{"Pretrain/Learning Rate": 3.234820855666681e-05, "Pretrain/Loss": 2.010378122329712, "Pretrain/Loss (Raw)": 1.9574378728866577, "Pretrain/Step": 4033, "Pretrain/Step Time": 8.803621586412191} +{"Pretrain/Learning Rate": 3.234009327925308e-05, "Pretrain/Loss": 2.008784770965576, "Pretrain/Loss (Raw)": 2.1562623977661133, "Pretrain/Step": 4034, "Pretrain/Step Time": 8.793596157804132} +{"Pretrain/Learning Rate": 3.23319771553452e-05, "Pretrain/Loss": 2.006944417953491, "Pretrain/Loss (Raw)": 1.8520934581756592, "Pretrain/Step": 4035, "Pretrain/Step Time": 8.794523041695356} +{"Pretrain/Learning Rate": 3.232386018587916e-05, "Pretrain/Loss": 2.0053772926330566, "Pretrain/Loss (Raw)": 1.8855249881744385, "Pretrain/Step": 4036, "Pretrain/Step Time": 8.79862143099308} +{"Pretrain/Learning Rate": 3.2315742371791046e-05, "Pretrain/Loss": 2.0037920475006104, "Pretrain/Loss (Raw)": 1.7845381498336792, "Pretrain/Step": 4037, "Pretrain/Step Time": 8.800686724483967} +{"Pretrain/Learning Rate": 3.230762371401705e-05, "Pretrain/Loss": 2.0042624473571777, "Pretrain/Loss (Raw)": 2.0489799976348877, "Pretrain/Step": 4038, "Pretrain/Step Time": 8.802110202610493} +{"Pretrain/Learning Rate": 3.2299504213493464e-05, "Pretrain/Loss": 2.002790927886963, "Pretrain/Loss (Raw)": 2.0418217182159424, "Pretrain/Step": 4039, "Pretrain/Step Time": 8.799051327630877} +{"Pretrain/Learning Rate": 3.229138387115665e-05, "Pretrain/Loss": 2.00268816947937, "Pretrain/Loss (Raw)": 1.9441494941711426, "Pretrain/Step": 4040, "Pretrain/Step Time": 8.800887009128928} +{"Pretrain/Learning Rate": 3.228326268794309e-05, "Pretrain/Loss": 2.0025248527526855, "Pretrain/Loss (Raw)": 2.0074028968811035, "Pretrain/Step": 4041, "Pretrain/Step Time": 8.806789373978972} +{"Pretrain/Learning Rate": 3.227514066478936e-05, "Pretrain/Loss": 2.0011682510375977, "Pretrain/Loss (Raw)": 1.8999125957489014, "Pretrain/Step": 4042, "Pretrain/Step Time": 8.807457778602839} +{"Pretrain/Learning Rate": 3.226701780263212e-05, "Pretrain/Loss": 2.0035336017608643, "Pretrain/Loss (Raw)": 2.2141377925872803, "Pretrain/Step": 4043, "Pretrain/Step Time": 8.795589478686452} +{"Pretrain/Learning Rate": 3.225889410240815e-05, "Pretrain/Loss": 2.0018410682678223, "Pretrain/Loss (Raw)": 1.9553550481796265, "Pretrain/Step": 4044, "Pretrain/Step Time": 8.799383318051696} +{"Pretrain/Learning Rate": 3.2250769565054305e-05, "Pretrain/Loss": 2.0025880336761475, "Pretrain/Loss (Raw)": 2.1079156398773193, "Pretrain/Step": 4045, "Pretrain/Step Time": 8.798725046217442} +{"Pretrain/Learning Rate": 3.2242644191507545e-05, "Pretrain/Loss": 2.002565383911133, "Pretrain/Loss (Raw)": 1.997347354888916, "Pretrain/Step": 4046, "Pretrain/Step Time": 8.802178023383021} +{"Pretrain/Learning Rate": 3.223451798270493e-05, "Pretrain/Loss": 1.9993698596954346, "Pretrain/Loss (Raw)": 1.7105038166046143, "Pretrain/Step": 4047, "Pretrain/Step Time": 8.793247183784842} +{"Pretrain/Learning Rate": 3.222639093958361e-05, "Pretrain/Loss": 1.9973342418670654, "Pretrain/Loss (Raw)": 1.8797636032104492, "Pretrain/Step": 4048, "Pretrain/Step Time": 8.808747619390488} +{"Pretrain/Learning Rate": 3.2218263063080836e-05, "Pretrain/Loss": 1.9981355667114258, "Pretrain/Loss (Raw)": 2.01639986038208, "Pretrain/Step": 4049, "Pretrain/Step Time": 8.808553475886583} +{"Pretrain/Learning Rate": 3.221013435413395e-05, "Pretrain/Loss": 1.9980660676956177, "Pretrain/Loss (Raw)": 2.0031521320343018, "Pretrain/Step": 4050, "Pretrain/Step Time": 8.803032448515296} +{"Pretrain/Learning Rate": 3.220200481368039e-05, "Pretrain/Loss": 1.9962849617004395, "Pretrain/Loss (Raw)": 1.851971983909607, "Pretrain/Step": 4051, "Pretrain/Step Time": 8.80719168484211} +{"Pretrain/Learning Rate": 3.219387444265771e-05, "Pretrain/Loss": 1.9971659183502197, "Pretrain/Loss (Raw)": 2.0964300632476807, "Pretrain/Step": 4052, "Pretrain/Step Time": 8.810859320685267} +{"Pretrain/Learning Rate": 3.2185743242003524e-05, "Pretrain/Loss": 1.9971593618392944, "Pretrain/Loss (Raw)": 1.9955884218215942, "Pretrain/Step": 4053, "Pretrain/Step Time": 8.810390282422304} +{"Pretrain/Learning Rate": 3.217761121265557e-05, "Pretrain/Loss": 1.9969537258148193, "Pretrain/Loss (Raw)": 2.0039284229278564, "Pretrain/Step": 4054, "Pretrain/Step Time": 8.811814678832889} +{"Pretrain/Learning Rate": 3.2169478355551665e-05, "Pretrain/Loss": 1.9969919919967651, "Pretrain/Loss (Raw)": 2.0621683597564697, "Pretrain/Step": 4055, "Pretrain/Step Time": 8.81282825767994} +{"Pretrain/Learning Rate": 3.216134467162973e-05, "Pretrain/Loss": 1.99735426902771, "Pretrain/Loss (Raw)": 2.197173833847046, "Pretrain/Step": 4056, "Pretrain/Step Time": 8.81018647365272} +{"Pretrain/Learning Rate": 3.215321016182779e-05, "Pretrain/Loss": 1.998977780342102, "Pretrain/Loss (Raw)": 2.189894437789917, "Pretrain/Step": 4057, "Pretrain/Step Time": 8.816666346043348} +{"Pretrain/Learning Rate": 3.2145074827083946e-05, "Pretrain/Loss": 1.9994131326675415, "Pretrain/Loss (Raw)": 2.0403780937194824, "Pretrain/Step": 4058, "Pretrain/Step Time": 8.815043115988374} +{"Pretrain/Learning Rate": 3.21369386683364e-05, "Pretrain/Loss": 1.9985201358795166, "Pretrain/Loss (Raw)": 1.9937843084335327, "Pretrain/Step": 4059, "Pretrain/Step Time": 8.813653726130724} +{"Pretrain/Learning Rate": 3.212880168652346e-05, "Pretrain/Loss": 1.9967992305755615, "Pretrain/Loss (Raw)": 1.9230225086212158, "Pretrain/Step": 4060, "Pretrain/Step Time": 8.814560672268271} +{"Pretrain/Learning Rate": 3.2120663882583514e-05, "Pretrain/Loss": 1.9932823181152344, "Pretrain/Loss (Raw)": 2.0279741287231445, "Pretrain/Step": 4061, "Pretrain/Step Time": 8.812042731791735} +{"Pretrain/Learning Rate": 3.2112525257455064e-05, "Pretrain/Loss": 1.9896693229675293, "Pretrain/Loss (Raw)": 1.690871238708496, "Pretrain/Step": 4062, "Pretrain/Step Time": 8.810954289510846} +{"Pretrain/Learning Rate": 3.210438581207667e-05, "Pretrain/Loss": 1.9942724704742432, "Pretrain/Loss (Raw)": 2.2935233116149902, "Pretrain/Step": 4063, "Pretrain/Step Time": 8.805048311129212} +{"Pretrain/Learning Rate": 3.209624554738704e-05, "Pretrain/Loss": 1.9938255548477173, "Pretrain/Loss (Raw)": 2.069039821624756, "Pretrain/Step": 4064, "Pretrain/Step Time": 8.802440578117967} +{"Pretrain/Learning Rate": 3.208810446432493e-05, "Pretrain/Loss": 1.9919828176498413, "Pretrain/Loss (Raw)": 1.842301368713379, "Pretrain/Step": 4065, "Pretrain/Step Time": 8.804144760593772} +{"Pretrain/Learning Rate": 3.207996256382922e-05, "Pretrain/Loss": 1.9911011457443237, "Pretrain/Loss (Raw)": 2.0150437355041504, "Pretrain/Step": 4066, "Pretrain/Step Time": 8.803237345069647} +{"Pretrain/Learning Rate": 3.207181984683886e-05, "Pretrain/Loss": 1.9913451671600342, "Pretrain/Loss (Raw)": 2.1735689640045166, "Pretrain/Step": 4067, "Pretrain/Step Time": 8.814899493008852} +{"Pretrain/Learning Rate": 3.2063676314292914e-05, "Pretrain/Loss": 1.99310302734375, "Pretrain/Loss (Raw)": 1.9938292503356934, "Pretrain/Step": 4068, "Pretrain/Step Time": 8.8212506249547} +{"Pretrain/Learning Rate": 3.205553196713052e-05, "Pretrain/Loss": 1.9940900802612305, "Pretrain/Loss (Raw)": 2.1455342769622803, "Pretrain/Step": 4069, "Pretrain/Step Time": 8.815252339467406} +{"Pretrain/Learning Rate": 3.204738680629094e-05, "Pretrain/Loss": 1.994864583015442, "Pretrain/Loss (Raw)": 2.037864923477173, "Pretrain/Step": 4070, "Pretrain/Step Time": 8.818809017539024} +{"Pretrain/Learning Rate": 3.2039240832713516e-05, "Pretrain/Loss": 1.9933242797851562, "Pretrain/Loss (Raw)": 1.8931488990783691, "Pretrain/Step": 4071, "Pretrain/Step Time": 8.814125521108508} +{"Pretrain/Learning Rate": 3.203109404733765e-05, "Pretrain/Loss": 1.994455337524414, "Pretrain/Loss (Raw)": 2.0889241695404053, "Pretrain/Step": 4072, "Pretrain/Step Time": 8.817171327769756} +{"Pretrain/Learning Rate": 3.20229464511029e-05, "Pretrain/Loss": 1.9961705207824707, "Pretrain/Loss (Raw)": 2.0946028232574463, "Pretrain/Step": 4073, "Pretrain/Step Time": 8.813670467585325} +{"Pretrain/Learning Rate": 3.2014798044948866e-05, "Pretrain/Loss": 1.996925950050354, "Pretrain/Loss (Raw)": 2.0860495567321777, "Pretrain/Step": 4074, "Pretrain/Step Time": 8.81114269606769} +{"Pretrain/Learning Rate": 3.2006648829815265e-05, "Pretrain/Loss": 1.9996657371520996, "Pretrain/Loss (Raw)": 2.0286219120025635, "Pretrain/Step": 4075, "Pretrain/Step Time": 8.813146973028779} +{"Pretrain/Learning Rate": 3.1998498806641907e-05, "Pretrain/Loss": 1.9970213174819946, "Pretrain/Loss (Raw)": 1.9973537921905518, "Pretrain/Step": 4076, "Pretrain/Step Time": 8.80041678622365} +{"Pretrain/Learning Rate": 3.19903479763687e-05, "Pretrain/Loss": 1.9980275630950928, "Pretrain/Loss (Raw)": 1.784223198890686, "Pretrain/Step": 4077, "Pretrain/Step Time": 8.800094665959477} +{"Pretrain/Learning Rate": 3.19821963399356e-05, "Pretrain/Loss": 1.997576355934143, "Pretrain/Loss (Raw)": 2.0511276721954346, "Pretrain/Step": 4078, "Pretrain/Step Time": 8.800016425549984} +{"Pretrain/Learning Rate": 3.1974043898282744e-05, "Pretrain/Loss": 1.9937365055084229, "Pretrain/Loss (Raw)": 1.7311092615127563, "Pretrain/Step": 4079, "Pretrain/Step Time": 8.805684793740511} +{"Pretrain/Learning Rate": 3.196589065235026e-05, "Pretrain/Loss": 1.9928197860717773, "Pretrain/Loss (Raw)": 1.94461190700531, "Pretrain/Step": 4080, "Pretrain/Step Time": 8.80345168337226} +{"Pretrain/Learning Rate": 3.195773660307846e-05, "Pretrain/Loss": 1.9916540384292603, "Pretrain/Loss (Raw)": 1.9303537607192993, "Pretrain/Step": 4081, "Pretrain/Step Time": 8.800357250496745} +{"Pretrain/Learning Rate": 3.1949581751407676e-05, "Pretrain/Loss": 1.993039846420288, "Pretrain/Loss (Raw)": 2.2018048763275146, "Pretrain/Step": 4082, "Pretrain/Step Time": 8.805040577426553} +{"Pretrain/Learning Rate": 3.1941426098278383e-05, "Pretrain/Loss": 1.9956960678100586, "Pretrain/Loss (Raw)": 2.3090691566467285, "Pretrain/Step": 4083, "Pretrain/Step Time": 8.809342332184315} +{"Pretrain/Learning Rate": 3.193326964463112e-05, "Pretrain/Loss": 1.9945297241210938, "Pretrain/Loss (Raw)": 1.9129983186721802, "Pretrain/Step": 4084, "Pretrain/Step Time": 8.804581984877586} +{"Pretrain/Learning Rate": 3.192511239140653e-05, "Pretrain/Loss": 1.9929184913635254, "Pretrain/Loss (Raw)": 1.9274744987487793, "Pretrain/Step": 4085, "Pretrain/Step Time": 8.804501699283719} +{"Pretrain/Learning Rate": 3.1916954339545355e-05, "Pretrain/Loss": 1.9935146570205688, "Pretrain/Loss (Raw)": 1.9571856260299683, "Pretrain/Step": 4086, "Pretrain/Step Time": 8.806660989299417} +{"Pretrain/Learning Rate": 3.19087954899884e-05, "Pretrain/Loss": 1.9890282154083252, "Pretrain/Loss (Raw)": 1.461463212966919, "Pretrain/Step": 4087, "Pretrain/Step Time": 8.80629044212401} +{"Pretrain/Learning Rate": 3.190063584367661e-05, "Pretrain/Loss": 1.98789644241333, "Pretrain/Loss (Raw)": 1.7296311855316162, "Pretrain/Step": 4088, "Pretrain/Step Time": 8.81124198436737} +{"Pretrain/Learning Rate": 3.1892475401550956e-05, "Pretrain/Loss": 1.9878180027008057, "Pretrain/Loss (Raw)": 2.097050428390503, "Pretrain/Step": 4089, "Pretrain/Step Time": 8.813770340755582} +{"Pretrain/Learning Rate": 3.1884314164552576e-05, "Pretrain/Loss": 1.9878828525543213, "Pretrain/Loss (Raw)": 1.9511276483535767, "Pretrain/Step": 4090, "Pretrain/Step Time": 8.802149271592498} +{"Pretrain/Learning Rate": 3.187615213362264e-05, "Pretrain/Loss": 1.9849228858947754, "Pretrain/Loss (Raw)": 1.8706883192062378, "Pretrain/Step": 4091, "Pretrain/Step Time": 8.80055558308959} +{"Pretrain/Learning Rate": 3.186798930970244e-05, "Pretrain/Loss": 1.9851007461547852, "Pretrain/Loss (Raw)": 2.0290894508361816, "Pretrain/Step": 4092, "Pretrain/Step Time": 8.795421740040183} +{"Pretrain/Learning Rate": 3.185982569373335e-05, "Pretrain/Loss": 1.9858933687210083, "Pretrain/Loss (Raw)": 1.9745573997497559, "Pretrain/Step": 4093, "Pretrain/Step Time": 8.79799829237163} +{"Pretrain/Learning Rate": 3.185166128665684e-05, "Pretrain/Loss": 1.9882515668869019, "Pretrain/Loss (Raw)": 2.210765838623047, "Pretrain/Step": 4094, "Pretrain/Step Time": 8.803860543295741} +{"Pretrain/Learning Rate": 3.184349608941446e-05, "Pretrain/Loss": 1.9857653379440308, "Pretrain/Loss (Raw)": 1.820294737815857, "Pretrain/Step": 4095, "Pretrain/Step Time": 8.8069580886513} +{"Pretrain/Learning Rate": 3.183533010294787e-05, "Pretrain/Loss": 1.983506202697754, "Pretrain/Loss (Raw)": 1.6647368669509888, "Pretrain/Step": 4096, "Pretrain/Step Time": 8.80672038719058} +{"Pretrain/Learning Rate": 3.18271633281988e-05, "Pretrain/Loss": 1.9859603643417358, "Pretrain/Loss (Raw)": 1.9585931301116943, "Pretrain/Step": 4097, "Pretrain/Step Time": 8.807175401598215} +{"Pretrain/Learning Rate": 3.181899576610908e-05, "Pretrain/Loss": 1.989701747894287, "Pretrain/Loss (Raw)": 2.033914089202881, "Pretrain/Step": 4098, "Pretrain/Step Time": 8.808387134224176} +{"Pretrain/Learning Rate": 3.1810827417620634e-05, "Pretrain/Loss": 1.9909846782684326, "Pretrain/Loss (Raw)": 2.0629806518554688, "Pretrain/Step": 4099, "Pretrain/Step Time": 8.795978033915162} +{"Pretrain/Learning Rate": 3.1802658283675486e-05, "Pretrain/Loss": 1.9925599098205566, "Pretrain/Loss (Raw)": 2.139613389968872, "Pretrain/Step": 4100, "Pretrain/Step Time": 8.79912082850933} +{"Pretrain/Learning Rate": 3.179448836521573e-05, "Pretrain/Loss": 1.9937011003494263, "Pretrain/Loss (Raw)": 2.232283353805542, "Pretrain/Step": 4101, "Pretrain/Step Time": 8.799322685226798} +{"Pretrain/Learning Rate": 3.178631766318355e-05, "Pretrain/Loss": 1.9929296970367432, "Pretrain/Loss (Raw)": 1.9126408100128174, "Pretrain/Step": 4102, "Pretrain/Step Time": 8.80181503854692} +{"Pretrain/Learning Rate": 3.177814617852124e-05, "Pretrain/Loss": 1.9940814971923828, "Pretrain/Loss (Raw)": 2.2102370262145996, "Pretrain/Step": 4103, "Pretrain/Step Time": 8.804495992138982} +{"Pretrain/Learning Rate": 3.176997391217117e-05, "Pretrain/Loss": 1.9902948141098022, "Pretrain/Loss (Raw)": 1.6399567127227783, "Pretrain/Step": 4104, "Pretrain/Step Time": 8.805407457053661} +{"Pretrain/Learning Rate": 3.176180086507582e-05, "Pretrain/Loss": 1.9904625415802002, "Pretrain/Loss (Raw)": 2.0913102626800537, "Pretrain/Step": 4105, "Pretrain/Step Time": 8.806004468351603} +{"Pretrain/Learning Rate": 3.175362703817773e-05, "Pretrain/Loss": 1.9901962280273438, "Pretrain/Loss (Raw)": 2.023041248321533, "Pretrain/Step": 4106, "Pretrain/Step Time": 8.81010265648365} +{"Pretrain/Learning Rate": 3.1745452432419534e-05, "Pretrain/Loss": 1.9834880828857422, "Pretrain/Loss (Raw)": 1.4635376930236816, "Pretrain/Step": 4107, "Pretrain/Step Time": 8.798527840524912} +{"Pretrain/Learning Rate": 3.1737277048743984e-05, "Pretrain/Loss": 1.9851738214492798, "Pretrain/Loss (Raw)": 2.1777637004852295, "Pretrain/Step": 4108, "Pretrain/Step Time": 8.792814107611775} +{"Pretrain/Learning Rate": 3.17291008880939e-05, "Pretrain/Loss": 1.9857213497161865, "Pretrain/Loss (Raw)": 2.06952166557312, "Pretrain/Step": 4109, "Pretrain/Step Time": 8.794291136786342} +{"Pretrain/Learning Rate": 3.172092395141219e-05, "Pretrain/Loss": 1.985982894897461, "Pretrain/Loss (Raw)": 2.0730838775634766, "Pretrain/Step": 4110, "Pretrain/Step Time": 8.789449637755752} +{"Pretrain/Learning Rate": 3.171274623964186e-05, "Pretrain/Loss": 1.9834704399108887, "Pretrain/Loss (Raw)": 1.6064738035202026, "Pretrain/Step": 4111, "Pretrain/Step Time": 8.792888171970844} +{"Pretrain/Learning Rate": 3.170456775372601e-05, "Pretrain/Loss": 1.9841954708099365, "Pretrain/Loss (Raw)": 1.9339491128921509, "Pretrain/Step": 4112, "Pretrain/Step Time": 8.796917501837015} +{"Pretrain/Learning Rate": 3.1696388494607804e-05, "Pretrain/Loss": 1.9848918914794922, "Pretrain/Loss (Raw)": 2.2233331203460693, "Pretrain/Step": 4113, "Pretrain/Step Time": 8.79359320551157} +{"Pretrain/Learning Rate": 3.168820846323053e-05, "Pretrain/Loss": 1.98458731174469, "Pretrain/Loss (Raw)": 1.996915578842163, "Pretrain/Step": 4114, "Pretrain/Step Time": 8.795940415933728} +{"Pretrain/Learning Rate": 3.1680027660537524e-05, "Pretrain/Loss": 1.9841554164886475, "Pretrain/Loss (Raw)": 1.930407166481018, "Pretrain/Step": 4115, "Pretrain/Step Time": 8.795271325856447} +{"Pretrain/Learning Rate": 3.167184608747227e-05, "Pretrain/Loss": 1.9841837882995605, "Pretrain/Loss (Raw)": 2.0069618225097656, "Pretrain/Step": 4116, "Pretrain/Step Time": 8.794771866872907} +{"Pretrain/Learning Rate": 3.1663663744978276e-05, "Pretrain/Loss": 1.9837075471878052, "Pretrain/Loss (Raw)": 1.9012973308563232, "Pretrain/Step": 4117, "Pretrain/Step Time": 8.793826406821609} +{"Pretrain/Learning Rate": 3.165548063399919e-05, "Pretrain/Loss": 1.9803781509399414, "Pretrain/Loss (Raw)": 1.6580569744110107, "Pretrain/Step": 4118, "Pretrain/Step Time": 8.794561546295881} +{"Pretrain/Learning Rate": 3.1647296755478694e-05, "Pretrain/Loss": 1.982043743133545, "Pretrain/Loss (Raw)": 2.127087354660034, "Pretrain/Step": 4119, "Pretrain/Step Time": 8.79084587842226} +{"Pretrain/Learning Rate": 3.163911211036063e-05, "Pretrain/Loss": 1.9832956790924072, "Pretrain/Loss (Raw)": 2.058135509490967, "Pretrain/Step": 4120, "Pretrain/Step Time": 8.788534140214324} +{"Pretrain/Learning Rate": 3.163092669958887e-05, "Pretrain/Loss": 1.9823222160339355, "Pretrain/Loss (Raw)": 1.9681519269943237, "Pretrain/Step": 4121, "Pretrain/Step Time": 8.78636321797967} +{"Pretrain/Learning Rate": 3.16227405241074e-05, "Pretrain/Loss": 1.9816310405731201, "Pretrain/Loss (Raw)": 1.8638561964035034, "Pretrain/Step": 4122, "Pretrain/Step Time": 8.779353404417634} +{"Pretrain/Learning Rate": 3.161455358486028e-05, "Pretrain/Loss": 1.9829380512237549, "Pretrain/Loss (Raw)": 2.0313985347747803, "Pretrain/Step": 4123, "Pretrain/Step Time": 8.7771115899086} +{"Pretrain/Learning Rate": 3.160636588279167e-05, "Pretrain/Loss": 1.9843147993087769, "Pretrain/Loss (Raw)": 2.157334566116333, "Pretrain/Step": 4124, "Pretrain/Step Time": 8.778081139549613} +{"Pretrain/Learning Rate": 3.159817741884582e-05, "Pretrain/Loss": 1.9842382669448853, "Pretrain/Loss (Raw)": 2.114863157272339, "Pretrain/Step": 4125, "Pretrain/Step Time": 8.77542189694941} +{"Pretrain/Learning Rate": 3.1589988193967056e-05, "Pretrain/Loss": 1.9852941036224365, "Pretrain/Loss (Raw)": 2.1470305919647217, "Pretrain/Step": 4126, "Pretrain/Step Time": 8.779348781332374} +{"Pretrain/Learning Rate": 3.15817982090998e-05, "Pretrain/Loss": 1.9856433868408203, "Pretrain/Loss (Raw)": 1.9904032945632935, "Pretrain/Step": 4127, "Pretrain/Step Time": 8.778363823890686} +{"Pretrain/Learning Rate": 3.157360746518857e-05, "Pretrain/Loss": 1.986566424369812, "Pretrain/Loss (Raw)": 2.1796257495880127, "Pretrain/Step": 4128, "Pretrain/Step Time": 8.778208240866661} +{"Pretrain/Learning Rate": 3.1565415963177944e-05, "Pretrain/Loss": 1.9899959564208984, "Pretrain/Loss (Raw)": 2.061521291732788, "Pretrain/Step": 4129, "Pretrain/Step Time": 8.782356642186642} +{"Pretrain/Learning Rate": 3.1557223704012606e-05, "Pretrain/Loss": 1.989274263381958, "Pretrain/Loss (Raw)": 1.9263887405395508, "Pretrain/Step": 4130, "Pretrain/Step Time": 8.774365846067667} +{"Pretrain/Learning Rate": 3.154903068863734e-05, "Pretrain/Loss": 1.9881293773651123, "Pretrain/Loss (Raw)": 1.8237818479537964, "Pretrain/Step": 4131, "Pretrain/Step Time": 8.776229111477733} +{"Pretrain/Learning Rate": 3.154083691799699e-05, "Pretrain/Loss": 1.9887111186981201, "Pretrain/Loss (Raw)": 2.1476364135742188, "Pretrain/Step": 4132, "Pretrain/Step Time": 8.778118474408984} +{"Pretrain/Learning Rate": 3.1532642393036506e-05, "Pretrain/Loss": 1.9850540161132812, "Pretrain/Loss (Raw)": 1.5237836837768555, "Pretrain/Step": 4133, "Pretrain/Step Time": 8.77288718521595} +{"Pretrain/Learning Rate": 3.1524447114700914e-05, "Pretrain/Loss": 1.9873661994934082, "Pretrain/Loss (Raw)": 2.0417673587799072, "Pretrain/Step": 4134, "Pretrain/Step Time": 8.77334233187139} +{"Pretrain/Learning Rate": 3.151625108393534e-05, "Pretrain/Loss": 1.9866559505462646, "Pretrain/Loss (Raw)": 2.022914409637451, "Pretrain/Step": 4135, "Pretrain/Step Time": 8.77104433439672} +{"Pretrain/Learning Rate": 3.150805430168499e-05, "Pretrain/Loss": 1.9865442514419556, "Pretrain/Loss (Raw)": 1.9849028587341309, "Pretrain/Step": 4136, "Pretrain/Step Time": 8.767790647223592} +{"Pretrain/Learning Rate": 3.149985676889515e-05, "Pretrain/Loss": 1.9845359325408936, "Pretrain/Loss (Raw)": 1.9128496646881104, "Pretrain/Step": 4137, "Pretrain/Step Time": 8.766103081405163} +{"Pretrain/Learning Rate": 3.14916584865112e-05, "Pretrain/Loss": 1.9832603931427002, "Pretrain/Loss (Raw)": 1.7033286094665527, "Pretrain/Step": 4138, "Pretrain/Step Time": 8.761431926861405} +{"Pretrain/Learning Rate": 3.1483459455478603e-05, "Pretrain/Loss": 1.9868706464767456, "Pretrain/Loss (Raw)": 1.9605202674865723, "Pretrain/Step": 4139, "Pretrain/Step Time": 8.754303490743041} +{"Pretrain/Learning Rate": 3.147525967674291e-05, "Pretrain/Loss": 1.9869271516799927, "Pretrain/Loss (Raw)": 2.0827760696411133, "Pretrain/Step": 4140, "Pretrain/Step Time": 8.756163567304611} +{"Pretrain/Learning Rate": 3.146705915124976e-05, "Pretrain/Loss": 1.9856271743774414, "Pretrain/Loss (Raw)": 1.8832883834838867, "Pretrain/Step": 4141, "Pretrain/Step Time": 8.753230454400182} +{"Pretrain/Learning Rate": 3.145885787994487e-05, "Pretrain/Loss": 1.9861481189727783, "Pretrain/Loss (Raw)": 2.0863921642303467, "Pretrain/Step": 4142, "Pretrain/Step Time": 8.756342785432935} +{"Pretrain/Learning Rate": 3.1450655863774056e-05, "Pretrain/Loss": 1.9855670928955078, "Pretrain/Loss (Raw)": 1.943821668624878, "Pretrain/Step": 4143, "Pretrain/Step Time": 8.759149689227343} +{"Pretrain/Learning Rate": 3.144245310368321e-05, "Pretrain/Loss": 1.9865046739578247, "Pretrain/Loss (Raw)": 2.056776285171509, "Pretrain/Step": 4144, "Pretrain/Step Time": 8.752532068639994} +{"Pretrain/Learning Rate": 3.1434249600618315e-05, "Pretrain/Loss": 1.989626169204712, "Pretrain/Loss (Raw)": 2.0591259002685547, "Pretrain/Step": 4145, "Pretrain/Step Time": 8.752675028517842} +{"Pretrain/Learning Rate": 3.142604535552544e-05, "Pretrain/Loss": 1.9890916347503662, "Pretrain/Loss (Raw)": 2.0155441761016846, "Pretrain/Step": 4146, "Pretrain/Step Time": 8.75358566828072} +{"Pretrain/Learning Rate": 3.1417840369350735e-05, "Pretrain/Loss": 1.991835355758667, "Pretrain/Loss (Raw)": 2.091130495071411, "Pretrain/Step": 4147, "Pretrain/Step Time": 8.752706915140152} +{"Pretrain/Learning Rate": 3.140963464304043e-05, "Pretrain/Loss": 1.9916834831237793, "Pretrain/Loss (Raw)": 2.0397796630859375, "Pretrain/Step": 4148, "Pretrain/Step Time": 8.751933973282576} +{"Pretrain/Learning Rate": 3.140142817754086e-05, "Pretrain/Loss": 1.988950490951538, "Pretrain/Loss (Raw)": 1.8888550996780396, "Pretrain/Step": 4149, "Pretrain/Step Time": 8.754452859982848} +{"Pretrain/Learning Rate": 3.1393220973798425e-05, "Pretrain/Loss": 1.9912766218185425, "Pretrain/Loss (Raw)": 2.1409733295440674, "Pretrain/Step": 4150, "Pretrain/Step Time": 8.750702017918229} +{"Pretrain/Learning Rate": 3.1385013032759623e-05, "Pretrain/Loss": 1.9919450283050537, "Pretrain/Loss (Raw)": 2.0116093158721924, "Pretrain/Step": 4151, "Pretrain/Step Time": 8.745832500979304} +{"Pretrain/Learning Rate": 3.137680435537104e-05, "Pretrain/Loss": 1.9903130531311035, "Pretrain/Loss (Raw)": 1.9719138145446777, "Pretrain/Step": 4152, "Pretrain/Step Time": 8.757641876116395} +{"Pretrain/Learning Rate": 3.136859494257931e-05, "Pretrain/Loss": 1.9901676177978516, "Pretrain/Loss (Raw)": 2.1428284645080566, "Pretrain/Step": 4153, "Pretrain/Step Time": 8.75386331230402} +{"Pretrain/Learning Rate": 3.136038479533122e-05, "Pretrain/Loss": 1.9911236763000488, "Pretrain/Loss (Raw)": 2.121445894241333, "Pretrain/Step": 4154, "Pretrain/Step Time": 8.758505804464221} +{"Pretrain/Learning Rate": 3.135217391457358e-05, "Pretrain/Loss": 1.9899370670318604, "Pretrain/Loss (Raw)": 1.929391622543335, "Pretrain/Step": 4155, "Pretrain/Step Time": 8.75339050963521} +{"Pretrain/Learning Rate": 3.1343962301253305e-05, "Pretrain/Loss": 1.9916692972183228, "Pretrain/Loss (Raw)": 2.0181195735931396, "Pretrain/Step": 4156, "Pretrain/Step Time": 8.756921019405127} +{"Pretrain/Learning Rate": 3.133574995631741e-05, "Pretrain/Loss": 1.9909685850143433, "Pretrain/Loss (Raw)": 2.019418478012085, "Pretrain/Step": 4157, "Pretrain/Step Time": 8.75585389137268} +{"Pretrain/Learning Rate": 3.132753688071297e-05, "Pretrain/Loss": 1.9877073764801025, "Pretrain/Loss (Raw)": 1.8557020425796509, "Pretrain/Step": 4158, "Pretrain/Step Time": 8.752477115020156} +{"Pretrain/Learning Rate": 3.1319323075387165e-05, "Pretrain/Loss": 1.9904334545135498, "Pretrain/Loss (Raw)": 2.328137159347534, "Pretrain/Step": 4159, "Pretrain/Step Time": 8.751835852861404} +{"Pretrain/Learning Rate": 3.131110854128724e-05, "Pretrain/Loss": 1.988084316253662, "Pretrain/Loss (Raw)": 1.8399521112442017, "Pretrain/Step": 4160, "Pretrain/Step Time": 8.748547721654177} +{"Pretrain/Learning Rate": 3.130289327936055e-05, "Pretrain/Loss": 1.9893929958343506, "Pretrain/Loss (Raw)": 2.1249632835388184, "Pretrain/Step": 4161, "Pretrain/Step Time": 8.750294202938676} +{"Pretrain/Learning Rate": 3.1294677290554494e-05, "Pretrain/Loss": 1.989102840423584, "Pretrain/Loss (Raw)": 2.1191110610961914, "Pretrain/Step": 4162, "Pretrain/Step Time": 8.753060506656766} +{"Pretrain/Learning Rate": 3.128646057581659e-05, "Pretrain/Loss": 1.992213249206543, "Pretrain/Loss (Raw)": 2.2502329349517822, "Pretrain/Step": 4163, "Pretrain/Step Time": 8.749646607786417} +{"Pretrain/Learning Rate": 3.1278243136094436e-05, "Pretrain/Loss": 1.994080662727356, "Pretrain/Loss (Raw)": 2.1245391368865967, "Pretrain/Step": 4164, "Pretrain/Step Time": 8.74762536585331} +{"Pretrain/Learning Rate": 3.1270024972335706e-05, "Pretrain/Loss": 1.9954311847686768, "Pretrain/Loss (Raw)": 1.9574143886566162, "Pretrain/Step": 4165, "Pretrain/Step Time": 8.744868950918317} +{"Pretrain/Learning Rate": 3.1261806085488144e-05, "Pretrain/Loss": 1.993518590927124, "Pretrain/Loss (Raw)": 1.804173469543457, "Pretrain/Step": 4166, "Pretrain/Step Time": 8.746927985921502} +{"Pretrain/Learning Rate": 3.1253586476499594e-05, "Pretrain/Loss": 1.991797924041748, "Pretrain/Loss (Raw)": 1.8215817213058472, "Pretrain/Step": 4167, "Pretrain/Step Time": 8.747046932578087} +{"Pretrain/Learning Rate": 3.124536614631799e-05, "Pretrain/Loss": 1.990795373916626, "Pretrain/Loss (Raw)": 1.8157975673675537, "Pretrain/Step": 4168, "Pretrain/Step Time": 8.743443932384253} +{"Pretrain/Learning Rate": 3.123714509589133e-05, "Pretrain/Loss": 1.9916484355926514, "Pretrain/Loss (Raw)": 2.116602659225464, "Pretrain/Step": 4169, "Pretrain/Step Time": 8.738011375069618} +{"Pretrain/Learning Rate": 3.122892332616771e-05, "Pretrain/Loss": 1.9914528131484985, "Pretrain/Loss (Raw)": 1.8748830556869507, "Pretrain/Step": 4170, "Pretrain/Step Time": 8.734225308522582} +{"Pretrain/Learning Rate": 3.12207008380953e-05, "Pretrain/Loss": 1.9893862009048462, "Pretrain/Loss (Raw)": 1.9496139287948608, "Pretrain/Step": 4171, "Pretrain/Step Time": 8.734385058283806} +{"Pretrain/Learning Rate": 3.121247763262235e-05, "Pretrain/Loss": 1.9898895025253296, "Pretrain/Loss (Raw)": 2.019768238067627, "Pretrain/Step": 4172, "Pretrain/Step Time": 8.727376705035567} +{"Pretrain/Learning Rate": 3.120425371069721e-05, "Pretrain/Loss": 1.9876619577407837, "Pretrain/Loss (Raw)": 1.8227975368499756, "Pretrain/Step": 4173, "Pretrain/Step Time": 8.732605870813131} +{"Pretrain/Learning Rate": 3.119602907326829e-05, "Pretrain/Loss": 1.9861689805984497, "Pretrain/Loss (Raw)": 1.8062427043914795, "Pretrain/Step": 4174, "Pretrain/Step Time": 8.728833999484777} +{"Pretrain/Learning Rate": 3.118780372128411e-05, "Pretrain/Loss": 1.9875688552856445, "Pretrain/Loss (Raw)": 1.8897053003311157, "Pretrain/Step": 4175, "Pretrain/Step Time": 8.728096008300781} +{"Pretrain/Learning Rate": 3.1179577655693245e-05, "Pretrain/Loss": 1.9883109331130981, "Pretrain/Loss (Raw)": 1.9747260808944702, "Pretrain/Step": 4176, "Pretrain/Step Time": 8.717620881274343} +{"Pretrain/Learning Rate": 3.1171350877444365e-05, "Pretrain/Loss": 1.987904667854309, "Pretrain/Loss (Raw)": 1.964391827583313, "Pretrain/Step": 4177, "Pretrain/Step Time": 8.717938320711255} +{"Pretrain/Learning Rate": 3.116312338748623e-05, "Pretrain/Loss": 1.9862697124481201, "Pretrain/Loss (Raw)": 1.7938987016677856, "Pretrain/Step": 4178, "Pretrain/Step Time": 8.712220100685954} +{"Pretrain/Learning Rate": 3.115489518676765e-05, "Pretrain/Loss": 1.987600326538086, "Pretrain/Loss (Raw)": 2.0222928524017334, "Pretrain/Step": 4179, "Pretrain/Step Time": 8.710405407473445} +{"Pretrain/Learning Rate": 3.1146666276237554e-05, "Pretrain/Loss": 1.9850728511810303, "Pretrain/Loss (Raw)": 1.7729023694992065, "Pretrain/Step": 4180, "Pretrain/Step Time": 8.706057148054242} +{"Pretrain/Learning Rate": 3.113843665684495e-05, "Pretrain/Loss": 1.9867093563079834, "Pretrain/Loss (Raw)": 2.2050628662109375, "Pretrain/Step": 4181, "Pretrain/Step Time": 8.703155180439353} +{"Pretrain/Learning Rate": 3.1130206329538905e-05, "Pretrain/Loss": 1.9869507551193237, "Pretrain/Loss (Raw)": 2.0348236560821533, "Pretrain/Step": 4182, "Pretrain/Step Time": 8.703731516376138} +{"Pretrain/Learning Rate": 3.112197529526857e-05, "Pretrain/Loss": 1.9857076406478882, "Pretrain/Loss (Raw)": 1.9030487537384033, "Pretrain/Step": 4183, "Pretrain/Step Time": 8.708608217537403} +{"Pretrain/Learning Rate": 3.11137435549832e-05, "Pretrain/Loss": 1.984346866607666, "Pretrain/Loss (Raw)": 2.022996187210083, "Pretrain/Step": 4184, "Pretrain/Step Time": 8.703949075192213} +{"Pretrain/Learning Rate": 3.110551110963212e-05, "Pretrain/Loss": 1.9840465784072876, "Pretrain/Loss (Raw)": 2.151451826095581, "Pretrain/Step": 4185, "Pretrain/Step Time": 8.695852851495147} +{"Pretrain/Learning Rate": 3.109727796016472e-05, "Pretrain/Loss": 1.9825828075408936, "Pretrain/Loss (Raw)": 1.8530129194259644, "Pretrain/Step": 4186, "Pretrain/Step Time": 8.695194702595472} +{"Pretrain/Learning Rate": 3.10890441075305e-05, "Pretrain/Loss": 1.9813202619552612, "Pretrain/Loss (Raw)": 1.8321938514709473, "Pretrain/Step": 4187, "Pretrain/Step Time": 8.705552840605378} +{"Pretrain/Learning Rate": 3.108080955267902e-05, "Pretrain/Loss": 1.9813597202301025, "Pretrain/Loss (Raw)": 1.9280766248703003, "Pretrain/Step": 4188, "Pretrain/Step Time": 8.70396506972611} +{"Pretrain/Learning Rate": 3.107257429655993e-05, "Pretrain/Loss": 1.9816758632659912, "Pretrain/Loss (Raw)": 2.0684380531311035, "Pretrain/Step": 4189, "Pretrain/Step Time": 8.706071170046926} +{"Pretrain/Learning Rate": 3.1064338340122953e-05, "Pretrain/Loss": 1.984250545501709, "Pretrain/Loss (Raw)": 2.0204238891601562, "Pretrain/Step": 4190, "Pretrain/Step Time": 8.708878573030233} +{"Pretrain/Learning Rate": 3.105610168431791e-05, "Pretrain/Loss": 1.9825191497802734, "Pretrain/Loss (Raw)": 2.07190203666687, "Pretrain/Step": 4191, "Pretrain/Step Time": 8.702343184500933} +{"Pretrain/Learning Rate": 3.1047864330094675e-05, "Pretrain/Loss": 1.9827945232391357, "Pretrain/Loss (Raw)": 2.1042890548706055, "Pretrain/Step": 4192, "Pretrain/Step Time": 8.706490140408278} +{"Pretrain/Learning Rate": 3.1039626278403234e-05, "Pretrain/Loss": 1.9839768409729004, "Pretrain/Loss (Raw)": 1.993627667427063, "Pretrain/Step": 4193, "Pretrain/Step Time": 8.700690126046538} +{"Pretrain/Learning Rate": 3.1031387530193626e-05, "Pretrain/Loss": 1.9854432344436646, "Pretrain/Loss (Raw)": 2.2027511596679688, "Pretrain/Step": 4194, "Pretrain/Step Time": 8.702374631538987} +{"Pretrain/Learning Rate": 3.1023148086415984e-05, "Pretrain/Loss": 1.9839712381362915, "Pretrain/Loss (Raw)": 1.985154151916504, "Pretrain/Step": 4195, "Pretrain/Step Time": 8.692895824089646} +{"Pretrain/Learning Rate": 3.101490794802053e-05, "Pretrain/Loss": 1.9843121767044067, "Pretrain/Loss (Raw)": 2.037477731704712, "Pretrain/Step": 4196, "Pretrain/Step Time": 8.691247586160898} +{"Pretrain/Learning Rate": 3.100666711595754e-05, "Pretrain/Loss": 1.9849021434783936, "Pretrain/Loss (Raw)": 2.221048593521118, "Pretrain/Step": 4197, "Pretrain/Step Time": 8.691634483635426} +{"Pretrain/Learning Rate": 3.09984255911774e-05, "Pretrain/Loss": 1.9797264337539673, "Pretrain/Loss (Raw)": 1.3753646612167358, "Pretrain/Step": 4198, "Pretrain/Step Time": 8.694295780733228} +{"Pretrain/Learning Rate": 3.099018337463056e-05, "Pretrain/Loss": 1.97661554813385, "Pretrain/Loss (Raw)": 1.494951605796814, "Pretrain/Step": 4199, "Pretrain/Step Time": 8.688814772292972} +{"Pretrain/Learning Rate": 3.0981940467267547e-05, "Pretrain/Loss": 1.9750850200653076, "Pretrain/Loss (Raw)": 1.8930186033248901, "Pretrain/Step": 4200, "Pretrain/Step Time": 8.687638910487294} +{"Pretrain/Learning Rate": 3.097369687003896e-05, "Pretrain/Loss": 1.9710025787353516, "Pretrain/Loss (Raw)": 1.5720405578613281, "Pretrain/Step": 4201, "Pretrain/Step Time": 8.686172936111689} +{"Pretrain/Learning Rate": 3.096545258389551e-05, "Pretrain/Loss": 1.9703848361968994, "Pretrain/Loss (Raw)": 2.0069940090179443, "Pretrain/Step": 4202, "Pretrain/Step Time": 8.687651405110955} +{"Pretrain/Learning Rate": 3.0957207609787945e-05, "Pretrain/Loss": 1.970110297203064, "Pretrain/Loss (Raw)": 1.9934779405593872, "Pretrain/Step": 4203, "Pretrain/Step Time": 8.68416159413755} +{"Pretrain/Learning Rate": 3.094896194866714e-05, "Pretrain/Loss": 1.968818187713623, "Pretrain/Loss (Raw)": 1.8319551944732666, "Pretrain/Step": 4204, "Pretrain/Step Time": 8.682486975565553} +{"Pretrain/Learning Rate": 3.094071560148401e-05, "Pretrain/Loss": 1.971944808959961, "Pretrain/Loss (Raw)": 2.1844470500946045, "Pretrain/Step": 4205, "Pretrain/Step Time": 8.680461319163442} +{"Pretrain/Learning Rate": 3.093246856918956e-05, "Pretrain/Loss": 1.9716260433197021, "Pretrain/Loss (Raw)": 2.01031494140625, "Pretrain/Step": 4206, "Pretrain/Step Time": 8.686441672965884} +{"Pretrain/Learning Rate": 3.092422085273488e-05, "Pretrain/Loss": 1.9744592905044556, "Pretrain/Loss (Raw)": 2.0937654972076416, "Pretrain/Step": 4207, "Pretrain/Step Time": 8.681278221309185} +{"Pretrain/Learning Rate": 3.091597245307114e-05, "Pretrain/Loss": 1.9729790687561035, "Pretrain/Loss (Raw)": 1.7551531791687012, "Pretrain/Step": 4208, "Pretrain/Step Time": 8.689264660701156} +{"Pretrain/Learning Rate": 3.0907723371149575e-05, "Pretrain/Loss": 1.9736685752868652, "Pretrain/Loss (Raw)": 2.0186028480529785, "Pretrain/Step": 4209, "Pretrain/Step Time": 8.686618436127901} +{"Pretrain/Learning Rate": 3.0899473607921513e-05, "Pretrain/Loss": 1.9727938175201416, "Pretrain/Loss (Raw)": 2.0898358821868896, "Pretrain/Step": 4210, "Pretrain/Step Time": 8.689964301884174} +{"Pretrain/Learning Rate": 3.0891223164338354e-05, "Pretrain/Loss": 1.9698491096496582, "Pretrain/Loss (Raw)": 1.9321343898773193, "Pretrain/Step": 4211, "Pretrain/Step Time": 8.68883772753179} +{"Pretrain/Learning Rate": 3.0882972041351585e-05, "Pretrain/Loss": 1.9707648754119873, "Pretrain/Loss (Raw)": 2.030233383178711, "Pretrain/Step": 4212, "Pretrain/Step Time": 8.688337536528707} +{"Pretrain/Learning Rate": 3.0874720239912744e-05, "Pretrain/Loss": 1.9715055227279663, "Pretrain/Loss (Raw)": 2.0222690105438232, "Pretrain/Step": 4213, "Pretrain/Step Time": 8.694344852119684} +{"Pretrain/Learning Rate": 3.0866467760973495e-05, "Pretrain/Loss": 1.9729194641113281, "Pretrain/Loss (Raw)": 2.138181686401367, "Pretrain/Step": 4214, "Pretrain/Step Time": 8.687324034050107} +{"Pretrain/Learning Rate": 3.0858214605485545e-05, "Pretrain/Loss": 1.977391242980957, "Pretrain/Loss (Raw)": 2.033829689025879, "Pretrain/Step": 4215, "Pretrain/Step Time": 8.685720203444362} +{"Pretrain/Learning Rate": 3.0849960774400667e-05, "Pretrain/Loss": 1.9776735305786133, "Pretrain/Loss (Raw)": 1.765785574913025, "Pretrain/Step": 4216, "Pretrain/Step Time": 8.680082304403186} +{"Pretrain/Learning Rate": 3.0841706268670756e-05, "Pretrain/Loss": 1.9766602516174316, "Pretrain/Loss (Raw)": 1.9673455953598022, "Pretrain/Step": 4217, "Pretrain/Step Time": 8.681991782039404} +{"Pretrain/Learning Rate": 3.083345108924775e-05, "Pretrain/Loss": 1.9746971130371094, "Pretrain/Loss (Raw)": 1.6998529434204102, "Pretrain/Step": 4218, "Pretrain/Step Time": 8.685911798849702} +{"Pretrain/Learning Rate": 3.082519523708368e-05, "Pretrain/Loss": 1.9726872444152832, "Pretrain/Loss (Raw)": 1.6134086847305298, "Pretrain/Step": 4219, "Pretrain/Step Time": 8.68732693977654} +{"Pretrain/Learning Rate": 3.081693871313064e-05, "Pretrain/Loss": 1.9734203815460205, "Pretrain/Loss (Raw)": 2.122934341430664, "Pretrain/Step": 4220, "Pretrain/Step Time": 8.68954604677856} +{"Pretrain/Learning Rate": 3.080868151834082e-05, "Pretrain/Loss": 1.9719892740249634, "Pretrain/Loss (Raw)": 1.791372299194336, "Pretrain/Step": 4221, "Pretrain/Step Time": 8.690596939995885} +{"Pretrain/Learning Rate": 3.080042365366648e-05, "Pretrain/Loss": 1.965857744216919, "Pretrain/Loss (Raw)": 1.425923228263855, "Pretrain/Step": 4222, "Pretrain/Step Time": 8.686096299439669} +{"Pretrain/Learning Rate": 3.079216512005994e-05, "Pretrain/Loss": 1.9651455879211426, "Pretrain/Loss (Raw)": 1.7291388511657715, "Pretrain/Step": 4223, "Pretrain/Step Time": 8.688236437737942} +{"Pretrain/Learning Rate": 3.078390591847363e-05, "Pretrain/Loss": 1.9687693119049072, "Pretrain/Loss (Raw)": 2.1285862922668457, "Pretrain/Step": 4224, "Pretrain/Step Time": 8.68488342128694} +{"Pretrain/Learning Rate": 3.077564604986004e-05, "Pretrain/Loss": 1.9687132835388184, "Pretrain/Loss (Raw)": 1.9514167308807373, "Pretrain/Step": 4225, "Pretrain/Step Time": 8.695671563968062} +{"Pretrain/Learning Rate": 3.076738551517173e-05, "Pretrain/Loss": 1.9686779975891113, "Pretrain/Loss (Raw)": 2.029404640197754, "Pretrain/Step": 4226, "Pretrain/Step Time": 8.695922149345279} +{"Pretrain/Learning Rate": 3.0759124315361344e-05, "Pretrain/Loss": 1.967965841293335, "Pretrain/Loss (Raw)": 1.9718167781829834, "Pretrain/Step": 4227, "Pretrain/Step Time": 8.69428457133472} +{"Pretrain/Learning Rate": 3.07508624513816e-05, "Pretrain/Loss": 1.9673869609832764, "Pretrain/Loss (Raw)": 2.065521240234375, "Pretrain/Step": 4228, "Pretrain/Step Time": 8.691988091915846} +{"Pretrain/Learning Rate": 3.0742599924185306e-05, "Pretrain/Loss": 1.9644421339035034, "Pretrain/Loss (Raw)": 1.8553380966186523, "Pretrain/Step": 4229, "Pretrain/Step Time": 8.698867933824658} +{"Pretrain/Learning Rate": 3.073433673472533e-05, "Pretrain/Loss": 1.9650115966796875, "Pretrain/Loss (Raw)": 1.985540509223938, "Pretrain/Step": 4230, "Pretrain/Step Time": 8.694462882354856} +{"Pretrain/Learning Rate": 3.072607288395461e-05, "Pretrain/Loss": 1.961625576019287, "Pretrain/Loss (Raw)": 1.7768089771270752, "Pretrain/Step": 4231, "Pretrain/Step Time": 8.698216699063778} +{"Pretrain/Learning Rate": 3.071780837282619e-05, "Pretrain/Loss": 1.9625492095947266, "Pretrain/Loss (Raw)": 1.7582074403762817, "Pretrain/Step": 4232, "Pretrain/Step Time": 8.699106207117438} +{"Pretrain/Learning Rate": 3.0709543202293164e-05, "Pretrain/Loss": 1.963354468345642, "Pretrain/Loss (Raw)": 2.194371461868286, "Pretrain/Step": 4233, "Pretrain/Step Time": 8.696292590349913} +{"Pretrain/Learning Rate": 3.070127737330871e-05, "Pretrain/Loss": 1.964927077293396, "Pretrain/Loss (Raw)": 2.224339246749878, "Pretrain/Step": 4234, "Pretrain/Step Time": 8.691492971032858} +{"Pretrain/Learning Rate": 3.069301088682609e-05, "Pretrain/Loss": 1.9674320220947266, "Pretrain/Loss (Raw)": 1.7841633558273315, "Pretrain/Step": 4235, "Pretrain/Step Time": 8.69646561704576} +{"Pretrain/Learning Rate": 3.068474374379863e-05, "Pretrain/Loss": 1.965010166168213, "Pretrain/Loss (Raw)": 1.8677723407745361, "Pretrain/Step": 4236, "Pretrain/Step Time": 8.69972083158791} +{"Pretrain/Learning Rate": 3.067647594517972e-05, "Pretrain/Loss": 1.9651988744735718, "Pretrain/Loss (Raw)": 2.093675136566162, "Pretrain/Step": 4237, "Pretrain/Step Time": 8.698229102417827} +{"Pretrain/Learning Rate": 3.0668207491922866e-05, "Pretrain/Loss": 1.9637359380722046, "Pretrain/Loss (Raw)": 1.8858262300491333, "Pretrain/Step": 4238, "Pretrain/Step Time": 8.715412318706512} +{"Pretrain/Learning Rate": 3.0659938384981616e-05, "Pretrain/Loss": 1.9683642387390137, "Pretrain/Loss (Raw)": 2.1988933086395264, "Pretrain/Step": 4239, "Pretrain/Step Time": 8.713444055989385} +{"Pretrain/Learning Rate": 3.0651668625309594e-05, "Pretrain/Loss": 1.970192551612854, "Pretrain/Loss (Raw)": 2.1679790019989014, "Pretrain/Step": 4240, "Pretrain/Step Time": 8.71187991462648} +{"Pretrain/Learning Rate": 3.0643398213860525e-05, "Pretrain/Loss": 1.9691216945648193, "Pretrain/Loss (Raw)": 2.086249589920044, "Pretrain/Step": 4241, "Pretrain/Step Time": 8.71731498464942} +{"Pretrain/Learning Rate": 3.0635127151588175e-05, "Pretrain/Loss": 1.9689182043075562, "Pretrain/Loss (Raw)": 1.9708796739578247, "Pretrain/Step": 4242, "Pretrain/Step Time": 8.719033053144813} +{"Pretrain/Learning Rate": 3.0626855439446405e-05, "Pretrain/Loss": 1.9694714546203613, "Pretrain/Loss (Raw)": 2.001214027404785, "Pretrain/Step": 4243, "Pretrain/Step Time": 8.716896196827292} +{"Pretrain/Learning Rate": 3.061858307838915e-05, "Pretrain/Loss": 1.9657304286956787, "Pretrain/Loss (Raw)": 1.5281199216842651, "Pretrain/Step": 4244, "Pretrain/Step Time": 8.7207405064255} +{"Pretrain/Learning Rate": 3.061031006937043e-05, "Pretrain/Loss": 1.9645172357559204, "Pretrain/Loss (Raw)": 1.7460111379623413, "Pretrain/Step": 4245, "Pretrain/Step Time": 8.724789820611477} +{"Pretrain/Learning Rate": 3.060203641334431e-05, "Pretrain/Loss": 1.9685198068618774, "Pretrain/Loss (Raw)": 2.170377016067505, "Pretrain/Step": 4246, "Pretrain/Step Time": 8.722035070881248} +{"Pretrain/Learning Rate": 3.059376211126495e-05, "Pretrain/Loss": 1.9679591655731201, "Pretrain/Loss (Raw)": 2.0553317070007324, "Pretrain/Step": 4247, "Pretrain/Step Time": 8.721892891451716} +{"Pretrain/Learning Rate": 3.058548716408658e-05, "Pretrain/Loss": 1.969340443611145, "Pretrain/Loss (Raw)": 2.2349390983581543, "Pretrain/Step": 4248, "Pretrain/Step Time": 8.720159333199263} +{"Pretrain/Learning Rate": 3.057721157276352e-05, "Pretrain/Loss": 1.969772458076477, "Pretrain/Loss (Raw)": 2.0234453678131104, "Pretrain/Step": 4249, "Pretrain/Step Time": 8.720970299094915} +{"Pretrain/Learning Rate": 3.056893533825014e-05, "Pretrain/Loss": 1.9720101356506348, "Pretrain/Loss (Raw)": 2.150291681289673, "Pretrain/Step": 4250, "Pretrain/Step Time": 8.72414026223123} +{"Pretrain/Learning Rate": 3.056065846150089e-05, "Pretrain/Loss": 1.9715923070907593, "Pretrain/Loss (Raw)": 1.977903127670288, "Pretrain/Step": 4251, "Pretrain/Step Time": 8.72622918151319} +{"Pretrain/Learning Rate": 3.0552380943470306e-05, "Pretrain/Loss": 1.9696882963180542, "Pretrain/Loss (Raw)": 1.9136242866516113, "Pretrain/Step": 4252, "Pretrain/Step Time": 8.724330488592386} +{"Pretrain/Learning Rate": 3.054410278511299e-05, "Pretrain/Loss": 1.9701238870620728, "Pretrain/Loss (Raw)": 2.1706154346466064, "Pretrain/Step": 4253, "Pretrain/Step Time": 8.730798127129674} +{"Pretrain/Learning Rate": 3.053582398738362e-05, "Pretrain/Loss": 1.9690961837768555, "Pretrain/Loss (Raw)": 2.015491008758545, "Pretrain/Step": 4254, "Pretrain/Step Time": 8.728688728064299} +{"Pretrain/Learning Rate": 3.052754455123693e-05, "Pretrain/Loss": 1.967925786972046, "Pretrain/Loss (Raw)": 1.840588092803955, "Pretrain/Step": 4255, "Pretrain/Step Time": 8.725003127008677} +{"Pretrain/Learning Rate": 3.051926447762776e-05, "Pretrain/Loss": 1.9652860164642334, "Pretrain/Loss (Raw)": 1.8417259454727173, "Pretrain/Step": 4256, "Pretrain/Step Time": 8.726474691182375} +{"Pretrain/Learning Rate": 3.0510983767511007e-05, "Pretrain/Loss": 1.965616226196289, "Pretrain/Loss (Raw)": 2.103797674179077, "Pretrain/Step": 4257, "Pretrain/Step Time": 8.723965061828494} +{"Pretrain/Learning Rate": 3.050270242184164e-05, "Pretrain/Loss": 1.9658784866333008, "Pretrain/Loss (Raw)": 1.9599523544311523, "Pretrain/Step": 4258, "Pretrain/Step Time": 8.726722806692123} +{"Pretrain/Learning Rate": 3.049442044157469e-05, "Pretrain/Loss": 1.9663853645324707, "Pretrain/Loss (Raw)": 1.8886786699295044, "Pretrain/Step": 4259, "Pretrain/Step Time": 8.729575723409653} +{"Pretrain/Learning Rate": 3.0486137827665296e-05, "Pretrain/Loss": 1.9657422304153442, "Pretrain/Loss (Raw)": 2.065314292907715, "Pretrain/Step": 4260, "Pretrain/Step Time": 8.725777519866824} +{"Pretrain/Learning Rate": 3.0477854581068626e-05, "Pretrain/Loss": 1.9701145887374878, "Pretrain/Loss (Raw)": 2.083439588546753, "Pretrain/Step": 4261, "Pretrain/Step Time": 8.729340525344014} +{"Pretrain/Learning Rate": 3.0469570702739958e-05, "Pretrain/Loss": 1.9701255559921265, "Pretrain/Loss (Raw)": 2.043165683746338, "Pretrain/Step": 4262, "Pretrain/Step Time": 8.72696227952838} +{"Pretrain/Learning Rate": 3.0461286193634626e-05, "Pretrain/Loss": 1.973388671875, "Pretrain/Loss (Raw)": 2.440596342086792, "Pretrain/Step": 4263, "Pretrain/Step Time": 8.731527633965015} +{"Pretrain/Learning Rate": 3.045300105470803e-05, "Pretrain/Loss": 1.9745012521743774, "Pretrain/Loss (Raw)": 2.1273193359375, "Pretrain/Step": 4264, "Pretrain/Step Time": 8.734467962756753} +{"Pretrain/Learning Rate": 3.0444715286915658e-05, "Pretrain/Loss": 1.974801778793335, "Pretrain/Loss (Raw)": 1.9513095617294312, "Pretrain/Step": 4265, "Pretrain/Step Time": 8.732994886115193} +{"Pretrain/Learning Rate": 3.0436428891213063e-05, "Pretrain/Loss": 1.9773122072219849, "Pretrain/Loss (Raw)": 2.0246660709381104, "Pretrain/Step": 4266, "Pretrain/Step Time": 8.734951812773943} +{"Pretrain/Learning Rate": 3.0428141868555875e-05, "Pretrain/Loss": 1.9798054695129395, "Pretrain/Loss (Raw)": 2.2796549797058105, "Pretrain/Step": 4267, "Pretrain/Step Time": 8.73773736692965} +{"Pretrain/Learning Rate": 3.0419854219899786e-05, "Pretrain/Loss": 1.9789890050888062, "Pretrain/Loss (Raw)": 1.9782754182815552, "Pretrain/Step": 4268, "Pretrain/Step Time": 8.738990511745214} +{"Pretrain/Learning Rate": 3.041156594620057e-05, "Pretrain/Loss": 1.9799494743347168, "Pretrain/Loss (Raw)": 2.006218910217285, "Pretrain/Step": 4269, "Pretrain/Step Time": 8.736025288701057} +{"Pretrain/Learning Rate": 3.0403277048414063e-05, "Pretrain/Loss": 1.9788811206817627, "Pretrain/Loss (Raw)": 1.949637532234192, "Pretrain/Step": 4270, "Pretrain/Step Time": 8.737858820706606} +{"Pretrain/Learning Rate": 3.0394987527496192e-05, "Pretrain/Loss": 1.9776568412780762, "Pretrain/Loss (Raw)": 1.7871365547180176, "Pretrain/Step": 4271, "Pretrain/Step Time": 8.737888261675835} +{"Pretrain/Learning Rate": 3.0386697384402935e-05, "Pretrain/Loss": 1.9772777557373047, "Pretrain/Loss (Raw)": 2.0082478523254395, "Pretrain/Step": 4272, "Pretrain/Step Time": 8.740876790136099} +{"Pretrain/Learning Rate": 3.0378406620090354e-05, "Pretrain/Loss": 1.9778989553451538, "Pretrain/Loss (Raw)": 2.1386349201202393, "Pretrain/Step": 4273, "Pretrain/Step Time": 8.740224933251739} +{"Pretrain/Learning Rate": 3.0370115235514574e-05, "Pretrain/Loss": 1.9782063961029053, "Pretrain/Loss (Raw)": 2.054896354675293, "Pretrain/Step": 4274, "Pretrain/Step Time": 8.745721891522408} +{"Pretrain/Learning Rate": 3.036182323163181e-05, "Pretrain/Loss": 1.977731704711914, "Pretrain/Loss (Raw)": 2.030367851257324, "Pretrain/Step": 4275, "Pretrain/Step Time": 8.74605580046773} +{"Pretrain/Learning Rate": 3.0353530609398313e-05, "Pretrain/Loss": 1.978215217590332, "Pretrain/Loss (Raw)": 2.1016721725463867, "Pretrain/Step": 4276, "Pretrain/Step Time": 8.744342543184757} +{"Pretrain/Learning Rate": 3.0345237369770448e-05, "Pretrain/Loss": 1.9768348932266235, "Pretrain/Loss (Raw)": 1.7121763229370117, "Pretrain/Step": 4277, "Pretrain/Step Time": 8.744910255074501} +{"Pretrain/Learning Rate": 3.0336943513704613e-05, "Pretrain/Loss": 1.976145625114441, "Pretrain/Loss (Raw)": 2.052745819091797, "Pretrain/Step": 4278, "Pretrain/Step Time": 8.744230659678578} +{"Pretrain/Learning Rate": 3.0328649042157315e-05, "Pretrain/Loss": 1.9763567447662354, "Pretrain/Loss (Raw)": 2.0386435985565186, "Pretrain/Step": 4279, "Pretrain/Step Time": 8.745591094717383} +{"Pretrain/Learning Rate": 3.0320353956085095e-05, "Pretrain/Loss": 1.9759933948516846, "Pretrain/Loss (Raw)": 1.925394892692566, "Pretrain/Step": 4280, "Pretrain/Step Time": 8.734143486246467} +{"Pretrain/Learning Rate": 3.0312058256444587e-05, "Pretrain/Loss": 1.9770562648773193, "Pretrain/Loss (Raw)": 2.278878688812256, "Pretrain/Step": 4281, "Pretrain/Step Time": 8.738275561481714} +{"Pretrain/Learning Rate": 3.0303761944192488e-05, "Pretrain/Loss": 1.9754447937011719, "Pretrain/Loss (Raw)": 1.9151756763458252, "Pretrain/Step": 4282, "Pretrain/Step Time": 8.731414021924138} +{"Pretrain/Learning Rate": 3.0295465020285567e-05, "Pretrain/Loss": 1.9778637886047363, "Pretrain/Loss (Raw)": 2.239011764526367, "Pretrain/Step": 4283, "Pretrain/Step Time": 8.735442116856575} +{"Pretrain/Learning Rate": 3.0287167485680672e-05, "Pretrain/Loss": 1.9778708219528198, "Pretrain/Loss (Raw)": 2.0190274715423584, "Pretrain/Step": 4284, "Pretrain/Step Time": 8.732809757813811} +{"Pretrain/Learning Rate": 3.0278869341334702e-05, "Pretrain/Loss": 1.978924036026001, "Pretrain/Loss (Raw)": 2.154233455657959, "Pretrain/Step": 4285, "Pretrain/Step Time": 8.729711135849357} +{"Pretrain/Learning Rate": 3.0270570588204655e-05, "Pretrain/Loss": 1.9803292751312256, "Pretrain/Loss (Raw)": 2.0355701446533203, "Pretrain/Step": 4286, "Pretrain/Step Time": 8.731883438304067} +{"Pretrain/Learning Rate": 3.0262271227247563e-05, "Pretrain/Loss": 1.9781782627105713, "Pretrain/Loss (Raw)": 2.052809953689575, "Pretrain/Step": 4287, "Pretrain/Step Time": 8.735023185610771} +{"Pretrain/Learning Rate": 3.025397125942056e-05, "Pretrain/Loss": 1.9805374145507812, "Pretrain/Loss (Raw)": 2.1419243812561035, "Pretrain/Step": 4288, "Pretrain/Step Time": 8.743647929280996} +{"Pretrain/Learning Rate": 3.0245670685680833e-05, "Pretrain/Loss": 1.9784891605377197, "Pretrain/Loss (Raw)": 1.8627930879592896, "Pretrain/Step": 4289, "Pretrain/Step Time": 8.74306513555348} +{"Pretrain/Learning Rate": 3.0237369506985646e-05, "Pretrain/Loss": 1.9775373935699463, "Pretrain/Loss (Raw)": 1.9972740411758423, "Pretrain/Step": 4290, "Pretrain/Step Time": 8.74194510653615} +{"Pretrain/Learning Rate": 3.022906772429232e-05, "Pretrain/Loss": 1.9754371643066406, "Pretrain/Loss (Raw)": 1.981399655342102, "Pretrain/Step": 4291, "Pretrain/Step Time": 8.741606157273054} +{"Pretrain/Learning Rate": 3.0220765338558278e-05, "Pretrain/Loss": 1.9739981889724731, "Pretrain/Loss (Raw)": 1.9403553009033203, "Pretrain/Step": 4292, "Pretrain/Step Time": 8.738538043573499} +{"Pretrain/Learning Rate": 3.021246235074096e-05, "Pretrain/Loss": 1.9739388227462769, "Pretrain/Loss (Raw)": 1.9498252868652344, "Pretrain/Step": 4293, "Pretrain/Step Time": 8.74029098637402} +{"Pretrain/Learning Rate": 3.0204158761797936e-05, "Pretrain/Loss": 1.9752392768859863, "Pretrain/Loss (Raw)": 1.9706215858459473, "Pretrain/Step": 4294, "Pretrain/Step Time": 8.735851012170315} +{"Pretrain/Learning Rate": 3.0195854572686793e-05, "Pretrain/Loss": 1.975161075592041, "Pretrain/Loss (Raw)": 1.8115652799606323, "Pretrain/Step": 4295, "Pretrain/Step Time": 8.734295662492514} +{"Pretrain/Learning Rate": 3.0187549784365214e-05, "Pretrain/Loss": 1.9763028621673584, "Pretrain/Loss (Raw)": 1.9619446992874146, "Pretrain/Step": 4296, "Pretrain/Step Time": 8.736323855817318} +{"Pretrain/Learning Rate": 3.0179244397790956e-05, "Pretrain/Loss": 1.9757773876190186, "Pretrain/Loss (Raw)": 2.0493569374084473, "Pretrain/Step": 4297, "Pretrain/Step Time": 8.735679620876908} +{"Pretrain/Learning Rate": 3.017093841392183e-05, "Pretrain/Loss": 1.978184700012207, "Pretrain/Loss (Raw)": 2.18300724029541, "Pretrain/Step": 4298, "Pretrain/Step Time": 8.738439373672009} +{"Pretrain/Learning Rate": 3.0162631833715715e-05, "Pretrain/Loss": 1.9793727397918701, "Pretrain/Loss (Raw)": 2.1016862392425537, "Pretrain/Step": 4299, "Pretrain/Step Time": 8.739931674674153} +{"Pretrain/Learning Rate": 3.0154324658130572e-05, "Pretrain/Loss": 1.9795012474060059, "Pretrain/Loss (Raw)": 2.0362110137939453, "Pretrain/Step": 4300, "Pretrain/Step Time": 8.744811333715916} +{"Pretrain/Learning Rate": 3.0146016888124423e-05, "Pretrain/Loss": 1.982048749923706, "Pretrain/Loss (Raw)": 2.14888596534729, "Pretrain/Step": 4301, "Pretrain/Step Time": 8.739833476021886} +{"Pretrain/Learning Rate": 3.013770852465535e-05, "Pretrain/Loss": 1.9831935167312622, "Pretrain/Loss (Raw)": 1.952772855758667, "Pretrain/Step": 4302, "Pretrain/Step Time": 8.740933883935213} +{"Pretrain/Learning Rate": 3.0129399568681533e-05, "Pretrain/Loss": 1.9836684465408325, "Pretrain/Loss (Raw)": 1.9504948854446411, "Pretrain/Step": 4303, "Pretrain/Step Time": 8.740689855068922} +{"Pretrain/Learning Rate": 3.0121090021161175e-05, "Pretrain/Loss": 1.98496675491333, "Pretrain/Loss (Raw)": 2.1409077644348145, "Pretrain/Step": 4304, "Pretrain/Step Time": 8.73935710825026} +{"Pretrain/Learning Rate": 3.0112779883052593e-05, "Pretrain/Loss": 1.9846618175506592, "Pretrain/Loss (Raw)": 1.9253695011138916, "Pretrain/Step": 4305, "Pretrain/Step Time": 8.745325043797493} +{"Pretrain/Learning Rate": 3.010446915531414e-05, "Pretrain/Loss": 1.9847438335418701, "Pretrain/Loss (Raw)": 1.8043742179870605, "Pretrain/Step": 4306, "Pretrain/Step Time": 8.747952498495579} +{"Pretrain/Learning Rate": 3.0096157838904247e-05, "Pretrain/Loss": 1.98349928855896, "Pretrain/Loss (Raw)": 1.8630175590515137, "Pretrain/Step": 4307, "Pretrain/Step Time": 8.745756326243281} +{"Pretrain/Learning Rate": 3.0087845934781424e-05, "Pretrain/Loss": 1.9845564365386963, "Pretrain/Loss (Raw)": 1.9082093238830566, "Pretrain/Step": 4308, "Pretrain/Step Time": 8.74558917246759} +{"Pretrain/Learning Rate": 3.0079533443904227e-05, "Pretrain/Loss": 1.9814130067825317, "Pretrain/Loss (Raw)": 1.80270254611969, "Pretrain/Step": 4309, "Pretrain/Step Time": 8.745063230395317} +{"Pretrain/Learning Rate": 3.0071220367231306e-05, "Pretrain/Loss": 1.9807138442993164, "Pretrain/Loss (Raw)": 1.9453257322311401, "Pretrain/Step": 4310, "Pretrain/Step Time": 8.74635011330247} +{"Pretrain/Learning Rate": 3.006290670572135e-05, "Pretrain/Loss": 1.9823328256607056, "Pretrain/Loss (Raw)": 2.110276937484741, "Pretrain/Step": 4311, "Pretrain/Step Time": 8.7432302813977} +{"Pretrain/Learning Rate": 3.0054592460333137e-05, "Pretrain/Loss": 1.9821593761444092, "Pretrain/Loss (Raw)": 2.0008034706115723, "Pretrain/Step": 4312, "Pretrain/Step Time": 8.74728457070887} +{"Pretrain/Learning Rate": 3.00462776320255e-05, "Pretrain/Loss": 1.9815479516983032, "Pretrain/Loss (Raw)": 2.0732011795043945, "Pretrain/Step": 4313, "Pretrain/Step Time": 8.747797396034002} +{"Pretrain/Learning Rate": 3.0037962221757354e-05, "Pretrain/Loss": 1.9820270538330078, "Pretrain/Loss (Raw)": 1.9143232107162476, "Pretrain/Step": 4314, "Pretrain/Step Time": 8.747899385169148} +{"Pretrain/Learning Rate": 3.0029646230487657e-05, "Pretrain/Loss": 1.9800688028335571, "Pretrain/Loss (Raw)": 1.5815370082855225, "Pretrain/Step": 4315, "Pretrain/Step Time": 8.737762043252587} +{"Pretrain/Learning Rate": 3.002132965917547e-05, "Pretrain/Loss": 1.9825900793075562, "Pretrain/Loss (Raw)": 2.250797748565674, "Pretrain/Step": 4316, "Pretrain/Step Time": 8.746738879010081} +{"Pretrain/Learning Rate": 3.001301250877987e-05, "Pretrain/Loss": 1.9823992252349854, "Pretrain/Loss (Raw)": 2.044013261795044, "Pretrain/Step": 4317, "Pretrain/Step Time": 8.7432023845613} +{"Pretrain/Learning Rate": 3.000469478026005e-05, "Pretrain/Loss": 1.9831016063690186, "Pretrain/Loss (Raw)": 2.1103265285491943, "Pretrain/Step": 4318, "Pretrain/Step Time": 8.742327865213156} +{"Pretrain/Learning Rate": 2.9996376474575244e-05, "Pretrain/Loss": 1.9821521043777466, "Pretrain/Loss (Raw)": 1.9503647089004517, "Pretrain/Step": 4319, "Pretrain/Step Time": 8.74626563116908} +{"Pretrain/Learning Rate": 2.9988057592684766e-05, "Pretrain/Loss": 1.9798798561096191, "Pretrain/Loss (Raw)": 1.8134485483169556, "Pretrain/Step": 4320, "Pretrain/Step Time": 8.74303357489407} +{"Pretrain/Learning Rate": 2.9979738135547973e-05, "Pretrain/Loss": 1.9800541400909424, "Pretrain/Loss (Raw)": 2.0159482955932617, "Pretrain/Step": 4321, "Pretrain/Step Time": 8.749640733003616} +{"Pretrain/Learning Rate": 2.9971418104124322e-05, "Pretrain/Loss": 1.9772018194198608, "Pretrain/Loss (Raw)": 1.837631106376648, "Pretrain/Step": 4322, "Pretrain/Step Time": 8.759987344965339} +{"Pretrain/Learning Rate": 2.9963097499373312e-05, "Pretrain/Loss": 1.9773844480514526, "Pretrain/Loss (Raw)": 2.0085370540618896, "Pretrain/Step": 4323, "Pretrain/Step Time": 8.753866072744131} +{"Pretrain/Learning Rate": 2.9954776322254495e-05, "Pretrain/Loss": 1.9757747650146484, "Pretrain/Loss (Raw)": 1.831433653831482, "Pretrain/Step": 4324, "Pretrain/Step Time": 8.75048273615539} +{"Pretrain/Learning Rate": 2.994645457372754e-05, "Pretrain/Loss": 1.972956657409668, "Pretrain/Loss (Raw)": 1.8603296279907227, "Pretrain/Step": 4325, "Pretrain/Step Time": 8.754927905276418} +{"Pretrain/Learning Rate": 2.9938132254752126e-05, "Pretrain/Loss": 1.979554533958435, "Pretrain/Loss (Raw)": 2.219895362854004, "Pretrain/Step": 4326, "Pretrain/Step Time": 8.748299518600106} +{"Pretrain/Learning Rate": 2.9929809366288035e-05, "Pretrain/Loss": 1.9809460639953613, "Pretrain/Loss (Raw)": 1.6730595827102661, "Pretrain/Step": 4327, "Pretrain/Step Time": 8.7500920612365} +{"Pretrain/Learning Rate": 2.99214859092951e-05, "Pretrain/Loss": 1.9823322296142578, "Pretrain/Loss (Raw)": 2.0704610347747803, "Pretrain/Step": 4328, "Pretrain/Step Time": 8.751059100031853} +{"Pretrain/Learning Rate": 2.9913161884733215e-05, "Pretrain/Loss": 1.9845197200775146, "Pretrain/Loss (Raw)": 1.852040410041809, "Pretrain/Step": 4329, "Pretrain/Step Time": 8.753190152347088} +{"Pretrain/Learning Rate": 2.9904837293562348e-05, "Pretrain/Loss": 1.9855296611785889, "Pretrain/Loss (Raw)": 2.136260509490967, "Pretrain/Step": 4330, "Pretrain/Step Time": 8.750306630507112} +{"Pretrain/Learning Rate": 2.989651213674254e-05, "Pretrain/Loss": 1.9857624769210815, "Pretrain/Loss (Raw)": 2.0232765674591064, "Pretrain/Step": 4331, "Pretrain/Step Time": 8.753645239397883} +{"Pretrain/Learning Rate": 2.988818641523387e-05, "Pretrain/Loss": 1.9854745864868164, "Pretrain/Loss (Raw)": 1.795115351676941, "Pretrain/Step": 4332, "Pretrain/Step Time": 8.755468936637044} +{"Pretrain/Learning Rate": 2.9879860129996517e-05, "Pretrain/Loss": 1.9828258752822876, "Pretrain/Loss (Raw)": 1.8454041481018066, "Pretrain/Step": 4333, "Pretrain/Step Time": 8.765298644080758} +{"Pretrain/Learning Rate": 2.9871533281990692e-05, "Pretrain/Loss": 1.9830436706542969, "Pretrain/Loss (Raw)": 2.0381853580474854, "Pretrain/Step": 4334, "Pretrain/Step Time": 8.76060733012855} +{"Pretrain/Learning Rate": 2.9863205872176703e-05, "Pretrain/Loss": 1.9814479351043701, "Pretrain/Loss (Raw)": 1.889509677886963, "Pretrain/Step": 4335, "Pretrain/Step Time": 8.771879078820348} +{"Pretrain/Learning Rate": 2.9854877901514884e-05, "Pretrain/Loss": 1.983016014099121, "Pretrain/Loss (Raw)": 1.955859899520874, "Pretrain/Step": 4336, "Pretrain/Step Time": 8.768483908846974} +{"Pretrain/Learning Rate": 2.9846549370965672e-05, "Pretrain/Loss": 1.982792615890503, "Pretrain/Loss (Raw)": 1.9900277853012085, "Pretrain/Step": 4337, "Pretrain/Step Time": 8.770398985594511} +{"Pretrain/Learning Rate": 2.9838220281489553e-05, "Pretrain/Loss": 1.9797465801239014, "Pretrain/Loss (Raw)": 1.6999510526657104, "Pretrain/Step": 4338, "Pretrain/Step Time": 8.761597147211432} +{"Pretrain/Learning Rate": 2.9829890634047068e-05, "Pretrain/Loss": 1.9829349517822266, "Pretrain/Loss (Raw)": 2.340222120285034, "Pretrain/Step": 4339, "Pretrain/Step Time": 8.758170047774911} +{"Pretrain/Learning Rate": 2.9821560429598844e-05, "Pretrain/Loss": 1.9832139015197754, "Pretrain/Loss (Raw)": 2.0659492015838623, "Pretrain/Step": 4340, "Pretrain/Step Time": 8.761124733835459} +{"Pretrain/Learning Rate": 2.9813229669105546e-05, "Pretrain/Loss": 1.9832251071929932, "Pretrain/Loss (Raw)": 2.0237085819244385, "Pretrain/Step": 4341, "Pretrain/Step Time": 8.757278544828296} +{"Pretrain/Learning Rate": 2.9804898353527928e-05, "Pretrain/Loss": 1.9839766025543213, "Pretrain/Loss (Raw)": 2.234358549118042, "Pretrain/Step": 4342, "Pretrain/Step Time": 8.754940258339047} +{"Pretrain/Learning Rate": 2.9796566483826777e-05, "Pretrain/Loss": 1.9841384887695312, "Pretrain/Loss (Raw)": 2.054560661315918, "Pretrain/Step": 4343, "Pretrain/Step Time": 8.759223628789186} +{"Pretrain/Learning Rate": 2.9788234060962988e-05, "Pretrain/Loss": 1.9873892068862915, "Pretrain/Loss (Raw)": 2.181879997253418, "Pretrain/Step": 4344, "Pretrain/Step Time": 8.76422412879765} +{"Pretrain/Learning Rate": 2.9779901085897478e-05, "Pretrain/Loss": 1.9876713752746582, "Pretrain/Loss (Raw)": 2.0034663677215576, "Pretrain/Step": 4345, "Pretrain/Step Time": 8.759763916954398} +{"Pretrain/Learning Rate": 2.9771567559591257e-05, "Pretrain/Loss": 1.9913088083267212, "Pretrain/Loss (Raw)": 2.1654465198516846, "Pretrain/Step": 4346, "Pretrain/Step Time": 8.7622115239501} +{"Pretrain/Learning Rate": 2.9763233483005383e-05, "Pretrain/Loss": 1.9953619241714478, "Pretrain/Loss (Raw)": 2.1322035789489746, "Pretrain/Step": 4347, "Pretrain/Step Time": 8.756713923066854} +{"Pretrain/Learning Rate": 2.975489885710097e-05, "Pretrain/Loss": 1.990039587020874, "Pretrain/Loss (Raw)": 1.4416812658309937, "Pretrain/Step": 4348, "Pretrain/Step Time": 8.76193132251501} +{"Pretrain/Learning Rate": 2.9746563682839225e-05, "Pretrain/Loss": 1.9928689002990723, "Pretrain/Loss (Raw)": 2.1535181999206543, "Pretrain/Step": 4349, "Pretrain/Step Time": 8.762860672548413} +{"Pretrain/Learning Rate": 2.9738227961181374e-05, "Pretrain/Loss": 1.996668815612793, "Pretrain/Loss (Raw)": 1.9123039245605469, "Pretrain/Step": 4350, "Pretrain/Step Time": 8.765246894210577} +{"Pretrain/Learning Rate": 2.972989169308876e-05, "Pretrain/Loss": 2.000467538833618, "Pretrain/Loss (Raw)": 2.215362787246704, "Pretrain/Step": 4351, "Pretrain/Step Time": 8.759029606357217} +{"Pretrain/Learning Rate": 2.9721554879522743e-05, "Pretrain/Loss": 1.9992671012878418, "Pretrain/Loss (Raw)": 1.9749516248703003, "Pretrain/Step": 4352, "Pretrain/Step Time": 8.765730660408735} +{"Pretrain/Learning Rate": 2.9713217521444774e-05, "Pretrain/Loss": 1.9989955425262451, "Pretrain/Loss (Raw)": 1.916656255722046, "Pretrain/Step": 4353, "Pretrain/Step Time": 8.752796271815896} +{"Pretrain/Learning Rate": 2.9704879619816346e-05, "Pretrain/Loss": 1.9969146251678467, "Pretrain/Loss (Raw)": 1.7630366086959839, "Pretrain/Step": 4354, "Pretrain/Step Time": 8.750849118456244} +{"Pretrain/Learning Rate": 2.969654117559903e-05, "Pretrain/Loss": 1.9982792139053345, "Pretrain/Loss (Raw)": 2.1464931964874268, "Pretrain/Step": 4355, "Pretrain/Step Time": 8.750769613310695} +{"Pretrain/Learning Rate": 2.9688202189754456e-05, "Pretrain/Loss": 1.9983837604522705, "Pretrain/Loss (Raw)": 2.0789060592651367, "Pretrain/Step": 4356, "Pretrain/Step Time": 8.749885940924287} +{"Pretrain/Learning Rate": 2.9679862663244317e-05, "Pretrain/Loss": 1.9990448951721191, "Pretrain/Loss (Raw)": 1.9399470090866089, "Pretrain/Step": 4357, "Pretrain/Step Time": 8.746826574206352} +{"Pretrain/Learning Rate": 2.9671522597030355e-05, "Pretrain/Loss": 1.9991604089736938, "Pretrain/Loss (Raw)": 2.000336170196533, "Pretrain/Step": 4358, "Pretrain/Step Time": 8.749145679175854} +{"Pretrain/Learning Rate": 2.9663181992074402e-05, "Pretrain/Loss": 2.001396656036377, "Pretrain/Loss (Raw)": 2.0630526542663574, "Pretrain/Step": 4359, "Pretrain/Step Time": 8.742510294541717} +{"Pretrain/Learning Rate": 2.9654840849338322e-05, "Pretrain/Loss": 2.0021023750305176, "Pretrain/Loss (Raw)": 1.848531723022461, "Pretrain/Step": 4360, "Pretrain/Step Time": 8.73781311698258} +{"Pretrain/Learning Rate": 2.964649916978407e-05, "Pretrain/Loss": 2.0006377696990967, "Pretrain/Loss (Raw)": 2.006913661956787, "Pretrain/Step": 4361, "Pretrain/Step Time": 8.740884212777019} +{"Pretrain/Learning Rate": 2.963815695437363e-05, "Pretrain/Loss": 1.9993232488632202, "Pretrain/Loss (Raw)": 2.0560896396636963, "Pretrain/Step": 4362, "Pretrain/Step Time": 8.743266750127077} +{"Pretrain/Learning Rate": 2.962981420406908e-05, "Pretrain/Loss": 1.9994919300079346, "Pretrain/Loss (Raw)": 1.8057414293289185, "Pretrain/Step": 4363, "Pretrain/Step Time": 8.742467567324638} +{"Pretrain/Learning Rate": 2.9621470919832538e-05, "Pretrain/Loss": 2.0007882118225098, "Pretrain/Loss (Raw)": 2.033684492111206, "Pretrain/Step": 4364, "Pretrain/Step Time": 8.73774280026555} +{"Pretrain/Learning Rate": 2.9613127102626187e-05, "Pretrain/Loss": 1.9995476007461548, "Pretrain/Loss (Raw)": 1.934902548789978, "Pretrain/Step": 4365, "Pretrain/Step Time": 8.744747525081038} +{"Pretrain/Learning Rate": 2.9604782753412292e-05, "Pretrain/Loss": 2.000293016433716, "Pretrain/Loss (Raw)": 1.9812287092208862, "Pretrain/Step": 4366, "Pretrain/Step Time": 8.728562882170081} +{"Pretrain/Learning Rate": 2.9596437873153137e-05, "Pretrain/Loss": 1.9996949434280396, "Pretrain/Loss (Raw)": 2.1223275661468506, "Pretrain/Step": 4367, "Pretrain/Step Time": 8.728702945634723} +{"Pretrain/Learning Rate": 2.9588092462811122e-05, "Pretrain/Loss": 1.9961376190185547, "Pretrain/Loss (Raw)": 1.7126514911651611, "Pretrain/Step": 4368, "Pretrain/Step Time": 8.729220371693373} +{"Pretrain/Learning Rate": 2.957974652334865e-05, "Pretrain/Loss": 1.996241807937622, "Pretrain/Loss (Raw)": 2.099574565887451, "Pretrain/Step": 4369, "Pretrain/Step Time": 8.727590590715408} +{"Pretrain/Learning Rate": 2.9571400055728242e-05, "Pretrain/Loss": 1.996311902999878, "Pretrain/Loss (Raw)": 1.9798665046691895, "Pretrain/Step": 4370, "Pretrain/Step Time": 8.726313628256321} +{"Pretrain/Learning Rate": 2.9563053060912426e-05, "Pretrain/Loss": 1.9950429201126099, "Pretrain/Loss (Raw)": 1.8387864828109741, "Pretrain/Step": 4371, "Pretrain/Step Time": 8.731122732162476} +{"Pretrain/Learning Rate": 2.9554705539863842e-05, "Pretrain/Loss": 1.9949666261672974, "Pretrain/Loss (Raw)": 1.5183521509170532, "Pretrain/Step": 4372, "Pretrain/Step Time": 8.728305729106069} +{"Pretrain/Learning Rate": 2.954635749354514e-05, "Pretrain/Loss": 1.9968030452728271, "Pretrain/Loss (Raw)": 1.9810634851455688, "Pretrain/Step": 4373, "Pretrain/Step Time": 8.722901253029704} +{"Pretrain/Learning Rate": 2.953800892291908e-05, "Pretrain/Loss": 1.9958339929580688, "Pretrain/Loss (Raw)": 2.0463476181030273, "Pretrain/Step": 4374, "Pretrain/Step Time": 8.724215026944876} +{"Pretrain/Learning Rate": 2.9529659828948442e-05, "Pretrain/Loss": 1.9948358535766602, "Pretrain/Loss (Raw)": 1.927564263343811, "Pretrain/Step": 4375, "Pretrain/Step Time": 8.727684957906604} +{"Pretrain/Learning Rate": 2.9521310212596087e-05, "Pretrain/Loss": 1.991723656654358, "Pretrain/Loss (Raw)": 1.836582064628601, "Pretrain/Step": 4376, "Pretrain/Step Time": 8.725939381867647} +{"Pretrain/Learning Rate": 2.951296007482493e-05, "Pretrain/Loss": 1.99241304397583, "Pretrain/Loss (Raw)": 2.1116766929626465, "Pretrain/Step": 4377, "Pretrain/Step Time": 8.73111037351191} +{"Pretrain/Learning Rate": 2.9504609416597956e-05, "Pretrain/Loss": 1.990368366241455, "Pretrain/Loss (Raw)": 1.8885871171951294, "Pretrain/Step": 4378, "Pretrain/Step Time": 8.726596139371395} +{"Pretrain/Learning Rate": 2.9496258238878198e-05, "Pretrain/Loss": 1.991141438484192, "Pretrain/Loss (Raw)": 2.076848268508911, "Pretrain/Step": 4379, "Pretrain/Step Time": 8.72746516764164} +{"Pretrain/Learning Rate": 2.9487906542628753e-05, "Pretrain/Loss": 1.9918110370635986, "Pretrain/Loss (Raw)": 1.9993385076522827, "Pretrain/Step": 4380, "Pretrain/Step Time": 8.731528578326106} +{"Pretrain/Learning Rate": 2.9479554328812775e-05, "Pretrain/Loss": 1.9900856018066406, "Pretrain/Loss (Raw)": 1.9497720003128052, "Pretrain/Step": 4381, "Pretrain/Step Time": 8.72729230299592} +{"Pretrain/Learning Rate": 2.9471201598393482e-05, "Pretrain/Loss": 1.9903535842895508, "Pretrain/Loss (Raw)": 2.04978346824646, "Pretrain/Step": 4382, "Pretrain/Step Time": 8.762691667303443} +{"Pretrain/Learning Rate": 2.946284835233416e-05, "Pretrain/Loss": 1.991978645324707, "Pretrain/Loss (Raw)": 2.048581123352051, "Pretrain/Step": 4383, "Pretrain/Step Time": 8.759803231805563} +{"Pretrain/Learning Rate": 2.945449459159813e-05, "Pretrain/Loss": 1.9927740097045898, "Pretrain/Loss (Raw)": 1.943537950515747, "Pretrain/Step": 4384, "Pretrain/Step Time": 8.761001603677869} +{"Pretrain/Learning Rate": 2.9446140317148795e-05, "Pretrain/Loss": 1.992121696472168, "Pretrain/Loss (Raw)": 2.020292043685913, "Pretrain/Step": 4385, "Pretrain/Step Time": 8.75988177023828} +{"Pretrain/Learning Rate": 2.9437785529949606e-05, "Pretrain/Loss": 1.993227481842041, "Pretrain/Loss (Raw)": 2.101498603820801, "Pretrain/Step": 4386, "Pretrain/Step Time": 8.758009046316147} +{"Pretrain/Learning Rate": 2.9429430230964084e-05, "Pretrain/Loss": 1.9935262203216553, "Pretrain/Loss (Raw)": 1.9269195795059204, "Pretrain/Step": 4387, "Pretrain/Step Time": 8.753480670973659} +{"Pretrain/Learning Rate": 2.9421074421155787e-05, "Pretrain/Loss": 1.991912603378296, "Pretrain/Loss (Raw)": 1.858783483505249, "Pretrain/Step": 4388, "Pretrain/Step Time": 8.757742950692773} +{"Pretrain/Learning Rate": 2.9412718101488364e-05, "Pretrain/Loss": 1.9933218955993652, "Pretrain/Loss (Raw)": 2.2638063430786133, "Pretrain/Step": 4389, "Pretrain/Step Time": 8.752573991194367} +{"Pretrain/Learning Rate": 2.9404361272925497e-05, "Pretrain/Loss": 1.9936187267303467, "Pretrain/Loss (Raw)": 2.081167697906494, "Pretrain/Step": 4390, "Pretrain/Step Time": 8.753647521138191} +{"Pretrain/Learning Rate": 2.939600393643092e-05, "Pretrain/Loss": 1.990621566772461, "Pretrain/Loss (Raw)": 2.0569612979888916, "Pretrain/Step": 4391, "Pretrain/Step Time": 8.75234591960907} +{"Pretrain/Learning Rate": 2.9387646092968468e-05, "Pretrain/Loss": 1.9902729988098145, "Pretrain/Loss (Raw)": 2.0827131271362305, "Pretrain/Step": 4392, "Pretrain/Step Time": 8.752588756382465} +{"Pretrain/Learning Rate": 2.9379287743501983e-05, "Pretrain/Loss": 1.9904080629348755, "Pretrain/Loss (Raw)": 1.9685956239700317, "Pretrain/Step": 4393, "Pretrain/Step Time": 8.749652948230505} +{"Pretrain/Learning Rate": 2.9370928888995407e-05, "Pretrain/Loss": 1.9904637336730957, "Pretrain/Loss (Raw)": 2.0317795276641846, "Pretrain/Step": 4394, "Pretrain/Step Time": 8.75183672644198} +{"Pretrain/Learning Rate": 2.936256953041271e-05, "Pretrain/Loss": 1.9867069721221924, "Pretrain/Loss (Raw)": 1.7987991571426392, "Pretrain/Step": 4395, "Pretrain/Step Time": 8.748662343248725} +{"Pretrain/Learning Rate": 2.935420966871795e-05, "Pretrain/Loss": 1.9878735542297363, "Pretrain/Loss (Raw)": 2.127592086791992, "Pretrain/Step": 4396, "Pretrain/Step Time": 8.74896671064198} +{"Pretrain/Learning Rate": 2.9345849304875195e-05, "Pretrain/Loss": 1.9878697395324707, "Pretrain/Loss (Raw)": 2.0057249069213867, "Pretrain/Step": 4397, "Pretrain/Step Time": 8.755243800580502} +{"Pretrain/Learning Rate": 2.9337488439848633e-05, "Pretrain/Loss": 1.986993432044983, "Pretrain/Loss (Raw)": 1.8374807834625244, "Pretrain/Step": 4398, "Pretrain/Step Time": 8.75283444300294} +{"Pretrain/Learning Rate": 2.9329127074602458e-05, "Pretrain/Loss": 1.9882311820983887, "Pretrain/Loss (Raw)": 1.9455583095550537, "Pretrain/Step": 4399, "Pretrain/Step Time": 8.748916909098625} +{"Pretrain/Learning Rate": 2.9320765210100952e-05, "Pretrain/Loss": 1.9868876934051514, "Pretrain/Loss (Raw)": 1.8363007307052612, "Pretrain/Step": 4400, "Pretrain/Step Time": 8.747357219457626} +{"Pretrain/Learning Rate": 2.931240284730844e-05, "Pretrain/Loss": 1.9835923910140991, "Pretrain/Loss (Raw)": 1.7168231010437012, "Pretrain/Step": 4401, "Pretrain/Step Time": 8.7476872112602} +{"Pretrain/Learning Rate": 2.9304039987189313e-05, "Pretrain/Loss": 1.9821031093597412, "Pretrain/Loss (Raw)": 1.8642771244049072, "Pretrain/Step": 4402, "Pretrain/Step Time": 8.74017545953393} +{"Pretrain/Learning Rate": 2.9295676630708013e-05, "Pretrain/Loss": 1.9803149700164795, "Pretrain/Loss (Raw)": 1.801479697227478, "Pretrain/Step": 4403, "Pretrain/Step Time": 8.74719494022429} +{"Pretrain/Learning Rate": 2.9287312778829047e-05, "Pretrain/Loss": 1.9802806377410889, "Pretrain/Loss (Raw)": 2.0972766876220703, "Pretrain/Step": 4404, "Pretrain/Step Time": 8.743891252204776} +{"Pretrain/Learning Rate": 2.9278948432516968e-05, "Pretrain/Loss": 1.9821679592132568, "Pretrain/Loss (Raw)": 1.9537450075149536, "Pretrain/Step": 4405, "Pretrain/Step Time": 8.742365999147296} +{"Pretrain/Learning Rate": 2.9270583592736385e-05, "Pretrain/Loss": 1.9800193309783936, "Pretrain/Loss (Raw)": 1.7777180671691895, "Pretrain/Step": 4406, "Pretrain/Step Time": 8.794908490031958} +{"Pretrain/Learning Rate": 2.9262218260451984e-05, "Pretrain/Loss": 1.9804909229278564, "Pretrain/Loss (Raw)": 2.099031686782837, "Pretrain/Step": 4407, "Pretrain/Step Time": 8.793656453490257} +{"Pretrain/Learning Rate": 2.9253852436628483e-05, "Pretrain/Loss": 1.983525276184082, "Pretrain/Loss (Raw)": 2.313788652420044, "Pretrain/Step": 4408, "Pretrain/Step Time": 8.795668363571167} +{"Pretrain/Learning Rate": 2.924548612223068e-05, "Pretrain/Loss": 1.9811688661575317, "Pretrain/Loss (Raw)": 1.9772621393203735, "Pretrain/Step": 4409, "Pretrain/Step Time": 8.79453738592565} +{"Pretrain/Learning Rate": 2.923711931822341e-05, "Pretrain/Loss": 1.980515718460083, "Pretrain/Loss (Raw)": 1.8315541744232178, "Pretrain/Step": 4410, "Pretrain/Step Time": 8.79686519689858} +{"Pretrain/Learning Rate": 2.9228752025571575e-05, "Pretrain/Loss": 1.979340672492981, "Pretrain/Loss (Raw)": 2.088618040084839, "Pretrain/Step": 4411, "Pretrain/Step Time": 8.801185144111514} +{"Pretrain/Learning Rate": 2.922038424524013e-05, "Pretrain/Loss": 1.9799755811691284, "Pretrain/Loss (Raw)": 2.100297451019287, "Pretrain/Step": 4412, "Pretrain/Step Time": 8.803267719224095} +{"Pretrain/Learning Rate": 2.9212015978194083e-05, "Pretrain/Loss": 1.9806432723999023, "Pretrain/Loss (Raw)": 2.239694118499756, "Pretrain/Step": 4413, "Pretrain/Step Time": 8.802364530041814} +{"Pretrain/Learning Rate": 2.920364722539851e-05, "Pretrain/Loss": 1.9802396297454834, "Pretrain/Loss (Raw)": 1.9839050769805908, "Pretrain/Step": 4414, "Pretrain/Step Time": 8.80321853235364} +{"Pretrain/Learning Rate": 2.9195277987818533e-05, "Pretrain/Loss": 1.9802398681640625, "Pretrain/Loss (Raw)": 2.0528368949890137, "Pretrain/Step": 4415, "Pretrain/Step Time": 8.802027154713869} +{"Pretrain/Learning Rate": 2.918690826641932e-05, "Pretrain/Loss": 1.9777944087982178, "Pretrain/Loss (Raw)": 1.8289207220077515, "Pretrain/Step": 4416, "Pretrain/Step Time": 8.798369478434324} +{"Pretrain/Learning Rate": 2.917853806216613e-05, "Pretrain/Loss": 1.9793672561645508, "Pretrain/Loss (Raw)": 2.064110040664673, "Pretrain/Step": 4417, "Pretrain/Step Time": 8.794331980869174} +{"Pretrain/Learning Rate": 2.9170167376024228e-05, "Pretrain/Loss": 1.9789425134658813, "Pretrain/Loss (Raw)": 1.9428930282592773, "Pretrain/Step": 4418, "Pretrain/Step Time": 8.795403521507978} +{"Pretrain/Learning Rate": 2.9161796208958974e-05, "Pretrain/Loss": 1.9778151512145996, "Pretrain/Loss (Raw)": 1.8371080160140991, "Pretrain/Step": 4419, "Pretrain/Step Time": 8.795385409146547} +{"Pretrain/Learning Rate": 2.9153424561935782e-05, "Pretrain/Loss": 1.9783220291137695, "Pretrain/Loss (Raw)": 2.0052318572998047, "Pretrain/Step": 4420, "Pretrain/Step Time": 8.794018890708685} +{"Pretrain/Learning Rate": 2.914505243592009e-05, "Pretrain/Loss": 1.9788479804992676, "Pretrain/Loss (Raw)": 2.017148733139038, "Pretrain/Step": 4421, "Pretrain/Step Time": 8.792906308546662} +{"Pretrain/Learning Rate": 2.913667983187742e-05, "Pretrain/Loss": 1.979682445526123, "Pretrain/Loss (Raw)": 2.0774309635162354, "Pretrain/Step": 4422, "Pretrain/Step Time": 8.79749834164977} +{"Pretrain/Learning Rate": 2.9128306750773338e-05, "Pretrain/Loss": 1.9817005395889282, "Pretrain/Loss (Raw)": 2.069883346557617, "Pretrain/Step": 4423, "Pretrain/Step Time": 8.799980353564024} +{"Pretrain/Learning Rate": 2.911993319357347e-05, "Pretrain/Loss": 1.98115873336792, "Pretrain/Loss (Raw)": 1.8925954103469849, "Pretrain/Step": 4424, "Pretrain/Step Time": 8.798617688938975} +{"Pretrain/Learning Rate": 2.911155916124349e-05, "Pretrain/Loss": 1.9806709289550781, "Pretrain/Loss (Raw)": 1.986915111541748, "Pretrain/Step": 4425, "Pretrain/Step Time": 8.80377389676869} +{"Pretrain/Learning Rate": 2.910318465474914e-05, "Pretrain/Loss": 1.9787209033966064, "Pretrain/Loss (Raw)": 1.9334157705307007, "Pretrain/Step": 4426, "Pretrain/Step Time": 8.799743965268135} +{"Pretrain/Learning Rate": 2.9094809675056188e-05, "Pretrain/Loss": 1.977271318435669, "Pretrain/Loss (Raw)": 1.9161341190338135, "Pretrain/Step": 4427, "Pretrain/Step Time": 8.799835413694382} +{"Pretrain/Learning Rate": 2.9086434223130504e-05, "Pretrain/Loss": 1.976799488067627, "Pretrain/Loss (Raw)": 1.975819706916809, "Pretrain/Step": 4428, "Pretrain/Step Time": 8.79696180485189} +{"Pretrain/Learning Rate": 2.9078058299937962e-05, "Pretrain/Loss": 1.97421395778656, "Pretrain/Loss (Raw)": 1.8179353475570679, "Pretrain/Step": 4429, "Pretrain/Step Time": 8.801965083926916} +{"Pretrain/Learning Rate": 2.9069681906444518e-05, "Pretrain/Loss": 1.9737248420715332, "Pretrain/Loss (Raw)": 1.8901653289794922, "Pretrain/Step": 4430, "Pretrain/Step Time": 8.799489252269268} +{"Pretrain/Learning Rate": 2.906130504361619e-05, "Pretrain/Loss": 1.9726061820983887, "Pretrain/Loss (Raw)": 1.8072983026504517, "Pretrain/Step": 4431, "Pretrain/Step Time": 8.80116306245327} +{"Pretrain/Learning Rate": 2.9052927712419013e-05, "Pretrain/Loss": 1.9716534614562988, "Pretrain/Loss (Raw)": 2.018965244293213, "Pretrain/Step": 4432, "Pretrain/Step Time": 8.79755343310535} +{"Pretrain/Learning Rate": 2.9044549913819124e-05, "Pretrain/Loss": 1.9732797145843506, "Pretrain/Loss (Raw)": 2.133526563644409, "Pretrain/Step": 4433, "Pretrain/Step Time": 8.790580982342362} +{"Pretrain/Learning Rate": 2.9036171648782672e-05, "Pretrain/Loss": 1.9754513502120972, "Pretrain/Loss (Raw)": 2.0823397636413574, "Pretrain/Step": 4434, "Pretrain/Step Time": 8.791053647175431} +{"Pretrain/Learning Rate": 2.9027792918275894e-05, "Pretrain/Loss": 1.9741718769073486, "Pretrain/Loss (Raw)": 1.6992405652999878, "Pretrain/Step": 4435, "Pretrain/Step Time": 8.790557121858} +{"Pretrain/Learning Rate": 2.9019413723265053e-05, "Pretrain/Loss": 1.973085880279541, "Pretrain/Loss (Raw)": 1.769202709197998, "Pretrain/Step": 4436, "Pretrain/Step Time": 8.79225991666317} +{"Pretrain/Learning Rate": 2.9011034064716485e-05, "Pretrain/Loss": 1.9733256101608276, "Pretrain/Loss (Raw)": 1.8333996534347534, "Pretrain/Step": 4437, "Pretrain/Step Time": 8.797620795667171} +{"Pretrain/Learning Rate": 2.9002653943596564e-05, "Pretrain/Loss": 1.9740296602249146, "Pretrain/Loss (Raw)": 2.035444974899292, "Pretrain/Step": 4438, "Pretrain/Step Time": 8.792882641777396} +{"Pretrain/Learning Rate": 2.8994273360871734e-05, "Pretrain/Loss": 1.973722219467163, "Pretrain/Loss (Raw)": 2.0709190368652344, "Pretrain/Step": 4439, "Pretrain/Step Time": 8.796761132776737} +{"Pretrain/Learning Rate": 2.898589231750847e-05, "Pretrain/Loss": 1.974382996559143, "Pretrain/Loss (Raw)": 2.0853919982910156, "Pretrain/Step": 4440, "Pretrain/Step Time": 8.799694212153554} +{"Pretrain/Learning Rate": 2.897751081447333e-05, "Pretrain/Loss": 1.9747405052185059, "Pretrain/Loss (Raw)": 2.1189606189727783, "Pretrain/Step": 4441, "Pretrain/Step Time": 8.797317462041974} +{"Pretrain/Learning Rate": 2.8969128852732896e-05, "Pretrain/Loss": 1.977205753326416, "Pretrain/Loss (Raw)": 2.229860305786133, "Pretrain/Step": 4442, "Pretrain/Step Time": 8.801215093582869} +{"Pretrain/Learning Rate": 2.896074643325382e-05, "Pretrain/Loss": 1.9795961380004883, "Pretrain/Loss (Raw)": 1.8875229358673096, "Pretrain/Step": 4443, "Pretrain/Step Time": 8.798561664298177} +{"Pretrain/Learning Rate": 2.8952363557002798e-05, "Pretrain/Loss": 1.978790044784546, "Pretrain/Loss (Raw)": 2.1475939750671387, "Pretrain/Step": 4444, "Pretrain/Step Time": 8.797784609720111} +{"Pretrain/Learning Rate": 2.89439802249466e-05, "Pretrain/Loss": 1.9756436347961426, "Pretrain/Loss (Raw)": 1.6413003206253052, "Pretrain/Step": 4445, "Pretrain/Step Time": 8.804615516215563} +{"Pretrain/Learning Rate": 2.8935596438052003e-05, "Pretrain/Loss": 1.9749114513397217, "Pretrain/Loss (Raw)": 2.016613006591797, "Pretrain/Step": 4446, "Pretrain/Step Time": 8.805209824815392} +{"Pretrain/Learning Rate": 2.8927212197285885e-05, "Pretrain/Loss": 1.9728338718414307, "Pretrain/Loss (Raw)": 1.684415578842163, "Pretrain/Step": 4447, "Pretrain/Step Time": 8.802377911284566} +{"Pretrain/Learning Rate": 2.8918827503615154e-05, "Pretrain/Loss": 1.9738383293151855, "Pretrain/Loss (Raw)": 1.9420164823532104, "Pretrain/Step": 4448, "Pretrain/Step Time": 8.80052281357348} +{"Pretrain/Learning Rate": 2.891044235800676e-05, "Pretrain/Loss": 1.9740850925445557, "Pretrain/Loss (Raw)": 2.047534704208374, "Pretrain/Step": 4449, "Pretrain/Step Time": 8.797907307744026} +{"Pretrain/Learning Rate": 2.8902056761427744e-05, "Pretrain/Loss": 1.9751746654510498, "Pretrain/Loss (Raw)": 1.9771100282669067, "Pretrain/Step": 4450, "Pretrain/Step Time": 8.787376180291176} +{"Pretrain/Learning Rate": 2.889367071484514e-05, "Pretrain/Loss": 1.9732253551483154, "Pretrain/Loss (Raw)": 1.7590214014053345, "Pretrain/Step": 4451, "Pretrain/Step Time": 8.78770344890654} +{"Pretrain/Learning Rate": 2.888528421922608e-05, "Pretrain/Loss": 1.9754936695098877, "Pretrain/Loss (Raw)": 2.1217732429504395, "Pretrain/Step": 4452, "Pretrain/Step Time": 8.790062177926302} +{"Pretrain/Learning Rate": 2.8876897275537744e-05, "Pretrain/Loss": 1.9770232439041138, "Pretrain/Loss (Raw)": 2.056112766265869, "Pretrain/Step": 4453, "Pretrain/Step Time": 8.785205477848649} +{"Pretrain/Learning Rate": 2.8868509884747348e-05, "Pretrain/Loss": 1.9758996963500977, "Pretrain/Loss (Raw)": 2.076080799102783, "Pretrain/Step": 4454, "Pretrain/Step Time": 8.788926977664232} +{"Pretrain/Learning Rate": 2.8860122047822154e-05, "Pretrain/Loss": 1.9780031442642212, "Pretrain/Loss (Raw)": 1.9422942399978638, "Pretrain/Step": 4455, "Pretrain/Step Time": 8.792111773043871} +{"Pretrain/Learning Rate": 2.88517337657295e-05, "Pretrain/Loss": 1.9784635305404663, "Pretrain/Loss (Raw)": 2.129396915435791, "Pretrain/Step": 4456, "Pretrain/Step Time": 8.789089247584343} +{"Pretrain/Learning Rate": 2.8843345039436758e-05, "Pretrain/Loss": 1.978137493133545, "Pretrain/Loss (Raw)": 1.810316801071167, "Pretrain/Step": 4457, "Pretrain/Step Time": 8.792164612561464} +{"Pretrain/Learning Rate": 2.8834955869911356e-05, "Pretrain/Loss": 1.978724718093872, "Pretrain/Loss (Raw)": 2.2114200592041016, "Pretrain/Step": 4458, "Pretrain/Step Time": 8.795865722000599} +{"Pretrain/Learning Rate": 2.8826566258120768e-05, "Pretrain/Loss": 1.980078935623169, "Pretrain/Loss (Raw)": 2.19661021232605, "Pretrain/Step": 4459, "Pretrain/Step Time": 8.799314023926854} +{"Pretrain/Learning Rate": 2.8818176205032533e-05, "Pretrain/Loss": 1.9810194969177246, "Pretrain/Loss (Raw)": 1.915515422821045, "Pretrain/Step": 4460, "Pretrain/Step Time": 8.797929460182786} +{"Pretrain/Learning Rate": 2.8809785711614228e-05, "Pretrain/Loss": 1.9824976921081543, "Pretrain/Loss (Raw)": 2.034623384475708, "Pretrain/Step": 4461, "Pretrain/Step Time": 8.792393397539854} +{"Pretrain/Learning Rate": 2.8801394778833475e-05, "Pretrain/Loss": 1.9825167655944824, "Pretrain/Loss (Raw)": 2.0406055450439453, "Pretrain/Step": 4462, "Pretrain/Step Time": 8.796559643000364} +{"Pretrain/Learning Rate": 2.879300340765797e-05, "Pretrain/Loss": 1.9834414720535278, "Pretrain/Loss (Raw)": 2.0078749656677246, "Pretrain/Step": 4463, "Pretrain/Step Time": 8.785525623708963} +{"Pretrain/Learning Rate": 2.8784611599055435e-05, "Pretrain/Loss": 1.9837099313735962, "Pretrain/Loss (Raw)": 1.9902312755584717, "Pretrain/Step": 4464, "Pretrain/Step Time": 8.783318040892482} +{"Pretrain/Learning Rate": 2.8776219353993662e-05, "Pretrain/Loss": 1.9843782186508179, "Pretrain/Loss (Raw)": 2.075561046600342, "Pretrain/Step": 4465, "Pretrain/Step Time": 8.78573533706367} +{"Pretrain/Learning Rate": 2.8767826673440467e-05, "Pretrain/Loss": 1.9845682382583618, "Pretrain/Loss (Raw)": 1.7242767810821533, "Pretrain/Step": 4466, "Pretrain/Step Time": 8.783506974577904} +{"Pretrain/Learning Rate": 2.8759433558363758e-05, "Pretrain/Loss": 1.9819087982177734, "Pretrain/Loss (Raw)": 1.9998130798339844, "Pretrain/Step": 4467, "Pretrain/Step Time": 8.786637213081121} +{"Pretrain/Learning Rate": 2.875104000973145e-05, "Pretrain/Loss": 1.9822211265563965, "Pretrain/Loss (Raw)": 2.105935573577881, "Pretrain/Step": 4468, "Pretrain/Step Time": 8.787510694935918} +{"Pretrain/Learning Rate": 2.874264602851154e-05, "Pretrain/Loss": 1.9829903841018677, "Pretrain/Loss (Raw)": 2.1221654415130615, "Pretrain/Step": 4469, "Pretrain/Step Time": 8.7831424549222} +{"Pretrain/Learning Rate": 2.8734251615672043e-05, "Pretrain/Loss": 1.9816919565200806, "Pretrain/Loss (Raw)": 2.0681636333465576, "Pretrain/Step": 4470, "Pretrain/Step Time": 8.790749909356236} +{"Pretrain/Learning Rate": 2.8725856772181058e-05, "Pretrain/Loss": 1.9793691635131836, "Pretrain/Loss (Raw)": 1.7572416067123413, "Pretrain/Step": 4471, "Pretrain/Step Time": 8.79096301086247} +{"Pretrain/Learning Rate": 2.8717461499006714e-05, "Pretrain/Loss": 1.9782383441925049, "Pretrain/Loss (Raw)": 2.037127733230591, "Pretrain/Step": 4472, "Pretrain/Step Time": 8.783873537555337} +{"Pretrain/Learning Rate": 2.8709065797117198e-05, "Pretrain/Loss": 1.977880835533142, "Pretrain/Loss (Raw)": 1.9577018022537231, "Pretrain/Step": 4473, "Pretrain/Step Time": 8.785105494782329} +{"Pretrain/Learning Rate": 2.8700669667480732e-05, "Pretrain/Loss": 1.9752631187438965, "Pretrain/Loss (Raw)": 1.830394983291626, "Pretrain/Step": 4474, "Pretrain/Step Time": 8.78424072638154} +{"Pretrain/Learning Rate": 2.86922731110656e-05, "Pretrain/Loss": 1.974963665008545, "Pretrain/Loss (Raw)": 2.0938568115234375, "Pretrain/Step": 4475, "Pretrain/Step Time": 8.784034280106425} +{"Pretrain/Learning Rate": 2.8683876128840138e-05, "Pretrain/Loss": 1.9789130687713623, "Pretrain/Loss (Raw)": 1.9472109079360962, "Pretrain/Step": 4476, "Pretrain/Step Time": 8.787171831354499} +{"Pretrain/Learning Rate": 2.8675478721772715e-05, "Pretrain/Loss": 1.977677583694458, "Pretrain/Loss (Raw)": 1.9953876733779907, "Pretrain/Step": 4477, "Pretrain/Step Time": 8.785397252067924} +{"Pretrain/Learning Rate": 2.866708089083177e-05, "Pretrain/Loss": 1.979645013809204, "Pretrain/Loss (Raw)": 2.1641287803649902, "Pretrain/Step": 4478, "Pretrain/Step Time": 8.783422488719225} +{"Pretrain/Learning Rate": 2.865868263698578e-05, "Pretrain/Loss": 1.978317379951477, "Pretrain/Loss (Raw)": 2.0454277992248535, "Pretrain/Step": 4479, "Pretrain/Step Time": 8.786087391898036} +{"Pretrain/Learning Rate": 2.8650283961203267e-05, "Pretrain/Loss": 1.9782683849334717, "Pretrain/Loss (Raw)": 1.968672275543213, "Pretrain/Step": 4480, "Pretrain/Step Time": 8.78118728660047} +{"Pretrain/Learning Rate": 2.86418848644528e-05, "Pretrain/Loss": 1.9797229766845703, "Pretrain/Loss (Raw)": 2.1028382778167725, "Pretrain/Step": 4481, "Pretrain/Step Time": 8.780303813517094} +{"Pretrain/Learning Rate": 2.8633485347703015e-05, "Pretrain/Loss": 1.9824395179748535, "Pretrain/Loss (Raw)": 2.110748052597046, "Pretrain/Step": 4482, "Pretrain/Step Time": 8.781284727156162} +{"Pretrain/Learning Rate": 2.8625085411922575e-05, "Pretrain/Loss": 1.9813566207885742, "Pretrain/Loss (Raw)": 2.0078980922698975, "Pretrain/Step": 4483, "Pretrain/Step Time": 8.784749813377857} +{"Pretrain/Learning Rate": 2.861668505808021e-05, "Pretrain/Loss": 1.9816206693649292, "Pretrain/Loss (Raw)": 2.1127023696899414, "Pretrain/Step": 4484, "Pretrain/Step Time": 8.79364661872387} +{"Pretrain/Learning Rate": 2.8608284287144675e-05, "Pretrain/Loss": 1.9815593957901, "Pretrain/Loss (Raw)": 1.9321054220199585, "Pretrain/Step": 4485, "Pretrain/Step Time": 8.791508799418807} +{"Pretrain/Learning Rate": 2.85998831000848e-05, "Pretrain/Loss": 1.9826604127883911, "Pretrain/Loss (Raw)": 2.1412649154663086, "Pretrain/Step": 4486, "Pretrain/Step Time": 8.795171609148383} +{"Pretrain/Learning Rate": 2.8591481497869433e-05, "Pretrain/Loss": 1.9824039936065674, "Pretrain/Loss (Raw)": 2.0302376747131348, "Pretrain/Step": 4487, "Pretrain/Step Time": 8.79469738341868} +{"Pretrain/Learning Rate": 2.8583079481467507e-05, "Pretrain/Loss": 1.9851248264312744, "Pretrain/Loss (Raw)": 2.196796417236328, "Pretrain/Step": 4488, "Pretrain/Step Time": 8.793556926771998} +{"Pretrain/Learning Rate": 2.857467705184797e-05, "Pretrain/Loss": 1.9834134578704834, "Pretrain/Loss (Raw)": 1.7878468036651611, "Pretrain/Step": 4489, "Pretrain/Step Time": 8.79104970023036} +{"Pretrain/Learning Rate": 2.856627420997982e-05, "Pretrain/Loss": 1.984048843383789, "Pretrain/Loss (Raw)": 2.1374220848083496, "Pretrain/Step": 4490, "Pretrain/Step Time": 8.791947176679969} +{"Pretrain/Learning Rate": 2.8557870956832132e-05, "Pretrain/Loss": 1.986072063446045, "Pretrain/Loss (Raw)": 2.06471586227417, "Pretrain/Step": 4491, "Pretrain/Step Time": 8.788235124200583} +{"Pretrain/Learning Rate": 2.8549467293374e-05, "Pretrain/Loss": 1.9860053062438965, "Pretrain/Loss (Raw)": 2.025141477584839, "Pretrain/Step": 4492, "Pretrain/Step Time": 8.79820260964334} +{"Pretrain/Learning Rate": 2.854106322057457e-05, "Pretrain/Loss": 1.9874272346496582, "Pretrain/Loss (Raw)": 2.116917848587036, "Pretrain/Step": 4493, "Pretrain/Step Time": 8.791348673403263} +{"Pretrain/Learning Rate": 2.8532658739403046e-05, "Pretrain/Loss": 1.9866526126861572, "Pretrain/Loss (Raw)": 1.8820652961730957, "Pretrain/Step": 4494, "Pretrain/Step Time": 8.792682250961661} +{"Pretrain/Learning Rate": 2.852425385082867e-05, "Pretrain/Loss": 1.9854490756988525, "Pretrain/Loss (Raw)": 1.9682916402816772, "Pretrain/Step": 4495, "Pretrain/Step Time": 8.791432010009885} +{"Pretrain/Learning Rate": 2.851584855582073e-05, "Pretrain/Loss": 1.9853429794311523, "Pretrain/Loss (Raw)": 1.6990588903427124, "Pretrain/Step": 4496, "Pretrain/Step Time": 8.788089459761977} +{"Pretrain/Learning Rate": 2.8507442855348577e-05, "Pretrain/Loss": 1.9860647916793823, "Pretrain/Loss (Raw)": 2.19195556640625, "Pretrain/Step": 4497, "Pretrain/Step Time": 8.786823054775596} +{"Pretrain/Learning Rate": 2.8499036750381576e-05, "Pretrain/Loss": 1.9849603176116943, "Pretrain/Loss (Raw)": 1.838494062423706, "Pretrain/Step": 4498, "Pretrain/Step Time": 8.797019125893712} +{"Pretrain/Learning Rate": 2.849063024188917e-05, "Pretrain/Loss": 1.985832929611206, "Pretrain/Loss (Raw)": 1.950485348701477, "Pretrain/Step": 4499, "Pretrain/Step Time": 8.790853802114725} +{"Pretrain/Learning Rate": 2.8482223330840836e-05, "Pretrain/Loss": 1.9907751083374023, "Pretrain/Loss (Raw)": 2.15094256401062, "Pretrain/Step": 4500, "Pretrain/Step Time": 8.790444411337376} +{"Pretrain/Learning Rate": 2.84738160182061e-05, "Pretrain/Loss": 1.9906272888183594, "Pretrain/Loss (Raw)": 1.962156057357788, "Pretrain/Step": 4501, "Pretrain/Step Time": 8.79264771193266} +{"Pretrain/Learning Rate": 2.8465408304954533e-05, "Pretrain/Loss": 1.9921094179153442, "Pretrain/Loss (Raw)": 2.2360453605651855, "Pretrain/Step": 4502, "Pretrain/Step Time": 8.797795306891203} +{"Pretrain/Learning Rate": 2.8457000192055748e-05, "Pretrain/Loss": 1.9924064874649048, "Pretrain/Loss (Raw)": 1.9656093120574951, "Pretrain/Step": 4503, "Pretrain/Step Time": 8.79654062539339} +{"Pretrain/Learning Rate": 2.8448591680479415e-05, "Pretrain/Loss": 1.9942805767059326, "Pretrain/Loss (Raw)": 2.076455593109131, "Pretrain/Step": 4504, "Pretrain/Step Time": 8.795668372884393} +{"Pretrain/Learning Rate": 2.8440182771195235e-05, "Pretrain/Loss": 1.991091251373291, "Pretrain/Loss (Raw)": 1.703452229499817, "Pretrain/Step": 4505, "Pretrain/Step Time": 8.79291277192533} +{"Pretrain/Learning Rate": 2.8431773465172972e-05, "Pretrain/Loss": 1.9929715394973755, "Pretrain/Loss (Raw)": 2.1292457580566406, "Pretrain/Step": 4506, "Pretrain/Step Time": 8.792734218761325} +{"Pretrain/Learning Rate": 2.8423363763382415e-05, "Pretrain/Loss": 1.9923681020736694, "Pretrain/Loss (Raw)": 1.9996224641799927, "Pretrain/Step": 4507, "Pretrain/Step Time": 8.802169717848301} +{"Pretrain/Learning Rate": 2.8414953666793426e-05, "Pretrain/Loss": 1.9928414821624756, "Pretrain/Loss (Raw)": 2.059926986694336, "Pretrain/Step": 4508, "Pretrain/Step Time": 8.796600243076682} +{"Pretrain/Learning Rate": 2.8406543176375882e-05, "Pretrain/Loss": 1.9929698705673218, "Pretrain/Loss (Raw)": 1.9662114381790161, "Pretrain/Step": 4509, "Pretrain/Step Time": 8.794149653986096} +{"Pretrain/Learning Rate": 2.839813229309973e-05, "Pretrain/Loss": 1.9939180612564087, "Pretrain/Loss (Raw)": 2.1711337566375732, "Pretrain/Step": 4510, "Pretrain/Step Time": 8.765588680282235} +{"Pretrain/Learning Rate": 2.8389721017934945e-05, "Pretrain/Loss": 1.991486668586731, "Pretrain/Loss (Raw)": 1.7373863458633423, "Pretrain/Step": 4511, "Pretrain/Step Time": 8.767704386264086} +{"Pretrain/Learning Rate": 2.8381309351851564e-05, "Pretrain/Loss": 1.9919781684875488, "Pretrain/Loss (Raw)": 2.006443977355957, "Pretrain/Step": 4512, "Pretrain/Step Time": 8.764412067830563} +{"Pretrain/Learning Rate": 2.837289729581965e-05, "Pretrain/Loss": 1.9931788444519043, "Pretrain/Loss (Raw)": 2.173969268798828, "Pretrain/Step": 4513, "Pretrain/Step Time": 8.769609374925494} +{"Pretrain/Learning Rate": 2.8364484850809337e-05, "Pretrain/Loss": 1.9923871755599976, "Pretrain/Loss (Raw)": 2.0001654624938965, "Pretrain/Step": 4514, "Pretrain/Step Time": 8.776110673323274} +{"Pretrain/Learning Rate": 2.835607201779077e-05, "Pretrain/Loss": 1.9910316467285156, "Pretrain/Loss (Raw)": 1.7534043788909912, "Pretrain/Step": 4515, "Pretrain/Step Time": 8.77691126614809} +{"Pretrain/Learning Rate": 2.834765879773416e-05, "Pretrain/Loss": 1.992997407913208, "Pretrain/Loss (Raw)": 2.1104276180267334, "Pretrain/Step": 4516, "Pretrain/Step Time": 8.772634221240878} +{"Pretrain/Learning Rate": 2.833924519160977e-05, "Pretrain/Loss": 1.9892483949661255, "Pretrain/Loss (Raw)": 1.7839218378067017, "Pretrain/Step": 4517, "Pretrain/Step Time": 8.778375554829836} +{"Pretrain/Learning Rate": 2.8330831200387885e-05, "Pretrain/Loss": 1.9883853197097778, "Pretrain/Loss (Raw)": 1.970683217048645, "Pretrain/Step": 4518, "Pretrain/Step Time": 8.778202384710312} +{"Pretrain/Learning Rate": 2.8322416825038855e-05, "Pretrain/Loss": 1.9882924556732178, "Pretrain/Loss (Raw)": 2.045090436935425, "Pretrain/Step": 4519, "Pretrain/Step Time": 8.784013396129012} +{"Pretrain/Learning Rate": 2.831400206653305e-05, "Pretrain/Loss": 1.988232135772705, "Pretrain/Loss (Raw)": 2.0749762058258057, "Pretrain/Step": 4520, "Pretrain/Step Time": 8.779838997870684} +{"Pretrain/Learning Rate": 2.830558692584092e-05, "Pretrain/Loss": 1.9896106719970703, "Pretrain/Loss (Raw)": 2.14506196975708, "Pretrain/Step": 4521, "Pretrain/Step Time": 8.784168591722846} +{"Pretrain/Learning Rate": 2.8297171403932928e-05, "Pretrain/Loss": 1.9874366521835327, "Pretrain/Loss (Raw)": 1.7534939050674438, "Pretrain/Step": 4522, "Pretrain/Step Time": 8.785967575386167} +{"Pretrain/Learning Rate": 2.8288755501779597e-05, "Pretrain/Loss": 1.9876431226730347, "Pretrain/Loss (Raw)": 1.8252453804016113, "Pretrain/Step": 4523, "Pretrain/Step Time": 8.78426731005311} +{"Pretrain/Learning Rate": 2.8280339220351475e-05, "Pretrain/Loss": 1.9864546060562134, "Pretrain/Loss (Raw)": 1.9754530191421509, "Pretrain/Step": 4524, "Pretrain/Step Time": 8.784662671387196} +{"Pretrain/Learning Rate": 2.8271922560619184e-05, "Pretrain/Loss": 1.987120509147644, "Pretrain/Loss (Raw)": 2.0909583568573, "Pretrain/Step": 4525, "Pretrain/Step Time": 8.781248960644007} +{"Pretrain/Learning Rate": 2.8263505523553357e-05, "Pretrain/Loss": 1.9892995357513428, "Pretrain/Loss (Raw)": 2.1163768768310547, "Pretrain/Step": 4526, "Pretrain/Step Time": 8.778928514569998} +{"Pretrain/Learning Rate": 2.8255088110124705e-05, "Pretrain/Loss": 1.9905441999435425, "Pretrain/Loss (Raw)": 2.10490083694458, "Pretrain/Step": 4527, "Pretrain/Step Time": 8.782011007890105} +{"Pretrain/Learning Rate": 2.8246670321303947e-05, "Pretrain/Loss": 1.9926416873931885, "Pretrain/Loss (Raw)": 2.1047778129577637, "Pretrain/Step": 4528, "Pretrain/Step Time": 8.780371295288205} +{"Pretrain/Learning Rate": 2.8238252158061873e-05, "Pretrain/Loss": 1.9966641664505005, "Pretrain/Loss (Raw)": 2.2316887378692627, "Pretrain/Step": 4529, "Pretrain/Step Time": 8.779852245002985} +{"Pretrain/Learning Rate": 2.8229833621369295e-05, "Pretrain/Loss": 1.9992313385009766, "Pretrain/Loss (Raw)": 2.1928927898406982, "Pretrain/Step": 4530, "Pretrain/Step Time": 8.789532927796245} +{"Pretrain/Learning Rate": 2.822141471219709e-05, "Pretrain/Loss": 2.0002810955047607, "Pretrain/Loss (Raw)": 1.9358408451080322, "Pretrain/Step": 4531, "Pretrain/Step Time": 8.78012197650969} +{"Pretrain/Learning Rate": 2.8212995431516163e-05, "Pretrain/Loss": 2.0048179626464844, "Pretrain/Loss (Raw)": 2.678007125854492, "Pretrain/Step": 4532, "Pretrain/Step Time": 8.78578631952405} +{"Pretrain/Learning Rate": 2.820457578029746e-05, "Pretrain/Loss": 2.005941390991211, "Pretrain/Loss (Raw)": 2.0975496768951416, "Pretrain/Step": 4533, "Pretrain/Step Time": 8.787995640188456} +{"Pretrain/Learning Rate": 2.8196155759511977e-05, "Pretrain/Loss": 2.0072367191314697, "Pretrain/Loss (Raw)": 1.9434971809387207, "Pretrain/Step": 4534, "Pretrain/Step Time": 8.739765817299485} +{"Pretrain/Learning Rate": 2.8187735370130745e-05, "Pretrain/Loss": 2.0072035789489746, "Pretrain/Loss (Raw)": 2.0948004722595215, "Pretrain/Step": 4535, "Pretrain/Step Time": 8.739303909242153} +{"Pretrain/Learning Rate": 2.8179314613124858e-05, "Pretrain/Loss": 2.0021581649780273, "Pretrain/Loss (Raw)": 1.667991042137146, "Pretrain/Step": 4536, "Pretrain/Step Time": 8.73658418469131} +{"Pretrain/Learning Rate": 2.817089348946542e-05, "Pretrain/Loss": 2.002424716949463, "Pretrain/Loss (Raw)": 2.011368751525879, "Pretrain/Step": 4537, "Pretrain/Step Time": 8.738496899604797} +{"Pretrain/Learning Rate": 2.8162472000123613e-05, "Pretrain/Loss": 2.0046751499176025, "Pretrain/Loss (Raw)": 2.119598388671875, "Pretrain/Step": 4538, "Pretrain/Step Time": 8.738828646019101} +{"Pretrain/Learning Rate": 2.8154050146070627e-05, "Pretrain/Loss": 2.00374436378479, "Pretrain/Loss (Raw)": 1.9694825410842896, "Pretrain/Step": 4539, "Pretrain/Step Time": 8.732071178033948} +{"Pretrain/Learning Rate": 2.814562792827772e-05, "Pretrain/Loss": 2.0021274089813232, "Pretrain/Loss (Raw)": 1.8933391571044922, "Pretrain/Step": 4540, "Pretrain/Step Time": 8.730999514460564} +{"Pretrain/Learning Rate": 2.8137205347716165e-05, "Pretrain/Loss": 2.0008978843688965, "Pretrain/Loss (Raw)": 2.0822999477386475, "Pretrain/Step": 4541, "Pretrain/Step Time": 8.730079792439938} +{"Pretrain/Learning Rate": 2.8128782405357312e-05, "Pretrain/Loss": 2.001051664352417, "Pretrain/Loss (Raw)": 2.003594160079956, "Pretrain/Step": 4542, "Pretrain/Step Time": 8.728817829862237} +{"Pretrain/Learning Rate": 2.812035910217254e-05, "Pretrain/Loss": 2.002455234527588, "Pretrain/Loss (Raw)": 2.2324726581573486, "Pretrain/Step": 4543, "Pretrain/Step Time": 8.72655027359724} +{"Pretrain/Learning Rate": 2.811193543913324e-05, "Pretrain/Loss": 2.0020666122436523, "Pretrain/Loss (Raw)": 1.7792129516601562, "Pretrain/Step": 4544, "Pretrain/Step Time": 8.721128642559052} +{"Pretrain/Learning Rate": 2.8103511417210886e-05, "Pretrain/Loss": 2.0012168884277344, "Pretrain/Loss (Raw)": 1.9553124904632568, "Pretrain/Step": 4545, "Pretrain/Step Time": 8.723136935383081} +{"Pretrain/Learning Rate": 2.809508703737697e-05, "Pretrain/Loss": 2.0023584365844727, "Pretrain/Loss (Raw)": 2.089024305343628, "Pretrain/Step": 4546, "Pretrain/Step Time": 8.720368959009647} +{"Pretrain/Learning Rate": 2.808666230060304e-05, "Pretrain/Loss": 2.003012180328369, "Pretrain/Loss (Raw)": 1.9207631349563599, "Pretrain/Step": 4547, "Pretrain/Step Time": 8.721723798662424} +{"Pretrain/Learning Rate": 2.8078237207860658e-05, "Pretrain/Loss": 2.002997875213623, "Pretrain/Loss (Raw)": 2.0034358501434326, "Pretrain/Step": 4548, "Pretrain/Step Time": 8.723944813013077} +{"Pretrain/Learning Rate": 2.806981176012146e-05, "Pretrain/Loss": 2.000800848007202, "Pretrain/Loss (Raw)": 1.7359143495559692, "Pretrain/Step": 4549, "Pretrain/Step Time": 8.725220024585724} +{"Pretrain/Learning Rate": 2.80613859583571e-05, "Pretrain/Loss": 1.9984427690505981, "Pretrain/Loss (Raw)": 1.7755968570709229, "Pretrain/Step": 4550, "Pretrain/Step Time": 8.723297107964754} +{"Pretrain/Learning Rate": 2.8052959803539298e-05, "Pretrain/Loss": 2.0015859603881836, "Pretrain/Loss (Raw)": 2.472233295440674, "Pretrain/Step": 4551, "Pretrain/Step Time": 8.71845306828618} +{"Pretrain/Learning Rate": 2.8044533296639774e-05, "Pretrain/Loss": 2.001110315322876, "Pretrain/Loss (Raw)": 1.8316985368728638, "Pretrain/Step": 4552, "Pretrain/Step Time": 8.720347197726369} +{"Pretrain/Learning Rate": 2.8036106438630327e-05, "Pretrain/Loss": 2.0014522075653076, "Pretrain/Loss (Raw)": 2.0306663513183594, "Pretrain/Step": 4553, "Pretrain/Step Time": 8.717055330052972} +{"Pretrain/Learning Rate": 2.802767923048278e-05, "Pretrain/Loss": 2.0045723915100098, "Pretrain/Loss (Raw)": 2.3328182697296143, "Pretrain/Step": 4554, "Pretrain/Step Time": 8.716139297932386} +{"Pretrain/Learning Rate": 2.8019251673168993e-05, "Pretrain/Loss": 2.004518985748291, "Pretrain/Loss (Raw)": 1.9092673063278198, "Pretrain/Step": 4555, "Pretrain/Step Time": 8.713297927752137} +{"Pretrain/Learning Rate": 2.8010823767660887e-05, "Pretrain/Loss": 2.0049285888671875, "Pretrain/Loss (Raw)": 2.0282838344573975, "Pretrain/Step": 4556, "Pretrain/Step Time": 8.715369397774339} +{"Pretrain/Learning Rate": 2.8002395514930385e-05, "Pretrain/Loss": 2.0062241554260254, "Pretrain/Loss (Raw)": 1.983770728111267, "Pretrain/Step": 4557, "Pretrain/Step Time": 8.710527701303363} +{"Pretrain/Learning Rate": 2.7993966915949493e-05, "Pretrain/Loss": 2.00549054145813, "Pretrain/Loss (Raw)": 1.7962377071380615, "Pretrain/Step": 4558, "Pretrain/Step Time": 8.714686904102564} +{"Pretrain/Learning Rate": 2.7985537971690216e-05, "Pretrain/Loss": 2.007378101348877, "Pretrain/Loss (Raw)": 2.048903465270996, "Pretrain/Step": 4559, "Pretrain/Step Time": 8.71690410003066} +{"Pretrain/Learning Rate": 2.7977108683124647e-05, "Pretrain/Loss": 2.006871461868286, "Pretrain/Loss (Raw)": 1.9541289806365967, "Pretrain/Step": 4560, "Pretrain/Step Time": 8.72252393513918} +{"Pretrain/Learning Rate": 2.7968679051224868e-05, "Pretrain/Loss": 2.0053772926330566, "Pretrain/Loss (Raw)": 1.9422659873962402, "Pretrain/Step": 4561, "Pretrain/Step Time": 8.722856517881155} +{"Pretrain/Learning Rate": 2.796024907696303e-05, "Pretrain/Loss": 2.0030436515808105, "Pretrain/Loss (Raw)": 1.7836196422576904, "Pretrain/Step": 4562, "Pretrain/Step Time": 8.718279588967562} +{"Pretrain/Learning Rate": 2.795181876131132e-05, "Pretrain/Loss": 2.0044870376586914, "Pretrain/Loss (Raw)": 1.88401198387146, "Pretrain/Step": 4563, "Pretrain/Step Time": 8.71838315948844} +{"Pretrain/Learning Rate": 2.7943388105241968e-05, "Pretrain/Loss": 2.0073018074035645, "Pretrain/Loss (Raw)": 2.1295127868652344, "Pretrain/Step": 4564, "Pretrain/Step Time": 8.724559966474771} +{"Pretrain/Learning Rate": 2.793495710972722e-05, "Pretrain/Loss": 2.008233070373535, "Pretrain/Loss (Raw)": 1.9525741338729858, "Pretrain/Step": 4565, "Pretrain/Step Time": 8.721794117242098} +{"Pretrain/Learning Rate": 2.79265257757394e-05, "Pretrain/Loss": 2.007230281829834, "Pretrain/Loss (Raw)": 1.907106876373291, "Pretrain/Step": 4566, "Pretrain/Step Time": 8.724663043394685} +{"Pretrain/Learning Rate": 2.7918094104250826e-05, "Pretrain/Loss": 2.004758834838867, "Pretrain/Loss (Raw)": 1.7545474767684937, "Pretrain/Step": 4567, "Pretrain/Step Time": 8.717207945883274} +{"Pretrain/Learning Rate": 2.7909662096233897e-05, "Pretrain/Loss": 2.0003809928894043, "Pretrain/Loss (Raw)": 1.525020956993103, "Pretrain/Step": 4568, "Pretrain/Step Time": 8.71744742617011} +{"Pretrain/Learning Rate": 2.7901229752661018e-05, "Pretrain/Loss": 2.000915050506592, "Pretrain/Loss (Raw)": 2.187356948852539, "Pretrain/Step": 4569, "Pretrain/Step Time": 8.717523334547877} +{"Pretrain/Learning Rate": 2.7892797074504656e-05, "Pretrain/Loss": 2.0009994506835938, "Pretrain/Loss (Raw)": 2.240670680999756, "Pretrain/Step": 4570, "Pretrain/Step Time": 8.71436313726008} +{"Pretrain/Learning Rate": 2.78843640627373e-05, "Pretrain/Loss": 2.00118088722229, "Pretrain/Loss (Raw)": 1.9107340574264526, "Pretrain/Step": 4571, "Pretrain/Step Time": 8.71552950143814} +{"Pretrain/Learning Rate": 2.7875930718331496e-05, "Pretrain/Loss": 2.0007457733154297, "Pretrain/Loss (Raw)": 2.0918612480163574, "Pretrain/Step": 4572, "Pretrain/Step Time": 8.710654255002737} +{"Pretrain/Learning Rate": 2.786749704225981e-05, "Pretrain/Loss": 2.001096248626709, "Pretrain/Loss (Raw)": 1.6861834526062012, "Pretrain/Step": 4573, "Pretrain/Step Time": 8.706684658303857} +{"Pretrain/Learning Rate": 2.785906303549485e-05, "Pretrain/Loss": 2.0012784004211426, "Pretrain/Loss (Raw)": 2.039935827255249, "Pretrain/Step": 4574, "Pretrain/Step Time": 8.708224276080728} +{"Pretrain/Learning Rate": 2.7850628699009268e-05, "Pretrain/Loss": 2.004329204559326, "Pretrain/Loss (Raw)": 2.074896812438965, "Pretrain/Step": 4575, "Pretrain/Step Time": 8.705551590770483} +{"Pretrain/Learning Rate": 2.7842194033775747e-05, "Pretrain/Loss": 2.0029444694519043, "Pretrain/Loss (Raw)": 1.7647998332977295, "Pretrain/Step": 4576, "Pretrain/Step Time": 8.708610137924552} +{"Pretrain/Learning Rate": 2.7833759040767027e-05, "Pretrain/Loss": 2.002957344055176, "Pretrain/Loss (Raw)": 2.049164295196533, "Pretrain/Step": 4577, "Pretrain/Step Time": 8.706424590200186} +{"Pretrain/Learning Rate": 2.7825323720955853e-05, "Pretrain/Loss": 2.0009889602661133, "Pretrain/Loss (Raw)": 1.7251633405685425, "Pretrain/Step": 4578, "Pretrain/Step Time": 8.706124104559422} +{"Pretrain/Learning Rate": 2.781688807531504e-05, "Pretrain/Loss": 2.002284526824951, "Pretrain/Loss (Raw)": 1.9248849153518677, "Pretrain/Step": 4579, "Pretrain/Step Time": 8.706375770270824} +{"Pretrain/Learning Rate": 2.7808452104817412e-05, "Pretrain/Loss": 2.0010740756988525, "Pretrain/Loss (Raw)": 1.966812014579773, "Pretrain/Step": 4580, "Pretrain/Step Time": 8.707052433863282} +{"Pretrain/Learning Rate": 2.7800015810435865e-05, "Pretrain/Loss": 2.0010433197021484, "Pretrain/Loss (Raw)": 2.0521626472473145, "Pretrain/Step": 4581, "Pretrain/Step Time": 8.715413704514503} +{"Pretrain/Learning Rate": 2.779157919314329e-05, "Pretrain/Loss": 1.9983618259429932, "Pretrain/Loss (Raw)": 1.732856035232544, "Pretrain/Step": 4582, "Pretrain/Step Time": 8.711441524326801} +{"Pretrain/Learning Rate": 2.7783142253912647e-05, "Pretrain/Loss": 1.9992320537567139, "Pretrain/Loss (Raw)": 2.0536935329437256, "Pretrain/Step": 4583, "Pretrain/Step Time": 8.70978120341897} +{"Pretrain/Learning Rate": 2.7774704993716937e-05, "Pretrain/Loss": 1.998785138130188, "Pretrain/Loss (Raw)": 2.07218074798584, "Pretrain/Step": 4584, "Pretrain/Step Time": 8.715087292715907} +{"Pretrain/Learning Rate": 2.776626741352916e-05, "Pretrain/Loss": 2.0003442764282227, "Pretrain/Loss (Raw)": 2.0099029541015625, "Pretrain/Step": 4585, "Pretrain/Step Time": 8.710536478087306} +{"Pretrain/Learning Rate": 2.7757829514322397e-05, "Pretrain/Loss": 1.9965417385101318, "Pretrain/Loss (Raw)": 1.7246925830841064, "Pretrain/Step": 4586, "Pretrain/Step Time": 8.704802796244621} +{"Pretrain/Learning Rate": 2.774939129706974e-05, "Pretrain/Loss": 1.9958302974700928, "Pretrain/Loss (Raw)": 2.1055426597595215, "Pretrain/Step": 4587, "Pretrain/Step Time": 8.700542211532593} +{"Pretrain/Learning Rate": 2.7740952762744322e-05, "Pretrain/Loss": 1.9945878982543945, "Pretrain/Loss (Raw)": 1.7564706802368164, "Pretrain/Step": 4588, "Pretrain/Step Time": 8.703229872509837} +{"Pretrain/Learning Rate": 2.7732513912319314e-05, "Pretrain/Loss": 1.9927468299865723, "Pretrain/Loss (Raw)": 1.7989745140075684, "Pretrain/Step": 4589, "Pretrain/Step Time": 8.69704538397491} +{"Pretrain/Learning Rate": 2.7724074746767926e-05, "Pretrain/Loss": 1.9934409856796265, "Pretrain/Loss (Raw)": 2.129465341567993, "Pretrain/Step": 4590, "Pretrain/Step Time": 8.691685101017356} +{"Pretrain/Learning Rate": 2.77156352670634e-05, "Pretrain/Loss": 1.9927618503570557, "Pretrain/Loss (Raw)": 1.9209343194961548, "Pretrain/Step": 4591, "Pretrain/Step Time": 8.688797244802117} +{"Pretrain/Learning Rate": 2.770719547417902e-05, "Pretrain/Loss": 1.9919723272323608, "Pretrain/Loss (Raw)": 1.8891807794570923, "Pretrain/Step": 4592, "Pretrain/Step Time": 8.685977853834629} +{"Pretrain/Learning Rate": 2.76987553690881e-05, "Pretrain/Loss": 1.9919228553771973, "Pretrain/Loss (Raw)": 2.069230318069458, "Pretrain/Step": 4593, "Pretrain/Step Time": 8.685485294088721} +{"Pretrain/Learning Rate": 2.7690314952764e-05, "Pretrain/Loss": 1.9942376613616943, "Pretrain/Loss (Raw)": 2.0205676555633545, "Pretrain/Step": 4594, "Pretrain/Step Time": 8.68370526842773} +{"Pretrain/Learning Rate": 2.7681874226180093e-05, "Pretrain/Loss": 1.9940321445465088, "Pretrain/Loss (Raw)": 1.9735132455825806, "Pretrain/Step": 4595, "Pretrain/Step Time": 8.686029879376292} +{"Pretrain/Learning Rate": 2.7673433190309823e-05, "Pretrain/Loss": 1.9934886693954468, "Pretrain/Loss (Raw)": 2.0363645553588867, "Pretrain/Step": 4596, "Pretrain/Step Time": 8.685924146324396} +{"Pretrain/Learning Rate": 2.766499184612663e-05, "Pretrain/Loss": 1.993685007095337, "Pretrain/Loss (Raw)": 2.1472997665405273, "Pretrain/Step": 4597, "Pretrain/Step Time": 8.68880264647305} +{"Pretrain/Learning Rate": 2.7656550194604026e-05, "Pretrain/Loss": 1.9927104711532593, "Pretrain/Loss (Raw)": 1.9434176683425903, "Pretrain/Step": 4598, "Pretrain/Step Time": 8.683575680479407} +{"Pretrain/Learning Rate": 2.7648108236715536e-05, "Pretrain/Loss": 1.990785837173462, "Pretrain/Loss (Raw)": 1.5108916759490967, "Pretrain/Step": 4599, "Pretrain/Step Time": 8.682403126731515} +{"Pretrain/Learning Rate": 2.7639665973434725e-05, "Pretrain/Loss": 1.988692283630371, "Pretrain/Loss (Raw)": 1.7691521644592285, "Pretrain/Step": 4600, "Pretrain/Step Time": 8.69063000753522} +{"Pretrain/Learning Rate": 2.7631223405735196e-05, "Pretrain/Loss": 1.9889789819717407, "Pretrain/Loss (Raw)": 1.994388461112976, "Pretrain/Step": 4601, "Pretrain/Step Time": 8.690345373004675} +{"Pretrain/Learning Rate": 2.7622780534590582e-05, "Pretrain/Loss": 1.9910047054290771, "Pretrain/Loss (Raw)": 2.089694023132324, "Pretrain/Step": 4602, "Pretrain/Step Time": 8.688556589186192} +{"Pretrain/Learning Rate": 2.7614337360974558e-05, "Pretrain/Loss": 1.9901902675628662, "Pretrain/Loss (Raw)": 1.9896076917648315, "Pretrain/Step": 4603, "Pretrain/Step Time": 8.690839394927025} +{"Pretrain/Learning Rate": 2.760589388586083e-05, "Pretrain/Loss": 1.9909911155700684, "Pretrain/Loss (Raw)": 2.049717664718628, "Pretrain/Step": 4604, "Pretrain/Step Time": 8.686659697443247} +{"Pretrain/Learning Rate": 2.7597450110223145e-05, "Pretrain/Loss": 1.99021315574646, "Pretrain/Loss (Raw)": 1.895807147026062, "Pretrain/Step": 4605, "Pretrain/Step Time": 8.684231955558062} +{"Pretrain/Learning Rate": 2.7589006035035264e-05, "Pretrain/Loss": 1.9908101558685303, "Pretrain/Loss (Raw)": 2.2405498027801514, "Pretrain/Step": 4606, "Pretrain/Step Time": 8.685104122385383} +{"Pretrain/Learning Rate": 2.7580561661271014e-05, "Pretrain/Loss": 1.989168405532837, "Pretrain/Loss (Raw)": 1.8352831602096558, "Pretrain/Step": 4607, "Pretrain/Step Time": 8.683100687339902} +{"Pretrain/Learning Rate": 2.7572116989904228e-05, "Pretrain/Loss": 1.9900643825531006, "Pretrain/Loss (Raw)": 2.0833611488342285, "Pretrain/Step": 4608, "Pretrain/Step Time": 8.681145390495658} +{"Pretrain/Learning Rate": 2.7563672021908797e-05, "Pretrain/Loss": 1.9901065826416016, "Pretrain/Loss (Raw)": 2.1082499027252197, "Pretrain/Step": 4609, "Pretrain/Step Time": 8.679278120398521} +{"Pretrain/Learning Rate": 2.7555226758258624e-05, "Pretrain/Loss": 1.9895159006118774, "Pretrain/Loss (Raw)": 2.0351312160491943, "Pretrain/Step": 4610, "Pretrain/Step Time": 8.678866609930992} +{"Pretrain/Learning Rate": 2.7546781199927667e-05, "Pretrain/Loss": 1.9892828464508057, "Pretrain/Loss (Raw)": 1.9780552387237549, "Pretrain/Step": 4611, "Pretrain/Step Time": 8.686399975791574} +{"Pretrain/Learning Rate": 2.7538335347889892e-05, "Pretrain/Loss": 1.989556074142456, "Pretrain/Loss (Raw)": 2.1476807594299316, "Pretrain/Step": 4612, "Pretrain/Step Time": 8.67833069525659} +{"Pretrain/Learning Rate": 2.752988920311933e-05, "Pretrain/Loss": 1.9921460151672363, "Pretrain/Loss (Raw)": 2.2636148929595947, "Pretrain/Step": 4613, "Pretrain/Step Time": 8.681985802948475} +{"Pretrain/Learning Rate": 2.7521442766590027e-05, "Pretrain/Loss": 1.9911837577819824, "Pretrain/Loss (Raw)": 2.0181117057800293, "Pretrain/Step": 4614, "Pretrain/Step Time": 8.674922697246075} +{"Pretrain/Learning Rate": 2.7512996039276055e-05, "Pretrain/Loss": 1.9927034378051758, "Pretrain/Loss (Raw)": 2.2247354984283447, "Pretrain/Step": 4615, "Pretrain/Step Time": 8.680019037798047} +{"Pretrain/Learning Rate": 2.7504549022151543e-05, "Pretrain/Loss": 1.9914069175720215, "Pretrain/Loss (Raw)": 2.030857563018799, "Pretrain/Step": 4616, "Pretrain/Step Time": 8.677552854642272} +{"Pretrain/Learning Rate": 2.749610171619063e-05, "Pretrain/Loss": 1.9956101179122925, "Pretrain/Loss (Raw)": 2.3258461952209473, "Pretrain/Step": 4617, "Pretrain/Step Time": 8.682814495638013} +{"Pretrain/Learning Rate": 2.748765412236751e-05, "Pretrain/Loss": 1.9933754205703735, "Pretrain/Loss (Raw)": 1.8513903617858887, "Pretrain/Step": 4618, "Pretrain/Step Time": 8.68041224218905} +{"Pretrain/Learning Rate": 2.747920624165639e-05, "Pretrain/Loss": 1.992305040359497, "Pretrain/Loss (Raw)": 1.9276992082595825, "Pretrain/Step": 4619, "Pretrain/Step Time": 8.681630896404386} +{"Pretrain/Learning Rate": 2.7470758075031533e-05, "Pretrain/Loss": 1.9913102388381958, "Pretrain/Loss (Raw)": 1.897806167602539, "Pretrain/Step": 4620, "Pretrain/Step Time": 8.680199012160301} +{"Pretrain/Learning Rate": 2.7462309623467204e-05, "Pretrain/Loss": 1.9904589653015137, "Pretrain/Loss (Raw)": 2.007962226867676, "Pretrain/Step": 4621, "Pretrain/Step Time": 8.690524071455002} +{"Pretrain/Learning Rate": 2.7453860887937732e-05, "Pretrain/Loss": 1.9905259609222412, "Pretrain/Loss (Raw)": 1.8906359672546387, "Pretrain/Step": 4622, "Pretrain/Step Time": 8.687335267663002} +{"Pretrain/Learning Rate": 2.7445411869417453e-05, "Pretrain/Loss": 1.9896886348724365, "Pretrain/Loss (Raw)": 1.8611034154891968, "Pretrain/Step": 4623, "Pretrain/Step Time": 8.689485363662243} +{"Pretrain/Learning Rate": 2.7436962568880752e-05, "Pretrain/Loss": 1.9890832901000977, "Pretrain/Loss (Raw)": 1.6215815544128418, "Pretrain/Step": 4624, "Pretrain/Step Time": 8.689532367512584} +{"Pretrain/Learning Rate": 2.7428512987302053e-05, "Pretrain/Loss": 1.9883309602737427, "Pretrain/Loss (Raw)": 2.0956692695617676, "Pretrain/Step": 4625, "Pretrain/Step Time": 8.693115064874291} +{"Pretrain/Learning Rate": 2.7420063125655787e-05, "Pretrain/Loss": 1.9894822835922241, "Pretrain/Loss (Raw)": 1.985864281654358, "Pretrain/Step": 4626, "Pretrain/Step Time": 8.68496529571712} +{"Pretrain/Learning Rate": 2.741161298491644e-05, "Pretrain/Loss": 1.988849401473999, "Pretrain/Loss (Raw)": 1.8694703578948975, "Pretrain/Step": 4627, "Pretrain/Step Time": 8.690566623583436} +{"Pretrain/Learning Rate": 2.7403162566058517e-05, "Pretrain/Loss": 1.989801049232483, "Pretrain/Loss (Raw)": 2.2727553844451904, "Pretrain/Step": 4628, "Pretrain/Step Time": 8.691991550847888} +{"Pretrain/Learning Rate": 2.7394711870056567e-05, "Pretrain/Loss": 1.990994930267334, "Pretrain/Loss (Raw)": 2.114975690841675, "Pretrain/Step": 4629, "Pretrain/Step Time": 8.690479155629873} +{"Pretrain/Learning Rate": 2.7386260897885156e-05, "Pretrain/Loss": 1.9887545108795166, "Pretrain/Loss (Raw)": 1.9492536783218384, "Pretrain/Step": 4630, "Pretrain/Step Time": 8.687101965770125} +{"Pretrain/Learning Rate": 2.73778096505189e-05, "Pretrain/Loss": 1.9883644580841064, "Pretrain/Loss (Raw)": 1.9157068729400635, "Pretrain/Step": 4631, "Pretrain/Step Time": 8.690844867378473} +{"Pretrain/Learning Rate": 2.7369358128932422e-05, "Pretrain/Loss": 1.9895119667053223, "Pretrain/Loss (Raw)": 2.223335027694702, "Pretrain/Step": 4632, "Pretrain/Step Time": 8.691780053079128} +{"Pretrain/Learning Rate": 2.7360906334100407e-05, "Pretrain/Loss": 1.9907552003860474, "Pretrain/Loss (Raw)": 1.862571358680725, "Pretrain/Step": 4633, "Pretrain/Step Time": 8.687424225732684} +{"Pretrain/Learning Rate": 2.7352454266997545e-05, "Pretrain/Loss": 1.991256594657898, "Pretrain/Loss (Raw)": 2.1934330463409424, "Pretrain/Step": 4634, "Pretrain/Step Time": 8.689953839406371} +{"Pretrain/Learning Rate": 2.734400192859857e-05, "Pretrain/Loss": 1.9907306432724, "Pretrain/Loss (Raw)": 1.9323009252548218, "Pretrain/Step": 4635, "Pretrain/Step Time": 8.679188687354326} +{"Pretrain/Learning Rate": 2.7335549319878252e-05, "Pretrain/Loss": 1.991348147392273, "Pretrain/Loss (Raw)": 2.1389646530151367, "Pretrain/Step": 4636, "Pretrain/Step Time": 8.688985148444772} +{"Pretrain/Learning Rate": 2.7327096441811383e-05, "Pretrain/Loss": 1.9925884008407593, "Pretrain/Loss (Raw)": 2.124962568283081, "Pretrain/Step": 4637, "Pretrain/Step Time": 8.690907191485167} +{"Pretrain/Learning Rate": 2.7318643295372776e-05, "Pretrain/Loss": 1.9916987419128418, "Pretrain/Loss (Raw)": 2.057255268096924, "Pretrain/Step": 4638, "Pretrain/Step Time": 8.683880330994725} +{"Pretrain/Learning Rate": 2.7310189881537307e-05, "Pretrain/Loss": 1.9941034317016602, "Pretrain/Loss (Raw)": 2.0451900959014893, "Pretrain/Step": 4639, "Pretrain/Step Time": 8.683769706636667} +{"Pretrain/Learning Rate": 2.7301736201279858e-05, "Pretrain/Loss": 1.994856834411621, "Pretrain/Loss (Raw)": 2.1028969287872314, "Pretrain/Step": 4640, "Pretrain/Step Time": 8.683549355715513} +{"Pretrain/Learning Rate": 2.7293282255575335e-05, "Pretrain/Loss": 1.994243860244751, "Pretrain/Loss (Raw)": 2.0954980850219727, "Pretrain/Step": 4641, "Pretrain/Step Time": 8.680892603471875} +{"Pretrain/Learning Rate": 2.7284828045398703e-05, "Pretrain/Loss": 1.9940048456192017, "Pretrain/Loss (Raw)": 1.969565510749817, "Pretrain/Step": 4642, "Pretrain/Step Time": 8.674215303733945} +{"Pretrain/Learning Rate": 2.7276373571724927e-05, "Pretrain/Loss": 1.9967052936553955, "Pretrain/Loss (Raw)": 2.099076509475708, "Pretrain/Step": 4643, "Pretrain/Step Time": 8.678453039377928} +{"Pretrain/Learning Rate": 2.7267918835529033e-05, "Pretrain/Loss": 1.9929499626159668, "Pretrain/Loss (Raw)": 1.6297402381896973, "Pretrain/Step": 4644, "Pretrain/Step Time": 8.68432211689651} +{"Pretrain/Learning Rate": 2.725946383778605e-05, "Pretrain/Loss": 1.9942620992660522, "Pretrain/Loss (Raw)": 1.951862096786499, "Pretrain/Step": 4645, "Pretrain/Step Time": 8.683600073680282} +{"Pretrain/Learning Rate": 2.7251008579471044e-05, "Pretrain/Loss": 1.9958441257476807, "Pretrain/Loss (Raw)": 2.1731834411621094, "Pretrain/Step": 4646, "Pretrain/Step Time": 8.683653915300965} +{"Pretrain/Learning Rate": 2.7242553061559123e-05, "Pretrain/Loss": 1.9959779977798462, "Pretrain/Loss (Raw)": 2.0622265338897705, "Pretrain/Step": 4647, "Pretrain/Step Time": 8.675809722393751} +{"Pretrain/Learning Rate": 2.7234097285025424e-05, "Pretrain/Loss": 1.9950897693634033, "Pretrain/Loss (Raw)": 1.9612929821014404, "Pretrain/Step": 4648, "Pretrain/Step Time": 8.681232154369354} +{"Pretrain/Learning Rate": 2.7225641250845085e-05, "Pretrain/Loss": 1.9911911487579346, "Pretrain/Loss (Raw)": 1.6460297107696533, "Pretrain/Step": 4649, "Pretrain/Step Time": 8.676969153806567} +{"Pretrain/Learning Rate": 2.7217184959993326e-05, "Pretrain/Loss": 1.9948683977127075, "Pretrain/Loss (Raw)": 2.2241806983947754, "Pretrain/Step": 4650, "Pretrain/Step Time": 8.672271756455302} +{"Pretrain/Learning Rate": 2.7208728413445332e-05, "Pretrain/Loss": 1.996577501296997, "Pretrain/Loss (Raw)": 2.0440165996551514, "Pretrain/Step": 4651, "Pretrain/Step Time": 8.672879330813885} +{"Pretrain/Learning Rate": 2.720027161217638e-05, "Pretrain/Loss": 1.9965251684188843, "Pretrain/Loss (Raw)": 1.968748927116394, "Pretrain/Step": 4652, "Pretrain/Step Time": 8.674975825473666} +{"Pretrain/Learning Rate": 2.7191814557161736e-05, "Pretrain/Loss": 1.9966180324554443, "Pretrain/Loss (Raw)": 2.102841377258301, "Pretrain/Step": 4653, "Pretrain/Step Time": 8.678339457139373} +{"Pretrain/Learning Rate": 2.7183357249376712e-05, "Pretrain/Loss": 1.9979066848754883, "Pretrain/Loss (Raw)": 2.281343698501587, "Pretrain/Step": 4654, "Pretrain/Step Time": 8.680136118084192} +{"Pretrain/Learning Rate": 2.7174899689796636e-05, "Pretrain/Loss": 1.9965283870697021, "Pretrain/Loss (Raw)": 1.9284735918045044, "Pretrain/Step": 4655, "Pretrain/Step Time": 8.68104549869895} +{"Pretrain/Learning Rate": 2.7166441879396887e-05, "Pretrain/Loss": 1.996960997581482, "Pretrain/Loss (Raw)": 2.1601531505584717, "Pretrain/Step": 4656, "Pretrain/Step Time": 8.68127029389143} +{"Pretrain/Learning Rate": 2.7157983819152848e-05, "Pretrain/Loss": 1.9956098794937134, "Pretrain/Loss (Raw)": 2.058741569519043, "Pretrain/Step": 4657, "Pretrain/Step Time": 8.692152881994843} +{"Pretrain/Learning Rate": 2.714952551003994e-05, "Pretrain/Loss": 1.9921153783798218, "Pretrain/Loss (Raw)": 1.7455846071243286, "Pretrain/Step": 4658, "Pretrain/Step Time": 8.682203594595194} +{"Pretrain/Learning Rate": 2.714106695303363e-05, "Pretrain/Loss": 1.9932656288146973, "Pretrain/Loss (Raw)": 2.0830821990966797, "Pretrain/Step": 4659, "Pretrain/Step Time": 8.68873325549066} +{"Pretrain/Learning Rate": 2.7132608149109383e-05, "Pretrain/Loss": 1.988990306854248, "Pretrain/Loss (Raw)": 2.130756139755249, "Pretrain/Step": 4660, "Pretrain/Step Time": 8.688876425847411} +{"Pretrain/Learning Rate": 2.7124149099242724e-05, "Pretrain/Loss": 1.9868710041046143, "Pretrain/Loss (Raw)": 1.8262851238250732, "Pretrain/Step": 4661, "Pretrain/Step Time": 8.686716819182038} +{"Pretrain/Learning Rate": 2.7115689804409174e-05, "Pretrain/Loss": 1.9862442016601562, "Pretrain/Loss (Raw)": 1.863279104232788, "Pretrain/Step": 4662, "Pretrain/Step Time": 8.68744022399187} +{"Pretrain/Learning Rate": 2.710723026558431e-05, "Pretrain/Loss": 1.9863853454589844, "Pretrain/Loss (Raw)": 2.1128387451171875, "Pretrain/Step": 4663, "Pretrain/Step Time": 8.692340150475502} +{"Pretrain/Learning Rate": 2.709877048374371e-05, "Pretrain/Loss": 1.9896159172058105, "Pretrain/Loss (Raw)": 2.0815281867980957, "Pretrain/Step": 4664, "Pretrain/Step Time": 8.695685379207134} +{"Pretrain/Learning Rate": 2.709031045986302e-05, "Pretrain/Loss": 1.9884448051452637, "Pretrain/Loss (Raw)": 1.8614563941955566, "Pretrain/Step": 4665, "Pretrain/Step Time": 8.699713306501508} +{"Pretrain/Learning Rate": 2.708185019491788e-05, "Pretrain/Loss": 1.9854865074157715, "Pretrain/Loss (Raw)": 1.740942120552063, "Pretrain/Step": 4666, "Pretrain/Step Time": 8.70158375799656} +{"Pretrain/Learning Rate": 2.707338968988396e-05, "Pretrain/Loss": 1.987098217010498, "Pretrain/Loss (Raw)": 2.1757845878601074, "Pretrain/Step": 4667, "Pretrain/Step Time": 8.699889255687594} +{"Pretrain/Learning Rate": 2.7064928945736974e-05, "Pretrain/Loss": 1.9866881370544434, "Pretrain/Loss (Raw)": 1.84083092212677, "Pretrain/Step": 4668, "Pretrain/Step Time": 8.705279856920242} +{"Pretrain/Learning Rate": 2.7056467963452646e-05, "Pretrain/Loss": 1.986633539199829, "Pretrain/Loss (Raw)": 2.075319766998291, "Pretrain/Step": 4669, "Pretrain/Step Time": 8.706226678565145} +{"Pretrain/Learning Rate": 2.704800674400675e-05, "Pretrain/Loss": 1.986494779586792, "Pretrain/Loss (Raw)": 1.9858405590057373, "Pretrain/Step": 4670, "Pretrain/Step Time": 8.708191119134426} +{"Pretrain/Learning Rate": 2.703954528837506e-05, "Pretrain/Loss": 1.985170602798462, "Pretrain/Loss (Raw)": 2.062976121902466, "Pretrain/Step": 4671, "Pretrain/Step Time": 8.706732247024775} +{"Pretrain/Learning Rate": 2.7031083597533402e-05, "Pretrain/Loss": 1.9856290817260742, "Pretrain/Loss (Raw)": 1.8378889560699463, "Pretrain/Step": 4672, "Pretrain/Step Time": 8.707123661413789} +{"Pretrain/Learning Rate": 2.702262167245761e-05, "Pretrain/Loss": 1.9861335754394531, "Pretrain/Loss (Raw)": 2.0198957920074463, "Pretrain/Step": 4673, "Pretrain/Step Time": 8.707054603844881} +{"Pretrain/Learning Rate": 2.7014159514123555e-05, "Pretrain/Loss": 1.986544132232666, "Pretrain/Loss (Raw)": 2.1415765285491943, "Pretrain/Step": 4674, "Pretrain/Step Time": 8.711056664586067} +{"Pretrain/Learning Rate": 2.7005697123507134e-05, "Pretrain/Loss": 1.987112045288086, "Pretrain/Loss (Raw)": 1.9934375286102295, "Pretrain/Step": 4675, "Pretrain/Step Time": 8.71869252808392} +{"Pretrain/Learning Rate": 2.6997234501584267e-05, "Pretrain/Loss": 1.9861321449279785, "Pretrain/Loss (Raw)": 1.878018856048584, "Pretrain/Step": 4676, "Pretrain/Step Time": 8.719710370525718} +{"Pretrain/Learning Rate": 2.6988771649330906e-05, "Pretrain/Loss": 1.9895570278167725, "Pretrain/Loss (Raw)": 2.174311637878418, "Pretrain/Step": 4677, "Pretrain/Step Time": 8.724236542358994} +{"Pretrain/Learning Rate": 2.6980308567723035e-05, "Pretrain/Loss": 1.9922630786895752, "Pretrain/Loss (Raw)": 2.1219568252563477, "Pretrain/Step": 4678, "Pretrain/Step Time": 8.726685320958495} +{"Pretrain/Learning Rate": 2.697184525773664e-05, "Pretrain/Loss": 1.9875504970550537, "Pretrain/Loss (Raw)": 1.8690142631530762, "Pretrain/Step": 4679, "Pretrain/Step Time": 8.727665666490793} +{"Pretrain/Learning Rate": 2.6963381720347764e-05, "Pretrain/Loss": 1.990392804145813, "Pretrain/Loss (Raw)": 2.1955223083496094, "Pretrain/Step": 4680, "Pretrain/Step Time": 8.734352871775627} +{"Pretrain/Learning Rate": 2.6954917956532455e-05, "Pretrain/Loss": 1.9898933172225952, "Pretrain/Loss (Raw)": 1.9667384624481201, "Pretrain/Step": 4681, "Pretrain/Step Time": 8.732313644140959} +{"Pretrain/Learning Rate": 2.6946453967266792e-05, "Pretrain/Loss": 1.985866904258728, "Pretrain/Loss (Raw)": 1.8174432516098022, "Pretrain/Step": 4682, "Pretrain/Step Time": 8.740438513457775} +{"Pretrain/Learning Rate": 2.693798975352689e-05, "Pretrain/Loss": 1.9856317043304443, "Pretrain/Loss (Raw)": 1.8791673183441162, "Pretrain/Step": 4683, "Pretrain/Step Time": 8.73864153958857} +{"Pretrain/Learning Rate": 2.6929525316288874e-05, "Pretrain/Loss": 1.9848480224609375, "Pretrain/Loss (Raw)": 1.9279545545578003, "Pretrain/Step": 4684, "Pretrain/Step Time": 8.737089790403843} +{"Pretrain/Learning Rate": 2.692106065652891e-05, "Pretrain/Loss": 1.9845025539398193, "Pretrain/Loss (Raw)": 1.9395594596862793, "Pretrain/Step": 4685, "Pretrain/Step Time": 8.737560000270605} +{"Pretrain/Learning Rate": 2.6912595775223175e-05, "Pretrain/Loss": 1.9841855764389038, "Pretrain/Loss (Raw)": 1.7556610107421875, "Pretrain/Step": 4686, "Pretrain/Step Time": 8.739798542112112} +{"Pretrain/Learning Rate": 2.6904130673347887e-05, "Pretrain/Loss": 1.9851229190826416, "Pretrain/Loss (Raw)": 2.168888568878174, "Pretrain/Step": 4687, "Pretrain/Step Time": 8.737133910879493} +{"Pretrain/Learning Rate": 2.6895665351879274e-05, "Pretrain/Loss": 1.9862279891967773, "Pretrain/Loss (Raw)": 2.0955779552459717, "Pretrain/Step": 4688, "Pretrain/Step Time": 8.730500357225537} +{"Pretrain/Learning Rate": 2.68871998117936e-05, "Pretrain/Loss": 1.9826626777648926, "Pretrain/Loss (Raw)": 1.4858976602554321, "Pretrain/Step": 4689, "Pretrain/Step Time": 8.73683275282383} +{"Pretrain/Learning Rate": 2.687873405406715e-05, "Pretrain/Loss": 1.984682559967041, "Pretrain/Loss (Raw)": 2.04217267036438, "Pretrain/Step": 4690, "Pretrain/Step Time": 8.737571265548468} +{"Pretrain/Learning Rate": 2.6870268079676237e-05, "Pretrain/Loss": 1.9841561317443848, "Pretrain/Loss (Raw)": 1.8166202306747437, "Pretrain/Step": 4691, "Pretrain/Step Time": 8.746301779523492} +{"Pretrain/Learning Rate": 2.6861801889597193e-05, "Pretrain/Loss": 1.9825994968414307, "Pretrain/Loss (Raw)": 1.9302566051483154, "Pretrain/Step": 4692, "Pretrain/Step Time": 8.741745088249445} +{"Pretrain/Learning Rate": 2.685333548480639e-05, "Pretrain/Loss": 1.9828333854675293, "Pretrain/Loss (Raw)": 1.982525110244751, "Pretrain/Step": 4693, "Pretrain/Step Time": 8.742378434166312} +{"Pretrain/Learning Rate": 2.68448688662802e-05, "Pretrain/Loss": 1.9841392040252686, "Pretrain/Loss (Raw)": 2.0742502212524414, "Pretrain/Step": 4694, "Pretrain/Step Time": 8.74152971059084} +{"Pretrain/Learning Rate": 2.683640203499504e-05, "Pretrain/Loss": 1.9861711263656616, "Pretrain/Loss (Raw)": 2.0146284103393555, "Pretrain/Step": 4695, "Pretrain/Step Time": 8.745577795431018} +{"Pretrain/Learning Rate": 2.682793499192734e-05, "Pretrain/Loss": 1.9893684387207031, "Pretrain/Loss (Raw)": 1.9342870712280273, "Pretrain/Step": 4696, "Pretrain/Step Time": 8.73961610160768} +{"Pretrain/Learning Rate": 2.6819467738053572e-05, "Pretrain/Loss": 1.9880279302597046, "Pretrain/Loss (Raw)": 2.0157642364501953, "Pretrain/Step": 4697, "Pretrain/Step Time": 8.746593348681927} +{"Pretrain/Learning Rate": 2.6811000274350205e-05, "Pretrain/Loss": 1.9872956275939941, "Pretrain/Loss (Raw)": 2.1469485759735107, "Pretrain/Step": 4698, "Pretrain/Step Time": 8.752631338313222} +{"Pretrain/Learning Rate": 2.680253260179375e-05, "Pretrain/Loss": 1.9863805770874023, "Pretrain/Loss (Raw)": 1.793592929840088, "Pretrain/Step": 4699, "Pretrain/Step Time": 8.754738485440612} +{"Pretrain/Learning Rate": 2.6794064721360752e-05, "Pretrain/Loss": 1.9839186668395996, "Pretrain/Loss (Raw)": 1.776739478111267, "Pretrain/Step": 4700, "Pretrain/Step Time": 8.754065163433552} +{"Pretrain/Learning Rate": 2.6785596634027745e-05, "Pretrain/Loss": 1.982871413230896, "Pretrain/Loss (Raw)": 1.5521353483200073, "Pretrain/Step": 4701, "Pretrain/Step Time": 8.756085069850087} +{"Pretrain/Learning Rate": 2.677712834077133e-05, "Pretrain/Loss": 1.9807374477386475, "Pretrain/Loss (Raw)": 1.7667908668518066, "Pretrain/Step": 4702, "Pretrain/Step Time": 8.755833726376295} +{"Pretrain/Learning Rate": 2.676865984256809e-05, "Pretrain/Loss": 1.9785888195037842, "Pretrain/Loss (Raw)": 1.7998719215393066, "Pretrain/Step": 4703, "Pretrain/Step Time": 8.759359765797853} +{"Pretrain/Learning Rate": 2.6760191140394668e-05, "Pretrain/Loss": 1.9807977676391602, "Pretrain/Loss (Raw)": 2.0475406646728516, "Pretrain/Step": 4704, "Pretrain/Step Time": 8.75816049054265} +{"Pretrain/Learning Rate": 2.675172223522771e-05, "Pretrain/Loss": 1.9799096584320068, "Pretrain/Loss (Raw)": 1.9354788064956665, "Pretrain/Step": 4705, "Pretrain/Step Time": 8.757794613018632} +{"Pretrain/Learning Rate": 2.6743253128043887e-05, "Pretrain/Loss": 1.9823004007339478, "Pretrain/Loss (Raw)": 2.0311896800994873, "Pretrain/Step": 4706, "Pretrain/Step Time": 8.758961541578174} +{"Pretrain/Learning Rate": 2.6734783819819903e-05, "Pretrain/Loss": 1.982170581817627, "Pretrain/Loss (Raw)": 1.9082735776901245, "Pretrain/Step": 4707, "Pretrain/Step Time": 8.760245058685541} +{"Pretrain/Learning Rate": 2.6726314311532467e-05, "Pretrain/Loss": 1.9810290336608887, "Pretrain/Loss (Raw)": 1.8206937313079834, "Pretrain/Step": 4708, "Pretrain/Step Time": 8.759159702807665} +{"Pretrain/Learning Rate": 2.671784460415834e-05, "Pretrain/Loss": 1.9803667068481445, "Pretrain/Loss (Raw)": 1.9673840999603271, "Pretrain/Step": 4709, "Pretrain/Step Time": 8.751362236216664} +{"Pretrain/Learning Rate": 2.6709374698674267e-05, "Pretrain/Loss": 1.9826042652130127, "Pretrain/Loss (Raw)": 2.019245147705078, "Pretrain/Step": 4710, "Pretrain/Step Time": 8.752697803080082} +{"Pretrain/Learning Rate": 2.670090459605706e-05, "Pretrain/Loss": 1.981931447982788, "Pretrain/Loss (Raw)": 1.9675849676132202, "Pretrain/Step": 4711, "Pretrain/Step Time": 8.753872921690345} +{"Pretrain/Learning Rate": 2.6692434297283514e-05, "Pretrain/Loss": 1.9802899360656738, "Pretrain/Loss (Raw)": 1.8620808124542236, "Pretrain/Step": 4712, "Pretrain/Step Time": 8.748121444135904} +{"Pretrain/Learning Rate": 2.6683963803330468e-05, "Pretrain/Loss": 1.9813382625579834, "Pretrain/Loss (Raw)": 2.1440694332122803, "Pretrain/Step": 4713, "Pretrain/Step Time": 8.748272636905313} +{"Pretrain/Learning Rate": 2.6675493115174786e-05, "Pretrain/Loss": 1.982985258102417, "Pretrain/Loss (Raw)": 1.9355131387710571, "Pretrain/Step": 4714, "Pretrain/Step Time": 8.752662267535925} +{"Pretrain/Learning Rate": 2.6667022233793342e-05, "Pretrain/Loss": 1.981238842010498, "Pretrain/Loss (Raw)": 1.8820170164108276, "Pretrain/Step": 4715, "Pretrain/Step Time": 8.749978495761752} +{"Pretrain/Learning Rate": 2.6658551160163036e-05, "Pretrain/Loss": 1.983227014541626, "Pretrain/Loss (Raw)": 2.010944366455078, "Pretrain/Step": 4716, "Pretrain/Step Time": 8.74956115707755} +{"Pretrain/Learning Rate": 2.6650079895260798e-05, "Pretrain/Loss": 1.9843153953552246, "Pretrain/Loss (Raw)": 1.9382884502410889, "Pretrain/Step": 4717, "Pretrain/Step Time": 8.75052378512919} +{"Pretrain/Learning Rate": 2.664160844006357e-05, "Pretrain/Loss": 1.983071208000183, "Pretrain/Loss (Raw)": 1.970198154449463, "Pretrain/Step": 4718, "Pretrain/Step Time": 8.748478062450886} +{"Pretrain/Learning Rate": 2.6633136795548326e-05, "Pretrain/Loss": 1.9840400218963623, "Pretrain/Loss (Raw)": 2.04494309425354, "Pretrain/Step": 4719, "Pretrain/Step Time": 8.74986849911511} +{"Pretrain/Learning Rate": 2.662466496269204e-05, "Pretrain/Loss": 1.9847609996795654, "Pretrain/Loss (Raw)": 1.9814786911010742, "Pretrain/Step": 4720, "Pretrain/Step Time": 8.754432875663042} +{"Pretrain/Learning Rate": 2.661619294247174e-05, "Pretrain/Loss": 1.9842774868011475, "Pretrain/Loss (Raw)": 2.0073318481445312, "Pretrain/Step": 4721, "Pretrain/Step Time": 8.75855872221291} +{"Pretrain/Learning Rate": 2.6607720735864454e-05, "Pretrain/Loss": 1.985637903213501, "Pretrain/Loss (Raw)": 2.194709539413452, "Pretrain/Step": 4722, "Pretrain/Step Time": 8.75812179595232} +{"Pretrain/Learning Rate": 2.6599248343847244e-05, "Pretrain/Loss": 1.9856691360473633, "Pretrain/Loss (Raw)": 1.9775104522705078, "Pretrain/Step": 4723, "Pretrain/Step Time": 8.757216058671474} +{"Pretrain/Learning Rate": 2.6590775767397174e-05, "Pretrain/Loss": 1.9837515354156494, "Pretrain/Loss (Raw)": 1.7909246683120728, "Pretrain/Step": 4724, "Pretrain/Step Time": 8.760837342590094} +{"Pretrain/Learning Rate": 2.6582303007491345e-05, "Pretrain/Loss": 1.9821467399597168, "Pretrain/Loss (Raw)": 1.941873550415039, "Pretrain/Step": 4725, "Pretrain/Step Time": 8.76154357008636} +{"Pretrain/Learning Rate": 2.6573830065106874e-05, "Pretrain/Loss": 1.9826524257659912, "Pretrain/Loss (Raw)": 2.008133888244629, "Pretrain/Step": 4726, "Pretrain/Step Time": 8.764777556061745} +{"Pretrain/Learning Rate": 2.6565356941220908e-05, "Pretrain/Loss": 1.9864780902862549, "Pretrain/Loss (Raw)": 2.0005786418914795, "Pretrain/Step": 4727, "Pretrain/Step Time": 8.76649503223598} +{"Pretrain/Learning Rate": 2.6556883636810605e-05, "Pretrain/Loss": 1.9874906539916992, "Pretrain/Loss (Raw)": 1.8987594842910767, "Pretrain/Step": 4728, "Pretrain/Step Time": 8.759862147271633} +{"Pretrain/Learning Rate": 2.6548410152853142e-05, "Pretrain/Loss": 1.9879379272460938, "Pretrain/Loss (Raw)": 2.0516347885131836, "Pretrain/Step": 4729, "Pretrain/Step Time": 8.76042084209621} +{"Pretrain/Learning Rate": 2.6539936490325725e-05, "Pretrain/Loss": 1.9854483604431152, "Pretrain/Loss (Raw)": 1.7710334062576294, "Pretrain/Step": 4730, "Pretrain/Step Time": 8.75757253728807} +{"Pretrain/Learning Rate": 2.6531462650205575e-05, "Pretrain/Loss": 1.9861916303634644, "Pretrain/Loss (Raw)": 2.0847604274749756, "Pretrain/Step": 4731, "Pretrain/Step Time": 8.758141668513417} +{"Pretrain/Learning Rate": 2.6522988633469938e-05, "Pretrain/Loss": 1.984879493713379, "Pretrain/Loss (Raw)": 1.8817722797393799, "Pretrain/Step": 4732, "Pretrain/Step Time": 8.756000325083733} +{"Pretrain/Learning Rate": 2.6514514441096066e-05, "Pretrain/Loss": 1.9867957830429077, "Pretrain/Loss (Raw)": 2.1410789489746094, "Pretrain/Step": 4733, "Pretrain/Step Time": 8.759003849700093} +{"Pretrain/Learning Rate": 2.650604007406126e-05, "Pretrain/Loss": 1.9829058647155762, "Pretrain/Loss (Raw)": 1.7426316738128662, "Pretrain/Step": 4734, "Pretrain/Step Time": 8.756027545779943} +{"Pretrain/Learning Rate": 2.6497565533342816e-05, "Pretrain/Loss": 1.9850165843963623, "Pretrain/Loss (Raw)": 2.105456829071045, "Pretrain/Step": 4735, "Pretrain/Step Time": 8.75647990964353} +{"Pretrain/Learning Rate": 2.6489090819918057e-05, "Pretrain/Loss": 1.9832994937896729, "Pretrain/Loss (Raw)": 1.863591194152832, "Pretrain/Step": 4736, "Pretrain/Step Time": 8.76263852789998} +{"Pretrain/Learning Rate": 2.6480615934764323e-05, "Pretrain/Loss": 1.9813973903656006, "Pretrain/Loss (Raw)": 1.86477530002594, "Pretrain/Step": 4737, "Pretrain/Step Time": 8.7674521189183} +{"Pretrain/Learning Rate": 2.6472140878858994e-05, "Pretrain/Loss": 1.981276512145996, "Pretrain/Loss (Raw)": 2.0196497440338135, "Pretrain/Step": 4738, "Pretrain/Step Time": 8.765905637294054} +{"Pretrain/Learning Rate": 2.646366565317943e-05, "Pretrain/Loss": 1.980421781539917, "Pretrain/Loss (Raw)": 1.8686586618423462, "Pretrain/Step": 4739, "Pretrain/Step Time": 8.760023230686784} +{"Pretrain/Learning Rate": 2.6455190258703056e-05, "Pretrain/Loss": 1.9810411930084229, "Pretrain/Loss (Raw)": 2.2269561290740967, "Pretrain/Step": 4740, "Pretrain/Step Time": 8.759220097213984} +{"Pretrain/Learning Rate": 2.644671469640728e-05, "Pretrain/Loss": 1.9792311191558838, "Pretrain/Loss (Raw)": 2.031942129135132, "Pretrain/Step": 4741, "Pretrain/Step Time": 8.764663379639387} +{"Pretrain/Learning Rate": 2.6438238967269546e-05, "Pretrain/Loss": 1.97925865650177, "Pretrain/Loss (Raw)": 2.0216214656829834, "Pretrain/Step": 4742, "Pretrain/Step Time": 8.76544369570911} +{"Pretrain/Learning Rate": 2.6429763072267317e-05, "Pretrain/Loss": 1.9781326055526733, "Pretrain/Loss (Raw)": 2.0806076526641846, "Pretrain/Step": 4743, "Pretrain/Step Time": 8.759749317541718} +{"Pretrain/Learning Rate": 2.642128701237807e-05, "Pretrain/Loss": 1.9774043560028076, "Pretrain/Loss (Raw)": 1.9376344680786133, "Pretrain/Step": 4744, "Pretrain/Step Time": 8.761774374172091} +{"Pretrain/Learning Rate": 2.641281078857932e-05, "Pretrain/Loss": 1.9709312915802002, "Pretrain/Loss (Raw)": 1.49728524684906, "Pretrain/Step": 4745, "Pretrain/Step Time": 8.760978300124407} +{"Pretrain/Learning Rate": 2.6404334401848558e-05, "Pretrain/Loss": 1.972428321838379, "Pretrain/Loss (Raw)": 2.0430314540863037, "Pretrain/Step": 4746, "Pretrain/Step Time": 8.759572444483638} +{"Pretrain/Learning Rate": 2.6395857853163346e-05, "Pretrain/Loss": 1.970045566558838, "Pretrain/Loss (Raw)": 1.6227048635482788, "Pretrain/Step": 4747, "Pretrain/Step Time": 8.760885125026107} +{"Pretrain/Learning Rate": 2.6387381143501217e-05, "Pretrain/Loss": 1.9724091291427612, "Pretrain/Loss (Raw)": 2.200336217880249, "Pretrain/Step": 4748, "Pretrain/Step Time": 8.756039593368769} +{"Pretrain/Learning Rate": 2.6378904273839765e-05, "Pretrain/Loss": 1.973654866218567, "Pretrain/Loss (Raw)": 2.1674118041992188, "Pretrain/Step": 4749, "Pretrain/Step Time": 8.751368617638946} +{"Pretrain/Learning Rate": 2.6370427245156574e-05, "Pretrain/Loss": 1.9747905731201172, "Pretrain/Loss (Raw)": 2.0360107421875, "Pretrain/Step": 4750, "Pretrain/Step Time": 8.752031236886978} +{"Pretrain/Learning Rate": 2.6361950058429257e-05, "Pretrain/Loss": 1.9761852025985718, "Pretrain/Loss (Raw)": 2.0396130084991455, "Pretrain/Step": 4751, "Pretrain/Step Time": 8.751086995005608} +{"Pretrain/Learning Rate": 2.635347271463544e-05, "Pretrain/Loss": 1.9782650470733643, "Pretrain/Loss (Raw)": 1.8877986669540405, "Pretrain/Step": 4752, "Pretrain/Step Time": 8.756384732201695} +{"Pretrain/Learning Rate": 2.6344995214752772e-05, "Pretrain/Loss": 1.9776849746704102, "Pretrain/Loss (Raw)": 2.021414279937744, "Pretrain/Step": 4753, "Pretrain/Step Time": 8.752917133271694} +{"Pretrain/Learning Rate": 2.6336517559758915e-05, "Pretrain/Loss": 1.9799723625183105, "Pretrain/Loss (Raw)": 2.2786548137664795, "Pretrain/Step": 4754, "Pretrain/Step Time": 8.747231939807534} +{"Pretrain/Learning Rate": 2.632803975063156e-05, "Pretrain/Loss": 1.9803510904312134, "Pretrain/Loss (Raw)": 1.9179511070251465, "Pretrain/Step": 4755, "Pretrain/Step Time": 8.745541950687766} +{"Pretrain/Learning Rate": 2.6319561788348402e-05, "Pretrain/Loss": 1.978751540184021, "Pretrain/Loss (Raw)": 2.0680127143859863, "Pretrain/Step": 4756, "Pretrain/Step Time": 8.742049157619476} +{"Pretrain/Learning Rate": 2.6311083673887154e-05, "Pretrain/Loss": 1.9789172410964966, "Pretrain/Loss (Raw)": 2.1361899375915527, "Pretrain/Step": 4757, "Pretrain/Step Time": 8.745131481438875} +{"Pretrain/Learning Rate": 2.6302605408225572e-05, "Pretrain/Loss": 1.9793956279754639, "Pretrain/Loss (Raw)": 2.0104799270629883, "Pretrain/Step": 4758, "Pretrain/Step Time": 8.744640737771988} +{"Pretrain/Learning Rate": 2.6294126992341382e-05, "Pretrain/Loss": 1.9803056716918945, "Pretrain/Loss (Raw)": 2.032205820083618, "Pretrain/Step": 4759, "Pretrain/Step Time": 8.739074353128672} +{"Pretrain/Learning Rate": 2.628564842721238e-05, "Pretrain/Loss": 1.9797446727752686, "Pretrain/Loss (Raw)": 2.151524543762207, "Pretrain/Step": 4760, "Pretrain/Step Time": 8.748591123148799} +{"Pretrain/Learning Rate": 2.6277169713816337e-05, "Pretrain/Loss": 1.9795823097229004, "Pretrain/Loss (Raw)": 1.8417863845825195, "Pretrain/Step": 4761, "Pretrain/Step Time": 8.748886631801724} +{"Pretrain/Learning Rate": 2.6268690853131067e-05, "Pretrain/Loss": 1.975777268409729, "Pretrain/Loss (Raw)": 1.706390380859375, "Pretrain/Step": 4762, "Pretrain/Step Time": 8.745748227462173} +{"Pretrain/Learning Rate": 2.6260211846134387e-05, "Pretrain/Loss": 1.9749755859375, "Pretrain/Loss (Raw)": 1.8296773433685303, "Pretrain/Step": 4763, "Pretrain/Step Time": 8.750091776251793} +{"Pretrain/Learning Rate": 2.6251732693804144e-05, "Pretrain/Loss": 1.9737560749053955, "Pretrain/Loss (Raw)": 1.9828623533248901, "Pretrain/Step": 4764, "Pretrain/Step Time": 8.740135937929153} +{"Pretrain/Learning Rate": 2.6243253397118178e-05, "Pretrain/Loss": 1.9716014862060547, "Pretrain/Loss (Raw)": 1.8491756916046143, "Pretrain/Step": 4765, "Pretrain/Step Time": 8.742886198684573} +{"Pretrain/Learning Rate": 2.6234773957054383e-05, "Pretrain/Loss": 1.9709440469741821, "Pretrain/Loss (Raw)": 1.9731101989746094, "Pretrain/Step": 4766, "Pretrain/Step Time": 8.743243642151356} +{"Pretrain/Learning Rate": 2.6226294374590638e-05, "Pretrain/Loss": 1.9709975719451904, "Pretrain/Loss (Raw)": 2.0520458221435547, "Pretrain/Step": 4767, "Pretrain/Step Time": 8.750375844538212} +{"Pretrain/Learning Rate": 2.6217814650704835e-05, "Pretrain/Loss": 1.9691890478134155, "Pretrain/Loss (Raw)": 1.8714030981063843, "Pretrain/Step": 4768, "Pretrain/Step Time": 8.749819807708263} +{"Pretrain/Learning Rate": 2.620933478637492e-05, "Pretrain/Loss": 1.9679431915283203, "Pretrain/Loss (Raw)": 1.9360097646713257, "Pretrain/Step": 4769, "Pretrain/Step Time": 8.751680994406343} +{"Pretrain/Learning Rate": 2.620085478257881e-05, "Pretrain/Loss": 1.967409610748291, "Pretrain/Loss (Raw)": 1.9012846946716309, "Pretrain/Step": 4770, "Pretrain/Step Time": 8.74946090951562} +{"Pretrain/Learning Rate": 2.6192374640294477e-05, "Pretrain/Loss": 1.9664900302886963, "Pretrain/Loss (Raw)": 1.9813669919967651, "Pretrain/Step": 4771, "Pretrain/Step Time": 8.745013702660799} +{"Pretrain/Learning Rate": 2.618389436049987e-05, "Pretrain/Loss": 1.9698708057403564, "Pretrain/Loss (Raw)": 2.062471628189087, "Pretrain/Step": 4772, "Pretrain/Step Time": 8.740330684930086} +{"Pretrain/Learning Rate": 2.6175413944172995e-05, "Pretrain/Loss": 1.9714453220367432, "Pretrain/Loss (Raw)": 2.153406858444214, "Pretrain/Step": 4773, "Pretrain/Step Time": 8.748297410085797} +{"Pretrain/Learning Rate": 2.6166933392291843e-05, "Pretrain/Loss": 1.9698970317840576, "Pretrain/Loss (Raw)": 1.9750111103057861, "Pretrain/Step": 4774, "Pretrain/Step Time": 8.750205516815186} +{"Pretrain/Learning Rate": 2.6158452705834434e-05, "Pretrain/Loss": 1.9669629335403442, "Pretrain/Loss (Raw)": 1.686657428741455, "Pretrain/Step": 4775, "Pretrain/Step Time": 8.752610336989164} +{"Pretrain/Learning Rate": 2.6149971885778795e-05, "Pretrain/Loss": 1.967002272605896, "Pretrain/Loss (Raw)": 1.9663184881210327, "Pretrain/Step": 4776, "Pretrain/Step Time": 8.748170550912619} +{"Pretrain/Learning Rate": 2.6141490933102987e-05, "Pretrain/Loss": 1.970245122909546, "Pretrain/Loss (Raw)": 2.0611212253570557, "Pretrain/Step": 4777, "Pretrain/Step Time": 8.748554166406393} +{"Pretrain/Learning Rate": 2.6133009848785062e-05, "Pretrain/Loss": 1.9680660963058472, "Pretrain/Loss (Raw)": 1.9452611207962036, "Pretrain/Step": 4778, "Pretrain/Step Time": 8.746755814179778} +{"Pretrain/Learning Rate": 2.6124528633803103e-05, "Pretrain/Loss": 1.9652857780456543, "Pretrain/Loss (Raw)": 1.688128113746643, "Pretrain/Step": 4779, "Pretrain/Step Time": 8.750232296064496} +{"Pretrain/Learning Rate": 2.61160472891352e-05, "Pretrain/Loss": 1.9651803970336914, "Pretrain/Loss (Raw)": 1.9552613496780396, "Pretrain/Step": 4780, "Pretrain/Step Time": 8.748514849692583} +{"Pretrain/Learning Rate": 2.6107565815759473e-05, "Pretrain/Loss": 1.964437484741211, "Pretrain/Loss (Raw)": 2.0077507495880127, "Pretrain/Step": 4781, "Pretrain/Step Time": 8.746997183188796} +{"Pretrain/Learning Rate": 2.6099084214654034e-05, "Pretrain/Loss": 1.9634004831314087, "Pretrain/Loss (Raw)": 2.148608446121216, "Pretrain/Step": 4782, "Pretrain/Step Time": 8.752465965226293} +{"Pretrain/Learning Rate": 2.6090602486797017e-05, "Pretrain/Loss": 1.9632446765899658, "Pretrain/Loss (Raw)": 1.9085502624511719, "Pretrain/Step": 4783, "Pretrain/Step Time": 8.753909396007657} +{"Pretrain/Learning Rate": 2.608212063316659e-05, "Pretrain/Loss": 1.9609272480010986, "Pretrain/Loss (Raw)": 1.8635097742080688, "Pretrain/Step": 4784, "Pretrain/Step Time": 8.753921657800674} +{"Pretrain/Learning Rate": 2.6073638654740908e-05, "Pretrain/Loss": 1.9615317583084106, "Pretrain/Loss (Raw)": 2.1361184120178223, "Pretrain/Step": 4785, "Pretrain/Step Time": 8.740393724292517} +{"Pretrain/Learning Rate": 2.606515655249816e-05, "Pretrain/Loss": 1.963686227798462, "Pretrain/Loss (Raw)": 2.021348237991333, "Pretrain/Step": 4786, "Pretrain/Step Time": 8.742294881492853} +{"Pretrain/Learning Rate": 2.6056674327416537e-05, "Pretrain/Loss": 1.963827133178711, "Pretrain/Loss (Raw)": 2.10113525390625, "Pretrain/Step": 4787, "Pretrain/Step Time": 8.743105210363865} +{"Pretrain/Learning Rate": 2.604819198047425e-05, "Pretrain/Loss": 1.9615097045898438, "Pretrain/Loss (Raw)": 1.834115743637085, "Pretrain/Step": 4788, "Pretrain/Step Time": 8.739311177283525} +{"Pretrain/Learning Rate": 2.6039709512649522e-05, "Pretrain/Loss": 1.9617124795913696, "Pretrain/Loss (Raw)": 1.8522439002990723, "Pretrain/Step": 4789, "Pretrain/Step Time": 8.747762978076935} +{"Pretrain/Learning Rate": 2.60312269249206e-05, "Pretrain/Loss": 1.9620614051818848, "Pretrain/Loss (Raw)": 1.907952070236206, "Pretrain/Step": 4790, "Pretrain/Step Time": 8.750314436852932} +{"Pretrain/Learning Rate": 2.602274421826573e-05, "Pretrain/Loss": 1.9608932733535767, "Pretrain/Loss (Raw)": 1.9633103609085083, "Pretrain/Step": 4791, "Pretrain/Step Time": 8.747112510725856} +{"Pretrain/Learning Rate": 2.6014261393663176e-05, "Pretrain/Loss": 1.9593507051467896, "Pretrain/Loss (Raw)": 1.8840665817260742, "Pretrain/Step": 4792, "Pretrain/Step Time": 8.748766202479601} +{"Pretrain/Learning Rate": 2.600577845209122e-05, "Pretrain/Loss": 1.9607226848602295, "Pretrain/Loss (Raw)": 2.0370757579803467, "Pretrain/Step": 4793, "Pretrain/Step Time": 8.739657551050186} +{"Pretrain/Learning Rate": 2.599729539452815e-05, "Pretrain/Loss": 1.9641778469085693, "Pretrain/Loss (Raw)": 2.1831977367401123, "Pretrain/Step": 4794, "Pretrain/Step Time": 8.740485010668635} +{"Pretrain/Learning Rate": 2.598881222195228e-05, "Pretrain/Loss": 1.9633525609970093, "Pretrain/Loss (Raw)": 2.0701494216918945, "Pretrain/Step": 4795, "Pretrain/Step Time": 8.744288224726915} +{"Pretrain/Learning Rate": 2.5980328935341918e-05, "Pretrain/Loss": 1.960951805114746, "Pretrain/Loss (Raw)": 1.5335345268249512, "Pretrain/Step": 4796, "Pretrain/Step Time": 8.740595748648047} +{"Pretrain/Learning Rate": 2.597184553567541e-05, "Pretrain/Loss": 1.9597022533416748, "Pretrain/Loss (Raw)": 1.9153767824172974, "Pretrain/Step": 4797, "Pretrain/Step Time": 8.74218631349504} +{"Pretrain/Learning Rate": 2.5963362023931092e-05, "Pretrain/Loss": 1.958230972290039, "Pretrain/Loss (Raw)": 1.7975099086761475, "Pretrain/Step": 4798, "Pretrain/Step Time": 8.747513093054295} +{"Pretrain/Learning Rate": 2.595487840108733e-05, "Pretrain/Loss": 1.9578756093978882, "Pretrain/Loss (Raw)": 2.0175063610076904, "Pretrain/Step": 4799, "Pretrain/Step Time": 8.746427228674293} +{"Pretrain/Learning Rate": 2.5946394668122485e-05, "Pretrain/Loss": 1.9590888023376465, "Pretrain/Loss (Raw)": 1.9931654930114746, "Pretrain/Step": 4800, "Pretrain/Step Time": 8.747115919366479} +{"Pretrain/Learning Rate": 2.5937910826014955e-05, "Pretrain/Loss": 1.9577664136886597, "Pretrain/Loss (Raw)": 1.8506394624710083, "Pretrain/Step": 4801, "Pretrain/Step Time": 8.74951278604567} +{"Pretrain/Learning Rate": 2.5929426875743123e-05, "Pretrain/Loss": 1.9553678035736084, "Pretrain/Loss (Raw)": 1.8345454931259155, "Pretrain/Step": 4802, "Pretrain/Step Time": 8.743754729628563} +{"Pretrain/Learning Rate": 2.592094281828541e-05, "Pretrain/Loss": 1.9569934606552124, "Pretrain/Loss (Raw)": 2.2015273571014404, "Pretrain/Step": 4803, "Pretrain/Step Time": 8.735415700823069} +{"Pretrain/Learning Rate": 2.5912458654620226e-05, "Pretrain/Loss": 1.958071231842041, "Pretrain/Loss (Raw)": 2.0159661769866943, "Pretrain/Step": 4804, "Pretrain/Step Time": 8.733980411663651} +{"Pretrain/Learning Rate": 2.5903974385726014e-05, "Pretrain/Loss": 1.9566879272460938, "Pretrain/Loss (Raw)": 1.9972611665725708, "Pretrain/Step": 4805, "Pretrain/Step Time": 8.730800667777658} +{"Pretrain/Learning Rate": 2.589549001258121e-05, "Pretrain/Loss": 1.9562102556228638, "Pretrain/Loss (Raw)": 2.0608129501342773, "Pretrain/Step": 4806, "Pretrain/Step Time": 8.724559959024191} +{"Pretrain/Learning Rate": 2.5887005536164288e-05, "Pretrain/Loss": 1.9562548398971558, "Pretrain/Loss (Raw)": 1.8747309446334839, "Pretrain/Step": 4807, "Pretrain/Step Time": 8.72629045881331} +{"Pretrain/Learning Rate": 2.58785209574537e-05, "Pretrain/Loss": 1.9552202224731445, "Pretrain/Loss (Raw)": 2.0630714893341064, "Pretrain/Step": 4808, "Pretrain/Step Time": 8.72961957193911} +{"Pretrain/Learning Rate": 2.587003627742794e-05, "Pretrain/Loss": 1.9557006359100342, "Pretrain/Loss (Raw)": 2.0282516479492188, "Pretrain/Step": 4809, "Pretrain/Step Time": 8.733279336243868} +{"Pretrain/Learning Rate": 2.5861551497065496e-05, "Pretrain/Loss": 1.957413911819458, "Pretrain/Loss (Raw)": 2.0367343425750732, "Pretrain/Step": 4810, "Pretrain/Step Time": 8.727359477430582} +{"Pretrain/Learning Rate": 2.5853066617344868e-05, "Pretrain/Loss": 1.959058165550232, "Pretrain/Loss (Raw)": 2.089632749557495, "Pretrain/Step": 4811, "Pretrain/Step Time": 8.727974742650986} +{"Pretrain/Learning Rate": 2.5844581639244586e-05, "Pretrain/Loss": 1.959999680519104, "Pretrain/Loss (Raw)": 2.0484559535980225, "Pretrain/Step": 4812, "Pretrain/Step Time": 8.729546669870615} +{"Pretrain/Learning Rate": 2.583609656374316e-05, "Pretrain/Loss": 1.9615652561187744, "Pretrain/Loss (Raw)": 2.1399621963500977, "Pretrain/Step": 4813, "Pretrain/Step Time": 8.733117323368788} +{"Pretrain/Learning Rate": 2.5827611391819152e-05, "Pretrain/Loss": 1.9633734226226807, "Pretrain/Loss (Raw)": 1.987096905708313, "Pretrain/Step": 4814, "Pretrain/Step Time": 8.728697199374437} +{"Pretrain/Learning Rate": 2.581912612445108e-05, "Pretrain/Loss": 1.9621717929840088, "Pretrain/Loss (Raw)": 2.0150909423828125, "Pretrain/Step": 4815, "Pretrain/Step Time": 8.730678310617805} +{"Pretrain/Learning Rate": 2.5810640762617538e-05, "Pretrain/Loss": 1.9612653255462646, "Pretrain/Loss (Raw)": 1.9795564413070679, "Pretrain/Step": 4816, "Pretrain/Step Time": 8.732515517622232} +{"Pretrain/Learning Rate": 2.5802155307297077e-05, "Pretrain/Loss": 1.9661626815795898, "Pretrain/Loss (Raw)": 2.1127383708953857, "Pretrain/Step": 4817, "Pretrain/Step Time": 8.724053218960762} +{"Pretrain/Learning Rate": 2.5793669759468292e-05, "Pretrain/Loss": 1.9672465324401855, "Pretrain/Loss (Raw)": 2.1809234619140625, "Pretrain/Step": 4818, "Pretrain/Step Time": 8.725111559033394} +{"Pretrain/Learning Rate": 2.578518412010976e-05, "Pretrain/Loss": 1.970628023147583, "Pretrain/Loss (Raw)": 2.249453067779541, "Pretrain/Step": 4819, "Pretrain/Step Time": 8.717671141028404} +{"Pretrain/Learning Rate": 2.577669839020011e-05, "Pretrain/Loss": 1.9709010124206543, "Pretrain/Loss (Raw)": 1.965185523033142, "Pretrain/Step": 4820, "Pretrain/Step Time": 8.7179009411484} +{"Pretrain/Learning Rate": 2.576821257071793e-05, "Pretrain/Loss": 1.9709261655807495, "Pretrain/Loss (Raw)": 1.9857515096664429, "Pretrain/Step": 4821, "Pretrain/Step Time": 8.72541026212275} +{"Pretrain/Learning Rate": 2.5759726662641865e-05, "Pretrain/Loss": 1.9710462093353271, "Pretrain/Loss (Raw)": 2.0896072387695312, "Pretrain/Step": 4822, "Pretrain/Step Time": 8.724147867411375} +{"Pretrain/Learning Rate": 2.5751240666950532e-05, "Pretrain/Loss": 1.9710185527801514, "Pretrain/Loss (Raw)": 2.011098623275757, "Pretrain/Step": 4823, "Pretrain/Step Time": 8.72151960991323} +{"Pretrain/Learning Rate": 2.5742754584622592e-05, "Pretrain/Loss": 1.9708739519119263, "Pretrain/Loss (Raw)": 1.9157650470733643, "Pretrain/Step": 4824, "Pretrain/Step Time": 8.725937968119979} +{"Pretrain/Learning Rate": 2.5734268416636697e-05, "Pretrain/Loss": 1.9715248346328735, "Pretrain/Loss (Raw)": 2.099100112915039, "Pretrain/Step": 4825, "Pretrain/Step Time": 8.7299142498523} +{"Pretrain/Learning Rate": 2.5725782163971495e-05, "Pretrain/Loss": 1.9709351062774658, "Pretrain/Loss (Raw)": 2.0714523792266846, "Pretrain/Step": 4826, "Pretrain/Step Time": 8.721669586375356} +{"Pretrain/Learning Rate": 2.5717295827605686e-05, "Pretrain/Loss": 1.9746205806732178, "Pretrain/Loss (Raw)": 2.2653515338897705, "Pretrain/Step": 4827, "Pretrain/Step Time": 8.72647225484252} +{"Pretrain/Learning Rate": 2.5708809408517937e-05, "Pretrain/Loss": 1.976762294769287, "Pretrain/Loss (Raw)": 2.050849199295044, "Pretrain/Step": 4828, "Pretrain/Step Time": 8.726650515571237} +{"Pretrain/Learning Rate": 2.5700322907686946e-05, "Pretrain/Loss": 1.9803670644760132, "Pretrain/Loss (Raw)": 2.0135533809661865, "Pretrain/Step": 4829, "Pretrain/Step Time": 8.72238445468247} +{"Pretrain/Learning Rate": 2.5691836326091414e-05, "Pretrain/Loss": 1.980958104133606, "Pretrain/Loss (Raw)": 1.8424428701400757, "Pretrain/Step": 4830, "Pretrain/Step Time": 8.725372640416026} +{"Pretrain/Learning Rate": 2.5683349664710067e-05, "Pretrain/Loss": 1.9805964231491089, "Pretrain/Loss (Raw)": 1.753587245941162, "Pretrain/Step": 4831, "Pretrain/Step Time": 8.729413019493222} +{"Pretrain/Learning Rate": 2.5674862924521605e-05, "Pretrain/Loss": 1.979567527770996, "Pretrain/Loss (Raw)": 1.9158259630203247, "Pretrain/Step": 4832, "Pretrain/Step Time": 8.72854195162654} +{"Pretrain/Learning Rate": 2.566637610650478e-05, "Pretrain/Loss": 1.9803963899612427, "Pretrain/Loss (Raw)": 2.0415825843811035, "Pretrain/Step": 4833, "Pretrain/Step Time": 8.72761208564043} +{"Pretrain/Learning Rate": 2.565788921163832e-05, "Pretrain/Loss": 1.9773486852645874, "Pretrain/Loss (Raw)": 1.6410865783691406, "Pretrain/Step": 4834, "Pretrain/Step Time": 8.728602483868599} +{"Pretrain/Learning Rate": 2.5649402240900972e-05, "Pretrain/Loss": 1.979274034500122, "Pretrain/Loss (Raw)": 2.1547210216522217, "Pretrain/Step": 4835, "Pretrain/Step Time": 8.738941963762045} +{"Pretrain/Learning Rate": 2.5640915195271504e-05, "Pretrain/Loss": 1.979241967201233, "Pretrain/Loss (Raw)": 1.8165841102600098, "Pretrain/Step": 4836, "Pretrain/Step Time": 8.735304167494178} +{"Pretrain/Learning Rate": 2.563242807572867e-05, "Pretrain/Loss": 1.9771960973739624, "Pretrain/Loss (Raw)": 1.705505132675171, "Pretrain/Step": 4837, "Pretrain/Step Time": 8.735635044053197} +{"Pretrain/Learning Rate": 2.5623940883251256e-05, "Pretrain/Loss": 1.9777531623840332, "Pretrain/Loss (Raw)": 2.0905470848083496, "Pretrain/Step": 4838, "Pretrain/Step Time": 8.73790543526411} +{"Pretrain/Learning Rate": 2.561545361881803e-05, "Pretrain/Loss": 1.977107286453247, "Pretrain/Loss (Raw)": 1.8849341869354248, "Pretrain/Step": 4839, "Pretrain/Step Time": 8.733755012974143} +{"Pretrain/Learning Rate": 2.5606966283407803e-05, "Pretrain/Loss": 1.9800759553909302, "Pretrain/Loss (Raw)": 2.2420568466186523, "Pretrain/Step": 4840, "Pretrain/Step Time": 8.736022206023335} +{"Pretrain/Learning Rate": 2.5598478877999356e-05, "Pretrain/Loss": 1.9792213439941406, "Pretrain/Loss (Raw)": 2.034689426422119, "Pretrain/Step": 4841, "Pretrain/Step Time": 8.74316100217402} +{"Pretrain/Learning Rate": 2.558999140357151e-05, "Pretrain/Loss": 1.9800597429275513, "Pretrain/Loss (Raw)": 2.0428130626678467, "Pretrain/Step": 4842, "Pretrain/Step Time": 8.747496288269758} +{"Pretrain/Learning Rate": 2.5581503861103073e-05, "Pretrain/Loss": 1.9809176921844482, "Pretrain/Loss (Raw)": 1.9918612241744995, "Pretrain/Step": 4843, "Pretrain/Step Time": 8.747814603149891} +{"Pretrain/Learning Rate": 2.5573016251572872e-05, "Pretrain/Loss": 1.9803663492202759, "Pretrain/Loss (Raw)": 1.940353274345398, "Pretrain/Step": 4844, "Pretrain/Step Time": 8.74654052220285} +{"Pretrain/Learning Rate": 2.5564528575959733e-05, "Pretrain/Loss": 1.9804130792617798, "Pretrain/Loss (Raw)": 1.9442667961120605, "Pretrain/Step": 4845, "Pretrain/Step Time": 8.750135283917189} +{"Pretrain/Learning Rate": 2.55560408352425e-05, "Pretrain/Loss": 1.9785149097442627, "Pretrain/Loss (Raw)": 1.7272288799285889, "Pretrain/Step": 4846, "Pretrain/Step Time": 8.756931569427252} +{"Pretrain/Learning Rate": 2.5547553030400016e-05, "Pretrain/Loss": 1.9784023761749268, "Pretrain/Loss (Raw)": 2.030539035797119, "Pretrain/Step": 4847, "Pretrain/Step Time": 8.75571370869875} +{"Pretrain/Learning Rate": 2.5539065162411143e-05, "Pretrain/Loss": 1.9794925451278687, "Pretrain/Loss (Raw)": 2.1210286617279053, "Pretrain/Step": 4848, "Pretrain/Step Time": 8.754176262766123} +{"Pretrain/Learning Rate": 2.5530577232254733e-05, "Pretrain/Loss": 1.9788854122161865, "Pretrain/Loss (Raw)": 1.929620385169983, "Pretrain/Step": 4849, "Pretrain/Step Time": 8.748022900894284} +{"Pretrain/Learning Rate": 2.5522089240909652e-05, "Pretrain/Loss": 1.9758729934692383, "Pretrain/Loss (Raw)": 1.8091187477111816, "Pretrain/Step": 4850, "Pretrain/Step Time": 8.753447914496064} +{"Pretrain/Learning Rate": 2.5513601189354786e-05, "Pretrain/Loss": 1.9770479202270508, "Pretrain/Loss (Raw)": 2.1279044151306152, "Pretrain/Step": 4851, "Pretrain/Step Time": 8.748969180509448} +{"Pretrain/Learning Rate": 2.5505113078569004e-05, "Pretrain/Loss": 1.9785832166671753, "Pretrain/Loss (Raw)": 1.9874368906021118, "Pretrain/Step": 4852, "Pretrain/Step Time": 8.750105196610093} +{"Pretrain/Learning Rate": 2.5496624909531207e-05, "Pretrain/Loss": 1.9783527851104736, "Pretrain/Loss (Raw)": 1.9123715162277222, "Pretrain/Step": 4853, "Pretrain/Step Time": 8.750268395990133} +{"Pretrain/Learning Rate": 2.548813668322028e-05, "Pretrain/Loss": 1.9784235954284668, "Pretrain/Loss (Raw)": 2.0171971321105957, "Pretrain/Step": 4854, "Pretrain/Step Time": 8.744292857125401} +{"Pretrain/Learning Rate": 2.5479648400615136e-05, "Pretrain/Loss": 1.9779839515686035, "Pretrain/Loss (Raw)": 1.9442988634109497, "Pretrain/Step": 4855, "Pretrain/Step Time": 8.740579448640347} +{"Pretrain/Learning Rate": 2.547116006269467e-05, "Pretrain/Loss": 1.9798305034637451, "Pretrain/Loss (Raw)": 2.1351382732391357, "Pretrain/Step": 4856, "Pretrain/Step Time": 8.74038890376687} +{"Pretrain/Learning Rate": 2.5462671670437816e-05, "Pretrain/Loss": 1.9786980152130127, "Pretrain/Loss (Raw)": 1.9066660404205322, "Pretrain/Step": 4857, "Pretrain/Step Time": 8.747636614367366} +{"Pretrain/Learning Rate": 2.545418322482348e-05, "Pretrain/Loss": 1.979364037513733, "Pretrain/Loss (Raw)": 1.8562871217727661, "Pretrain/Step": 4858, "Pretrain/Step Time": 8.752336401492357} +{"Pretrain/Learning Rate": 2.5445694726830593e-05, "Pretrain/Loss": 1.979071855545044, "Pretrain/Loss (Raw)": 2.047363042831421, "Pretrain/Step": 4859, "Pretrain/Step Time": 8.755475360900164} +{"Pretrain/Learning Rate": 2.543720617743809e-05, "Pretrain/Loss": 1.9803828001022339, "Pretrain/Loss (Raw)": 2.0495760440826416, "Pretrain/Step": 4860, "Pretrain/Step Time": 8.755116291344166} +{"Pretrain/Learning Rate": 2.5428717577624915e-05, "Pretrain/Loss": 1.9786649942398071, "Pretrain/Loss (Raw)": 1.9212067127227783, "Pretrain/Step": 4861, "Pretrain/Step Time": 8.752618415281177} +{"Pretrain/Learning Rate": 2.5420228928370005e-05, "Pretrain/Loss": 1.9809694290161133, "Pretrain/Loss (Raw)": 2.037597894668579, "Pretrain/Step": 4862, "Pretrain/Step Time": 8.756363032385707} +{"Pretrain/Learning Rate": 2.5411740230652315e-05, "Pretrain/Loss": 1.9803447723388672, "Pretrain/Loss (Raw)": 2.0254786014556885, "Pretrain/Step": 4863, "Pretrain/Step Time": 8.753452671691775} +{"Pretrain/Learning Rate": 2.5403251485450795e-05, "Pretrain/Loss": 1.9802987575531006, "Pretrain/Loss (Raw)": 1.857706904411316, "Pretrain/Step": 4864, "Pretrain/Step Time": 8.751432996243238} +{"Pretrain/Learning Rate": 2.5394762693744428e-05, "Pretrain/Loss": 1.9815634489059448, "Pretrain/Loss (Raw)": 2.0266621112823486, "Pretrain/Step": 4865, "Pretrain/Step Time": 8.751485832035542} +{"Pretrain/Learning Rate": 2.538627385651216e-05, "Pretrain/Loss": 1.9822722673416138, "Pretrain/Loss (Raw)": 2.110382080078125, "Pretrain/Step": 4866, "Pretrain/Step Time": 8.753254866227508} +{"Pretrain/Learning Rate": 2.5377784974732965e-05, "Pretrain/Loss": 1.9822667837142944, "Pretrain/Loss (Raw)": 1.8679478168487549, "Pretrain/Step": 4867, "Pretrain/Step Time": 8.751287134364247} +{"Pretrain/Learning Rate": 2.536929604938584e-05, "Pretrain/Loss": 1.979773998260498, "Pretrain/Loss (Raw)": 1.9078818559646606, "Pretrain/Step": 4868, "Pretrain/Step Time": 8.749048065394163} +{"Pretrain/Learning Rate": 2.5360807081449738e-05, "Pretrain/Loss": 1.9790678024291992, "Pretrain/Loss (Raw)": 1.941558599472046, "Pretrain/Step": 4869, "Pretrain/Step Time": 8.7384630497545} +{"Pretrain/Learning Rate": 2.5352318071903675e-05, "Pretrain/Loss": 1.9751685857772827, "Pretrain/Loss (Raw)": 1.5225131511688232, "Pretrain/Step": 4870, "Pretrain/Step Time": 8.741051895543933} +{"Pretrain/Learning Rate": 2.5343829021726618e-05, "Pretrain/Loss": 1.9713698625564575, "Pretrain/Loss (Raw)": 1.594355821609497, "Pretrain/Step": 4871, "Pretrain/Step Time": 8.743650628253818} +{"Pretrain/Learning Rate": 2.533533993189759e-05, "Pretrain/Loss": 1.9706366062164307, "Pretrain/Loss (Raw)": 1.8437926769256592, "Pretrain/Step": 4872, "Pretrain/Step Time": 8.742835091426969} +{"Pretrain/Learning Rate": 2.5326850803395575e-05, "Pretrain/Loss": 1.975515604019165, "Pretrain/Loss (Raw)": 2.121791124343872, "Pretrain/Step": 4873, "Pretrain/Step Time": 8.739279203116894} +{"Pretrain/Learning Rate": 2.5318361637199594e-05, "Pretrain/Loss": 1.9736549854278564, "Pretrain/Loss (Raw)": 1.8048911094665527, "Pretrain/Step": 4874, "Pretrain/Step Time": 8.74528850056231} +{"Pretrain/Learning Rate": 2.5309872434288645e-05, "Pretrain/Loss": 1.9742536544799805, "Pretrain/Loss (Raw)": 1.6993070840835571, "Pretrain/Step": 4875, "Pretrain/Step Time": 8.749246833845973} +{"Pretrain/Learning Rate": 2.5301383195641742e-05, "Pretrain/Loss": 1.9711182117462158, "Pretrain/Loss (Raw)": 1.7990169525146484, "Pretrain/Step": 4876, "Pretrain/Step Time": 8.747514240443707} +{"Pretrain/Learning Rate": 2.5292893922237913e-05, "Pretrain/Loss": 1.9697339534759521, "Pretrain/Loss (Raw)": 1.9902364015579224, "Pretrain/Step": 4877, "Pretrain/Step Time": 8.744406944140792} +{"Pretrain/Learning Rate": 2.5284404615056172e-05, "Pretrain/Loss": 1.96946382522583, "Pretrain/Loss (Raw)": 2.0014278888702393, "Pretrain/Step": 4878, "Pretrain/Step Time": 8.74889632128179} +{"Pretrain/Learning Rate": 2.5275915275075556e-05, "Pretrain/Loss": 1.969929814338684, "Pretrain/Loss (Raw)": 2.0992486476898193, "Pretrain/Step": 4879, "Pretrain/Step Time": 8.748046478256583} +{"Pretrain/Learning Rate": 2.5267425903275088e-05, "Pretrain/Loss": 1.9699875116348267, "Pretrain/Loss (Raw)": 1.8951842784881592, "Pretrain/Step": 4880, "Pretrain/Step Time": 8.743388028815389} +{"Pretrain/Learning Rate": 2.5258936500633807e-05, "Pretrain/Loss": 1.9707252979278564, "Pretrain/Loss (Raw)": 2.1158649921417236, "Pretrain/Step": 4881, "Pretrain/Step Time": 8.74637278355658} +{"Pretrain/Learning Rate": 2.5250447068130746e-05, "Pretrain/Loss": 1.9685454368591309, "Pretrain/Loss (Raw)": 1.999618411064148, "Pretrain/Step": 4882, "Pretrain/Step Time": 8.74942490272224} +{"Pretrain/Learning Rate": 2.5241957606744952e-05, "Pretrain/Loss": 1.9694159030914307, "Pretrain/Loss (Raw)": 2.029372453689575, "Pretrain/Step": 4883, "Pretrain/Step Time": 8.745597856119275} +{"Pretrain/Learning Rate": 2.523346811745546e-05, "Pretrain/Loss": 1.9695148468017578, "Pretrain/Loss (Raw)": 2.080674171447754, "Pretrain/Step": 4884, "Pretrain/Step Time": 8.744816610589623} +{"Pretrain/Learning Rate": 2.5224978601241333e-05, "Pretrain/Loss": 1.9668172597885132, "Pretrain/Loss (Raw)": 1.7909033298492432, "Pretrain/Step": 4885, "Pretrain/Step Time": 8.744065349921584} +{"Pretrain/Learning Rate": 2.5216489059081607e-05, "Pretrain/Loss": 1.9665207862854004, "Pretrain/Loss (Raw)": 1.9725229740142822, "Pretrain/Step": 4886, "Pretrain/Step Time": 8.744006361812353} +{"Pretrain/Learning Rate": 2.5207999491955347e-05, "Pretrain/Loss": 1.9675195217132568, "Pretrain/Loss (Raw)": 2.1600582599639893, "Pretrain/Step": 4887, "Pretrain/Step Time": 8.748188031837344} +{"Pretrain/Learning Rate": 2.51995099008416e-05, "Pretrain/Loss": 1.9654195308685303, "Pretrain/Loss (Raw)": 1.8827133178710938, "Pretrain/Step": 4888, "Pretrain/Step Time": 8.747520372271538} +{"Pretrain/Learning Rate": 2.519102028671944e-05, "Pretrain/Loss": 1.9665601253509521, "Pretrain/Loss (Raw)": 1.9877859354019165, "Pretrain/Step": 4889, "Pretrain/Step Time": 8.744853094220161} +{"Pretrain/Learning Rate": 2.518253065056791e-05, "Pretrain/Loss": 1.9680373668670654, "Pretrain/Loss (Raw)": 1.8954765796661377, "Pretrain/Step": 4890, "Pretrain/Step Time": 8.758729424327612} +{"Pretrain/Learning Rate": 2.5174040993366094e-05, "Pretrain/Loss": 1.9690628051757812, "Pretrain/Loss (Raw)": 1.9609276056289673, "Pretrain/Step": 4891, "Pretrain/Step Time": 8.755541760474443} +{"Pretrain/Learning Rate": 2.516555131609305e-05, "Pretrain/Loss": 1.9698550701141357, "Pretrain/Loss (Raw)": 2.084291696548462, "Pretrain/Step": 4892, "Pretrain/Step Time": 8.756261814385653} +{"Pretrain/Learning Rate": 2.5157061619727844e-05, "Pretrain/Loss": 1.9714075326919556, "Pretrain/Loss (Raw)": 2.047886848449707, "Pretrain/Step": 4893, "Pretrain/Step Time": 8.75380426645279} +{"Pretrain/Learning Rate": 2.514857190524955e-05, "Pretrain/Loss": 1.9716594219207764, "Pretrain/Loss (Raw)": 2.0053462982177734, "Pretrain/Step": 4894, "Pretrain/Step Time": 8.75998780503869} +{"Pretrain/Learning Rate": 2.514008217363725e-05, "Pretrain/Loss": 1.972476601600647, "Pretrain/Loss (Raw)": 2.1566412448883057, "Pretrain/Step": 4895, "Pretrain/Step Time": 8.75063525699079} +{"Pretrain/Learning Rate": 2.513159242587001e-05, "Pretrain/Loss": 1.9749271869659424, "Pretrain/Loss (Raw)": 2.18508243560791, "Pretrain/Step": 4896, "Pretrain/Step Time": 8.762542583048344} +{"Pretrain/Learning Rate": 2.5123102662926913e-05, "Pretrain/Loss": 1.9770994186401367, "Pretrain/Loss (Raw)": 2.2140579223632812, "Pretrain/Step": 4897, "Pretrain/Step Time": 8.758682608604431} +{"Pretrain/Learning Rate": 2.5114612885787037e-05, "Pretrain/Loss": 1.9778668880462646, "Pretrain/Loss (Raw)": 1.999513030052185, "Pretrain/Step": 4898, "Pretrain/Step Time": 8.761266510933638} +{"Pretrain/Learning Rate": 2.5106123095429456e-05, "Pretrain/Loss": 1.9792457818984985, "Pretrain/Loss (Raw)": 2.1578781604766846, "Pretrain/Step": 4899, "Pretrain/Step Time": 8.761359395459294} +{"Pretrain/Learning Rate": 2.5097633292833268e-05, "Pretrain/Loss": 1.9804867506027222, "Pretrain/Loss (Raw)": 2.2213003635406494, "Pretrain/Step": 4900, "Pretrain/Step Time": 8.763437021523714} +{"Pretrain/Learning Rate": 2.5089143478977546e-05, "Pretrain/Loss": 1.978585958480835, "Pretrain/Loss (Raw)": 1.910117745399475, "Pretrain/Step": 4901, "Pretrain/Step Time": 8.750562075525522} +{"Pretrain/Learning Rate": 2.5080653654841378e-05, "Pretrain/Loss": 1.9783565998077393, "Pretrain/Loss (Raw)": 1.9456416368484497, "Pretrain/Step": 4902, "Pretrain/Step Time": 8.750273996964097} +{"Pretrain/Learning Rate": 2.507216382140385e-05, "Pretrain/Loss": 1.9801535606384277, "Pretrain/Loss (Raw)": 1.9166635274887085, "Pretrain/Step": 4903, "Pretrain/Step Time": 8.748220298439264} +{"Pretrain/Learning Rate": 2.5063673979644054e-05, "Pretrain/Loss": 1.9813127517700195, "Pretrain/Loss (Raw)": 2.1147100925445557, "Pretrain/Step": 4904, "Pretrain/Step Time": 8.748227130621672} +{"Pretrain/Learning Rate": 2.5055184130541065e-05, "Pretrain/Loss": 1.981649398803711, "Pretrain/Loss (Raw)": 2.104212760925293, "Pretrain/Step": 4905, "Pretrain/Step Time": 8.757694298401475} +{"Pretrain/Learning Rate": 2.504669427507399e-05, "Pretrain/Loss": 1.9807442426681519, "Pretrain/Loss (Raw)": 1.8294014930725098, "Pretrain/Step": 4906, "Pretrain/Step Time": 8.763541284948587} +{"Pretrain/Learning Rate": 2.503820441422191e-05, "Pretrain/Loss": 1.9823763370513916, "Pretrain/Loss (Raw)": 1.8970320224761963, "Pretrain/Step": 4907, "Pretrain/Step Time": 8.763132764026523} +{"Pretrain/Learning Rate": 2.5029714548963917e-05, "Pretrain/Loss": 1.9841976165771484, "Pretrain/Loss (Raw)": 2.1883904933929443, "Pretrain/Step": 4908, "Pretrain/Step Time": 8.765078792348504} +{"Pretrain/Learning Rate": 2.5021224680279105e-05, "Pretrain/Loss": 1.9839190244674683, "Pretrain/Loss (Raw)": 1.9720878601074219, "Pretrain/Step": 4909, "Pretrain/Step Time": 8.761579275131226} +{"Pretrain/Learning Rate": 2.5012734809146554e-05, "Pretrain/Loss": 1.9799890518188477, "Pretrain/Loss (Raw)": 1.6455841064453125, "Pretrain/Step": 4910, "Pretrain/Step Time": 8.757384905591607} +{"Pretrain/Learning Rate": 2.5004244936545374e-05, "Pretrain/Loss": 1.9793007373809814, "Pretrain/Loss (Raw)": 1.8204368352890015, "Pretrain/Step": 4911, "Pretrain/Step Time": 8.757021084427834} +{"Pretrain/Learning Rate": 2.499575506345464e-05, "Pretrain/Loss": 1.9800119400024414, "Pretrain/Loss (Raw)": 1.9545453786849976, "Pretrain/Step": 4912, "Pretrain/Step Time": 8.76086825504899} +{"Pretrain/Learning Rate": 2.498726519085345e-05, "Pretrain/Loss": 1.978309154510498, "Pretrain/Loss (Raw)": 1.918150782585144, "Pretrain/Step": 4913, "Pretrain/Step Time": 8.764230521395802} +{"Pretrain/Learning Rate": 2.497877531972091e-05, "Pretrain/Loss": 1.9774696826934814, "Pretrain/Loss (Raw)": 1.91390860080719, "Pretrain/Step": 4914, "Pretrain/Step Time": 8.765220271423459} +{"Pretrain/Learning Rate": 2.497028545103609e-05, "Pretrain/Loss": 1.9758718013763428, "Pretrain/Loss (Raw)": 1.8966089487075806, "Pretrain/Step": 4915, "Pretrain/Step Time": 8.763128913939} +{"Pretrain/Learning Rate": 2.49617955857781e-05, "Pretrain/Loss": 1.979573369026184, "Pretrain/Loss (Raw)": 2.307901382446289, "Pretrain/Step": 4916, "Pretrain/Step Time": 8.763952726498246} +{"Pretrain/Learning Rate": 2.4953305724926017e-05, "Pretrain/Loss": 1.980886459350586, "Pretrain/Loss (Raw)": 2.02032208442688, "Pretrain/Step": 4917, "Pretrain/Step Time": 8.75400448590517} +{"Pretrain/Learning Rate": 2.494481586945894e-05, "Pretrain/Loss": 1.9846975803375244, "Pretrain/Loss (Raw)": 2.395782709121704, "Pretrain/Step": 4918, "Pretrain/Step Time": 8.750129409134388} +{"Pretrain/Learning Rate": 2.4936326020355955e-05, "Pretrain/Loss": 1.9860961437225342, "Pretrain/Loss (Raw)": 2.142326593399048, "Pretrain/Step": 4919, "Pretrain/Step Time": 8.749862985685468} +{"Pretrain/Learning Rate": 2.4927836178596156e-05, "Pretrain/Loss": 1.9888787269592285, "Pretrain/Loss (Raw)": 2.240229606628418, "Pretrain/Step": 4920, "Pretrain/Step Time": 8.7475705165416} +{"Pretrain/Learning Rate": 2.4919346345158624e-05, "Pretrain/Loss": 1.9882763624191284, "Pretrain/Loss (Raw)": 1.9599745273590088, "Pretrain/Step": 4921, "Pretrain/Step Time": 8.754093596711755} +{"Pretrain/Learning Rate": 2.491085652102246e-05, "Pretrain/Loss": 1.986916422843933, "Pretrain/Loss (Raw)": 2.009133815765381, "Pretrain/Step": 4922, "Pretrain/Step Time": 8.76518364623189} +{"Pretrain/Learning Rate": 2.4902366707166734e-05, "Pretrain/Loss": 1.9852055311203003, "Pretrain/Loss (Raw)": 1.8511462211608887, "Pretrain/Step": 4923, "Pretrain/Step Time": 8.763213030993938} +{"Pretrain/Learning Rate": 2.4893876904570554e-05, "Pretrain/Loss": 1.9882020950317383, "Pretrain/Loss (Raw)": 1.9170933961868286, "Pretrain/Step": 4924, "Pretrain/Step Time": 8.765704073011875} +{"Pretrain/Learning Rate": 2.488538711421297e-05, "Pretrain/Loss": 1.9850270748138428, "Pretrain/Loss (Raw)": 1.508976936340332, "Pretrain/Step": 4925, "Pretrain/Step Time": 8.766688181087375} +{"Pretrain/Learning Rate": 2.4876897337073103e-05, "Pretrain/Loss": 1.9858864545822144, "Pretrain/Loss (Raw)": 1.9075225591659546, "Pretrain/Step": 4926, "Pretrain/Step Time": 8.76237945817411} +{"Pretrain/Learning Rate": 2.4868407574129994e-05, "Pretrain/Loss": 1.982072353363037, "Pretrain/Loss (Raw)": 1.529305338859558, "Pretrain/Step": 4927, "Pretrain/Step Time": 8.765438675880432} +{"Pretrain/Learning Rate": 2.4859917826362764e-05, "Pretrain/Loss": 1.9828670024871826, "Pretrain/Loss (Raw)": 2.0948646068573, "Pretrain/Step": 4928, "Pretrain/Step Time": 8.764993611723185} +{"Pretrain/Learning Rate": 2.485142809475045e-05, "Pretrain/Loss": 1.984632134437561, "Pretrain/Loss (Raw)": 2.0765740871429443, "Pretrain/Step": 4929, "Pretrain/Step Time": 8.76293415389955} +{"Pretrain/Learning Rate": 2.4842938380272168e-05, "Pretrain/Loss": 1.9841463565826416, "Pretrain/Loss (Raw)": 1.7723714113235474, "Pretrain/Step": 4930, "Pretrain/Step Time": 8.761656830087304} +{"Pretrain/Learning Rate": 2.4834448683906957e-05, "Pretrain/Loss": 1.982391119003296, "Pretrain/Loss (Raw)": 1.976855993270874, "Pretrain/Step": 4931, "Pretrain/Step Time": 8.763742970302701} +{"Pretrain/Learning Rate": 2.482595900663392e-05, "Pretrain/Loss": 1.9833815097808838, "Pretrain/Loss (Raw)": 2.142730236053467, "Pretrain/Step": 4932, "Pretrain/Step Time": 8.766254970803857} +{"Pretrain/Learning Rate": 2.481746934943209e-05, "Pretrain/Loss": 1.9838061332702637, "Pretrain/Loss (Raw)": 2.0516178607940674, "Pretrain/Step": 4933, "Pretrain/Step Time": 8.765200067311525} +{"Pretrain/Learning Rate": 2.480897971328056e-05, "Pretrain/Loss": 1.9818451404571533, "Pretrain/Loss (Raw)": 1.809826374053955, "Pretrain/Step": 4934, "Pretrain/Step Time": 8.76919561251998} +{"Pretrain/Learning Rate": 2.4800490099158403e-05, "Pretrain/Loss": 1.982775330543518, "Pretrain/Loss (Raw)": 1.9937866926193237, "Pretrain/Step": 4935, "Pretrain/Step Time": 8.766612440347672} +{"Pretrain/Learning Rate": 2.4792000508044652e-05, "Pretrain/Loss": 1.9817545413970947, "Pretrain/Loss (Raw)": 1.9324207305908203, "Pretrain/Step": 4936, "Pretrain/Step Time": 8.758003856986761} +{"Pretrain/Learning Rate": 2.4783510940918396e-05, "Pretrain/Loss": 1.9828894138336182, "Pretrain/Loss (Raw)": 2.173494338989258, "Pretrain/Step": 4937, "Pretrain/Step Time": 8.759240524843335} +{"Pretrain/Learning Rate": 2.4775021398758666e-05, "Pretrain/Loss": 1.9804482460021973, "Pretrain/Loss (Raw)": 1.7242764234542847, "Pretrain/Step": 4938, "Pretrain/Step Time": 8.767715161666274} +{"Pretrain/Learning Rate": 2.4766531882544545e-05, "Pretrain/Loss": 1.980118989944458, "Pretrain/Loss (Raw)": 2.047480583190918, "Pretrain/Step": 4939, "Pretrain/Step Time": 8.76715524122119} +{"Pretrain/Learning Rate": 2.475804239325505e-05, "Pretrain/Loss": 1.9794654846191406, "Pretrain/Loss (Raw)": 1.9648118019104004, "Pretrain/Step": 4940, "Pretrain/Step Time": 8.770142203196883} +{"Pretrain/Learning Rate": 2.474955293186926e-05, "Pretrain/Loss": 1.9785419702529907, "Pretrain/Loss (Raw)": 2.0217394828796387, "Pretrain/Step": 4941, "Pretrain/Step Time": 8.76656642369926} +{"Pretrain/Learning Rate": 2.4741063499366195e-05, "Pretrain/Loss": 1.9800243377685547, "Pretrain/Loss (Raw)": 2.1768569946289062, "Pretrain/Step": 4942, "Pretrain/Step Time": 8.76712979376316} +{"Pretrain/Learning Rate": 2.4732574096724918e-05, "Pretrain/Loss": 1.980628252029419, "Pretrain/Loss (Raw)": 2.092390537261963, "Pretrain/Step": 4943, "Pretrain/Step Time": 8.766773177310824} +{"Pretrain/Learning Rate": 2.4724084724924446e-05, "Pretrain/Loss": 1.982689380645752, "Pretrain/Loss (Raw)": 2.2433736324310303, "Pretrain/Step": 4944, "Pretrain/Step Time": 8.768628720194101} +{"Pretrain/Learning Rate": 2.471559538494383e-05, "Pretrain/Loss": 1.9824397563934326, "Pretrain/Loss (Raw)": 2.0807766914367676, "Pretrain/Step": 4945, "Pretrain/Step Time": 8.772482516244054} +{"Pretrain/Learning Rate": 2.470710607776209e-05, "Pretrain/Loss": 1.9804186820983887, "Pretrain/Loss (Raw)": 1.9222222566604614, "Pretrain/Step": 4946, "Pretrain/Step Time": 8.771169409155846} +{"Pretrain/Learning Rate": 2.4698616804358263e-05, "Pretrain/Loss": 1.9796154499053955, "Pretrain/Loss (Raw)": 2.146634817123413, "Pretrain/Step": 4947, "Pretrain/Step Time": 8.771837813779712} +{"Pretrain/Learning Rate": 2.469012756571136e-05, "Pretrain/Loss": 1.980961561203003, "Pretrain/Loss (Raw)": 2.137502431869507, "Pretrain/Step": 4948, "Pretrain/Step Time": 8.771243145689368} +{"Pretrain/Learning Rate": 2.4681638362800415e-05, "Pretrain/Loss": 1.9828300476074219, "Pretrain/Loss (Raw)": 2.2249197959899902, "Pretrain/Step": 4949, "Pretrain/Step Time": 8.76314121671021} +{"Pretrain/Learning Rate": 2.4673149196604424e-05, "Pretrain/Loss": 1.9826470613479614, "Pretrain/Loss (Raw)": 2.066180944442749, "Pretrain/Step": 4950, "Pretrain/Step Time": 8.765431394800544} +{"Pretrain/Learning Rate": 2.4664660068102416e-05, "Pretrain/Loss": 1.9826117753982544, "Pretrain/Loss (Raw)": 2.0065839290618896, "Pretrain/Step": 4951, "Pretrain/Step Time": 8.763877023011446} +{"Pretrain/Learning Rate": 2.465617097827338e-05, "Pretrain/Loss": 1.9844655990600586, "Pretrain/Loss (Raw)": 2.15307354927063, "Pretrain/Step": 4952, "Pretrain/Step Time": 8.763790072873235} +{"Pretrain/Learning Rate": 2.4647681928096337e-05, "Pretrain/Loss": 1.9820537567138672, "Pretrain/Loss (Raw)": 1.7903741598129272, "Pretrain/Step": 4953, "Pretrain/Step Time": 8.755419498309493} +{"Pretrain/Learning Rate": 2.4639192918550268e-05, "Pretrain/Loss": 1.9807748794555664, "Pretrain/Loss (Raw)": 1.9077330827713013, "Pretrain/Step": 4954, "Pretrain/Step Time": 8.75907850265503} +{"Pretrain/Learning Rate": 2.4630703950614176e-05, "Pretrain/Loss": 1.9790167808532715, "Pretrain/Loss (Raw)": 2.0403311252593994, "Pretrain/Step": 4955, "Pretrain/Step Time": 8.753652814775705} +{"Pretrain/Learning Rate": 2.462221502526704e-05, "Pretrain/Loss": 1.9792108535766602, "Pretrain/Loss (Raw)": 2.075700283050537, "Pretrain/Step": 4956, "Pretrain/Step Time": 8.752111703157425} +{"Pretrain/Learning Rate": 2.461372614348785e-05, "Pretrain/Loss": 1.9793529510498047, "Pretrain/Loss (Raw)": 2.0317282676696777, "Pretrain/Step": 4957, "Pretrain/Step Time": 8.75333870202303} +{"Pretrain/Learning Rate": 2.460523730625558e-05, "Pretrain/Loss": 1.981602430343628, "Pretrain/Loss (Raw)": 2.130375623703003, "Pretrain/Step": 4958, "Pretrain/Step Time": 8.754246860742569} +{"Pretrain/Learning Rate": 2.4596748514549208e-05, "Pretrain/Loss": 1.985338807106018, "Pretrain/Loss (Raw)": 2.231841564178467, "Pretrain/Step": 4959, "Pretrain/Step Time": 8.746616223827004} +{"Pretrain/Learning Rate": 2.458825976934769e-05, "Pretrain/Loss": 1.982686996459961, "Pretrain/Loss (Raw)": 1.5763918161392212, "Pretrain/Step": 4960, "Pretrain/Step Time": 8.748085567727685} +{"Pretrain/Learning Rate": 2.4579771071630004e-05, "Pretrain/Loss": 1.980798363685608, "Pretrain/Loss (Raw)": 1.799843668937683, "Pretrain/Step": 4961, "Pretrain/Step Time": 8.757139332592487} +{"Pretrain/Learning Rate": 2.457128242237509e-05, "Pretrain/Loss": 1.9837771654129028, "Pretrain/Loss (Raw)": 2.022378921508789, "Pretrain/Step": 4962, "Pretrain/Step Time": 8.756375007331371} +{"Pretrain/Learning Rate": 2.4562793822561914e-05, "Pretrain/Loss": 1.9843969345092773, "Pretrain/Loss (Raw)": 2.234037160873413, "Pretrain/Step": 4963, "Pretrain/Step Time": 8.74596482515335} +{"Pretrain/Learning Rate": 2.455430527316941e-05, "Pretrain/Loss": 1.9844212532043457, "Pretrain/Loss (Raw)": 1.8197081089019775, "Pretrain/Step": 4964, "Pretrain/Step Time": 8.74828358925879} +{"Pretrain/Learning Rate": 2.4545816775176532e-05, "Pretrain/Loss": 1.987358808517456, "Pretrain/Loss (Raw)": 2.0814976692199707, "Pretrain/Step": 4965, "Pretrain/Step Time": 8.751136356964707} +{"Pretrain/Learning Rate": 2.4537328329562186e-05, "Pretrain/Loss": 1.9853205680847168, "Pretrain/Loss (Raw)": 1.8296728134155273, "Pretrain/Step": 4966, "Pretrain/Step Time": 8.746264843270183} +{"Pretrain/Learning Rate": 2.4528839937305336e-05, "Pretrain/Loss": 1.9829168319702148, "Pretrain/Loss (Raw)": 1.5772515535354614, "Pretrain/Step": 4967, "Pretrain/Step Time": 8.74788343347609} +{"Pretrain/Learning Rate": 2.452035159938487e-05, "Pretrain/Loss": 1.9806442260742188, "Pretrain/Loss (Raw)": 1.9511758089065552, "Pretrain/Step": 4968, "Pretrain/Step Time": 8.754034265875816} +{"Pretrain/Learning Rate": 2.4511863316779728e-05, "Pretrain/Loss": 1.981465220451355, "Pretrain/Loss (Raw)": 2.1397619247436523, "Pretrain/Step": 4969, "Pretrain/Step Time": 8.744947664439678} +{"Pretrain/Learning Rate": 2.4503375090468795e-05, "Pretrain/Loss": 1.9813292026519775, "Pretrain/Loss (Raw)": 2.025400400161743, "Pretrain/Step": 4970, "Pretrain/Step Time": 8.738724051043391} +{"Pretrain/Learning Rate": 2.4494886921431005e-05, "Pretrain/Loss": 1.9817285537719727, "Pretrain/Loss (Raw)": 2.0429656505584717, "Pretrain/Step": 4971, "Pretrain/Step Time": 8.743594305589795} +{"Pretrain/Learning Rate": 2.448639881064522e-05, "Pretrain/Loss": 1.9826149940490723, "Pretrain/Loss (Raw)": 2.0538251399993896, "Pretrain/Step": 4972, "Pretrain/Step Time": 8.741282073780894} +{"Pretrain/Learning Rate": 2.4477910759090357e-05, "Pretrain/Loss": 1.9836395978927612, "Pretrain/Loss (Raw)": 2.0754144191741943, "Pretrain/Step": 4973, "Pretrain/Step Time": 8.737778525799513} +{"Pretrain/Learning Rate": 2.446942276774527e-05, "Pretrain/Loss": 1.9885591268539429, "Pretrain/Loss (Raw)": 2.3569414615631104, "Pretrain/Step": 4974, "Pretrain/Step Time": 8.733884507790208} +{"Pretrain/Learning Rate": 2.4460934837588856e-05, "Pretrain/Loss": 1.9890741109848022, "Pretrain/Loss (Raw)": 2.0964407920837402, "Pretrain/Step": 4975, "Pretrain/Step Time": 8.743071615695953} +{"Pretrain/Learning Rate": 2.4452446969599986e-05, "Pretrain/Loss": 1.987784504890442, "Pretrain/Loss (Raw)": 1.9559719562530518, "Pretrain/Step": 4976, "Pretrain/Step Time": 8.746325846761465} +{"Pretrain/Learning Rate": 2.44439591647575e-05, "Pretrain/Loss": 1.9871594905853271, "Pretrain/Loss (Raw)": 1.849605679512024, "Pretrain/Step": 4977, "Pretrain/Step Time": 8.745910346508026} +{"Pretrain/Learning Rate": 2.4435471424040273e-05, "Pretrain/Loss": 1.988275170326233, "Pretrain/Loss (Raw)": 1.951949119567871, "Pretrain/Step": 4978, "Pretrain/Step Time": 8.747349191457033} +{"Pretrain/Learning Rate": 2.442698374842713e-05, "Pretrain/Loss": 1.9872288703918457, "Pretrain/Loss (Raw)": 1.9939744472503662, "Pretrain/Step": 4979, "Pretrain/Step Time": 8.747965026646852} +{"Pretrain/Learning Rate": 2.4418496138896936e-05, "Pretrain/Loss": 1.987858533859253, "Pretrain/Loss (Raw)": 2.0680294036865234, "Pretrain/Step": 4980, "Pretrain/Step Time": 8.740778725594282} +{"Pretrain/Learning Rate": 2.4410008596428492e-05, "Pretrain/Loss": 1.9885388612747192, "Pretrain/Loss (Raw)": 1.99942946434021, "Pretrain/Step": 4981, "Pretrain/Step Time": 8.740464825183153} +{"Pretrain/Learning Rate": 2.440152112200065e-05, "Pretrain/Loss": 1.9882349967956543, "Pretrain/Loss (Raw)": 1.9783300161361694, "Pretrain/Step": 4982, "Pretrain/Step Time": 8.745146384462714} +{"Pretrain/Learning Rate": 2.4393033716592196e-05, "Pretrain/Loss": 1.9880954027175903, "Pretrain/Loss (Raw)": 1.9264330863952637, "Pretrain/Step": 4983, "Pretrain/Step Time": 8.74656854942441} +{"Pretrain/Learning Rate": 2.4384546381181976e-05, "Pretrain/Loss": 1.9852452278137207, "Pretrain/Loss (Raw)": 1.7703012228012085, "Pretrain/Step": 4984, "Pretrain/Step Time": 8.748623579740524} +{"Pretrain/Learning Rate": 2.437605911674875e-05, "Pretrain/Loss": 1.984520435333252, "Pretrain/Loss (Raw)": 1.8138865232467651, "Pretrain/Step": 4985, "Pretrain/Step Time": 8.745967311784625} +{"Pretrain/Learning Rate": 2.4367571924271335e-05, "Pretrain/Loss": 1.9841029644012451, "Pretrain/Loss (Raw)": 1.8028619289398193, "Pretrain/Step": 4986, "Pretrain/Step Time": 8.74317822046578} +{"Pretrain/Learning Rate": 2.43590848047285e-05, "Pretrain/Loss": 1.9845120906829834, "Pretrain/Loss (Raw)": 2.099731206893921, "Pretrain/Step": 4987, "Pretrain/Step Time": 8.739595299586654} +{"Pretrain/Learning Rate": 2.4350597759099034e-05, "Pretrain/Loss": 1.9843316078186035, "Pretrain/Loss (Raw)": 2.0264623165130615, "Pretrain/Step": 4988, "Pretrain/Step Time": 8.738510888069868} +{"Pretrain/Learning Rate": 2.4342110788361685e-05, "Pretrain/Loss": 1.9846510887145996, "Pretrain/Loss (Raw)": 1.9620890617370605, "Pretrain/Step": 4989, "Pretrain/Step Time": 8.738583963364363} +{"Pretrain/Learning Rate": 2.433362389349523e-05, "Pretrain/Loss": 1.9850050210952759, "Pretrain/Loss (Raw)": 2.082919120788574, "Pretrain/Step": 4990, "Pretrain/Step Time": 8.740222066640854} +{"Pretrain/Learning Rate": 2.4325137075478398e-05, "Pretrain/Loss": 1.9855862855911255, "Pretrain/Loss (Raw)": 2.099893093109131, "Pretrain/Step": 4991, "Pretrain/Step Time": 8.74444955587387} +{"Pretrain/Learning Rate": 2.4316650335289942e-05, "Pretrain/Loss": 1.9851617813110352, "Pretrain/Loss (Raw)": 1.8033562898635864, "Pretrain/Step": 4992, "Pretrain/Step Time": 8.741108573973179} +{"Pretrain/Learning Rate": 2.430816367390859e-05, "Pretrain/Loss": 1.983874797821045, "Pretrain/Loss (Raw)": 1.86192786693573, "Pretrain/Step": 4993, "Pretrain/Step Time": 8.742498949170113} +{"Pretrain/Learning Rate": 2.429967709231306e-05, "Pretrain/Loss": 1.9832559823989868, "Pretrain/Loss (Raw)": 2.031177282333374, "Pretrain/Step": 4994, "Pretrain/Step Time": 8.74512473680079} +{"Pretrain/Learning Rate": 2.429119059148207e-05, "Pretrain/Loss": 1.9839212894439697, "Pretrain/Loss (Raw)": 1.9531077146530151, "Pretrain/Step": 4995, "Pretrain/Step Time": 8.742314232513309} +{"Pretrain/Learning Rate": 2.4282704172394323e-05, "Pretrain/Loss": 1.9806406497955322, "Pretrain/Loss (Raw)": 1.4879767894744873, "Pretrain/Step": 4996, "Pretrain/Step Time": 8.745791947469115} +{"Pretrain/Learning Rate": 2.4274217836028507e-05, "Pretrain/Loss": 1.9807357788085938, "Pretrain/Loss (Raw)": 1.9537068605422974, "Pretrain/Step": 4997, "Pretrain/Step Time": 8.746862469241023} +{"Pretrain/Learning Rate": 2.4265731583363316e-05, "Pretrain/Loss": 1.9839355945587158, "Pretrain/Loss (Raw)": 1.9321036338806152, "Pretrain/Step": 4998, "Pretrain/Step Time": 8.75114013440907} +{"Pretrain/Learning Rate": 2.425724541537741e-05, "Pretrain/Loss": 1.983766794204712, "Pretrain/Loss (Raw)": 1.572759747505188, "Pretrain/Step": 4999, "Pretrain/Step Time": 8.748245801776648} +{"Pretrain/Learning Rate": 2.4248759333049474e-05, "Pretrain/Loss": 1.983555555343628, "Pretrain/Loss (Raw)": 1.8167449235916138, "Pretrain/Step": 5000, "Pretrain/Step Time": 8.751551592722535} +{"Pretrain/Learning Rate": 2.424027333735814e-05, "Pretrain/Loss": 1.9801578521728516, "Pretrain/Loss (Raw)": 1.6868771314620972, "Pretrain/Step": 5001, "Pretrain/Step Time": 9.219243872910738} +{"Pretrain/Learning Rate": 2.4231787429282073e-05, "Pretrain/Loss": 1.982410192489624, "Pretrain/Loss (Raw)": 2.093191385269165, "Pretrain/Step": 5002, "Pretrain/Step Time": 9.21364163607359} +{"Pretrain/Learning Rate": 2.4223301609799895e-05, "Pretrain/Loss": 1.9838206768035889, "Pretrain/Loss (Raw)": 1.8798561096191406, "Pretrain/Step": 5003, "Pretrain/Step Time": 9.208990439772606} +{"Pretrain/Learning Rate": 2.421481587989024e-05, "Pretrain/Loss": 1.9855093955993652, "Pretrain/Loss (Raw)": 2.0151634216308594, "Pretrain/Step": 5004, "Pretrain/Step Time": 9.211191564798355} +{"Pretrain/Learning Rate": 2.4206330240531713e-05, "Pretrain/Loss": 1.9844739437103271, "Pretrain/Loss (Raw)": 1.8576993942260742, "Pretrain/Step": 5005, "Pretrain/Step Time": 9.214929986745119} +{"Pretrain/Learning Rate": 2.4197844692702925e-05, "Pretrain/Loss": 1.983222246170044, "Pretrain/Loss (Raw)": 1.841225028038025, "Pretrain/Step": 5006, "Pretrain/Step Time": 9.211895175278187} +{"Pretrain/Learning Rate": 2.4189359237382464e-05, "Pretrain/Loss": 1.983231544494629, "Pretrain/Loss (Raw)": 2.1004478931427, "Pretrain/Step": 5007, "Pretrain/Step Time": 9.211872298270464} +{"Pretrain/Learning Rate": 2.4180873875548925e-05, "Pretrain/Loss": 1.9836959838867188, "Pretrain/Loss (Raw)": 1.954601764678955, "Pretrain/Step": 5008, "Pretrain/Step Time": 9.212777534499764} +{"Pretrain/Learning Rate": 2.4172388608180857e-05, "Pretrain/Loss": 1.982325553894043, "Pretrain/Loss (Raw)": 1.9404582977294922, "Pretrain/Step": 5009, "Pretrain/Step Time": 9.208408173173666} +{"Pretrain/Learning Rate": 2.4163903436256848e-05, "Pretrain/Loss": 1.9824628829956055, "Pretrain/Loss (Raw)": 2.0172085762023926, "Pretrain/Step": 5010, "Pretrain/Step Time": 9.20790140144527} +{"Pretrain/Learning Rate": 2.4155418360755423e-05, "Pretrain/Loss": 1.9834623336791992, "Pretrain/Loss (Raw)": 2.15730357170105, "Pretrain/Step": 5011, "Pretrain/Step Time": 9.209164870902896} +{"Pretrain/Learning Rate": 2.4146933382655145e-05, "Pretrain/Loss": 1.9831936359405518, "Pretrain/Loss (Raw)": 2.046279191970825, "Pretrain/Step": 5012, "Pretrain/Step Time": 9.210718592628837} +{"Pretrain/Learning Rate": 2.413844850293451e-05, "Pretrain/Loss": 1.9862334728240967, "Pretrain/Loss (Raw)": 2.1799888610839844, "Pretrain/Step": 5013, "Pretrain/Step Time": 9.215952675789595} +{"Pretrain/Learning Rate": 2.4129963722572074e-05, "Pretrain/Loss": 1.986068606376648, "Pretrain/Loss (Raw)": 1.9514340162277222, "Pretrain/Step": 5014, "Pretrain/Step Time": 9.214164251461625} +{"Pretrain/Learning Rate": 2.41214790425463e-05, "Pretrain/Loss": 1.982946515083313, "Pretrain/Loss (Raw)": 1.76042902469635, "Pretrain/Step": 5015, "Pretrain/Step Time": 9.212633572518826} +{"Pretrain/Learning Rate": 2.4112994463835714e-05, "Pretrain/Loss": 1.9831746816635132, "Pretrain/Loss (Raw)": 1.911926507949829, "Pretrain/Step": 5016, "Pretrain/Step Time": 9.205482561141253} +{"Pretrain/Learning Rate": 2.4104509987418793e-05, "Pretrain/Loss": 1.9841692447662354, "Pretrain/Loss (Raw)": 2.115065574645996, "Pretrain/Step": 5017, "Pretrain/Step Time": 9.210262620821595} +{"Pretrain/Learning Rate": 2.4096025614273988e-05, "Pretrain/Loss": 1.9854516983032227, "Pretrain/Loss (Raw)": 2.0596399307250977, "Pretrain/Step": 5018, "Pretrain/Step Time": 9.197238618507981} +{"Pretrain/Learning Rate": 2.408754134537978e-05, "Pretrain/Loss": 1.9846956729888916, "Pretrain/Loss (Raw)": 1.8641761541366577, "Pretrain/Step": 5019, "Pretrain/Step Time": 9.197224147617817} +{"Pretrain/Learning Rate": 2.407905718171459e-05, "Pretrain/Loss": 1.9857494831085205, "Pretrain/Loss (Raw)": 2.219172239303589, "Pretrain/Step": 5020, "Pretrain/Step Time": 9.198649190366268} +{"Pretrain/Learning Rate": 2.4070573124256883e-05, "Pretrain/Loss": 1.9845569133758545, "Pretrain/Loss (Raw)": 1.8952230215072632, "Pretrain/Step": 5021, "Pretrain/Step Time": 9.199610911309719} +{"Pretrain/Learning Rate": 2.4062089173985044e-05, "Pretrain/Loss": 1.9847309589385986, "Pretrain/Loss (Raw)": 2.0276315212249756, "Pretrain/Step": 5022, "Pretrain/Step Time": 9.19238300062716} +{"Pretrain/Learning Rate": 2.4053605331877517e-05, "Pretrain/Loss": 1.9831011295318604, "Pretrain/Loss (Raw)": 1.9480311870574951, "Pretrain/Step": 5023, "Pretrain/Step Time": 9.194689394906163} +{"Pretrain/Learning Rate": 2.404512159891267e-05, "Pretrain/Loss": 1.980451226234436, "Pretrain/Loss (Raw)": 1.8458858728408813, "Pretrain/Step": 5024, "Pretrain/Step Time": 9.181337971240282} +{"Pretrain/Learning Rate": 2.4036637976068914e-05, "Pretrain/Loss": 1.9765372276306152, "Pretrain/Loss (Raw)": 1.7130573987960815, "Pretrain/Step": 5025, "Pretrain/Step Time": 9.181515542790294} +{"Pretrain/Learning Rate": 2.4028154464324592e-05, "Pretrain/Loss": 1.9758797883987427, "Pretrain/Loss (Raw)": 1.9153691530227661, "Pretrain/Step": 5026, "Pretrain/Step Time": 9.186075776815414} +{"Pretrain/Learning Rate": 2.4019671064658088e-05, "Pretrain/Loss": 1.9760648012161255, "Pretrain/Loss (Raw)": 2.181567430496216, "Pretrain/Step": 5027, "Pretrain/Step Time": 9.184516942128539} +{"Pretrain/Learning Rate": 2.4011187778047727e-05, "Pretrain/Loss": 1.9752521514892578, "Pretrain/Loss (Raw)": 2.1172664165496826, "Pretrain/Step": 5028, "Pretrain/Step Time": 9.18228456005454} +{"Pretrain/Learning Rate": 2.4002704605471857e-05, "Pretrain/Loss": 1.9752295017242432, "Pretrain/Loss (Raw)": 1.907228946685791, "Pretrain/Step": 5029, "Pretrain/Step Time": 9.187219889834523} +{"Pretrain/Learning Rate": 2.3994221547908783e-05, "Pretrain/Loss": 1.9771943092346191, "Pretrain/Loss (Raw)": 2.1971397399902344, "Pretrain/Step": 5030, "Pretrain/Step Time": 9.187249897047877} +{"Pretrain/Learning Rate": 2.398573860633683e-05, "Pretrain/Loss": 1.9787752628326416, "Pretrain/Loss (Raw)": 2.1190185546875, "Pretrain/Step": 5031, "Pretrain/Step Time": 9.188118198886514} +{"Pretrain/Learning Rate": 2.3977255781734275e-05, "Pretrain/Loss": 1.9800233840942383, "Pretrain/Loss (Raw)": 2.274477005004883, "Pretrain/Step": 5032, "Pretrain/Step Time": 9.187238292768598} +{"Pretrain/Learning Rate": 2.3968773075079404e-05, "Pretrain/Loss": 1.9779999256134033, "Pretrain/Loss (Raw)": 1.8452098369598389, "Pretrain/Step": 5033, "Pretrain/Step Time": 9.184535421431065} +{"Pretrain/Learning Rate": 2.396029048735048e-05, "Pretrain/Loss": 1.9784610271453857, "Pretrain/Loss (Raw)": 1.8884050846099854, "Pretrain/Step": 5034, "Pretrain/Step Time": 9.181072676554322} +{"Pretrain/Learning Rate": 2.3951808019525758e-05, "Pretrain/Loss": 1.9787402153015137, "Pretrain/Loss (Raw)": 1.9327819347381592, "Pretrain/Step": 5035, "Pretrain/Step Time": 9.180841663852334} +{"Pretrain/Learning Rate": 2.394332567258347e-05, "Pretrain/Loss": 1.9770570993423462, "Pretrain/Loss (Raw)": 1.9729558229446411, "Pretrain/Step": 5036, "Pretrain/Step Time": 9.181012615561485} +{"Pretrain/Learning Rate": 2.3934843447501852e-05, "Pretrain/Loss": 1.975993275642395, "Pretrain/Loss (Raw)": 1.8358964920043945, "Pretrain/Step": 5037, "Pretrain/Step Time": 9.180605556815863} +{"Pretrain/Learning Rate": 2.3926361345259098e-05, "Pretrain/Loss": 1.9779155254364014, "Pretrain/Loss (Raw)": 1.8916314840316772, "Pretrain/Step": 5038, "Pretrain/Step Time": 9.17995779775083} +{"Pretrain/Learning Rate": 2.391787936683342e-05, "Pretrain/Loss": 1.9805954694747925, "Pretrain/Loss (Raw)": 2.1634957790374756, "Pretrain/Step": 5039, "Pretrain/Step Time": 9.176046686246991} +{"Pretrain/Learning Rate": 2.390939751320299e-05, "Pretrain/Loss": 1.9815688133239746, "Pretrain/Loss (Raw)": 2.0791258811950684, "Pretrain/Step": 5040, "Pretrain/Step Time": 9.174215776845813} +{"Pretrain/Learning Rate": 2.390091578534598e-05, "Pretrain/Loss": 1.9801267385482788, "Pretrain/Loss (Raw)": 1.7335608005523682, "Pretrain/Step": 5041, "Pretrain/Step Time": 9.173070913180709} +{"Pretrain/Learning Rate": 2.3892434184240533e-05, "Pretrain/Loss": 1.9774599075317383, "Pretrain/Loss (Raw)": 1.5725475549697876, "Pretrain/Step": 5042, "Pretrain/Step Time": 9.172622349113226} +{"Pretrain/Learning Rate": 2.3883952710864804e-05, "Pretrain/Loss": 1.9796431064605713, "Pretrain/Loss (Raw)": 2.1760666370391846, "Pretrain/Step": 5043, "Pretrain/Step Time": 9.169226406142116} +{"Pretrain/Learning Rate": 2.3875471366196903e-05, "Pretrain/Loss": 1.9758089780807495, "Pretrain/Loss (Raw)": 1.8171266317367554, "Pretrain/Step": 5044, "Pretrain/Step Time": 9.168822729960084} +{"Pretrain/Learning Rate": 2.3866990151214947e-05, "Pretrain/Loss": 1.9754033088684082, "Pretrain/Loss (Raw)": 1.9684149026870728, "Pretrain/Step": 5045, "Pretrain/Step Time": 9.172014804556966} +{"Pretrain/Learning Rate": 2.3858509066897016e-05, "Pretrain/Loss": 1.9724936485290527, "Pretrain/Loss (Raw)": 2.0233349800109863, "Pretrain/Step": 5046, "Pretrain/Step Time": 9.16761538758874} +{"Pretrain/Learning Rate": 2.385002811422121e-05, "Pretrain/Loss": 1.9723725318908691, "Pretrain/Loss (Raw)": 2.1268320083618164, "Pretrain/Step": 5047, "Pretrain/Step Time": 9.171517543494701} +{"Pretrain/Learning Rate": 2.384154729416557e-05, "Pretrain/Loss": 1.9707043170928955, "Pretrain/Loss (Raw)": 2.026700735092163, "Pretrain/Step": 5048, "Pretrain/Step Time": 9.16988074593246} +{"Pretrain/Learning Rate": 2.383306660770817e-05, "Pretrain/Loss": 1.972110390663147, "Pretrain/Loss (Raw)": 2.1399426460266113, "Pretrain/Step": 5049, "Pretrain/Step Time": 9.166913956403732} +{"Pretrain/Learning Rate": 2.382458605582701e-05, "Pretrain/Loss": 1.9702832698822021, "Pretrain/Loss (Raw)": 1.7752588987350464, "Pretrain/Step": 5050, "Pretrain/Step Time": 9.155338352546096} +{"Pretrain/Learning Rate": 2.3816105639500142e-05, "Pretrain/Loss": 1.9729020595550537, "Pretrain/Loss (Raw)": 2.186349630355835, "Pretrain/Step": 5051, "Pretrain/Step Time": 9.154738511890173} +{"Pretrain/Learning Rate": 2.3807625359705532e-05, "Pretrain/Loss": 1.9746782779693604, "Pretrain/Loss (Raw)": 2.1444509029388428, "Pretrain/Step": 5052, "Pretrain/Step Time": 9.15185383707285} +{"Pretrain/Learning Rate": 2.37991452174212e-05, "Pretrain/Loss": 1.9784456491470337, "Pretrain/Loss (Raw)": 1.9911906719207764, "Pretrain/Step": 5053, "Pretrain/Step Time": 9.15271856635809} +{"Pretrain/Learning Rate": 2.3790665213625087e-05, "Pretrain/Loss": 1.9792277812957764, "Pretrain/Loss (Raw)": 2.007627010345459, "Pretrain/Step": 5054, "Pretrain/Step Time": 9.148384178057313} +{"Pretrain/Learning Rate": 2.3782185349295174e-05, "Pretrain/Loss": 1.9829577207565308, "Pretrain/Loss (Raw)": 2.006749391555786, "Pretrain/Step": 5055, "Pretrain/Step Time": 9.153315257281065} +{"Pretrain/Learning Rate": 2.377370562540937e-05, "Pretrain/Loss": 1.9829211235046387, "Pretrain/Loss (Raw)": 2.090191125869751, "Pretrain/Step": 5056, "Pretrain/Step Time": 9.15081681124866} +{"Pretrain/Learning Rate": 2.3765226042945616e-05, "Pretrain/Loss": 1.9828487634658813, "Pretrain/Loss (Raw)": 2.0673000812530518, "Pretrain/Step": 5057, "Pretrain/Step Time": 9.152465354651213} +{"Pretrain/Learning Rate": 2.3756746602881824e-05, "Pretrain/Loss": 1.9844532012939453, "Pretrain/Loss (Raw)": 1.9777467250823975, "Pretrain/Step": 5058, "Pretrain/Step Time": 9.156962329521775} +{"Pretrain/Learning Rate": 2.3748267306195855e-05, "Pretrain/Loss": 1.9825994968414307, "Pretrain/Loss (Raw)": 1.739577293395996, "Pretrain/Step": 5059, "Pretrain/Step Time": 9.153933545574546} +{"Pretrain/Learning Rate": 2.373978815386562e-05, "Pretrain/Loss": 1.98061203956604, "Pretrain/Loss (Raw)": 1.8883411884307861, "Pretrain/Step": 5060, "Pretrain/Step Time": 9.154981438070536} +{"Pretrain/Learning Rate": 2.3731309146868932e-05, "Pretrain/Loss": 1.979992389678955, "Pretrain/Loss (Raw)": 1.9723076820373535, "Pretrain/Step": 5061, "Pretrain/Step Time": 9.156448986381292} +{"Pretrain/Learning Rate": 2.372283028618367e-05, "Pretrain/Loss": 1.9783520698547363, "Pretrain/Loss (Raw)": 1.599853277206421, "Pretrain/Step": 5062, "Pretrain/Step Time": 9.157227855175734} +{"Pretrain/Learning Rate": 2.371435157278762e-05, "Pretrain/Loss": 1.9776630401611328, "Pretrain/Loss (Raw)": 1.9056055545806885, "Pretrain/Step": 5063, "Pretrain/Step Time": 9.157505732029676} +{"Pretrain/Learning Rate": 2.370587300765862e-05, "Pretrain/Loss": 1.9767811298370361, "Pretrain/Loss (Raw)": 1.8195337057113647, "Pretrain/Step": 5064, "Pretrain/Step Time": 9.1541953291744} +{"Pretrain/Learning Rate": 2.369739459177443e-05, "Pretrain/Loss": 1.977863073348999, "Pretrain/Loss (Raw)": 2.311985969543457, "Pretrain/Step": 5065, "Pretrain/Step Time": 9.151318056508899} +{"Pretrain/Learning Rate": 2.3688916326112848e-05, "Pretrain/Loss": 1.975755214691162, "Pretrain/Loss (Raw)": 1.454463243484497, "Pretrain/Step": 5066, "Pretrain/Step Time": 9.141059113666415} +{"Pretrain/Learning Rate": 2.3680438211651597e-05, "Pretrain/Loss": 1.9747378826141357, "Pretrain/Loss (Raw)": 1.9172700643539429, "Pretrain/Step": 5067, "Pretrain/Step Time": 9.142185140401125} +{"Pretrain/Learning Rate": 2.3671960249368448e-05, "Pretrain/Loss": 1.9754371643066406, "Pretrain/Loss (Raw)": 2.0543110370635986, "Pretrain/Step": 5068, "Pretrain/Step Time": 9.141992876306176} +{"Pretrain/Learning Rate": 2.3663482440241087e-05, "Pretrain/Loss": 1.9733012914657593, "Pretrain/Loss (Raw)": 1.7483428716659546, "Pretrain/Step": 5069, "Pretrain/Step Time": 9.144960891455412} +{"Pretrain/Learning Rate": 2.3655004785247234e-05, "Pretrain/Loss": 1.9738240242004395, "Pretrain/Loss (Raw)": 2.243767738342285, "Pretrain/Step": 5070, "Pretrain/Step Time": 9.143032813444734} +{"Pretrain/Learning Rate": 2.3646527285364565e-05, "Pretrain/Loss": 1.9728081226348877, "Pretrain/Loss (Raw)": 1.9623503684997559, "Pretrain/Step": 5071, "Pretrain/Step Time": 9.14048246666789} +{"Pretrain/Learning Rate": 2.363804994157075e-05, "Pretrain/Loss": 1.97072172164917, "Pretrain/Loss (Raw)": 1.9763343334197998, "Pretrain/Step": 5072, "Pretrain/Step Time": 9.139202930033207} +{"Pretrain/Learning Rate": 2.3629572754843428e-05, "Pretrain/Loss": 1.9678559303283691, "Pretrain/Loss (Raw)": 1.7139451503753662, "Pretrain/Step": 5073, "Pretrain/Step Time": 9.13790394552052} +{"Pretrain/Learning Rate": 2.3621095726160237e-05, "Pretrain/Loss": 1.9687941074371338, "Pretrain/Loss (Raw)": 2.0423073768615723, "Pretrain/Step": 5074, "Pretrain/Step Time": 9.139541963115335} +{"Pretrain/Learning Rate": 2.3612618856498785e-05, "Pretrain/Loss": 1.968044400215149, "Pretrain/Loss (Raw)": 2.0506672859191895, "Pretrain/Step": 5075, "Pretrain/Step Time": 9.144389662891626} +{"Pretrain/Learning Rate": 2.3604142146836666e-05, "Pretrain/Loss": 1.9676599502563477, "Pretrain/Loss (Raw)": 2.0883073806762695, "Pretrain/Step": 5076, "Pretrain/Step Time": 9.143494736403227} +{"Pretrain/Learning Rate": 2.3595665598151444e-05, "Pretrain/Loss": 1.9664185047149658, "Pretrain/Loss (Raw)": 2.0659966468811035, "Pretrain/Step": 5077, "Pretrain/Step Time": 9.148068306967616} +{"Pretrain/Learning Rate": 2.3587189211420694e-05, "Pretrain/Loss": 1.9660924673080444, "Pretrain/Loss (Raw)": 2.024451494216919, "Pretrain/Step": 5078, "Pretrain/Step Time": 9.147336050868034} +{"Pretrain/Learning Rate": 2.3578712987621932e-05, "Pretrain/Loss": 1.9654459953308105, "Pretrain/Loss (Raw)": 1.9238353967666626, "Pretrain/Step": 5079, "Pretrain/Step Time": 9.154955269768834} +{"Pretrain/Learning Rate": 2.3570236927732692e-05, "Pretrain/Loss": 1.9638845920562744, "Pretrain/Loss (Raw)": 1.9532209634780884, "Pretrain/Step": 5080, "Pretrain/Step Time": 9.154728777706623} +{"Pretrain/Learning Rate": 2.3561761032730463e-05, "Pretrain/Loss": 1.9666929244995117, "Pretrain/Loss (Raw)": 2.149832248687744, "Pretrain/Step": 5081, "Pretrain/Step Time": 9.163859622552991} +{"Pretrain/Learning Rate": 2.355328530359273e-05, "Pretrain/Loss": 1.968287467956543, "Pretrain/Loss (Raw)": 2.111849308013916, "Pretrain/Step": 5082, "Pretrain/Step Time": 9.162259517237544} +{"Pretrain/Learning Rate": 2.3544809741296954e-05, "Pretrain/Loss": 1.9656553268432617, "Pretrain/Loss (Raw)": 1.7034196853637695, "Pretrain/Step": 5083, "Pretrain/Step Time": 9.16176062822342} +{"Pretrain/Learning Rate": 2.3536334346820578e-05, "Pretrain/Loss": 1.9648499488830566, "Pretrain/Loss (Raw)": 1.9726027250289917, "Pretrain/Step": 5084, "Pretrain/Step Time": 9.164441078901291} +{"Pretrain/Learning Rate": 2.3527859121141012e-05, "Pretrain/Loss": 1.9630393981933594, "Pretrain/Loss (Raw)": 1.7999708652496338, "Pretrain/Step": 5085, "Pretrain/Step Time": 9.174723729491234} +{"Pretrain/Learning Rate": 2.351938406523568e-05, "Pretrain/Loss": 1.9626476764678955, "Pretrain/Loss (Raw)": 2.080231189727783, "Pretrain/Step": 5086, "Pretrain/Step Time": 9.167828230187297} +{"Pretrain/Learning Rate": 2.3510909180081946e-05, "Pretrain/Loss": 1.960502028465271, "Pretrain/Loss (Raw)": 1.9572137594223022, "Pretrain/Step": 5087, "Pretrain/Step Time": 9.169409438967705} +{"Pretrain/Learning Rate": 2.350243446665719e-05, "Pretrain/Loss": 1.9631882905960083, "Pretrain/Loss (Raw)": 1.9202353954315186, "Pretrain/Step": 5088, "Pretrain/Step Time": 9.169499721378088} +{"Pretrain/Learning Rate": 2.3493959925938746e-05, "Pretrain/Loss": 1.962463617324829, "Pretrain/Loss (Raw)": 1.7070773839950562, "Pretrain/Step": 5089, "Pretrain/Step Time": 9.161715907976031} +{"Pretrain/Learning Rate": 2.348548555890394e-05, "Pretrain/Loss": 1.9623761177062988, "Pretrain/Loss (Raw)": 2.0111889839172363, "Pretrain/Step": 5090, "Pretrain/Step Time": 9.16186941601336} +{"Pretrain/Learning Rate": 2.3477011366530068e-05, "Pretrain/Loss": 1.961976170539856, "Pretrain/Loss (Raw)": 2.182832956314087, "Pretrain/Step": 5091, "Pretrain/Step Time": 9.162007458508015} +{"Pretrain/Learning Rate": 2.3468537349794438e-05, "Pretrain/Loss": 1.9616166353225708, "Pretrain/Loss (Raw)": 1.773685336112976, "Pretrain/Step": 5092, "Pretrain/Step Time": 9.162559267133474} +{"Pretrain/Learning Rate": 2.3460063509674278e-05, "Pretrain/Loss": 1.9587963819503784, "Pretrain/Loss (Raw)": 1.7205010652542114, "Pretrain/Step": 5093, "Pretrain/Step Time": 9.164712980389595} +{"Pretrain/Learning Rate": 2.345158984714687e-05, "Pretrain/Loss": 1.9603404998779297, "Pretrain/Loss (Raw)": 2.0273191928863525, "Pretrain/Step": 5094, "Pretrain/Step Time": 9.166105583310127} +{"Pretrain/Learning Rate": 2.3443116363189398e-05, "Pretrain/Loss": 1.9624561071395874, "Pretrain/Loss (Raw)": 1.848054051399231, "Pretrain/Step": 5095, "Pretrain/Step Time": 9.170831380411983} +{"Pretrain/Learning Rate": 2.3434643058779104e-05, "Pretrain/Loss": 1.961366891860962, "Pretrain/Loss (Raw)": 1.811767578125, "Pretrain/Step": 5096, "Pretrain/Step Time": 9.164287822321057} +{"Pretrain/Learning Rate": 2.342616993489313e-05, "Pretrain/Loss": 1.9614893198013306, "Pretrain/Loss (Raw)": 2.1554198265075684, "Pretrain/Step": 5097, "Pretrain/Step Time": 9.167103553190827} +{"Pretrain/Learning Rate": 2.3417696992508657e-05, "Pretrain/Loss": 1.962274432182312, "Pretrain/Loss (Raw)": 2.1258938312530518, "Pretrain/Step": 5098, "Pretrain/Step Time": 9.167180420830846} +{"Pretrain/Learning Rate": 2.3409224232602832e-05, "Pretrain/Loss": 1.963252305984497, "Pretrain/Loss (Raw)": 2.1681485176086426, "Pretrain/Step": 5099, "Pretrain/Step Time": 9.161131829023361} +{"Pretrain/Learning Rate": 2.340075165615276e-05, "Pretrain/Loss": 1.9624526500701904, "Pretrain/Loss (Raw)": 1.951453685760498, "Pretrain/Step": 5100, "Pretrain/Step Time": 9.169965842738748} +{"Pretrain/Learning Rate": 2.339227926413555e-05, "Pretrain/Loss": 1.9621987342834473, "Pretrain/Loss (Raw)": 2.0429179668426514, "Pretrain/Step": 5101, "Pretrain/Step Time": 9.171296145766973} +{"Pretrain/Learning Rate": 2.3383807057528256e-05, "Pretrain/Loss": 1.9622567892074585, "Pretrain/Loss (Raw)": 2.3643667697906494, "Pretrain/Step": 5102, "Pretrain/Step Time": 9.17285568267107} +{"Pretrain/Learning Rate": 2.3375335037307965e-05, "Pretrain/Loss": 1.9597582817077637, "Pretrain/Loss (Raw)": 1.7766438722610474, "Pretrain/Step": 5103, "Pretrain/Step Time": 9.164985969662666} +{"Pretrain/Learning Rate": 2.3366863204451677e-05, "Pretrain/Loss": 1.9604874849319458, "Pretrain/Loss (Raw)": 2.049313545227051, "Pretrain/Step": 5104, "Pretrain/Step Time": 9.160255800932646} +{"Pretrain/Learning Rate": 2.3358391559936438e-05, "Pretrain/Loss": 1.9623279571533203, "Pretrain/Loss (Raw)": 2.08516526222229, "Pretrain/Step": 5105, "Pretrain/Step Time": 9.16081029176712} +{"Pretrain/Learning Rate": 2.33499201047392e-05, "Pretrain/Loss": 1.9618663787841797, "Pretrain/Loss (Raw)": 1.8928698301315308, "Pretrain/Step": 5106, "Pretrain/Step Time": 9.154905531555414} +{"Pretrain/Learning Rate": 2.334144883983697e-05, "Pretrain/Loss": 1.9598462581634521, "Pretrain/Loss (Raw)": 1.7354031801223755, "Pretrain/Step": 5107, "Pretrain/Step Time": 9.155960785225034} +{"Pretrain/Learning Rate": 2.3332977766206657e-05, "Pretrain/Loss": 1.9600341320037842, "Pretrain/Loss (Raw)": 2.0920727252960205, "Pretrain/Step": 5108, "Pretrain/Step Time": 9.160747528076172} +{"Pretrain/Learning Rate": 2.332450688482522e-05, "Pretrain/Loss": 1.9584726095199585, "Pretrain/Loss (Raw)": 1.7995688915252686, "Pretrain/Step": 5109, "Pretrain/Step Time": 9.16016443632543} +{"Pretrain/Learning Rate": 2.3316036196669534e-05, "Pretrain/Loss": 1.958939552307129, "Pretrain/Loss (Raw)": 2.0380895137786865, "Pretrain/Step": 5110, "Pretrain/Step Time": 9.15623034350574} +{"Pretrain/Learning Rate": 2.3307565702716495e-05, "Pretrain/Loss": 1.9576984643936157, "Pretrain/Loss (Raw)": 1.7675822973251343, "Pretrain/Step": 5111, "Pretrain/Step Time": 9.161375876516104} +{"Pretrain/Learning Rate": 2.3299095403942943e-05, "Pretrain/Loss": 1.9600095748901367, "Pretrain/Loss (Raw)": 2.066138982772827, "Pretrain/Step": 5112, "Pretrain/Step Time": 9.160970816388726} +{"Pretrain/Learning Rate": 2.3290625301325735e-05, "Pretrain/Loss": 1.9629287719726562, "Pretrain/Loss (Raw)": 2.187518835067749, "Pretrain/Step": 5113, "Pretrain/Step Time": 9.155566034838557} +{"Pretrain/Learning Rate": 2.3282155395841667e-05, "Pretrain/Loss": 1.9622470140457153, "Pretrain/Loss (Raw)": 1.715597152709961, "Pretrain/Step": 5114, "Pretrain/Step Time": 9.158294416964054} +{"Pretrain/Learning Rate": 2.327368568846754e-05, "Pretrain/Loss": 1.9627275466918945, "Pretrain/Loss (Raw)": 2.161240339279175, "Pretrain/Step": 5115, "Pretrain/Step Time": 9.159758925437927} +{"Pretrain/Learning Rate": 2.3265216180180106e-05, "Pretrain/Loss": 1.960239291191101, "Pretrain/Loss (Raw)": 1.7079766988754272, "Pretrain/Step": 5116, "Pretrain/Step Time": 9.15970721654594} +{"Pretrain/Learning Rate": 2.325674687195612e-05, "Pretrain/Loss": 1.9600961208343506, "Pretrain/Loss (Raw)": 1.9437732696533203, "Pretrain/Step": 5117, "Pretrain/Step Time": 9.159298811107874} +{"Pretrain/Learning Rate": 2.32482777647723e-05, "Pretrain/Loss": 1.960740566253662, "Pretrain/Loss (Raw)": 2.16538405418396, "Pretrain/Step": 5118, "Pretrain/Step Time": 9.155167182907462} +{"Pretrain/Learning Rate": 2.323980885960534e-05, "Pretrain/Loss": 1.9594132900238037, "Pretrain/Loss (Raw)": 1.9300196170806885, "Pretrain/Step": 5119, "Pretrain/Step Time": 9.156632520258427} +{"Pretrain/Learning Rate": 2.3231340157431917e-05, "Pretrain/Loss": 1.9597278833389282, "Pretrain/Loss (Raw)": 1.8436205387115479, "Pretrain/Step": 5120, "Pretrain/Step Time": 9.154693637043238} +{"Pretrain/Learning Rate": 2.3222871659228685e-05, "Pretrain/Loss": 1.9611990451812744, "Pretrain/Loss (Raw)": 2.0502281188964844, "Pretrain/Step": 5121, "Pretrain/Step Time": 9.153017209842801} +{"Pretrain/Learning Rate": 2.3214403365972258e-05, "Pretrain/Loss": 1.9608051776885986, "Pretrain/Loss (Raw)": 1.9807640314102173, "Pretrain/Step": 5122, "Pretrain/Step Time": 9.147772399708629} +{"Pretrain/Learning Rate": 2.320593527863926e-05, "Pretrain/Loss": 1.9624229669570923, "Pretrain/Loss (Raw)": 2.1601834297180176, "Pretrain/Step": 5123, "Pretrain/Step Time": 9.148845782503486} +{"Pretrain/Learning Rate": 2.319746739820625e-05, "Pretrain/Loss": 1.9667911529541016, "Pretrain/Loss (Raw)": 2.0471091270446777, "Pretrain/Step": 5124, "Pretrain/Step Time": 9.147935379296541} +{"Pretrain/Learning Rate": 2.3188999725649804e-05, "Pretrain/Loss": 1.9658924341201782, "Pretrain/Loss (Raw)": 1.838678002357483, "Pretrain/Step": 5125, "Pretrain/Step Time": 9.151529526337981} +{"Pretrain/Learning Rate": 2.3180532261946437e-05, "Pretrain/Loss": 1.9686111211776733, "Pretrain/Loss (Raw)": 2.2800936698913574, "Pretrain/Step": 5126, "Pretrain/Step Time": 9.145324625074863} +{"Pretrain/Learning Rate": 2.3172065008072663e-05, "Pretrain/Loss": 1.9734387397766113, "Pretrain/Loss (Raw)": 2.1906898021698, "Pretrain/Step": 5127, "Pretrain/Step Time": 9.148585870862007} +{"Pretrain/Learning Rate": 2.3163597965004967e-05, "Pretrain/Loss": 1.975040316581726, "Pretrain/Loss (Raw)": 2.021749496459961, "Pretrain/Step": 5128, "Pretrain/Step Time": 9.144577633589506} +{"Pretrain/Learning Rate": 2.315513113371981e-05, "Pretrain/Loss": 1.9761788845062256, "Pretrain/Loss (Raw)": 1.8326209783554077, "Pretrain/Step": 5129, "Pretrain/Step Time": 8.67593896202743} +{"Pretrain/Learning Rate": 2.3146664515193616e-05, "Pretrain/Loss": 1.9756056070327759, "Pretrain/Loss (Raw)": 2.0197956562042236, "Pretrain/Step": 5130, "Pretrain/Step Time": 8.676040867343545} +{"Pretrain/Learning Rate": 2.3138198110402812e-05, "Pretrain/Loss": 1.9756919145584106, "Pretrain/Loss (Raw)": 1.8909069299697876, "Pretrain/Step": 5131, "Pretrain/Step Time": 8.677196009084582} +{"Pretrain/Learning Rate": 2.3129731920323765e-05, "Pretrain/Loss": 1.975494384765625, "Pretrain/Loss (Raw)": 1.9898948669433594, "Pretrain/Step": 5132, "Pretrain/Step Time": 8.677988279610872} +{"Pretrain/Learning Rate": 2.3121265945932862e-05, "Pretrain/Loss": 1.9764375686645508, "Pretrain/Loss (Raw)": 1.9783997535705566, "Pretrain/Step": 5133, "Pretrain/Step Time": 8.67116946540773} +{"Pretrain/Learning Rate": 2.3112800188206404e-05, "Pretrain/Loss": 1.9766857624053955, "Pretrain/Loss (Raw)": 1.8730132579803467, "Pretrain/Step": 5134, "Pretrain/Step Time": 8.678522042930126} +{"Pretrain/Learning Rate": 2.310433464812074e-05, "Pretrain/Loss": 1.9758977890014648, "Pretrain/Loss (Raw)": 1.9995801448822021, "Pretrain/Step": 5135, "Pretrain/Step Time": 8.676345102488995} +{"Pretrain/Learning Rate": 2.309586932665212e-05, "Pretrain/Loss": 1.9778810739517212, "Pretrain/Loss (Raw)": 2.2084598541259766, "Pretrain/Step": 5136, "Pretrain/Step Time": 8.676526399329305} +{"Pretrain/Learning Rate": 2.3087404224776835e-05, "Pretrain/Loss": 1.9795293807983398, "Pretrain/Loss (Raw)": 2.151437997817993, "Pretrain/Step": 5137, "Pretrain/Step Time": 8.676678938791156} +{"Pretrain/Learning Rate": 2.307893934347109e-05, "Pretrain/Loss": 1.9797735214233398, "Pretrain/Loss (Raw)": 2.0484580993652344, "Pretrain/Step": 5138, "Pretrain/Step Time": 8.675063755363226} +{"Pretrain/Learning Rate": 2.3070474683711125e-05, "Pretrain/Loss": 1.9779143333435059, "Pretrain/Loss (Raw)": 1.9193379878997803, "Pretrain/Step": 5139, "Pretrain/Step Time": 8.676300479099154} +{"Pretrain/Learning Rate": 2.306201024647311e-05, "Pretrain/Loss": 1.9784157276153564, "Pretrain/Loss (Raw)": 2.110457420349121, "Pretrain/Step": 5140, "Pretrain/Step Time": 8.677537754178047} +{"Pretrain/Learning Rate": 2.3053546032733207e-05, "Pretrain/Loss": 1.9788291454315186, "Pretrain/Loss (Raw)": 2.2328927516937256, "Pretrain/Step": 5141, "Pretrain/Step Time": 8.67527269385755} +{"Pretrain/Learning Rate": 2.3045082043467554e-05, "Pretrain/Loss": 1.9780793190002441, "Pretrain/Loss (Raw)": 1.8554612398147583, "Pretrain/Step": 5142, "Pretrain/Step Time": 8.673833455890417} +{"Pretrain/Learning Rate": 2.3036618279652232e-05, "Pretrain/Loss": 1.980487585067749, "Pretrain/Loss (Raw)": 2.0686936378479004, "Pretrain/Step": 5143, "Pretrain/Step Time": 8.673345550894737} +{"Pretrain/Learning Rate": 2.3028154742263362e-05, "Pretrain/Loss": 1.9800333976745605, "Pretrain/Loss (Raw)": 1.8537882566452026, "Pretrain/Step": 5144, "Pretrain/Step Time": 8.67403475381434} +{"Pretrain/Learning Rate": 2.3019691432276964e-05, "Pretrain/Loss": 1.9789984226226807, "Pretrain/Loss (Raw)": 1.9825917482376099, "Pretrain/Step": 5145, "Pretrain/Step Time": 8.673808863386512} +{"Pretrain/Learning Rate": 2.3011228350669096e-05, "Pretrain/Loss": 1.9790024757385254, "Pretrain/Loss (Raw)": 2.0601491928100586, "Pretrain/Step": 5146, "Pretrain/Step Time": 8.673105554655194} +{"Pretrain/Learning Rate": 2.3002765498415728e-05, "Pretrain/Loss": 1.9797852039337158, "Pretrain/Loss (Raw)": 1.964361548423767, "Pretrain/Step": 5147, "Pretrain/Step Time": 8.674173526465893} +{"Pretrain/Learning Rate": 2.2994302876492875e-05, "Pretrain/Loss": 1.9781652688980103, "Pretrain/Loss (Raw)": 2.0118353366851807, "Pretrain/Step": 5148, "Pretrain/Step Time": 8.671809252351522} +{"Pretrain/Learning Rate": 2.2985840485876444e-05, "Pretrain/Loss": 1.9789299964904785, "Pretrain/Loss (Raw)": 1.993092656135559, "Pretrain/Step": 5149, "Pretrain/Step Time": 8.678406670689583} +{"Pretrain/Learning Rate": 2.2977378327542397e-05, "Pretrain/Loss": 1.9766466617584229, "Pretrain/Loss (Raw)": 1.7353721857070923, "Pretrain/Step": 5150, "Pretrain/Step Time": 8.679393913596869} +{"Pretrain/Learning Rate": 2.2968916402466604e-05, "Pretrain/Loss": 1.978344202041626, "Pretrain/Loss (Raw)": 2.165325880050659, "Pretrain/Step": 5151, "Pretrain/Step Time": 8.685753671452403} +{"Pretrain/Learning Rate": 2.2960454711624945e-05, "Pretrain/Loss": 1.9793260097503662, "Pretrain/Loss (Raw)": 1.9715543985366821, "Pretrain/Step": 5152, "Pretrain/Step Time": 8.685126010328531} +{"Pretrain/Learning Rate": 2.2951993255993252e-05, "Pretrain/Loss": 1.9828249216079712, "Pretrain/Loss (Raw)": 2.1609044075012207, "Pretrain/Step": 5153, "Pretrain/Step Time": 8.6876435931772} +{"Pretrain/Learning Rate": 2.2943532036547356e-05, "Pretrain/Loss": 1.984547734260559, "Pretrain/Loss (Raw)": 2.1358938217163086, "Pretrain/Step": 5154, "Pretrain/Step Time": 8.681527243927121} +{"Pretrain/Learning Rate": 2.293507105426303e-05, "Pretrain/Loss": 1.982908844947815, "Pretrain/Loss (Raw)": 1.9717884063720703, "Pretrain/Step": 5155, "Pretrain/Step Time": 8.683840204030275} +{"Pretrain/Learning Rate": 2.2926610310116047e-05, "Pretrain/Loss": 1.9804890155792236, "Pretrain/Loss (Raw)": 1.807531714439392, "Pretrain/Step": 5156, "Pretrain/Step Time": 8.687822142615914} +{"Pretrain/Learning Rate": 2.2918149805082127e-05, "Pretrain/Loss": 1.9815688133239746, "Pretrain/Loss (Raw)": 2.04542875289917, "Pretrain/Step": 5157, "Pretrain/Step Time": 8.684397073462605} +{"Pretrain/Learning Rate": 2.2909689540136985e-05, "Pretrain/Loss": 1.978834867477417, "Pretrain/Loss (Raw)": 1.8472177982330322, "Pretrain/Step": 5158, "Pretrain/Step Time": 8.687884652987123} +{"Pretrain/Learning Rate": 2.290122951625629e-05, "Pretrain/Loss": 1.9770454168319702, "Pretrain/Loss (Raw)": 1.8899705410003662, "Pretrain/Step": 5159, "Pretrain/Step Time": 8.687883622944355} +{"Pretrain/Learning Rate": 2.2892769734415703e-05, "Pretrain/Loss": 1.9750341176986694, "Pretrain/Loss (Raw)": 2.0170347690582275, "Pretrain/Step": 5160, "Pretrain/Step Time": 8.693152327090502} +{"Pretrain/Learning Rate": 2.2884310195590835e-05, "Pretrain/Loss": 1.9763319492340088, "Pretrain/Loss (Raw)": 2.011321783065796, "Pretrain/Step": 5161, "Pretrain/Step Time": 8.684724189341068} +{"Pretrain/Learning Rate": 2.2875850900757288e-05, "Pretrain/Loss": 1.97709321975708, "Pretrain/Loss (Raw)": 1.9858447313308716, "Pretrain/Step": 5162, "Pretrain/Step Time": 8.685602067038417} +{"Pretrain/Learning Rate": 2.2867391850890623e-05, "Pretrain/Loss": 1.9745795726776123, "Pretrain/Loss (Raw)": 1.6110398769378662, "Pretrain/Step": 5163, "Pretrain/Step Time": 8.681786553934216} +{"Pretrain/Learning Rate": 2.285893304696638e-05, "Pretrain/Loss": 1.9734102487564087, "Pretrain/Loss (Raw)": 1.8232783079147339, "Pretrain/Step": 5164, "Pretrain/Step Time": 8.679762601852417} +{"Pretrain/Learning Rate": 2.2850474489960065e-05, "Pretrain/Loss": 1.9756042957305908, "Pretrain/Loss (Raw)": 2.116731882095337, "Pretrain/Step": 5165, "Pretrain/Step Time": 8.68248431943357} +{"Pretrain/Learning Rate": 2.2842016180847165e-05, "Pretrain/Loss": 1.9765994548797607, "Pretrain/Loss (Raw)": 2.0190088748931885, "Pretrain/Step": 5166, "Pretrain/Step Time": 8.689669383689761} +{"Pretrain/Learning Rate": 2.2833558120603122e-05, "Pretrain/Loss": 1.972110629081726, "Pretrain/Loss (Raw)": 1.5889357328414917, "Pretrain/Step": 5167, "Pretrain/Step Time": 8.689373111352324} +{"Pretrain/Learning Rate": 2.282510031020337e-05, "Pretrain/Loss": 1.9701015949249268, "Pretrain/Loss (Raw)": 1.8219683170318604, "Pretrain/Step": 5168, "Pretrain/Step Time": 8.690641840919852} +{"Pretrain/Learning Rate": 2.2816642750623294e-05, "Pretrain/Loss": 1.9722561836242676, "Pretrain/Loss (Raw)": 2.0093536376953125, "Pretrain/Step": 5169, "Pretrain/Step Time": 8.69212001375854} +{"Pretrain/Learning Rate": 2.280818544283827e-05, "Pretrain/Loss": 1.9758539199829102, "Pretrain/Loss (Raw)": 2.0330538749694824, "Pretrain/Step": 5170, "Pretrain/Step Time": 8.689836962148547} +{"Pretrain/Learning Rate": 2.279972838782362e-05, "Pretrain/Loss": 1.975886344909668, "Pretrain/Loss (Raw)": 2.180203676223755, "Pretrain/Step": 5171, "Pretrain/Step Time": 8.69101039506495} +{"Pretrain/Learning Rate": 2.279127158655467e-05, "Pretrain/Loss": 1.9782652854919434, "Pretrain/Loss (Raw)": 2.121635675430298, "Pretrain/Step": 5172, "Pretrain/Step Time": 8.696173515170813} +{"Pretrain/Learning Rate": 2.2782815040006683e-05, "Pretrain/Loss": 1.9791637659072876, "Pretrain/Loss (Raw)": 2.0834286212921143, "Pretrain/Step": 5173, "Pretrain/Step Time": 8.694494016468525} +{"Pretrain/Learning Rate": 2.2774358749154917e-05, "Pretrain/Loss": 1.9779393672943115, "Pretrain/Loss (Raw)": 1.8666187524795532, "Pretrain/Step": 5174, "Pretrain/Step Time": 8.69587992504239} +{"Pretrain/Learning Rate": 2.2765902714974585e-05, "Pretrain/Loss": 1.978474497795105, "Pretrain/Loss (Raw)": 2.195319652557373, "Pretrain/Step": 5175, "Pretrain/Step Time": 8.693883910775185} +{"Pretrain/Learning Rate": 2.2757446938440886e-05, "Pretrain/Loss": 1.978956699371338, "Pretrain/Loss (Raw)": 2.0884387493133545, "Pretrain/Step": 5176, "Pretrain/Step Time": 8.699017833918333} +{"Pretrain/Learning Rate": 2.274899142052896e-05, "Pretrain/Loss": 1.9767932891845703, "Pretrain/Loss (Raw)": 1.8630162477493286, "Pretrain/Step": 5177, "Pretrain/Step Time": 8.696888225153089} +{"Pretrain/Learning Rate": 2.2740536162213967e-05, "Pretrain/Loss": 1.9724721908569336, "Pretrain/Loss (Raw)": 1.2221466302871704, "Pretrain/Step": 5178, "Pretrain/Step Time": 8.712543405592442} +{"Pretrain/Learning Rate": 2.2732081164470973e-05, "Pretrain/Loss": 1.9715957641601562, "Pretrain/Loss (Raw)": 2.0741827487945557, "Pretrain/Step": 5179, "Pretrain/Step Time": 8.711566669866443} +{"Pretrain/Learning Rate": 2.2723626428275072e-05, "Pretrain/Loss": 1.9687540531158447, "Pretrain/Loss (Raw)": 1.7807016372680664, "Pretrain/Step": 5180, "Pretrain/Step Time": 8.712816344574094} +{"Pretrain/Learning Rate": 2.2715171954601303e-05, "Pretrain/Loss": 1.9678016901016235, "Pretrain/Loss (Raw)": 1.8692951202392578, "Pretrain/Step": 5181, "Pretrain/Step Time": 8.712864261120558} +{"Pretrain/Learning Rate": 2.2706717744424664e-05, "Pretrain/Loss": 1.9655487537384033, "Pretrain/Loss (Raw)": 1.719238519668579, "Pretrain/Step": 5182, "Pretrain/Step Time": 8.71802137605846} +{"Pretrain/Learning Rate": 2.2698263798720148e-05, "Pretrain/Loss": 1.9640382528305054, "Pretrain/Loss (Raw)": 1.8134170770645142, "Pretrain/Step": 5183, "Pretrain/Step Time": 8.71489280462265} +{"Pretrain/Learning Rate": 2.268981011846269e-05, "Pretrain/Loss": 1.9630119800567627, "Pretrain/Loss (Raw)": 1.9588359594345093, "Pretrain/Step": 5184, "Pretrain/Step Time": 8.71659412048757} +{"Pretrain/Learning Rate": 2.2681356704627226e-05, "Pretrain/Loss": 1.9610575437545776, "Pretrain/Loss (Raw)": 1.8171181678771973, "Pretrain/Step": 5185, "Pretrain/Step Time": 8.712895343080163} +{"Pretrain/Learning Rate": 2.267290355818862e-05, "Pretrain/Loss": 1.9594721794128418, "Pretrain/Loss (Raw)": 1.7748252153396606, "Pretrain/Step": 5186, "Pretrain/Step Time": 8.71596990339458} +{"Pretrain/Learning Rate": 2.2664450680121754e-05, "Pretrain/Loss": 1.9602586030960083, "Pretrain/Loss (Raw)": 1.8402339220046997, "Pretrain/Step": 5187, "Pretrain/Step Time": 8.718749694526196} +{"Pretrain/Learning Rate": 2.2655998071401424e-05, "Pretrain/Loss": 1.9618215560913086, "Pretrain/Loss (Raw)": 2.088381767272949, "Pretrain/Step": 5188, "Pretrain/Step Time": 8.723484188318253} +{"Pretrain/Learning Rate": 2.264754573300246e-05, "Pretrain/Loss": 1.9621829986572266, "Pretrain/Loss (Raw)": 2.0186054706573486, "Pretrain/Step": 5189, "Pretrain/Step Time": 8.71945614553988} +{"Pretrain/Learning Rate": 2.2639093665899592e-05, "Pretrain/Loss": 1.9652962684631348, "Pretrain/Loss (Raw)": 1.9983361959457397, "Pretrain/Step": 5190, "Pretrain/Step Time": 8.71717599593103} +{"Pretrain/Learning Rate": 2.263064187106758e-05, "Pretrain/Loss": 1.9642047882080078, "Pretrain/Loss (Raw)": 1.7658796310424805, "Pretrain/Step": 5191, "Pretrain/Step Time": 8.718801552429795} +{"Pretrain/Learning Rate": 2.2622190349481102e-05, "Pretrain/Loss": 1.9649534225463867, "Pretrain/Loss (Raw)": 1.915379285812378, "Pretrain/Step": 5192, "Pretrain/Step Time": 8.717734714969993} +{"Pretrain/Learning Rate": 2.2613739102114846e-05, "Pretrain/Loss": 1.9592801332473755, "Pretrain/Loss (Raw)": 1.585806131362915, "Pretrain/Step": 5193, "Pretrain/Step Time": 8.722677048295736} +{"Pretrain/Learning Rate": 2.2605288129943435e-05, "Pretrain/Loss": 1.9637730121612549, "Pretrain/Loss (Raw)": 2.0295419692993164, "Pretrain/Step": 5194, "Pretrain/Step Time": 8.723150024190545} +{"Pretrain/Learning Rate": 2.2596837433941486e-05, "Pretrain/Loss": 1.9637384414672852, "Pretrain/Loss (Raw)": 1.9128472805023193, "Pretrain/Step": 5195, "Pretrain/Step Time": 8.727094557136297} +{"Pretrain/Learning Rate": 2.2588387015083566e-05, "Pretrain/Loss": 1.962310791015625, "Pretrain/Loss (Raw)": 1.8715769052505493, "Pretrain/Step": 5196, "Pretrain/Step Time": 8.722032316029072} +{"Pretrain/Learning Rate": 2.257993687434422e-05, "Pretrain/Loss": 1.9647738933563232, "Pretrain/Loss (Raw)": 2.0636274814605713, "Pretrain/Step": 5197, "Pretrain/Step Time": 8.720204472541809} +{"Pretrain/Learning Rate": 2.2571487012697952e-05, "Pretrain/Loss": 1.9632863998413086, "Pretrain/Loss (Raw)": 2.053354024887085, "Pretrain/Step": 5198, "Pretrain/Step Time": 8.720317443832755} +{"Pretrain/Learning Rate": 2.2563037431119254e-05, "Pretrain/Loss": 1.9642294645309448, "Pretrain/Loss (Raw)": 2.0830607414245605, "Pretrain/Step": 5199, "Pretrain/Step Time": 8.722976669669151} +{"Pretrain/Learning Rate": 2.2554588130582556e-05, "Pretrain/Loss": 1.9626176357269287, "Pretrain/Loss (Raw)": 1.7700345516204834, "Pretrain/Step": 5200, "Pretrain/Step Time": 8.72276060283184} +{"Pretrain/Learning Rate": 2.254613911206228e-05, "Pretrain/Loss": 1.9655570983886719, "Pretrain/Loss (Raw)": 2.0901846885681152, "Pretrain/Step": 5201, "Pretrain/Step Time": 8.723877090960741} +{"Pretrain/Learning Rate": 2.25376903765328e-05, "Pretrain/Loss": 1.963897705078125, "Pretrain/Loss (Raw)": 1.82991623878479, "Pretrain/Step": 5202, "Pretrain/Step Time": 8.724388705566525} +{"Pretrain/Learning Rate": 2.252924192496848e-05, "Pretrain/Loss": 1.9644775390625, "Pretrain/Loss (Raw)": 2.124876022338867, "Pretrain/Step": 5203, "Pretrain/Step Time": 8.716599080711603} +{"Pretrain/Learning Rate": 2.2520793758343614e-05, "Pretrain/Loss": 1.9652936458587646, "Pretrain/Loss (Raw)": 2.1927590370178223, "Pretrain/Step": 5204, "Pretrain/Step Time": 8.718804702162743} +{"Pretrain/Learning Rate": 2.2512345877632498e-05, "Pretrain/Loss": 1.964796781539917, "Pretrain/Loss (Raw)": 2.002406358718872, "Pretrain/Step": 5205, "Pretrain/Step Time": 8.718605019152164} +{"Pretrain/Learning Rate": 2.2503898283809374e-05, "Pretrain/Loss": 1.9624412059783936, "Pretrain/Loss (Raw)": 1.7229492664337158, "Pretrain/Step": 5206, "Pretrain/Step Time": 8.721978433430195} +{"Pretrain/Learning Rate": 2.2495450977848467e-05, "Pretrain/Loss": 1.960540533065796, "Pretrain/Loss (Raw)": 1.680532455444336, "Pretrain/Step": 5207, "Pretrain/Step Time": 8.714916994795203} +{"Pretrain/Learning Rate": 2.248700396072395e-05, "Pretrain/Loss": 1.960900068283081, "Pretrain/Loss (Raw)": 1.9992395639419556, "Pretrain/Step": 5208, "Pretrain/Step Time": 8.712050376459956} +{"Pretrain/Learning Rate": 2.2478557233409986e-05, "Pretrain/Loss": 1.9596333503723145, "Pretrain/Loss (Raw)": 1.987712025642395, "Pretrain/Step": 5209, "Pretrain/Step Time": 8.701974850147963} +{"Pretrain/Learning Rate": 2.2470110796880673e-05, "Pretrain/Loss": 1.960108995437622, "Pretrain/Loss (Raw)": 2.1727285385131836, "Pretrain/Step": 5210, "Pretrain/Step Time": 8.703098529949784} +{"Pretrain/Learning Rate": 2.246166465211011e-05, "Pretrain/Loss": 1.9616777896881104, "Pretrain/Loss (Raw)": 1.9042247533798218, "Pretrain/Step": 5211, "Pretrain/Step Time": 8.700945479795337} +{"Pretrain/Learning Rate": 2.245321880007234e-05, "Pretrain/Loss": 1.96029794216156, "Pretrain/Loss (Raw)": 1.7959742546081543, "Pretrain/Step": 5212, "Pretrain/Step Time": 8.702070523053408} +{"Pretrain/Learning Rate": 2.244477324174138e-05, "Pretrain/Loss": 1.9624226093292236, "Pretrain/Loss (Raw)": 2.071913003921509, "Pretrain/Step": 5213, "Pretrain/Step Time": 8.694358218461275} +{"Pretrain/Learning Rate": 2.2436327978091205e-05, "Pretrain/Loss": 1.9605774879455566, "Pretrain/Loss (Raw)": 1.8440567255020142, "Pretrain/Step": 5214, "Pretrain/Step Time": 8.694377107545733} +{"Pretrain/Learning Rate": 2.2427883010095775e-05, "Pretrain/Loss": 1.960272192955017, "Pretrain/Loss (Raw)": 1.9181458950042725, "Pretrain/Step": 5215, "Pretrain/Step Time": 8.69233924895525} +{"Pretrain/Learning Rate": 2.241943833872899e-05, "Pretrain/Loss": 1.9614847898483276, "Pretrain/Loss (Raw)": 2.0754494667053223, "Pretrain/Step": 5216, "Pretrain/Step Time": 8.696045173332095} +{"Pretrain/Learning Rate": 2.2410993964964745e-05, "Pretrain/Loss": 1.9647855758666992, "Pretrain/Loss (Raw)": 2.1295857429504395, "Pretrain/Step": 5217, "Pretrain/Step Time": 8.694585848599672} +{"Pretrain/Learning Rate": 2.2402549889776864e-05, "Pretrain/Loss": 1.964440107345581, "Pretrain/Loss (Raw)": 1.9669643640518188, "Pretrain/Step": 5218, "Pretrain/Step Time": 8.69340816885233} +{"Pretrain/Learning Rate": 2.2394106114139183e-05, "Pretrain/Loss": 1.9598262310028076, "Pretrain/Loss (Raw)": 1.592254400253296, "Pretrain/Step": 5219, "Pretrain/Step Time": 8.695838209241629} +{"Pretrain/Learning Rate": 2.2385662639025448e-05, "Pretrain/Loss": 1.9587268829345703, "Pretrain/Loss (Raw)": 1.6329623460769653, "Pretrain/Step": 5220, "Pretrain/Step Time": 8.696674292907119} +{"Pretrain/Learning Rate": 2.237721946540942e-05, "Pretrain/Loss": 1.9588065147399902, "Pretrain/Loss (Raw)": 1.7306944131851196, "Pretrain/Step": 5221, "Pretrain/Step Time": 8.692053321748972} +{"Pretrain/Learning Rate": 2.2368776594264813e-05, "Pretrain/Loss": 1.9594318866729736, "Pretrain/Loss (Raw)": 2.10737943649292, "Pretrain/Step": 5222, "Pretrain/Step Time": 8.700208395719528} +{"Pretrain/Learning Rate": 2.2360334026565277e-05, "Pretrain/Loss": 1.9608581066131592, "Pretrain/Loss (Raw)": 2.0306077003479004, "Pretrain/Step": 5223, "Pretrain/Step Time": 8.699720941483974} +{"Pretrain/Learning Rate": 2.2351891763284466e-05, "Pretrain/Loss": 1.964181661605835, "Pretrain/Loss (Raw)": 2.23717999458313, "Pretrain/Step": 5224, "Pretrain/Step Time": 8.70335360057652} +{"Pretrain/Learning Rate": 2.2343449805395973e-05, "Pretrain/Loss": 1.9616239070892334, "Pretrain/Loss (Raw)": 1.828026294708252, "Pretrain/Step": 5225, "Pretrain/Step Time": 8.705366536974907} +{"Pretrain/Learning Rate": 2.2335008153873375e-05, "Pretrain/Loss": 1.9604299068450928, "Pretrain/Loss (Raw)": 1.9730503559112549, "Pretrain/Step": 5226, "Pretrain/Step Time": 8.7078080996871} +{"Pretrain/Learning Rate": 2.2326566809690176e-05, "Pretrain/Loss": 1.957850456237793, "Pretrain/Loss (Raw)": 1.8379846811294556, "Pretrain/Step": 5227, "Pretrain/Step Time": 8.711328003555536} +{"Pretrain/Learning Rate": 2.2318125773819913e-05, "Pretrain/Loss": 1.9574772119522095, "Pretrain/Loss (Raw)": 1.903685450553894, "Pretrain/Step": 5228, "Pretrain/Step Time": 8.707873426377773} +{"Pretrain/Learning Rate": 2.2309685047236002e-05, "Pretrain/Loss": 1.9556622505187988, "Pretrain/Loss (Raw)": 1.810591697692871, "Pretrain/Step": 5229, "Pretrain/Step Time": 8.709592888131738} +{"Pretrain/Learning Rate": 2.2301244630911904e-05, "Pretrain/Loss": 1.9519810676574707, "Pretrain/Loss (Raw)": 1.8931878805160522, "Pretrain/Step": 5230, "Pretrain/Step Time": 8.710049126297235} +{"Pretrain/Learning Rate": 2.229280452582098e-05, "Pretrain/Loss": 1.9538038969039917, "Pretrain/Loss (Raw)": 2.0099685192108154, "Pretrain/Step": 5231, "Pretrain/Step Time": 8.711313515901566} +{"Pretrain/Learning Rate": 2.2284364732936608e-05, "Pretrain/Loss": 1.9533295631408691, "Pretrain/Loss (Raw)": 1.9886058568954468, "Pretrain/Step": 5232, "Pretrain/Step Time": 8.714579816907644} +{"Pretrain/Learning Rate": 2.2275925253232073e-05, "Pretrain/Loss": 1.9532933235168457, "Pretrain/Loss (Raw)": 2.080514907836914, "Pretrain/Step": 5233, "Pretrain/Step Time": 8.716772444546223} +{"Pretrain/Learning Rate": 2.2267486087680695e-05, "Pretrain/Loss": 1.9525548219680786, "Pretrain/Loss (Raw)": 1.7983458042144775, "Pretrain/Step": 5234, "Pretrain/Step Time": 8.718395909294486} +{"Pretrain/Learning Rate": 2.2259047237255684e-05, "Pretrain/Loss": 1.952914834022522, "Pretrain/Loss (Raw)": 1.7814794778823853, "Pretrain/Step": 5235, "Pretrain/Step Time": 8.721889743581414} +{"Pretrain/Learning Rate": 2.2250608702930266e-05, "Pretrain/Loss": 1.9519388675689697, "Pretrain/Loss (Raw)": 1.9671605825424194, "Pretrain/Step": 5236, "Pretrain/Step Time": 8.720486134290695} +{"Pretrain/Learning Rate": 2.2242170485677606e-05, "Pretrain/Loss": 1.9520416259765625, "Pretrain/Loss (Raw)": 1.8127163648605347, "Pretrain/Step": 5237, "Pretrain/Step Time": 8.718416003510356} +{"Pretrain/Learning Rate": 2.223373258647084e-05, "Pretrain/Loss": 1.953625202178955, "Pretrain/Loss (Raw)": 2.240780830383301, "Pretrain/Step": 5238, "Pretrain/Step Time": 8.719515144824982} +{"Pretrain/Learning Rate": 2.222529500628307e-05, "Pretrain/Loss": 1.9541518688201904, "Pretrain/Loss (Raw)": 1.835005283355713, "Pretrain/Step": 5239, "Pretrain/Step Time": 8.719290684908628} +{"Pretrain/Learning Rate": 2.2216857746087355e-05, "Pretrain/Loss": 1.9555275440216064, "Pretrain/Loss (Raw)": 2.2422358989715576, "Pretrain/Step": 5240, "Pretrain/Step Time": 8.718253059312701} +{"Pretrain/Learning Rate": 2.2208420806856718e-05, "Pretrain/Loss": 1.9545502662658691, "Pretrain/Loss (Raw)": 2.062410593032837, "Pretrain/Step": 5241, "Pretrain/Step Time": 8.719776859506965} +{"Pretrain/Learning Rate": 2.2199984189564148e-05, "Pretrain/Loss": 1.9560188055038452, "Pretrain/Loss (Raw)": 1.9035652875900269, "Pretrain/Step": 5242, "Pretrain/Step Time": 8.72102197445929} +{"Pretrain/Learning Rate": 2.2191547895182594e-05, "Pretrain/Loss": 1.956331729888916, "Pretrain/Loss (Raw)": 2.201301336288452, "Pretrain/Step": 5243, "Pretrain/Step Time": 8.717484179884195} +{"Pretrain/Learning Rate": 2.2183111924684975e-05, "Pretrain/Loss": 1.956488847732544, "Pretrain/Loss (Raw)": 1.7280874252319336, "Pretrain/Step": 5244, "Pretrain/Step Time": 8.717881632968783} +{"Pretrain/Learning Rate": 2.2174676279044153e-05, "Pretrain/Loss": 1.955411434173584, "Pretrain/Loss (Raw)": 1.8058547973632812, "Pretrain/Step": 5245, "Pretrain/Step Time": 8.720419123768806} +{"Pretrain/Learning Rate": 2.2166240959232985e-05, "Pretrain/Loss": 1.9543147087097168, "Pretrain/Loss (Raw)": 2.0250191688537598, "Pretrain/Step": 5246, "Pretrain/Step Time": 8.72455289401114} +{"Pretrain/Learning Rate": 2.215780596622426e-05, "Pretrain/Loss": 1.9545247554779053, "Pretrain/Loss (Raw)": 1.9569032192230225, "Pretrain/Step": 5247, "Pretrain/Step Time": 8.723013838753104} +{"Pretrain/Learning Rate": 2.2149371300990745e-05, "Pretrain/Loss": 1.9560636281967163, "Pretrain/Loss (Raw)": 2.0406007766723633, "Pretrain/Step": 5248, "Pretrain/Step Time": 8.727384189143777} +{"Pretrain/Learning Rate": 2.214093696450516e-05, "Pretrain/Loss": 1.954673171043396, "Pretrain/Loss (Raw)": 1.872240662574768, "Pretrain/Step": 5249, "Pretrain/Step Time": 8.726765690371394} +{"Pretrain/Learning Rate": 2.21325029577402e-05, "Pretrain/Loss": 1.9540165662765503, "Pretrain/Loss (Raw)": 1.896724820137024, "Pretrain/Step": 5250, "Pretrain/Step Time": 8.727518308907747} +{"Pretrain/Learning Rate": 2.2124069281668507e-05, "Pretrain/Loss": 1.9519456624984741, "Pretrain/Loss (Raw)": 1.895101547241211, "Pretrain/Step": 5251, "Pretrain/Step Time": 8.730280172079802} +{"Pretrain/Learning Rate": 2.2115635937262706e-05, "Pretrain/Loss": 1.952162504196167, "Pretrain/Loss (Raw)": 2.0748753547668457, "Pretrain/Step": 5252, "Pretrain/Step Time": 8.727640399709344} +{"Pretrain/Learning Rate": 2.210720292549535e-05, "Pretrain/Loss": 1.9528295993804932, "Pretrain/Loss (Raw)": 1.9240564107894897, "Pretrain/Step": 5253, "Pretrain/Step Time": 8.727224707603455} +{"Pretrain/Learning Rate": 2.209877024733899e-05, "Pretrain/Loss": 1.9502191543579102, "Pretrain/Loss (Raw)": 1.9459623098373413, "Pretrain/Step": 5254, "Pretrain/Step Time": 8.728745520114899} +{"Pretrain/Learning Rate": 2.209033790376611e-05, "Pretrain/Loss": 1.9500081539154053, "Pretrain/Loss (Raw)": 2.163662910461426, "Pretrain/Step": 5255, "Pretrain/Step Time": 8.728832622990012} +{"Pretrain/Learning Rate": 2.2081905895749183e-05, "Pretrain/Loss": 1.9500646591186523, "Pretrain/Loss (Raw)": 2.0289950370788574, "Pretrain/Step": 5256, "Pretrain/Step Time": 8.728225963190198} +{"Pretrain/Learning Rate": 2.207347422426061e-05, "Pretrain/Loss": 1.9519271850585938, "Pretrain/Loss (Raw)": 2.071035146713257, "Pretrain/Step": 5257, "Pretrain/Step Time": 8.730640342459083} +{"Pretrain/Learning Rate": 2.206504289027279e-05, "Pretrain/Loss": 1.9508198499679565, "Pretrain/Loss (Raw)": 1.8780477046966553, "Pretrain/Step": 5258, "Pretrain/Step Time": 8.734454357996583} +{"Pretrain/Learning Rate": 2.2056611894758038e-05, "Pretrain/Loss": 1.9502341747283936, "Pretrain/Loss (Raw)": 1.8159265518188477, "Pretrain/Step": 5259, "Pretrain/Step Time": 8.730752045288682} +{"Pretrain/Learning Rate": 2.204818123868869e-05, "Pretrain/Loss": 1.9521872997283936, "Pretrain/Loss (Raw)": 2.2399098873138428, "Pretrain/Step": 5260, "Pretrain/Step Time": 8.729699974879622} +{"Pretrain/Learning Rate": 2.203975092303697e-05, "Pretrain/Loss": 1.9522819519042969, "Pretrain/Loss (Raw)": 1.9905054569244385, "Pretrain/Step": 5261, "Pretrain/Step Time": 8.731471298262477} +{"Pretrain/Learning Rate": 2.2031320948775135e-05, "Pretrain/Loss": 1.9539507627487183, "Pretrain/Loss (Raw)": 2.086625099182129, "Pretrain/Step": 5262, "Pretrain/Step Time": 8.727115627378225} +{"Pretrain/Learning Rate": 2.2022891316875362e-05, "Pretrain/Loss": 1.9541261196136475, "Pretrain/Loss (Raw)": 2.0220160484313965, "Pretrain/Step": 5263, "Pretrain/Step Time": 8.725499855354428} +{"Pretrain/Learning Rate": 2.201446202830978e-05, "Pretrain/Loss": 1.9517961740493774, "Pretrain/Loss (Raw)": 1.9102492332458496, "Pretrain/Step": 5264, "Pretrain/Step Time": 8.72657135501504} +{"Pretrain/Learning Rate": 2.2006033084050516e-05, "Pretrain/Loss": 1.9505923986434937, "Pretrain/Loss (Raw)": 1.997349739074707, "Pretrain/Step": 5265, "Pretrain/Step Time": 8.72894261777401} +{"Pretrain/Learning Rate": 2.1997604485069614e-05, "Pretrain/Loss": 1.9499742984771729, "Pretrain/Loss (Raw)": 1.9693437814712524, "Pretrain/Step": 5266, "Pretrain/Step Time": 8.730253003537655} +{"Pretrain/Learning Rate": 2.1989176232339122e-05, "Pretrain/Loss": 1.9530372619628906, "Pretrain/Loss (Raw)": 2.3113973140716553, "Pretrain/Step": 5267, "Pretrain/Step Time": 8.72852741740644} +{"Pretrain/Learning Rate": 2.1980748326831002e-05, "Pretrain/Loss": 1.9520889520645142, "Pretrain/Loss (Raw)": 1.9890697002410889, "Pretrain/Step": 5268, "Pretrain/Step Time": 8.727654492482543} +{"Pretrain/Learning Rate": 2.1972320769517226e-05, "Pretrain/Loss": 1.9519362449645996, "Pretrain/Loss (Raw)": 2.2133495807647705, "Pretrain/Step": 5269, "Pretrain/Step Time": 8.724081305786967} +{"Pretrain/Learning Rate": 2.1963893561369672e-05, "Pretrain/Loss": 1.951082706451416, "Pretrain/Loss (Raw)": 1.7462069988250732, "Pretrain/Step": 5270, "Pretrain/Step Time": 8.727694034576416} +{"Pretrain/Learning Rate": 2.1955466703360232e-05, "Pretrain/Loss": 1.9503495693206787, "Pretrain/Loss (Raw)": 1.9748468399047852, "Pretrain/Step": 5271, "Pretrain/Step Time": 8.72483647428453} +{"Pretrain/Learning Rate": 2.1947040196460704e-05, "Pretrain/Loss": 1.949317216873169, "Pretrain/Loss (Raw)": 1.7216616868972778, "Pretrain/Step": 5272, "Pretrain/Step Time": 8.724483424797654} +{"Pretrain/Learning Rate": 2.1938614041642903e-05, "Pretrain/Loss": 1.9504857063293457, "Pretrain/Loss (Raw)": 2.132153272628784, "Pretrain/Step": 5273, "Pretrain/Step Time": 8.725124195218086} +{"Pretrain/Learning Rate": 2.1930188239878537e-05, "Pretrain/Loss": 1.9476852416992188, "Pretrain/Loss (Raw)": 1.7016959190368652, "Pretrain/Step": 5274, "Pretrain/Step Time": 8.739093955606222} +{"Pretrain/Learning Rate": 2.192176279213935e-05, "Pretrain/Loss": 1.9466660022735596, "Pretrain/Loss (Raw)": 1.8338829278945923, "Pretrain/Step": 5275, "Pretrain/Step Time": 8.73659436777234} +{"Pretrain/Learning Rate": 2.191333769939696e-05, "Pretrain/Loss": 1.9465665817260742, "Pretrain/Loss (Raw)": 1.9991216659545898, "Pretrain/Step": 5276, "Pretrain/Step Time": 8.737248383462429} +{"Pretrain/Learning Rate": 2.1904912962623035e-05, "Pretrain/Loss": 1.946326732635498, "Pretrain/Loss (Raw)": 1.9623936414718628, "Pretrain/Step": 5277, "Pretrain/Step Time": 8.739355748519301} +{"Pretrain/Learning Rate": 2.1896488582789117e-05, "Pretrain/Loss": 1.9506182670593262, "Pretrain/Loss (Raw)": 2.284681558609009, "Pretrain/Step": 5278, "Pretrain/Step Time": 8.736922401934862} +{"Pretrain/Learning Rate": 2.1888064560866765e-05, "Pretrain/Loss": 1.9490257501602173, "Pretrain/Loss (Raw)": 1.9614793062210083, "Pretrain/Step": 5279, "Pretrain/Step Time": 8.731797581538558} +{"Pretrain/Learning Rate": 2.187964089782747e-05, "Pretrain/Loss": 1.950380802154541, "Pretrain/Loss (Raw)": 2.145010471343994, "Pretrain/Step": 5280, "Pretrain/Step Time": 8.732888845726848} +{"Pretrain/Learning Rate": 2.187121759464269e-05, "Pretrain/Loss": 1.950392484664917, "Pretrain/Loss (Raw)": 2.1623897552490234, "Pretrain/Step": 5281, "Pretrain/Step Time": 8.732652066275477} +{"Pretrain/Learning Rate": 2.1862794652283837e-05, "Pretrain/Loss": 1.9501163959503174, "Pretrain/Loss (Raw)": 2.100567102432251, "Pretrain/Step": 5282, "Pretrain/Step Time": 8.734310645610094} +{"Pretrain/Learning Rate": 2.1854372071722297e-05, "Pretrain/Loss": 1.9504833221435547, "Pretrain/Loss (Raw)": 2.0187458992004395, "Pretrain/Step": 5283, "Pretrain/Step Time": 8.736753396689892} +{"Pretrain/Learning Rate": 2.1845949853929382e-05, "Pretrain/Loss": 1.951935887336731, "Pretrain/Loss (Raw)": 1.9934643507003784, "Pretrain/Step": 5284, "Pretrain/Step Time": 8.732988644391298} +{"Pretrain/Learning Rate": 2.1837527999876396e-05, "Pretrain/Loss": 1.95101797580719, "Pretrain/Loss (Raw)": 1.9279327392578125, "Pretrain/Step": 5285, "Pretrain/Step Time": 8.734396431595087} +{"Pretrain/Learning Rate": 2.1829106510534585e-05, "Pretrain/Loss": 1.9537789821624756, "Pretrain/Loss (Raw)": 2.2006173133850098, "Pretrain/Step": 5286, "Pretrain/Step Time": 8.729220118373632} +{"Pretrain/Learning Rate": 2.1820685386875155e-05, "Pretrain/Loss": 1.9542536735534668, "Pretrain/Loss (Raw)": 1.9507414102554321, "Pretrain/Step": 5287, "Pretrain/Step Time": 8.733024226501584} +{"Pretrain/Learning Rate": 2.1812264629869257e-05, "Pretrain/Loss": 1.953307032585144, "Pretrain/Loss (Raw)": 1.8958678245544434, "Pretrain/Step": 5288, "Pretrain/Step Time": 8.727455088868737} +{"Pretrain/Learning Rate": 2.1803844240488036e-05, "Pretrain/Loss": 1.951744556427002, "Pretrain/Loss (Raw)": 1.8113154172897339, "Pretrain/Step": 5289, "Pretrain/Step Time": 8.73247211240232} +{"Pretrain/Learning Rate": 2.179542421970255e-05, "Pretrain/Loss": 1.9524822235107422, "Pretrain/Loss (Raw)": 2.0802676677703857, "Pretrain/Step": 5290, "Pretrain/Step Time": 8.730245752260089} +{"Pretrain/Learning Rate": 2.1787004568483846e-05, "Pretrain/Loss": 1.95570969581604, "Pretrain/Loss (Raw)": 2.0241587162017822, "Pretrain/Step": 5291, "Pretrain/Step Time": 8.732709679752588} +{"Pretrain/Learning Rate": 2.1778585287802914e-05, "Pretrain/Loss": 1.95856511592865, "Pretrain/Loss (Raw)": 2.1887636184692383, "Pretrain/Step": 5292, "Pretrain/Step Time": 8.73302990756929} +{"Pretrain/Learning Rate": 2.1770166378630708e-05, "Pretrain/Loss": 1.9586265087127686, "Pretrain/Loss (Raw)": 2.124587297439575, "Pretrain/Step": 5293, "Pretrain/Step Time": 8.73207158781588} +{"Pretrain/Learning Rate": 2.1761747841938133e-05, "Pretrain/Loss": 1.9598667621612549, "Pretrain/Loss (Raw)": 2.1777782440185547, "Pretrain/Step": 5294, "Pretrain/Step Time": 8.72431824542582} +{"Pretrain/Learning Rate": 2.175332967869606e-05, "Pretrain/Loss": 1.9616773128509521, "Pretrain/Loss (Raw)": 1.8206897974014282, "Pretrain/Step": 5295, "Pretrain/Step Time": 8.726488852873445} +{"Pretrain/Learning Rate": 2.17449118898753e-05, "Pretrain/Loss": 1.9642047882080078, "Pretrain/Loss (Raw)": 2.1454854011535645, "Pretrain/Step": 5296, "Pretrain/Step Time": 8.72529836371541} +{"Pretrain/Learning Rate": 2.1736494476446646e-05, "Pretrain/Loss": 1.9635463953018188, "Pretrain/Loss (Raw)": 1.9250627756118774, "Pretrain/Step": 5297, "Pretrain/Step Time": 8.726736698299646} +{"Pretrain/Learning Rate": 2.172807743938082e-05, "Pretrain/Loss": 1.9639205932617188, "Pretrain/Loss (Raw)": 2.0809528827667236, "Pretrain/Step": 5298, "Pretrain/Step Time": 8.72836423292756} +{"Pretrain/Learning Rate": 2.171966077964853e-05, "Pretrain/Loss": 1.9651434421539307, "Pretrain/Loss (Raw)": 2.3367273807525635, "Pretrain/Step": 5299, "Pretrain/Step Time": 8.729067791253328} +{"Pretrain/Learning Rate": 2.1711244498220412e-05, "Pretrain/Loss": 1.9641835689544678, "Pretrain/Loss (Raw)": 1.9987752437591553, "Pretrain/Step": 5300, "Pretrain/Step Time": 8.72447968274355} +{"Pretrain/Learning Rate": 2.170282859606708e-05, "Pretrain/Loss": 1.9622251987457275, "Pretrain/Loss (Raw)": 1.8327423334121704, "Pretrain/Step": 5301, "Pretrain/Step Time": 8.729284059256315} +{"Pretrain/Learning Rate": 2.1694413074159082e-05, "Pretrain/Loss": 1.962951421737671, "Pretrain/Loss (Raw)": 1.959587574005127, "Pretrain/Step": 5302, "Pretrain/Step Time": 8.727406196296215} +{"Pretrain/Learning Rate": 2.1685997933466948e-05, "Pretrain/Loss": 1.9601951837539673, "Pretrain/Loss (Raw)": 1.8425289392471313, "Pretrain/Step": 5303, "Pretrain/Step Time": 8.728559026494622} +{"Pretrain/Learning Rate": 2.167758317496115e-05, "Pretrain/Loss": 1.9592211246490479, "Pretrain/Loss (Raw)": 1.9637507200241089, "Pretrain/Step": 5304, "Pretrain/Step Time": 8.727940153330564} +{"Pretrain/Learning Rate": 2.1669168799612118e-05, "Pretrain/Loss": 1.960562825202942, "Pretrain/Loss (Raw)": 2.034749984741211, "Pretrain/Step": 5305, "Pretrain/Step Time": 8.730913896113634} +{"Pretrain/Learning Rate": 2.1660754808390235e-05, "Pretrain/Loss": 1.9675111770629883, "Pretrain/Loss (Raw)": 2.1115431785583496, "Pretrain/Step": 5306, "Pretrain/Step Time": 8.713943969458342} +{"Pretrain/Learning Rate": 2.1652341202265838e-05, "Pretrain/Loss": 1.9666154384613037, "Pretrain/Loss (Raw)": 1.9595223665237427, "Pretrain/Step": 5307, "Pretrain/Step Time": 8.719955664128065} +{"Pretrain/Learning Rate": 2.1643927982209233e-05, "Pretrain/Loss": 1.9670886993408203, "Pretrain/Loss (Raw)": 1.8412761688232422, "Pretrain/Step": 5308, "Pretrain/Step Time": 8.717603657394648} +{"Pretrain/Learning Rate": 2.1635515149190665e-05, "Pretrain/Loss": 1.9681017398834229, "Pretrain/Loss (Raw)": 1.9989620447158813, "Pretrain/Step": 5309, "Pretrain/Step Time": 8.714477838948369} +{"Pretrain/Learning Rate": 2.1627102704180353e-05, "Pretrain/Loss": 1.9706027507781982, "Pretrain/Loss (Raw)": 2.0393896102905273, "Pretrain/Step": 5310, "Pretrain/Step Time": 8.713751653209329} +{"Pretrain/Learning Rate": 2.1618690648148435e-05, "Pretrain/Loss": 1.971990942955017, "Pretrain/Loss (Raw)": 1.9910979270935059, "Pretrain/Step": 5311, "Pretrain/Step Time": 8.707844026386738} +{"Pretrain/Learning Rate": 2.161027898206506e-05, "Pretrain/Loss": 1.9723844528198242, "Pretrain/Loss (Raw)": 2.009199380874634, "Pretrain/Step": 5312, "Pretrain/Step Time": 8.711880002170801} +{"Pretrain/Learning Rate": 2.160186770690027e-05, "Pretrain/Loss": 1.9733749628067017, "Pretrain/Loss (Raw)": 1.9439033269882202, "Pretrain/Step": 5313, "Pretrain/Step Time": 8.719146920368075} +{"Pretrain/Learning Rate": 2.1593456823624127e-05, "Pretrain/Loss": 1.9701757431030273, "Pretrain/Loss (Raw)": 1.3653277158737183, "Pretrain/Step": 5314, "Pretrain/Step Time": 8.715114014223218} +{"Pretrain/Learning Rate": 2.1585046333206573e-05, "Pretrain/Loss": 1.9712398052215576, "Pretrain/Loss (Raw)": 1.9764249324798584, "Pretrain/Step": 5315, "Pretrain/Step Time": 8.712218618020415} +{"Pretrain/Learning Rate": 2.157663623661759e-05, "Pretrain/Loss": 1.9688292741775513, "Pretrain/Loss (Raw)": 1.7798385620117188, "Pretrain/Step": 5316, "Pretrain/Step Time": 8.703933415934443} +{"Pretrain/Learning Rate": 2.156822653482703e-05, "Pretrain/Loss": 1.9669983386993408, "Pretrain/Loss (Raw)": 1.784256100654602, "Pretrain/Step": 5317, "Pretrain/Step Time": 8.70137119665742} +{"Pretrain/Learning Rate": 2.155981722880477e-05, "Pretrain/Loss": 1.9665515422821045, "Pretrain/Loss (Raw)": 1.9411392211914062, "Pretrain/Step": 5318, "Pretrain/Step Time": 8.70491797849536} +{"Pretrain/Learning Rate": 2.1551408319520588e-05, "Pretrain/Loss": 1.9683924913406372, "Pretrain/Loss (Raw)": 2.001530885696411, "Pretrain/Step": 5319, "Pretrain/Step Time": 8.704045087099075} +{"Pretrain/Learning Rate": 2.1542999807944258e-05, "Pretrain/Loss": 1.96913743019104, "Pretrain/Loss (Raw)": 2.0107192993164062, "Pretrain/Step": 5320, "Pretrain/Step Time": 8.704516854137182} +{"Pretrain/Learning Rate": 2.1534591695045473e-05, "Pretrain/Loss": 1.9722265005111694, "Pretrain/Loss (Raw)": 1.981204628944397, "Pretrain/Step": 5321, "Pretrain/Step Time": 8.696511195972562} +{"Pretrain/Learning Rate": 2.1526183981793908e-05, "Pretrain/Loss": 1.9714076519012451, "Pretrain/Loss (Raw)": 1.9247303009033203, "Pretrain/Step": 5322, "Pretrain/Step Time": 8.700151031836867} +{"Pretrain/Learning Rate": 2.1517776669159166e-05, "Pretrain/Loss": 1.9733929634094238, "Pretrain/Loss (Raw)": 2.1669673919677734, "Pretrain/Step": 5323, "Pretrain/Step Time": 8.70068628527224} +{"Pretrain/Learning Rate": 2.150936975811084e-05, "Pretrain/Loss": 1.976965308189392, "Pretrain/Loss (Raw)": 2.328834056854248, "Pretrain/Step": 5324, "Pretrain/Step Time": 8.70145308598876} +{"Pretrain/Learning Rate": 2.1500963249618433e-05, "Pretrain/Loss": 1.9759687185287476, "Pretrain/Loss (Raw)": 1.936071753501892, "Pretrain/Step": 5325, "Pretrain/Step Time": 8.7025037817657} +{"Pretrain/Learning Rate": 2.149255714465144e-05, "Pretrain/Loss": 1.974541425704956, "Pretrain/Loss (Raw)": 1.8706547021865845, "Pretrain/Step": 5326, "Pretrain/Step Time": 8.708206063136458} +{"Pretrain/Learning Rate": 2.1484151444179273e-05, "Pretrain/Loss": 1.974977970123291, "Pretrain/Loss (Raw)": 2.13893461227417, "Pretrain/Step": 5327, "Pretrain/Step Time": 8.709687577560544} +{"Pretrain/Learning Rate": 2.147574614917134e-05, "Pretrain/Loss": 1.9776649475097656, "Pretrain/Loss (Raw)": 2.1139731407165527, "Pretrain/Step": 5328, "Pretrain/Step Time": 8.707495471462607} +{"Pretrain/Learning Rate": 2.146734126059696e-05, "Pretrain/Loss": 1.977475881576538, "Pretrain/Loss (Raw)": 2.065988540649414, "Pretrain/Step": 5329, "Pretrain/Step Time": 8.708285486325622} +{"Pretrain/Learning Rate": 2.1458936779425438e-05, "Pretrain/Loss": 1.9780077934265137, "Pretrain/Loss (Raw)": 1.8980000019073486, "Pretrain/Step": 5330, "Pretrain/Step Time": 8.708412582054734} +{"Pretrain/Learning Rate": 2.145053270662601e-05, "Pretrain/Loss": 1.9776241779327393, "Pretrain/Loss (Raw)": 2.0757648944854736, "Pretrain/Step": 5331, "Pretrain/Step Time": 8.71099109761417} +{"Pretrain/Learning Rate": 2.1442129043167874e-05, "Pretrain/Loss": 1.97675621509552, "Pretrain/Loss (Raw)": 2.0816609859466553, "Pretrain/Step": 5332, "Pretrain/Step Time": 8.709443561732769} +{"Pretrain/Learning Rate": 2.1433725790020186e-05, "Pretrain/Loss": 1.9753366708755493, "Pretrain/Loss (Raw)": 1.8207166194915771, "Pretrain/Step": 5333, "Pretrain/Step Time": 8.704408045858145} +{"Pretrain/Learning Rate": 2.1425322948152042e-05, "Pretrain/Loss": 1.976730227470398, "Pretrain/Loss (Raw)": 1.9013140201568604, "Pretrain/Step": 5334, "Pretrain/Step Time": 8.701762467622757} +{"Pretrain/Learning Rate": 2.14169205185325e-05, "Pretrain/Loss": 1.978664517402649, "Pretrain/Loss (Raw)": 1.9281277656555176, "Pretrain/Step": 5335, "Pretrain/Step Time": 8.700984990224242} +{"Pretrain/Learning Rate": 2.140851850213057e-05, "Pretrain/Loss": 1.9789587259292603, "Pretrain/Loss (Raw)": 2.0368878841400146, "Pretrain/Step": 5336, "Pretrain/Step Time": 8.703097054734826} +{"Pretrain/Learning Rate": 2.1400116899915205e-05, "Pretrain/Loss": 1.9775965213775635, "Pretrain/Loss (Raw)": 1.8133456707000732, "Pretrain/Step": 5337, "Pretrain/Step Time": 8.702078005298972} +{"Pretrain/Learning Rate": 2.1391715712855327e-05, "Pretrain/Loss": 1.9767818450927734, "Pretrain/Loss (Raw)": 2.0684688091278076, "Pretrain/Step": 5338, "Pretrain/Step Time": 8.706600585952401} +{"Pretrain/Learning Rate": 2.1383314941919795e-05, "Pretrain/Loss": 1.978223204612732, "Pretrain/Loss (Raw)": 2.0887084007263184, "Pretrain/Step": 5339, "Pretrain/Step Time": 8.716260723769665} +{"Pretrain/Learning Rate": 2.1374914588077427e-05, "Pretrain/Loss": 1.9782919883728027, "Pretrain/Loss (Raw)": 1.8047716617584229, "Pretrain/Step": 5340, "Pretrain/Step Time": 8.712927350774407} +{"Pretrain/Learning Rate": 2.1366514652296987e-05, "Pretrain/Loss": 1.9780007600784302, "Pretrain/Loss (Raw)": 2.03464674949646, "Pretrain/Step": 5341, "Pretrain/Step Time": 8.713087510317564} +{"Pretrain/Learning Rate": 2.135811513554721e-05, "Pretrain/Loss": 1.979126214981079, "Pretrain/Loss (Raw)": 1.988107681274414, "Pretrain/Step": 5342, "Pretrain/Step Time": 8.722943738102913} +{"Pretrain/Learning Rate": 2.1349716038796742e-05, "Pretrain/Loss": 1.9805312156677246, "Pretrain/Loss (Raw)": 2.097992181777954, "Pretrain/Step": 5343, "Pretrain/Step Time": 8.72336401231587} +{"Pretrain/Learning Rate": 2.1341317363014223e-05, "Pretrain/Loss": 1.9804134368896484, "Pretrain/Loss (Raw)": 2.0603652000427246, "Pretrain/Step": 5344, "Pretrain/Step Time": 8.722711941227317} +{"Pretrain/Learning Rate": 2.133291910916823e-05, "Pretrain/Loss": 1.978851556777954, "Pretrain/Loss (Raw)": 1.9296809434890747, "Pretrain/Step": 5345, "Pretrain/Step Time": 8.724311275407672} +{"Pretrain/Learning Rate": 2.1324521278227287e-05, "Pretrain/Loss": 1.978618860244751, "Pretrain/Loss (Raw)": 1.9371623992919922, "Pretrain/Step": 5346, "Pretrain/Step Time": 8.720923978835344} +{"Pretrain/Learning Rate": 2.131612387115987e-05, "Pretrain/Loss": 1.9824872016906738, "Pretrain/Loss (Raw)": 2.0874135494232178, "Pretrain/Step": 5347, "Pretrain/Step Time": 8.72157246246934} +{"Pretrain/Learning Rate": 2.13077268889344e-05, "Pretrain/Loss": 1.985435962677002, "Pretrain/Loss (Raw)": 2.0104053020477295, "Pretrain/Step": 5348, "Pretrain/Step Time": 8.717604333534837} +{"Pretrain/Learning Rate": 2.1299330332519273e-05, "Pretrain/Loss": 1.9870002269744873, "Pretrain/Loss (Raw)": 1.9309213161468506, "Pretrain/Step": 5349, "Pretrain/Step Time": 8.717757610604167} +{"Pretrain/Learning Rate": 2.1290934202882805e-05, "Pretrain/Loss": 1.9872254133224487, "Pretrain/Loss (Raw)": 2.1361947059631348, "Pretrain/Step": 5350, "Pretrain/Step Time": 8.712877731770277} +{"Pretrain/Learning Rate": 2.128253850099329e-05, "Pretrain/Loss": 1.9852163791656494, "Pretrain/Loss (Raw)": 1.7734607458114624, "Pretrain/Step": 5351, "Pretrain/Step Time": 8.706435605883598} +{"Pretrain/Learning Rate": 2.1274143227818938e-05, "Pretrain/Loss": 1.9832308292388916, "Pretrain/Loss (Raw)": 1.9830149412155151, "Pretrain/Step": 5352, "Pretrain/Step Time": 8.707943331450224} +{"Pretrain/Learning Rate": 2.126574838432796e-05, "Pretrain/Loss": 1.984365701675415, "Pretrain/Loss (Raw)": 1.9733085632324219, "Pretrain/Step": 5353, "Pretrain/Step Time": 8.713181730359793} +{"Pretrain/Learning Rate": 2.1257353971488463e-05, "Pretrain/Loss": 1.9844112396240234, "Pretrain/Loss (Raw)": 1.9788687229156494, "Pretrain/Step": 5354, "Pretrain/Step Time": 8.709187377244234} +{"Pretrain/Learning Rate": 2.1248959990268554e-05, "Pretrain/Loss": 1.985813021659851, "Pretrain/Loss (Raw)": 2.0174105167388916, "Pretrain/Step": 5355, "Pretrain/Step Time": 8.70929948426783} +{"Pretrain/Learning Rate": 2.1240566441636238e-05, "Pretrain/Loss": 1.9860069751739502, "Pretrain/Loss (Raw)": 1.9285283088684082, "Pretrain/Step": 5356, "Pretrain/Step Time": 8.707201145589352} +{"Pretrain/Learning Rate": 2.1232173326559535e-05, "Pretrain/Loss": 1.9867918491363525, "Pretrain/Loss (Raw)": 1.91105055809021, "Pretrain/Step": 5357, "Pretrain/Step Time": 8.70567699894309} +{"Pretrain/Learning Rate": 2.122378064600634e-05, "Pretrain/Loss": 1.9880144596099854, "Pretrain/Loss (Raw)": 2.0496609210968018, "Pretrain/Step": 5358, "Pretrain/Step Time": 8.704189090058208} +{"Pretrain/Learning Rate": 2.121538840094457e-05, "Pretrain/Loss": 1.9885647296905518, "Pretrain/Loss (Raw)": 2.0804080963134766, "Pretrain/Step": 5359, "Pretrain/Step Time": 8.705909995362163} +{"Pretrain/Learning Rate": 2.120699659234203e-05, "Pretrain/Loss": 1.9877992868423462, "Pretrain/Loss (Raw)": 1.8906371593475342, "Pretrain/Step": 5360, "Pretrain/Step Time": 8.707416456192732} +{"Pretrain/Learning Rate": 2.1198605221166528e-05, "Pretrain/Loss": 1.9846296310424805, "Pretrain/Loss (Raw)": 1.6747922897338867, "Pretrain/Step": 5361, "Pretrain/Step Time": 8.708065390586853} +{"Pretrain/Learning Rate": 2.1190214288385778e-05, "Pretrain/Loss": 1.9863795042037964, "Pretrain/Loss (Raw)": 2.0223376750946045, "Pretrain/Step": 5362, "Pretrain/Step Time": 8.707730101421475} +{"Pretrain/Learning Rate": 2.1181823794967472e-05, "Pretrain/Loss": 1.9885821342468262, "Pretrain/Loss (Raw)": 2.063415050506592, "Pretrain/Step": 5363, "Pretrain/Step Time": 8.702431095764041} +{"Pretrain/Learning Rate": 2.1173433741879234e-05, "Pretrain/Loss": 1.9866554737091064, "Pretrain/Loss (Raw)": 1.7205541133880615, "Pretrain/Step": 5364, "Pretrain/Step Time": 8.705668365582824} +{"Pretrain/Learning Rate": 2.116504413008865e-05, "Pretrain/Loss": 1.9876248836517334, "Pretrain/Loss (Raw)": 1.9368019104003906, "Pretrain/Step": 5365, "Pretrain/Step Time": 8.709591176360846} +{"Pretrain/Learning Rate": 2.1156654960563248e-05, "Pretrain/Loss": 1.9855122566223145, "Pretrain/Loss (Raw)": 1.9703623056411743, "Pretrain/Step": 5366, "Pretrain/Step Time": 8.713347766548395} +{"Pretrain/Learning Rate": 2.1148266234270508e-05, "Pretrain/Loss": 1.9866664409637451, "Pretrain/Loss (Raw)": 1.9827375411987305, "Pretrain/Step": 5367, "Pretrain/Step Time": 8.710382893681526} +{"Pretrain/Learning Rate": 2.1139877952177852e-05, "Pretrain/Loss": 1.985518455505371, "Pretrain/Loss (Raw)": 2.095292091369629, "Pretrain/Step": 5368, "Pretrain/Step Time": 8.711762646213174} +{"Pretrain/Learning Rate": 2.1131490115252668e-05, "Pretrain/Loss": 1.9849846363067627, "Pretrain/Loss (Raw)": 1.994099736213684, "Pretrain/Step": 5369, "Pretrain/Step Time": 8.709695931524038} +{"Pretrain/Learning Rate": 2.1123102724462262e-05, "Pretrain/Loss": 1.9845832586288452, "Pretrain/Loss (Raw)": 1.8521714210510254, "Pretrain/Step": 5370, "Pretrain/Step Time": 8.706715483218431} +{"Pretrain/Learning Rate": 2.1114715780773924e-05, "Pretrain/Loss": 1.981879472732544, "Pretrain/Loss (Raw)": 1.8552191257476807, "Pretrain/Step": 5371, "Pretrain/Step Time": 8.709910042583942} +{"Pretrain/Learning Rate": 2.110632928515487e-05, "Pretrain/Loss": 1.984797477722168, "Pretrain/Loss (Raw)": 2.1016016006469727, "Pretrain/Step": 5372, "Pretrain/Step Time": 8.71253852918744} +{"Pretrain/Learning Rate": 2.1097943238572272e-05, "Pretrain/Loss": 1.984619140625, "Pretrain/Loss (Raw)": 1.7830075025558472, "Pretrain/Step": 5373, "Pretrain/Step Time": 8.716787464916706} +{"Pretrain/Learning Rate": 2.108955764199324e-05, "Pretrain/Loss": 1.9840277433395386, "Pretrain/Loss (Raw)": 1.949324607849121, "Pretrain/Step": 5374, "Pretrain/Step Time": 8.714499333873391} +{"Pretrain/Learning Rate": 2.1081172496384855e-05, "Pretrain/Loss": 1.9846587181091309, "Pretrain/Loss (Raw)": 2.0376737117767334, "Pretrain/Step": 5375, "Pretrain/Step Time": 8.71504607051611} +{"Pretrain/Learning Rate": 2.107278780271412e-05, "Pretrain/Loss": 1.9837749004364014, "Pretrain/Loss (Raw)": 1.9274804592132568, "Pretrain/Step": 5376, "Pretrain/Step Time": 8.718920547515154} +{"Pretrain/Learning Rate": 2.1064403561948003e-05, "Pretrain/Loss": 1.9859930276870728, "Pretrain/Loss (Raw)": 2.156153917312622, "Pretrain/Step": 5377, "Pretrain/Step Time": 8.718677915632725} +{"Pretrain/Learning Rate": 2.105601977505341e-05, "Pretrain/Loss": 1.9862478971481323, "Pretrain/Loss (Raw)": 1.9293490648269653, "Pretrain/Step": 5378, "Pretrain/Step Time": 8.716383500024676} +{"Pretrain/Learning Rate": 2.1047636442997205e-05, "Pretrain/Loss": 1.986558198928833, "Pretrain/Loss (Raw)": 1.9348264932632446, "Pretrain/Step": 5379, "Pretrain/Step Time": 8.714200189337134} +{"Pretrain/Learning Rate": 2.1039253566746182e-05, "Pretrain/Loss": 1.98665452003479, "Pretrain/Loss (Raw)": 2.087214708328247, "Pretrain/Step": 5380, "Pretrain/Step Time": 8.718987561762333} +{"Pretrain/Learning Rate": 2.1030871147267113e-05, "Pretrain/Loss": 1.9844034910202026, "Pretrain/Loss (Raw)": 1.635908842086792, "Pretrain/Step": 5381, "Pretrain/Step Time": 8.714686743915081} +{"Pretrain/Learning Rate": 2.1022489185526674e-05, "Pretrain/Loss": 1.9853688478469849, "Pretrain/Loss (Raw)": 2.0695221424102783, "Pretrain/Step": 5382, "Pretrain/Step Time": 8.717324912548065} +{"Pretrain/Learning Rate": 2.1014107682491534e-05, "Pretrain/Loss": 1.9851408004760742, "Pretrain/Loss (Raw)": 2.1344797611236572, "Pretrain/Step": 5383, "Pretrain/Step Time": 8.717578995972872} +{"Pretrain/Learning Rate": 2.1005726639128276e-05, "Pretrain/Loss": 1.9846110343933105, "Pretrain/Loss (Raw)": 1.9611860513687134, "Pretrain/Step": 5384, "Pretrain/Step Time": 8.72184981405735} +{"Pretrain/Learning Rate": 2.0997346056403438e-05, "Pretrain/Loss": 1.984349012374878, "Pretrain/Loss (Raw)": 2.037501573562622, "Pretrain/Step": 5385, "Pretrain/Step Time": 8.720521671697497} +{"Pretrain/Learning Rate": 2.0988965935283524e-05, "Pretrain/Loss": 1.9884719848632812, "Pretrain/Loss (Raw)": 2.4057822227478027, "Pretrain/Step": 5386, "Pretrain/Step Time": 8.719017568975687} +{"Pretrain/Learning Rate": 2.098058627673495e-05, "Pretrain/Loss": 1.9889575242996216, "Pretrain/Loss (Raw)": 1.878074288368225, "Pretrain/Step": 5387, "Pretrain/Step Time": 8.722028210759163} +{"Pretrain/Learning Rate": 2.097220708172411e-05, "Pretrain/Loss": 1.987691879272461, "Pretrain/Loss (Raw)": 2.0779175758361816, "Pretrain/Step": 5388, "Pretrain/Step Time": 8.722646560519934} +{"Pretrain/Learning Rate": 2.0963828351217327e-05, "Pretrain/Loss": 1.9889880418777466, "Pretrain/Loss (Raw)": 2.1563990116119385, "Pretrain/Step": 5389, "Pretrain/Step Time": 8.725907465443015} +{"Pretrain/Learning Rate": 2.0955450086180882e-05, "Pretrain/Loss": 1.9871371984481812, "Pretrain/Loss (Raw)": 1.849717140197754, "Pretrain/Step": 5390, "Pretrain/Step Time": 8.72131105326116} +{"Pretrain/Learning Rate": 2.094707228758099e-05, "Pretrain/Loss": 1.9857004880905151, "Pretrain/Loss (Raw)": 1.838120460510254, "Pretrain/Step": 5391, "Pretrain/Step Time": 8.724452467635274} +{"Pretrain/Learning Rate": 2.093869495638382e-05, "Pretrain/Loss": 1.9879684448242188, "Pretrain/Loss (Raw)": 2.200547218322754, "Pretrain/Step": 5392, "Pretrain/Step Time": 8.725199837237597} +{"Pretrain/Learning Rate": 2.093031809355548e-05, "Pretrain/Loss": 1.9871182441711426, "Pretrain/Loss (Raw)": 1.888511300086975, "Pretrain/Step": 5393, "Pretrain/Step Time": 8.72312930598855} +{"Pretrain/Learning Rate": 2.0921941700062047e-05, "Pretrain/Loss": 1.9867278337478638, "Pretrain/Loss (Raw)": 1.9193856716156006, "Pretrain/Step": 5394, "Pretrain/Step Time": 8.72131697833538} +{"Pretrain/Learning Rate": 2.0913565776869498e-05, "Pretrain/Loss": 1.9830554723739624, "Pretrain/Loss (Raw)": 1.8413342237472534, "Pretrain/Step": 5395, "Pretrain/Step Time": 8.72234152816236} +{"Pretrain/Learning Rate": 2.0905190324943814e-05, "Pretrain/Loss": 1.9827556610107422, "Pretrain/Loss (Raw)": 1.9506783485412598, "Pretrain/Step": 5396, "Pretrain/Step Time": 8.723484750837088} +{"Pretrain/Learning Rate": 2.089681534525086e-05, "Pretrain/Loss": 1.982399821281433, "Pretrain/Loss (Raw)": 2.1678099632263184, "Pretrain/Step": 5397, "Pretrain/Step Time": 8.72405045479536} +{"Pretrain/Learning Rate": 2.0888440838756515e-05, "Pretrain/Loss": 1.9841628074645996, "Pretrain/Loss (Raw)": 1.9718656539916992, "Pretrain/Step": 5398, "Pretrain/Step Time": 8.722880830988288} +{"Pretrain/Learning Rate": 2.088006680642653e-05, "Pretrain/Loss": 1.9846012592315674, "Pretrain/Loss (Raw)": 2.0309810638427734, "Pretrain/Step": 5399, "Pretrain/Step Time": 8.721419790759683} +{"Pretrain/Learning Rate": 2.087169324922667e-05, "Pretrain/Loss": 1.9862775802612305, "Pretrain/Loss (Raw)": 1.9362317323684692, "Pretrain/Step": 5400, "Pretrain/Step Time": 8.723847202956676} +{"Pretrain/Learning Rate": 2.086332016812258e-05, "Pretrain/Loss": 1.986583948135376, "Pretrain/Loss (Raw)": 2.1713669300079346, "Pretrain/Step": 5401, "Pretrain/Step Time": 8.724730763584375} +{"Pretrain/Learning Rate": 2.085494756407992e-05, "Pretrain/Loss": 1.9876716136932373, "Pretrain/Loss (Raw)": 1.8409109115600586, "Pretrain/Step": 5402, "Pretrain/Step Time": 8.712717467918992} +{"Pretrain/Learning Rate": 2.0846575438064227e-05, "Pretrain/Loss": 1.989652395248413, "Pretrain/Loss (Raw)": 2.087437868118286, "Pretrain/Step": 5403, "Pretrain/Step Time": 8.712580753490329} +{"Pretrain/Learning Rate": 2.0838203791041028e-05, "Pretrain/Loss": 1.9894187450408936, "Pretrain/Loss (Raw)": 1.9691917896270752, "Pretrain/Step": 5404, "Pretrain/Step Time": 8.713909067213535} +{"Pretrain/Learning Rate": 2.0829832623975775e-05, "Pretrain/Loss": 1.9897775650024414, "Pretrain/Loss (Raw)": 2.0083305835723877, "Pretrain/Step": 5405, "Pretrain/Step Time": 8.70875827781856} +{"Pretrain/Learning Rate": 2.0821461937833884e-05, "Pretrain/Loss": 1.988290548324585, "Pretrain/Loss (Raw)": 2.094341516494751, "Pretrain/Step": 5406, "Pretrain/Step Time": 8.711472762748599} +{"Pretrain/Learning Rate": 2.0813091733580685e-05, "Pretrain/Loss": 1.9885189533233643, "Pretrain/Loss (Raw)": 1.9907186031341553, "Pretrain/Step": 5407, "Pretrain/Step Time": 8.711241280660033} +{"Pretrain/Learning Rate": 2.080472201218148e-05, "Pretrain/Loss": 1.9871490001678467, "Pretrain/Loss (Raw)": 1.969657301902771, "Pretrain/Step": 5408, "Pretrain/Step Time": 8.710875766351819} +{"Pretrain/Learning Rate": 2.0796352774601495e-05, "Pretrain/Loss": 1.9856853485107422, "Pretrain/Loss (Raw)": 1.975036382675171, "Pretrain/Step": 5409, "Pretrain/Step Time": 8.710122099146247} +{"Pretrain/Learning Rate": 2.0787984021805922e-05, "Pretrain/Loss": 1.9856760501861572, "Pretrain/Loss (Raw)": 2.099395751953125, "Pretrain/Step": 5410, "Pretrain/Step Time": 8.708989847451448} +{"Pretrain/Learning Rate": 2.077961575475988e-05, "Pretrain/Loss": 1.9836283922195435, "Pretrain/Loss (Raw)": 1.75663423538208, "Pretrain/Step": 5411, "Pretrain/Step Time": 8.708623975515366} +{"Pretrain/Learning Rate": 2.0771247974428434e-05, "Pretrain/Loss": 1.9848847389221191, "Pretrain/Loss (Raw)": 2.1542646884918213, "Pretrain/Step": 5412, "Pretrain/Step Time": 8.708653036504984} +{"Pretrain/Learning Rate": 2.07628806817766e-05, "Pretrain/Loss": 1.985481858253479, "Pretrain/Loss (Raw)": 2.004366874694824, "Pretrain/Step": 5413, "Pretrain/Step Time": 8.705503823235631} +{"Pretrain/Learning Rate": 2.0754513877769328e-05, "Pretrain/Loss": 1.9845285415649414, "Pretrain/Loss (Raw)": 2.0785984992980957, "Pretrain/Step": 5414, "Pretrain/Step Time": 8.708329427987337} +{"Pretrain/Learning Rate": 2.074614756337152e-05, "Pretrain/Loss": 1.9844112396240234, "Pretrain/Loss (Raw)": 1.935716152191162, "Pretrain/Step": 5415, "Pretrain/Step Time": 8.705738067626953} +{"Pretrain/Learning Rate": 2.073778173954803e-05, "Pretrain/Loss": 1.981353759765625, "Pretrain/Loss (Raw)": 1.5045225620269775, "Pretrain/Step": 5416, "Pretrain/Step Time": 8.710583271458745} +{"Pretrain/Learning Rate": 2.072941640726362e-05, "Pretrain/Loss": 1.9821960926055908, "Pretrain/Loss (Raw)": 1.9191348552703857, "Pretrain/Step": 5417, "Pretrain/Step Time": 8.708982974290848} +{"Pretrain/Learning Rate": 2.0721051567483045e-05, "Pretrain/Loss": 1.9808446168899536, "Pretrain/Loss (Raw)": 1.9072803258895874, "Pretrain/Step": 5418, "Pretrain/Step Time": 8.708297604694963} +{"Pretrain/Learning Rate": 2.071268722117096e-05, "Pretrain/Loss": 1.979504108428955, "Pretrain/Loss (Raw)": 1.8525804281234741, "Pretrain/Step": 5419, "Pretrain/Step Time": 8.709379523992538} +{"Pretrain/Learning Rate": 2.0704323369291993e-05, "Pretrain/Loss": 1.9773173332214355, "Pretrain/Loss (Raw)": 1.9088362455368042, "Pretrain/Step": 5420, "Pretrain/Step Time": 8.708897856995463} +{"Pretrain/Learning Rate": 2.069596001281069e-05, "Pretrain/Loss": 1.9760615825653076, "Pretrain/Loss (Raw)": 1.9638590812683105, "Pretrain/Step": 5421, "Pretrain/Step Time": 8.708711478859186} +{"Pretrain/Learning Rate": 2.0687597152691567e-05, "Pretrain/Loss": 1.9746034145355225, "Pretrain/Loss (Raw)": 1.991128921508789, "Pretrain/Step": 5422, "Pretrain/Step Time": 8.70840441994369} +{"Pretrain/Learning Rate": 2.0679234789899054e-05, "Pretrain/Loss": 1.9758118391036987, "Pretrain/Loss (Raw)": 1.9753717184066772, "Pretrain/Step": 5423, "Pretrain/Step Time": 8.704581581056118} +{"Pretrain/Learning Rate": 2.067087292539755e-05, "Pretrain/Loss": 1.9739184379577637, "Pretrain/Loss (Raw)": 1.9031352996826172, "Pretrain/Step": 5424, "Pretrain/Step Time": 8.704079857096076} +{"Pretrain/Learning Rate": 2.0662511560151373e-05, "Pretrain/Loss": 1.9736967086791992, "Pretrain/Loss (Raw)": 1.8966864347457886, "Pretrain/Step": 5425, "Pretrain/Step Time": 8.700479157269001} +{"Pretrain/Learning Rate": 2.0654150695124804e-05, "Pretrain/Loss": 1.973585844039917, "Pretrain/Loss (Raw)": 2.066744565963745, "Pretrain/Step": 5426, "Pretrain/Step Time": 8.700686857104301} +{"Pretrain/Learning Rate": 2.064579033128206e-05, "Pretrain/Loss": 1.9708114862442017, "Pretrain/Loss (Raw)": 1.9816241264343262, "Pretrain/Step": 5427, "Pretrain/Step Time": 8.70008590258658} +{"Pretrain/Learning Rate": 2.063743046958729e-05, "Pretrain/Loss": 1.9701178073883057, "Pretrain/Loss (Raw)": 1.9099655151367188, "Pretrain/Step": 5428, "Pretrain/Step Time": 8.69802501052618} +{"Pretrain/Learning Rate": 2.0629071111004595e-05, "Pretrain/Loss": 1.9725408554077148, "Pretrain/Loss (Raw)": 2.142904281616211, "Pretrain/Step": 5429, "Pretrain/Step Time": 8.692495550960302} +{"Pretrain/Learning Rate": 2.0620712256498016e-05, "Pretrain/Loss": 1.9724617004394531, "Pretrain/Loss (Raw)": 1.9494738578796387, "Pretrain/Step": 5430, "Pretrain/Step Time": 8.698106011375785} +{"Pretrain/Learning Rate": 2.061235390703154e-05, "Pretrain/Loss": 1.9717210531234741, "Pretrain/Loss (Raw)": 1.7477079629898071, "Pretrain/Step": 5431, "Pretrain/Step Time": 8.69873284175992} +{"Pretrain/Learning Rate": 2.0603996063569078e-05, "Pretrain/Loss": 1.967766523361206, "Pretrain/Loss (Raw)": 1.4575762748718262, "Pretrain/Step": 5432, "Pretrain/Step Time": 8.694275338202715} +{"Pretrain/Learning Rate": 2.0595638727074512e-05, "Pretrain/Loss": 1.968034029006958, "Pretrain/Loss (Raw)": 2.0689852237701416, "Pretrain/Step": 5433, "Pretrain/Step Time": 8.692211106419563} +{"Pretrain/Learning Rate": 2.058728189851164e-05, "Pretrain/Loss": 1.9668058156967163, "Pretrain/Loss (Raw)": 1.9543371200561523, "Pretrain/Step": 5434, "Pretrain/Step Time": 8.691503752022982} +{"Pretrain/Learning Rate": 2.0578925578844216e-05, "Pretrain/Loss": 1.9663879871368408, "Pretrain/Loss (Raw)": 1.9060434103012085, "Pretrain/Step": 5435, "Pretrain/Step Time": 8.684458501636982} +{"Pretrain/Learning Rate": 2.0570569769035915e-05, "Pretrain/Loss": 1.9692553281784058, "Pretrain/Loss (Raw)": 2.20828914642334, "Pretrain/Step": 5436, "Pretrain/Step Time": 8.696966130286455} +{"Pretrain/Learning Rate": 2.0562214470050396e-05, "Pretrain/Loss": 1.9700441360473633, "Pretrain/Loss (Raw)": 2.099932909011841, "Pretrain/Step": 5437, "Pretrain/Step Time": 8.698965962976217} +{"Pretrain/Learning Rate": 2.0553859682851204e-05, "Pretrain/Loss": 1.9688769578933716, "Pretrain/Loss (Raw)": 1.8899940252304077, "Pretrain/Step": 5438, "Pretrain/Step Time": 8.697250759229064} +{"Pretrain/Learning Rate": 2.0545505408401878e-05, "Pretrain/Loss": 1.967095136642456, "Pretrain/Loss (Raw)": 1.7630070447921753, "Pretrain/Step": 5439, "Pretrain/Step Time": 8.699526324868202} +{"Pretrain/Learning Rate": 2.053715164766584e-05, "Pretrain/Loss": 1.9670854806900024, "Pretrain/Loss (Raw)": 2.0079805850982666, "Pretrain/Step": 5440, "Pretrain/Step Time": 8.697604367509484} +{"Pretrain/Learning Rate": 2.052879840160652e-05, "Pretrain/Loss": 1.9659311771392822, "Pretrain/Loss (Raw)": 1.7961571216583252, "Pretrain/Step": 5441, "Pretrain/Step Time": 8.694652797654271} +{"Pretrain/Learning Rate": 2.052044567118722e-05, "Pretrain/Loss": 1.9710462093353271, "Pretrain/Loss (Raw)": 2.0200467109680176, "Pretrain/Step": 5442, "Pretrain/Step Time": 8.695909244939685} +{"Pretrain/Learning Rate": 2.0512093457371253e-05, "Pretrain/Loss": 1.9711413383483887, "Pretrain/Loss (Raw)": 1.9885979890823364, "Pretrain/Step": 5443, "Pretrain/Step Time": 8.696844285354018} +{"Pretrain/Learning Rate": 2.0503741761121804e-05, "Pretrain/Loss": 1.9730300903320312, "Pretrain/Loss (Raw)": 2.021606206893921, "Pretrain/Step": 5444, "Pretrain/Step Time": 8.694512911140919} +{"Pretrain/Learning Rate": 2.049539058340205e-05, "Pretrain/Loss": 1.9746407270431519, "Pretrain/Loss (Raw)": 1.9904069900512695, "Pretrain/Step": 5445, "Pretrain/Step Time": 8.714953355491161} +{"Pretrain/Learning Rate": 2.0487039925175073e-05, "Pretrain/Loss": 1.9751765727996826, "Pretrain/Loss (Raw)": 2.0097389221191406, "Pretrain/Step": 5446, "Pretrain/Step Time": 8.71154166571796} +{"Pretrain/Learning Rate": 2.0478689787403923e-05, "Pretrain/Loss": 1.9751567840576172, "Pretrain/Loss (Raw)": 1.9989851713180542, "Pretrain/Step": 5447, "Pretrain/Step Time": 8.710172664374113} +{"Pretrain/Learning Rate": 2.0470340171051567e-05, "Pretrain/Loss": 1.9748389720916748, "Pretrain/Loss (Raw)": 1.9700500965118408, "Pretrain/Step": 5448, "Pretrain/Step Time": 8.71351726539433} +{"Pretrain/Learning Rate": 2.046199107708093e-05, "Pretrain/Loss": 1.9743454456329346, "Pretrain/Loss (Raw)": 1.918028712272644, "Pretrain/Step": 5449, "Pretrain/Step Time": 8.712673287838697} +{"Pretrain/Learning Rate": 2.0453642506454862e-05, "Pretrain/Loss": 1.9759745597839355, "Pretrain/Loss (Raw)": 2.133261203765869, "Pretrain/Step": 5450, "Pretrain/Step Time": 8.715145478025079} +{"Pretrain/Learning Rate": 2.044529446013617e-05, "Pretrain/Loss": 1.9750416278839111, "Pretrain/Loss (Raw)": 2.047555923461914, "Pretrain/Step": 5451, "Pretrain/Step Time": 8.711600529029965} +{"Pretrain/Learning Rate": 2.0436946939087576e-05, "Pretrain/Loss": 1.9732906818389893, "Pretrain/Loss (Raw)": 2.1047067642211914, "Pretrain/Step": 5452, "Pretrain/Step Time": 8.710428984835744} +{"Pretrain/Learning Rate": 2.042859994427177e-05, "Pretrain/Loss": 1.9750640392303467, "Pretrain/Loss (Raw)": 2.163057804107666, "Pretrain/Step": 5453, "Pretrain/Step Time": 8.715703222900629} +{"Pretrain/Learning Rate": 2.042025347665135e-05, "Pretrain/Loss": 1.97517991065979, "Pretrain/Loss (Raw)": 1.8855032920837402, "Pretrain/Step": 5454, "Pretrain/Step Time": 8.71028164960444} +{"Pretrain/Learning Rate": 2.041190753718889e-05, "Pretrain/Loss": 1.9744571447372437, "Pretrain/Loss (Raw)": 2.0464048385620117, "Pretrain/Step": 5455, "Pretrain/Step Time": 8.712338795885444} +{"Pretrain/Learning Rate": 2.0403562126846865e-05, "Pretrain/Loss": 1.9712111949920654, "Pretrain/Loss (Raw)": 1.69850492477417, "Pretrain/Step": 5456, "Pretrain/Step Time": 8.71712128072977} +{"Pretrain/Learning Rate": 2.039521724658772e-05, "Pretrain/Loss": 1.970365285873413, "Pretrain/Loss (Raw)": 1.9576972723007202, "Pretrain/Step": 5457, "Pretrain/Step Time": 8.71518473699689} +{"Pretrain/Learning Rate": 2.0386872897373816e-05, "Pretrain/Loss": 1.9710683822631836, "Pretrain/Loss (Raw)": 1.9880120754241943, "Pretrain/Step": 5458, "Pretrain/Step Time": 8.714357484132051} +{"Pretrain/Learning Rate": 2.037852908016747e-05, "Pretrain/Loss": 1.9701396226882935, "Pretrain/Loss (Raw)": 1.9568649530410767, "Pretrain/Step": 5459, "Pretrain/Step Time": 8.712858060374856} +{"Pretrain/Learning Rate": 2.0370185795930927e-05, "Pretrain/Loss": 1.9696400165557861, "Pretrain/Loss (Raw)": 2.017730236053467, "Pretrain/Step": 5460, "Pretrain/Step Time": 8.713350171223283} +{"Pretrain/Learning Rate": 2.0361843045626378e-05, "Pretrain/Loss": 1.9717613458633423, "Pretrain/Loss (Raw)": 2.0922324657440186, "Pretrain/Step": 5461, "Pretrain/Step Time": 8.716769617050886} +{"Pretrain/Learning Rate": 2.035350083021594e-05, "Pretrain/Loss": 1.9739704132080078, "Pretrain/Loss (Raw)": 2.1840670108795166, "Pretrain/Step": 5462, "Pretrain/Step Time": 8.715740030631423} +{"Pretrain/Learning Rate": 2.0345159150661683e-05, "Pretrain/Loss": 1.975602626800537, "Pretrain/Loss (Raw)": 2.1370489597320557, "Pretrain/Step": 5463, "Pretrain/Step Time": 8.717119384557009} +{"Pretrain/Learning Rate": 2.0336818007925603e-05, "Pretrain/Loss": 1.975851058959961, "Pretrain/Loss (Raw)": 2.0687108039855957, "Pretrain/Step": 5464, "Pretrain/Step Time": 8.721188321709633} +{"Pretrain/Learning Rate": 2.032847740296965e-05, "Pretrain/Loss": 1.977428674697876, "Pretrain/Loss (Raw)": 2.0152788162231445, "Pretrain/Step": 5465, "Pretrain/Step Time": 8.719762338325381} +{"Pretrain/Learning Rate": 2.0320137336755692e-05, "Pretrain/Loss": 1.9772169589996338, "Pretrain/Loss (Raw)": 2.0413613319396973, "Pretrain/Step": 5466, "Pretrain/Step Time": 8.718367505818605} +{"Pretrain/Learning Rate": 2.0311797810245543e-05, "Pretrain/Loss": 1.9752246141433716, "Pretrain/Loss (Raw)": 1.8336888551712036, "Pretrain/Step": 5467, "Pretrain/Step Time": 8.715892814099789} +{"Pretrain/Learning Rate": 2.0303458824400974e-05, "Pretrain/Loss": 1.9769105911254883, "Pretrain/Loss (Raw)": 2.0205681324005127, "Pretrain/Step": 5468, "Pretrain/Step Time": 8.718130979686975} +{"Pretrain/Learning Rate": 2.0295120380183657e-05, "Pretrain/Loss": 1.976461410522461, "Pretrain/Loss (Raw)": 1.9771536588668823, "Pretrain/Step": 5469, "Pretrain/Step Time": 8.71544893272221} +{"Pretrain/Learning Rate": 2.0286782478555232e-05, "Pretrain/Loss": 1.976020097732544, "Pretrain/Loss (Raw)": 1.9316251277923584, "Pretrain/Step": 5470, "Pretrain/Step Time": 8.706384742632508} +{"Pretrain/Learning Rate": 2.027844512047726e-05, "Pretrain/Loss": 1.9736703634262085, "Pretrain/Loss (Raw)": 1.797228217124939, "Pretrain/Step": 5471, "Pretrain/Step Time": 8.709407748654485} +{"Pretrain/Learning Rate": 2.027010830691124e-05, "Pretrain/Loss": 1.973711371421814, "Pretrain/Loss (Raw)": 2.0656187534332275, "Pretrain/Step": 5472, "Pretrain/Step Time": 8.701951920986176} +{"Pretrain/Learning Rate": 2.0261772038818622e-05, "Pretrain/Loss": 1.9746577739715576, "Pretrain/Loss (Raw)": 2.050804853439331, "Pretrain/Step": 5473, "Pretrain/Step Time": 8.711724633350968} +{"Pretrain/Learning Rate": 2.0253436317160784e-05, "Pretrain/Loss": 1.9741981029510498, "Pretrain/Loss (Raw)": 1.8783329725265503, "Pretrain/Step": 5474, "Pretrain/Step Time": 8.712193889543414} +{"Pretrain/Learning Rate": 2.0245101142899032e-05, "Pretrain/Loss": 1.975616455078125, "Pretrain/Loss (Raw)": 2.2689647674560547, "Pretrain/Step": 5475, "Pretrain/Step Time": 8.710538864135742} +{"Pretrain/Learning Rate": 2.0236766516994623e-05, "Pretrain/Loss": 1.9754550457000732, "Pretrain/Loss (Raw)": 1.9897414445877075, "Pretrain/Step": 5476, "Pretrain/Step Time": 8.710908381268382} +{"Pretrain/Learning Rate": 2.022843244040874e-05, "Pretrain/Loss": 1.9771664142608643, "Pretrain/Loss (Raw)": 2.1499810218811035, "Pretrain/Step": 5477, "Pretrain/Step Time": 8.714609157294035} +{"Pretrain/Learning Rate": 2.0220098914102525e-05, "Pretrain/Loss": 1.97492253780365, "Pretrain/Loss (Raw)": 1.8489683866500854, "Pretrain/Step": 5478, "Pretrain/Step Time": 8.71152769215405} +{"Pretrain/Learning Rate": 2.021176593903701e-05, "Pretrain/Loss": 1.97584867477417, "Pretrain/Loss (Raw)": 1.8920018672943115, "Pretrain/Step": 5479, "Pretrain/Step Time": 8.716282155364752} +{"Pretrain/Learning Rate": 2.0203433516173225e-05, "Pretrain/Loss": 1.9767000675201416, "Pretrain/Loss (Raw)": 2.092010974884033, "Pretrain/Step": 5480, "Pretrain/Step Time": 8.70928287692368} +{"Pretrain/Learning Rate": 2.0195101646472075e-05, "Pretrain/Loss": 1.9768757820129395, "Pretrain/Loss (Raw)": 1.9958045482635498, "Pretrain/Step": 5481, "Pretrain/Step Time": 8.700570845976472} +{"Pretrain/Learning Rate": 2.018677033089446e-05, "Pretrain/Loss": 1.9768844842910767, "Pretrain/Loss (Raw)": 1.979974627494812, "Pretrain/Step": 5482, "Pretrain/Step Time": 8.705210534855723} +{"Pretrain/Learning Rate": 2.017843957040115e-05, "Pretrain/Loss": 1.976436734199524, "Pretrain/Loss (Raw)": 1.960094928741455, "Pretrain/Step": 5483, "Pretrain/Step Time": 8.70525236800313} +{"Pretrain/Learning Rate": 2.0170109365952934e-05, "Pretrain/Loss": 1.9791204929351807, "Pretrain/Loss (Raw)": 2.2720556259155273, "Pretrain/Step": 5484, "Pretrain/Step Time": 8.705568978562951} +{"Pretrain/Learning Rate": 2.0161779718510443e-05, "Pretrain/Loss": 1.9801502227783203, "Pretrain/Loss (Raw)": 2.0428483486175537, "Pretrain/Step": 5485, "Pretrain/Step Time": 8.710366506129503} +{"Pretrain/Learning Rate": 2.015345062903433e-05, "Pretrain/Loss": 1.9785006046295166, "Pretrain/Loss (Raw)": 1.838504433631897, "Pretrain/Step": 5486, "Pretrain/Step Time": 8.708639223128557} +{"Pretrain/Learning Rate": 2.014512209848512e-05, "Pretrain/Loss": 1.9792122840881348, "Pretrain/Loss (Raw)": 2.1715052127838135, "Pretrain/Step": 5487, "Pretrain/Step Time": 8.70449928380549} +{"Pretrain/Learning Rate": 2.013679412782331e-05, "Pretrain/Loss": 1.9810279607772827, "Pretrain/Loss (Raw)": 2.1230499744415283, "Pretrain/Step": 5488, "Pretrain/Step Time": 8.701905958354473} +{"Pretrain/Learning Rate": 2.0128466718009313e-05, "Pretrain/Loss": 1.9847924709320068, "Pretrain/Loss (Raw)": 2.1566452980041504, "Pretrain/Step": 5489, "Pretrain/Step Time": 8.701694123446941} +{"Pretrain/Learning Rate": 2.0120139870003492e-05, "Pretrain/Loss": 1.9831132888793945, "Pretrain/Loss (Raw)": 1.8073993921279907, "Pretrain/Step": 5490, "Pretrain/Step Time": 8.702269183471799} +{"Pretrain/Learning Rate": 2.0111813584766134e-05, "Pretrain/Loss": 1.9803664684295654, "Pretrain/Loss (Raw)": 1.7118464708328247, "Pretrain/Step": 5491, "Pretrain/Step Time": 8.70862645842135} +{"Pretrain/Learning Rate": 2.010348786325747e-05, "Pretrain/Loss": 1.9836372137069702, "Pretrain/Loss (Raw)": 2.1391994953155518, "Pretrain/Step": 5492, "Pretrain/Step Time": 8.706906627863646} +{"Pretrain/Learning Rate": 2.0095162706437655e-05, "Pretrain/Loss": 1.9839181900024414, "Pretrain/Loss (Raw)": 1.9727493524551392, "Pretrain/Step": 5493, "Pretrain/Step Time": 8.705713113769889} +{"Pretrain/Learning Rate": 2.0086838115266794e-05, "Pretrain/Loss": 1.984795093536377, "Pretrain/Loss (Raw)": 2.082606792449951, "Pretrain/Step": 5494, "Pretrain/Step Time": 8.703144785016775} +{"Pretrain/Learning Rate": 2.007851409070491e-05, "Pretrain/Loss": 1.9853320121765137, "Pretrain/Loss (Raw)": 2.0514798164367676, "Pretrain/Step": 5495, "Pretrain/Step Time": 8.707902073860168} +{"Pretrain/Learning Rate": 2.007019063371197e-05, "Pretrain/Loss": 1.9841252565383911, "Pretrain/Loss (Raw)": 1.940818190574646, "Pretrain/Step": 5496, "Pretrain/Step Time": 8.70829469896853} +{"Pretrain/Learning Rate": 2.006186774524788e-05, "Pretrain/Loss": 1.9854280948638916, "Pretrain/Loss (Raw)": 2.1608636379241943, "Pretrain/Step": 5497, "Pretrain/Step Time": 8.708238253369927} +{"Pretrain/Learning Rate": 2.005354542627247e-05, "Pretrain/Loss": 1.987276315689087, "Pretrain/Loss (Raw)": 2.088742733001709, "Pretrain/Step": 5498, "Pretrain/Step Time": 8.709487050771713} +{"Pretrain/Learning Rate": 2.0045223677745507e-05, "Pretrain/Loss": 1.9879035949707031, "Pretrain/Loss (Raw)": 1.9355157613754272, "Pretrain/Step": 5499, "Pretrain/Step Time": 8.707452865317464} +{"Pretrain/Learning Rate": 2.0036902500626704e-05, "Pretrain/Loss": 1.9867279529571533, "Pretrain/Loss (Raw)": 1.9511213302612305, "Pretrain/Step": 5500, "Pretrain/Step Time": 8.706465506926179} +{"Pretrain/Learning Rate": 2.002858189587568e-05, "Pretrain/Loss": 1.989319086074829, "Pretrain/Loss (Raw)": 2.1146767139434814, "Pretrain/Step": 5501, "Pretrain/Step Time": 8.702855696901679} +{"Pretrain/Learning Rate": 2.002026186445203e-05, "Pretrain/Loss": 1.9883177280426025, "Pretrain/Loss (Raw)": 1.821144461631775, "Pretrain/Step": 5502, "Pretrain/Step Time": 8.70393743738532} +{"Pretrain/Learning Rate": 2.0011942407315236e-05, "Pretrain/Loss": 1.9880561828613281, "Pretrain/Loss (Raw)": 2.0041911602020264, "Pretrain/Step": 5503, "Pretrain/Step Time": 8.704198155552149} +{"Pretrain/Learning Rate": 2.0003623525424758e-05, "Pretrain/Loss": 1.987821340560913, "Pretrain/Loss (Raw)": 1.8974206447601318, "Pretrain/Step": 5504, "Pretrain/Step Time": 8.702372282743454} +{"Pretrain/Learning Rate": 1.9995305219739952e-05, "Pretrain/Loss": 1.9859731197357178, "Pretrain/Loss (Raw)": 1.9195741415023804, "Pretrain/Step": 5505, "Pretrain/Step Time": 8.702615359798074} +{"Pretrain/Learning Rate": 1.9986987491220137e-05, "Pretrain/Loss": 1.9824943542480469, "Pretrain/Loss (Raw)": 1.4840761423110962, "Pretrain/Step": 5506, "Pretrain/Step Time": 8.702835112810135} +{"Pretrain/Learning Rate": 1.997867034082454e-05, "Pretrain/Loss": 1.9830251932144165, "Pretrain/Loss (Raw)": 2.0027809143066406, "Pretrain/Step": 5507, "Pretrain/Step Time": 8.706793125718832} +{"Pretrain/Learning Rate": 1.997035376951234e-05, "Pretrain/Loss": 1.9824938774108887, "Pretrain/Loss (Raw)": 2.019212007522583, "Pretrain/Step": 5508, "Pretrain/Step Time": 8.702272664755583} +{"Pretrain/Learning Rate": 1.996203777824265e-05, "Pretrain/Loss": 1.9867908954620361, "Pretrain/Loss (Raw)": 2.185908079147339, "Pretrain/Step": 5509, "Pretrain/Step Time": 8.71120249480009} +{"Pretrain/Learning Rate": 1.99537223679745e-05, "Pretrain/Loss": 1.9856021404266357, "Pretrain/Loss (Raw)": 1.9173730611801147, "Pretrain/Step": 5510, "Pretrain/Step Time": 8.713062850758433} +{"Pretrain/Learning Rate": 1.994540753966687e-05, "Pretrain/Loss": 1.983726978302002, "Pretrain/Loss (Raw)": 1.894450068473816, "Pretrain/Step": 5511, "Pretrain/Step Time": 8.70935677178204} +{"Pretrain/Learning Rate": 1.9937093294278653e-05, "Pretrain/Loss": 1.9838703870773315, "Pretrain/Loss (Raw)": 1.9795492887496948, "Pretrain/Step": 5512, "Pretrain/Step Time": 8.711286894977093} +{"Pretrain/Learning Rate": 1.99287796327687e-05, "Pretrain/Loss": 1.9798986911773682, "Pretrain/Loss (Raw)": 1.529117465019226, "Pretrain/Step": 5513, "Pretrain/Step Time": 8.711190050467849} +{"Pretrain/Learning Rate": 1.9920466556095772e-05, "Pretrain/Loss": 1.9772422313690186, "Pretrain/Loss (Raw)": 2.065762996673584, "Pretrain/Step": 5514, "Pretrain/Step Time": 8.714688090607524} +{"Pretrain/Learning Rate": 1.991215406521858e-05, "Pretrain/Loss": 1.9763009548187256, "Pretrain/Loss (Raw)": 1.757577657699585, "Pretrain/Step": 5515, "Pretrain/Step Time": 8.713202262297273} +{"Pretrain/Learning Rate": 1.9903842161095752e-05, "Pretrain/Loss": 1.9763214588165283, "Pretrain/Loss (Raw)": 2.0805444717407227, "Pretrain/Step": 5516, "Pretrain/Step Time": 8.714826703071594} +{"Pretrain/Learning Rate": 1.9895530844685865e-05, "Pretrain/Loss": 1.973914623260498, "Pretrain/Loss (Raw)": 1.8483474254608154, "Pretrain/Step": 5517, "Pretrain/Step Time": 8.710902599617839} +{"Pretrain/Learning Rate": 1.988722011694741e-05, "Pretrain/Loss": 1.976110577583313, "Pretrain/Loss (Raw)": 2.1307859420776367, "Pretrain/Step": 5518, "Pretrain/Step Time": 8.713616378605366} +{"Pretrain/Learning Rate": 1.987890997883883e-05, "Pretrain/Loss": 1.97662353515625, "Pretrain/Loss (Raw)": 1.9037704467773438, "Pretrain/Step": 5519, "Pretrain/Step Time": 8.71506691351533} +{"Pretrain/Learning Rate": 1.987060043131847e-05, "Pretrain/Loss": 1.9736014604568481, "Pretrain/Loss (Raw)": 1.813727855682373, "Pretrain/Step": 5520, "Pretrain/Step Time": 8.714149525389075} +{"Pretrain/Learning Rate": 1.9862291475344654e-05, "Pretrain/Loss": 1.971805214881897, "Pretrain/Loss (Raw)": 1.6585971117019653, "Pretrain/Step": 5521, "Pretrain/Step Time": 8.712830929085612} +{"Pretrain/Learning Rate": 1.985398311187558e-05, "Pretrain/Loss": 1.970559000968933, "Pretrain/Loss (Raw)": 1.759863257408142, "Pretrain/Step": 5522, "Pretrain/Step Time": 8.716274404898286} +{"Pretrain/Learning Rate": 1.9845675341869437e-05, "Pretrain/Loss": 1.9717929363250732, "Pretrain/Loss (Raw)": 1.9992717504501343, "Pretrain/Step": 5523, "Pretrain/Step Time": 8.715806046500802} +{"Pretrain/Learning Rate": 1.9837368166284284e-05, "Pretrain/Loss": 1.9739513397216797, "Pretrain/Loss (Raw)": 2.2269561290740967, "Pretrain/Step": 5524, "Pretrain/Step Time": 8.713085046038032} +{"Pretrain/Learning Rate": 1.982906158607818e-05, "Pretrain/Loss": 1.9711709022521973, "Pretrain/Loss (Raw)": 1.8119266033172607, "Pretrain/Step": 5525, "Pretrain/Step Time": 8.715613886713982} +{"Pretrain/Learning Rate": 1.982075560220904e-05, "Pretrain/Loss": 1.9730350971221924, "Pretrain/Loss (Raw)": 2.2104640007019043, "Pretrain/Step": 5526, "Pretrain/Step Time": 8.716219874098897} +{"Pretrain/Learning Rate": 1.981245021563479e-05, "Pretrain/Loss": 1.9732028245925903, "Pretrain/Loss (Raw)": 2.0524611473083496, "Pretrain/Step": 5527, "Pretrain/Step Time": 8.717359628528357} +{"Pretrain/Learning Rate": 1.9804145427313213e-05, "Pretrain/Loss": 1.9755098819732666, "Pretrain/Loss (Raw)": 2.231546640396118, "Pretrain/Step": 5528, "Pretrain/Step Time": 8.713880212977529} +{"Pretrain/Learning Rate": 1.9795841238202077e-05, "Pretrain/Loss": 1.9733998775482178, "Pretrain/Loss (Raw)": 1.901288628578186, "Pretrain/Step": 5529, "Pretrain/Step Time": 8.71949877589941} +{"Pretrain/Learning Rate": 1.9787537649259043e-05, "Pretrain/Loss": 1.9730079174041748, "Pretrain/Loss (Raw)": 1.790728211402893, "Pretrain/Step": 5530, "Pretrain/Step Time": 8.718964584171772} +{"Pretrain/Learning Rate": 1.977923466144174e-05, "Pretrain/Loss": 1.9742603302001953, "Pretrain/Loss (Raw)": 2.247730255126953, "Pretrain/Step": 5531, "Pretrain/Step Time": 8.723255043849349} +{"Pretrain/Learning Rate": 1.977093227570768e-05, "Pretrain/Loss": 1.9743403196334839, "Pretrain/Loss (Raw)": 1.9794481992721558, "Pretrain/Step": 5532, "Pretrain/Step Time": 8.731430508196354} +{"Pretrain/Learning Rate": 1.9762630493014366e-05, "Pretrain/Loss": 1.9753786325454712, "Pretrain/Loss (Raw)": 2.1412453651428223, "Pretrain/Step": 5533, "Pretrain/Step Time": 8.726589584723115} +{"Pretrain/Learning Rate": 1.9754329314319176e-05, "Pretrain/Loss": 1.9748629331588745, "Pretrain/Loss (Raw)": 2.028310775756836, "Pretrain/Step": 5534, "Pretrain/Step Time": 8.728490557521582} +{"Pretrain/Learning Rate": 1.974602874057945e-05, "Pretrain/Loss": 1.974578857421875, "Pretrain/Loss (Raw)": 1.9543719291687012, "Pretrain/Step": 5535, "Pretrain/Step Time": 8.728953622281551} +{"Pretrain/Learning Rate": 1.9737728772752446e-05, "Pretrain/Loss": 1.9758819341659546, "Pretrain/Loss (Raw)": 2.1364357471466064, "Pretrain/Step": 5536, "Pretrain/Step Time": 8.738146748393774} +{"Pretrain/Learning Rate": 1.9729429411795358e-05, "Pretrain/Loss": 1.975494146347046, "Pretrain/Loss (Raw)": 1.9254199266433716, "Pretrain/Step": 5537, "Pretrain/Step Time": 8.739932743832469} +{"Pretrain/Learning Rate": 1.97211306586653e-05, "Pretrain/Loss": 1.9751830101013184, "Pretrain/Loss (Raw)": 2.0595600605010986, "Pretrain/Step": 5538, "Pretrain/Step Time": 8.74057112634182} +{"Pretrain/Learning Rate": 1.971283251431934e-05, "Pretrain/Loss": 1.9765751361846924, "Pretrain/Loss (Raw)": 1.9348245859146118, "Pretrain/Step": 5539, "Pretrain/Step Time": 8.738758759573102} +{"Pretrain/Learning Rate": 1.970453497971444e-05, "Pretrain/Loss": 1.970197081565857, "Pretrain/Loss (Raw)": 1.3378748893737793, "Pretrain/Step": 5540, "Pretrain/Step Time": 8.741552878171206} +{"Pretrain/Learning Rate": 1.969623805580752e-05, "Pretrain/Loss": 1.9695338010787964, "Pretrain/Loss (Raw)": 1.919467568397522, "Pretrain/Step": 5541, "Pretrain/Step Time": 8.744439728558064} +{"Pretrain/Learning Rate": 1.9687941743555422e-05, "Pretrain/Loss": 1.9668607711791992, "Pretrain/Loss (Raw)": 1.7364368438720703, "Pretrain/Step": 5542, "Pretrain/Step Time": 8.741795312613249} +{"Pretrain/Learning Rate": 1.9679646043914914e-05, "Pretrain/Loss": 1.966670274734497, "Pretrain/Loss (Raw)": 1.9113408327102661, "Pretrain/Step": 5543, "Pretrain/Step Time": 8.75071033462882} +{"Pretrain/Learning Rate": 1.967135095784269e-05, "Pretrain/Loss": 1.9713531732559204, "Pretrain/Loss (Raw)": 2.103936195373535, "Pretrain/Step": 5544, "Pretrain/Step Time": 8.74450564570725} +{"Pretrain/Learning Rate": 1.966305648629539e-05, "Pretrain/Loss": 1.9721570014953613, "Pretrain/Loss (Raw)": 2.0220389366149902, "Pretrain/Step": 5545, "Pretrain/Step Time": 8.745045647025108} +{"Pretrain/Learning Rate": 1.9654762630229558e-05, "Pretrain/Loss": 1.972291111946106, "Pretrain/Loss (Raw)": 1.9244410991668701, "Pretrain/Step": 5546, "Pretrain/Step Time": 8.75061235204339} +{"Pretrain/Learning Rate": 1.9646469390601692e-05, "Pretrain/Loss": 1.972896933555603, "Pretrain/Loss (Raw)": 1.9301135540008545, "Pretrain/Step": 5547, "Pretrain/Step Time": 8.748611411079764} +{"Pretrain/Learning Rate": 1.96381767683682e-05, "Pretrain/Loss": 1.973738193511963, "Pretrain/Loss (Raw)": 2.0165257453918457, "Pretrain/Step": 5548, "Pretrain/Step Time": 8.749200396239758} +{"Pretrain/Learning Rate": 1.9629884764485422e-05, "Pretrain/Loss": 1.9746553897857666, "Pretrain/Loss (Raw)": 2.0812535285949707, "Pretrain/Step": 5549, "Pretrain/Step Time": 8.751821104437113} +{"Pretrain/Learning Rate": 1.962159337990965e-05, "Pretrain/Loss": 1.9754360914230347, "Pretrain/Loss (Raw)": 2.0910532474517822, "Pretrain/Step": 5550, "Pretrain/Step Time": 8.752500185742974} +{"Pretrain/Learning Rate": 1.9613302615597064e-05, "Pretrain/Loss": 1.9769597053527832, "Pretrain/Loss (Raw)": 2.170408010482788, "Pretrain/Step": 5551, "Pretrain/Step Time": 8.75812890380621} +{"Pretrain/Learning Rate": 1.960501247250381e-05, "Pretrain/Loss": 1.977501630783081, "Pretrain/Loss (Raw)": 1.9724931716918945, "Pretrain/Step": 5552, "Pretrain/Step Time": 8.75976461544633} +{"Pretrain/Learning Rate": 1.9596722951585936e-05, "Pretrain/Loss": 1.9775943756103516, "Pretrain/Loss (Raw)": 1.9085590839385986, "Pretrain/Step": 5553, "Pretrain/Step Time": 8.761406999081373} +{"Pretrain/Learning Rate": 1.9588434053799437e-05, "Pretrain/Loss": 1.97737455368042, "Pretrain/Loss (Raw)": 2.0386085510253906, "Pretrain/Step": 5554, "Pretrain/Step Time": 8.759343389421701} +{"Pretrain/Learning Rate": 1.9580145780100216e-05, "Pretrain/Loss": 1.9783446788787842, "Pretrain/Loss (Raw)": 2.1058075428009033, "Pretrain/Step": 5555, "Pretrain/Step Time": 8.756750043481588} +{"Pretrain/Learning Rate": 1.9571858131444128e-05, "Pretrain/Loss": 1.9786213636398315, "Pretrain/Loss (Raw)": 1.9453721046447754, "Pretrain/Step": 5556, "Pretrain/Step Time": 8.763868022710085} +{"Pretrain/Learning Rate": 1.9563571108786936e-05, "Pretrain/Loss": 1.9762098789215088, "Pretrain/Loss (Raw)": 1.834234595298767, "Pretrain/Step": 5557, "Pretrain/Step Time": 8.766019776463509} +{"Pretrain/Learning Rate": 1.9555284713084345e-05, "Pretrain/Loss": 1.9772608280181885, "Pretrain/Loss (Raw)": 2.0839955806732178, "Pretrain/Step": 5558, "Pretrain/Step Time": 8.762087877839804} +{"Pretrain/Learning Rate": 1.954699894529197e-05, "Pretrain/Loss": 1.976724624633789, "Pretrain/Loss (Raw)": 1.6790690422058105, "Pretrain/Step": 5559, "Pretrain/Step Time": 8.760418202728033} +{"Pretrain/Learning Rate": 1.953871380636538e-05, "Pretrain/Loss": 1.9830840826034546, "Pretrain/Loss (Raw)": 2.2715961933135986, "Pretrain/Step": 5560, "Pretrain/Step Time": 8.762526165693998} +{"Pretrain/Learning Rate": 1.953042929726004e-05, "Pretrain/Loss": 1.9816653728485107, "Pretrain/Loss (Raw)": 1.8873907327651978, "Pretrain/Step": 5561, "Pretrain/Step Time": 8.762129247188568} +{"Pretrain/Learning Rate": 1.952214541893138e-05, "Pretrain/Loss": 1.9805171489715576, "Pretrain/Loss (Raw)": 1.8073545694351196, "Pretrain/Step": 5562, "Pretrain/Step Time": 8.766769794747233} +{"Pretrain/Learning Rate": 1.9513862172334707e-05, "Pretrain/Loss": 1.981740951538086, "Pretrain/Loss (Raw)": 2.062688112258911, "Pretrain/Step": 5563, "Pretrain/Step Time": 8.774127406999469} +{"Pretrain/Learning Rate": 1.9505579558425313e-05, "Pretrain/Loss": 1.9811128377914429, "Pretrain/Loss (Raw)": 2.1278958320617676, "Pretrain/Step": 5564, "Pretrain/Step Time": 8.760963594540954} +{"Pretrain/Learning Rate": 1.9497297578158363e-05, "Pretrain/Loss": 1.9807422161102295, "Pretrain/Loss (Raw)": 2.052476644515991, "Pretrain/Step": 5565, "Pretrain/Step Time": 8.763504536822438} +{"Pretrain/Learning Rate": 1.9489016232489e-05, "Pretrain/Loss": 1.9820556640625, "Pretrain/Loss (Raw)": 2.058135509490967, "Pretrain/Step": 5566, "Pretrain/Step Time": 8.761096253991127} +{"Pretrain/Learning Rate": 1.9480735522372236e-05, "Pretrain/Loss": 1.9815115928649902, "Pretrain/Loss (Raw)": 1.6933728456497192, "Pretrain/Step": 5567, "Pretrain/Step Time": 8.768524218350649} +{"Pretrain/Learning Rate": 1.9472455448763077e-05, "Pretrain/Loss": 1.9810142517089844, "Pretrain/Loss (Raw)": 1.944329023361206, "Pretrain/Step": 5568, "Pretrain/Step Time": 8.764391131699085} +{"Pretrain/Learning Rate": 1.9464176012616386e-05, "Pretrain/Loss": 1.9836336374282837, "Pretrain/Loss (Raw)": 2.1314170360565186, "Pretrain/Step": 5569, "Pretrain/Step Time": 8.766010228544474} +{"Pretrain/Learning Rate": 1.945589721488702e-05, "Pretrain/Loss": 1.983597993850708, "Pretrain/Loss (Raw)": 2.015495538711548, "Pretrain/Step": 5570, "Pretrain/Step Time": 8.767864527180791} +{"Pretrain/Learning Rate": 1.9447619056529697e-05, "Pretrain/Loss": 1.9815011024475098, "Pretrain/Loss (Raw)": 1.7201955318450928, "Pretrain/Step": 5571, "Pretrain/Step Time": 8.768301432952285} +{"Pretrain/Learning Rate": 1.9439341538499117e-05, "Pretrain/Loss": 1.9794795513153076, "Pretrain/Loss (Raw)": 1.7628358602523804, "Pretrain/Step": 5572, "Pretrain/Step Time": 8.772698570042849} +{"Pretrain/Learning Rate": 1.9431064661749866e-05, "Pretrain/Loss": 1.9806785583496094, "Pretrain/Loss (Raw)": 2.1438820362091064, "Pretrain/Step": 5573, "Pretrain/Step Time": 8.755262734368443} +{"Pretrain/Learning Rate": 1.9422788427236487e-05, "Pretrain/Loss": 1.9803721904754639, "Pretrain/Loss (Raw)": 1.9705227613449097, "Pretrain/Step": 5574, "Pretrain/Step Time": 8.755886631086469} +{"Pretrain/Learning Rate": 1.9414512835913422e-05, "Pretrain/Loss": 1.9804985523223877, "Pretrain/Loss (Raw)": 2.0151665210723877, "Pretrain/Step": 5575, "Pretrain/Step Time": 8.755163261666894} +{"Pretrain/Learning Rate": 1.940623788873506e-05, "Pretrain/Loss": 1.9802874326705933, "Pretrain/Loss (Raw)": 1.943033218383789, "Pretrain/Step": 5576, "Pretrain/Step Time": 8.752330528572202} +{"Pretrain/Learning Rate": 1.9397963586655702e-05, "Pretrain/Loss": 1.9813525676727295, "Pretrain/Loss (Raw)": 2.054356813430786, "Pretrain/Step": 5577, "Pretrain/Step Time": 8.755936032161117} +{"Pretrain/Learning Rate": 1.9389689930629585e-05, "Pretrain/Loss": 1.9798048734664917, "Pretrain/Loss (Raw)": 1.935152292251587, "Pretrain/Step": 5578, "Pretrain/Step Time": 8.758437912911177} +{"Pretrain/Learning Rate": 1.9381416921610855e-05, "Pretrain/Loss": 1.9788219928741455, "Pretrain/Loss (Raw)": 1.9217379093170166, "Pretrain/Step": 5579, "Pretrain/Step Time": 8.75973828881979} +{"Pretrain/Learning Rate": 1.9373144560553604e-05, "Pretrain/Loss": 1.9745041131973267, "Pretrain/Loss (Raw)": 1.5520299673080444, "Pretrain/Step": 5580, "Pretrain/Step Time": 8.758323257789016} +{"Pretrain/Learning Rate": 1.9364872848411837e-05, "Pretrain/Loss": 1.9723634719848633, "Pretrain/Loss (Raw)": 1.8890480995178223, "Pretrain/Step": 5581, "Pretrain/Step Time": 8.74995861388743} +{"Pretrain/Learning Rate": 1.9356601786139487e-05, "Pretrain/Loss": 1.9738457202911377, "Pretrain/Loss (Raw)": 2.075240135192871, "Pretrain/Step": 5582, "Pretrain/Step Time": 8.749095788225532} +{"Pretrain/Learning Rate": 1.934833137469041e-05, "Pretrain/Loss": 1.9724102020263672, "Pretrain/Loss (Raw)": 1.8626701831817627, "Pretrain/Step": 5583, "Pretrain/Step Time": 8.74765807390213} +{"Pretrain/Learning Rate": 1.9340061615018393e-05, "Pretrain/Loss": 1.9757778644561768, "Pretrain/Loss (Raw)": 2.1295669078826904, "Pretrain/Step": 5584, "Pretrain/Step Time": 8.744934413582087} +{"Pretrain/Learning Rate": 1.9331792508077136e-05, "Pretrain/Loss": 1.975510597229004, "Pretrain/Loss (Raw)": 1.9234627485275269, "Pretrain/Step": 5585, "Pretrain/Step Time": 8.743244472891092} +{"Pretrain/Learning Rate": 1.9323524054820285e-05, "Pretrain/Loss": 1.9775891304016113, "Pretrain/Loss (Raw)": 2.254070997238159, "Pretrain/Step": 5586, "Pretrain/Step Time": 8.742352830246091} +{"Pretrain/Learning Rate": 1.9315256256201382e-05, "Pretrain/Loss": 1.9771329164505005, "Pretrain/Loss (Raw)": 1.8984777927398682, "Pretrain/Step": 5587, "Pretrain/Step Time": 8.743163004517555} +{"Pretrain/Learning Rate": 1.930698911317392e-05, "Pretrain/Loss": 1.9784005880355835, "Pretrain/Loss (Raw)": 2.1799864768981934, "Pretrain/Step": 5588, "Pretrain/Step Time": 8.741684349253774} +{"Pretrain/Learning Rate": 1.929872262669129e-05, "Pretrain/Loss": 1.9757503271102905, "Pretrain/Loss (Raw)": 1.753002643585205, "Pretrain/Step": 5589, "Pretrain/Step Time": 8.737421745434403} +{"Pretrain/Learning Rate": 1.9290456797706835e-05, "Pretrain/Loss": 1.978164553642273, "Pretrain/Loss (Raw)": 2.49308443069458, "Pretrain/Step": 5590, "Pretrain/Step Time": 8.738590942695737} +{"Pretrain/Learning Rate": 1.928219162717381e-05, "Pretrain/Loss": 1.9756381511688232, "Pretrain/Loss (Raw)": 1.813667893409729, "Pretrain/Step": 5591, "Pretrain/Step Time": 8.739815780892968} +{"Pretrain/Learning Rate": 1.927392711604539e-05, "Pretrain/Loss": 1.9745514392852783, "Pretrain/Loss (Raw)": 1.929619312286377, "Pretrain/Step": 5592, "Pretrain/Step Time": 8.734101835638285} +{"Pretrain/Learning Rate": 1.926566326527468e-05, "Pretrain/Loss": 1.97358238697052, "Pretrain/Loss (Raw)": 1.891238808631897, "Pretrain/Step": 5593, "Pretrain/Step Time": 8.742628928273916} +{"Pretrain/Learning Rate": 1.9257400075814697e-05, "Pretrain/Loss": 1.9734597206115723, "Pretrain/Loss (Raw)": 2.0256433486938477, "Pretrain/Step": 5594, "Pretrain/Step Time": 8.739399978891015} +{"Pretrain/Learning Rate": 1.92491375486184e-05, "Pretrain/Loss": 1.9739866256713867, "Pretrain/Loss (Raw)": 1.9011479616165161, "Pretrain/Step": 5595, "Pretrain/Step Time": 8.73579584993422} +{"Pretrain/Learning Rate": 1.9240875684638658e-05, "Pretrain/Loss": 1.974450945854187, "Pretrain/Loss (Raw)": 2.0799951553344727, "Pretrain/Step": 5596, "Pretrain/Step Time": 8.736333036795259} +{"Pretrain/Learning Rate": 1.9232614484828277e-05, "Pretrain/Loss": 1.971800446510315, "Pretrain/Loss (Raw)": 1.6378954648971558, "Pretrain/Step": 5597, "Pretrain/Step Time": 8.741032667458057} +{"Pretrain/Learning Rate": 1.922435395013996e-05, "Pretrain/Loss": 1.97274911403656, "Pretrain/Loss (Raw)": 2.0530507564544678, "Pretrain/Step": 5598, "Pretrain/Step Time": 8.738761894404888} +{"Pretrain/Learning Rate": 1.921609408152637e-05, "Pretrain/Loss": 1.9739580154418945, "Pretrain/Loss (Raw)": 1.951984167098999, "Pretrain/Step": 5599, "Pretrain/Step Time": 8.739731950685382} +{"Pretrain/Learning Rate": 1.9207834879940058e-05, "Pretrain/Loss": 1.9713480472564697, "Pretrain/Loss (Raw)": 1.7315205335617065, "Pretrain/Step": 5600, "Pretrain/Step Time": 8.740802243351936} +{"Pretrain/Learning Rate": 1.919957634633353e-05, "Pretrain/Loss": 1.9710371494293213, "Pretrain/Loss (Raw)": 2.011007308959961, "Pretrain/Step": 5601, "Pretrain/Step Time": 8.732529439032078} +{"Pretrain/Learning Rate": 1.9191318481659183e-05, "Pretrain/Loss": 1.9729326963424683, "Pretrain/Loss (Raw)": 2.1209752559661865, "Pretrain/Step": 5602, "Pretrain/Step Time": 8.733716739341617} +{"Pretrain/Learning Rate": 1.918306128686937e-05, "Pretrain/Loss": 1.9714832305908203, "Pretrain/Loss (Raw)": 2.0834333896636963, "Pretrain/Step": 5603, "Pretrain/Step Time": 8.735163850709796} +{"Pretrain/Learning Rate": 1.9174804762916324e-05, "Pretrain/Loss": 1.9727613925933838, "Pretrain/Loss (Raw)": 2.1533524990081787, "Pretrain/Step": 5604, "Pretrain/Step Time": 8.73650081641972} +{"Pretrain/Learning Rate": 1.916654891075226e-05, "Pretrain/Loss": 1.9694700241088867, "Pretrain/Loss (Raw)": 1.7286840677261353, "Pretrain/Step": 5605, "Pretrain/Step Time": 8.731508070603013} +{"Pretrain/Learning Rate": 1.915829373132924e-05, "Pretrain/Loss": 1.9709765911102295, "Pretrain/Loss (Raw)": 2.041802167892456, "Pretrain/Step": 5606, "Pretrain/Step Time": 8.732119590044022} +{"Pretrain/Learning Rate": 1.9150039225599336e-05, "Pretrain/Loss": 1.9710958003997803, "Pretrain/Loss (Raw)": 1.9072762727737427, "Pretrain/Step": 5607, "Pretrain/Step Time": 8.730073627084494} +{"Pretrain/Learning Rate": 1.914178539451446e-05, "Pretrain/Loss": 1.9693129062652588, "Pretrain/Loss (Raw)": 1.8637747764587402, "Pretrain/Step": 5608, "Pretrain/Step Time": 8.729753525927663} +{"Pretrain/Learning Rate": 1.913353223902651e-05, "Pretrain/Loss": 1.9691294431686401, "Pretrain/Loss (Raw)": 1.9723305702209473, "Pretrain/Step": 5609, "Pretrain/Step Time": 8.735517118126154} +{"Pretrain/Learning Rate": 1.912527976008725e-05, "Pretrain/Loss": 1.9718596935272217, "Pretrain/Loss (Raw)": 2.329439163208008, "Pretrain/Step": 5610, "Pretrain/Step Time": 8.733269756659865} +{"Pretrain/Learning Rate": 1.911702795864843e-05, "Pretrain/Loss": 1.9731724262237549, "Pretrain/Loss (Raw)": 2.128122568130493, "Pretrain/Step": 5611, "Pretrain/Step Time": 8.732010258361697} +{"Pretrain/Learning Rate": 1.9108776835661655e-05, "Pretrain/Loss": 1.97097647190094, "Pretrain/Loss (Raw)": 1.9909783601760864, "Pretrain/Step": 5612, "Pretrain/Step Time": 8.73256953805685} +{"Pretrain/Learning Rate": 1.91005263920785e-05, "Pretrain/Loss": 1.9706650972366333, "Pretrain/Loss (Raw)": 2.0029990673065186, "Pretrain/Step": 5613, "Pretrain/Step Time": 8.72397924400866} +{"Pretrain/Learning Rate": 1.9092276628850438e-05, "Pretrain/Loss": 1.9706707000732422, "Pretrain/Loss (Raw)": 1.8392218351364136, "Pretrain/Step": 5614, "Pretrain/Step Time": 8.726176148280501} +{"Pretrain/Learning Rate": 1.9084027546928872e-05, "Pretrain/Loss": 1.9714804887771606, "Pretrain/Loss (Raw)": 2.2751715183258057, "Pretrain/Step": 5615, "Pretrain/Step Time": 8.736760647967458} +{"Pretrain/Learning Rate": 1.907577914726513e-05, "Pretrain/Loss": 1.9700229167938232, "Pretrain/Loss (Raw)": 1.9364547729492188, "Pretrain/Step": 5616, "Pretrain/Step Time": 8.732501884922385} +{"Pretrain/Learning Rate": 1.906753143081045e-05, "Pretrain/Loss": 1.9671906232833862, "Pretrain/Loss (Raw)": 1.794120192527771, "Pretrain/Step": 5617, "Pretrain/Step Time": 8.732627546414733} +{"Pretrain/Learning Rate": 1.9059284398515997e-05, "Pretrain/Loss": 1.9682505130767822, "Pretrain/Loss (Raw)": 1.9430739879608154, "Pretrain/Step": 5618, "Pretrain/Step Time": 8.732043555006385} +{"Pretrain/Learning Rate": 1.9051038051332868e-05, "Pretrain/Loss": 1.9708235263824463, "Pretrain/Loss (Raw)": 2.041194438934326, "Pretrain/Step": 5619, "Pretrain/Step Time": 8.726662235334516} +{"Pretrain/Learning Rate": 1.9042792390212054e-05, "Pretrain/Loss": 1.9689536094665527, "Pretrain/Loss (Raw)": 1.899839162826538, "Pretrain/Step": 5620, "Pretrain/Step Time": 8.728617025539279} +{"Pretrain/Learning Rate": 1.9034547416104502e-05, "Pretrain/Loss": 1.9703691005706787, "Pretrain/Loss (Raw)": 2.1539382934570312, "Pretrain/Step": 5621, "Pretrain/Step Time": 8.729079224169254} +{"Pretrain/Learning Rate": 1.9026303129961047e-05, "Pretrain/Loss": 1.963878870010376, "Pretrain/Loss (Raw)": 1.2518528699874878, "Pretrain/Step": 5622, "Pretrain/Step Time": 8.725581912323833} +{"Pretrain/Learning Rate": 1.901805953273247e-05, "Pretrain/Loss": 1.9646011590957642, "Pretrain/Loss (Raw)": 2.1439406871795654, "Pretrain/Step": 5623, "Pretrain/Step Time": 8.721192706376314} +{"Pretrain/Learning Rate": 1.900981662536945e-05, "Pretrain/Loss": 1.9629193544387817, "Pretrain/Loss (Raw)": 1.725540280342102, "Pretrain/Step": 5624, "Pretrain/Step Time": 8.724090220406651} +{"Pretrain/Learning Rate": 1.9001574408822603e-05, "Pretrain/Loss": 1.960957646369934, "Pretrain/Loss (Raw)": 1.9097626209259033, "Pretrain/Step": 5625, "Pretrain/Step Time": 8.72432536445558} +{"Pretrain/Learning Rate": 1.899333288404246e-05, "Pretrain/Loss": 1.9601811170578003, "Pretrain/Loss (Raw)": 1.989349126815796, "Pretrain/Step": 5626, "Pretrain/Step Time": 8.722045646980405} +{"Pretrain/Learning Rate": 1.8985092051979478e-05, "Pretrain/Loss": 1.9601609706878662, "Pretrain/Loss (Raw)": 1.9329296350479126, "Pretrain/Step": 5627, "Pretrain/Step Time": 8.720581602305174} +{"Pretrain/Learning Rate": 1.897685191358402e-05, "Pretrain/Loss": 1.9626027345657349, "Pretrain/Loss (Raw)": 2.263671636581421, "Pretrain/Step": 5628, "Pretrain/Step Time": 8.719443997368217} +{"Pretrain/Learning Rate": 1.8968612469806387e-05, "Pretrain/Loss": 1.9602079391479492, "Pretrain/Loss (Raw)": 1.8081532716751099, "Pretrain/Step": 5629, "Pretrain/Step Time": 8.720429547131062} +{"Pretrain/Learning Rate": 1.8960373721596775e-05, "Pretrain/Loss": 1.9600207805633545, "Pretrain/Loss (Raw)": 1.7971733808517456, "Pretrain/Step": 5630, "Pretrain/Step Time": 8.720083624124527} +{"Pretrain/Learning Rate": 1.8952135669905334e-05, "Pretrain/Loss": 1.959053874015808, "Pretrain/Loss (Raw)": 1.8804436922073364, "Pretrain/Step": 5631, "Pretrain/Step Time": 8.719377541914582} +{"Pretrain/Learning Rate": 1.89438983156821e-05, "Pretrain/Loss": 1.9590485095977783, "Pretrain/Loss (Raw)": 1.8967214822769165, "Pretrain/Step": 5632, "Pretrain/Step Time": 8.715412057936192} +{"Pretrain/Learning Rate": 1.8935661659877046e-05, "Pretrain/Loss": 1.9599153995513916, "Pretrain/Loss (Raw)": 2.0305473804473877, "Pretrain/Step": 5633, "Pretrain/Step Time": 8.715034699067473} +{"Pretrain/Learning Rate": 1.8927425703440076e-05, "Pretrain/Loss": 1.963669776916504, "Pretrain/Loss (Raw)": 1.9646275043487549, "Pretrain/Step": 5634, "Pretrain/Step Time": 8.717366078868508} +{"Pretrain/Learning Rate": 1.8919190447320982e-05, "Pretrain/Loss": 1.963571548461914, "Pretrain/Loss (Raw)": 1.9902172088623047, "Pretrain/Step": 5635, "Pretrain/Step Time": 8.71529757976532} +{"Pretrain/Learning Rate": 1.8910955892469505e-05, "Pretrain/Loss": 1.9638874530792236, "Pretrain/Loss (Raw)": 2.059638023376465, "Pretrain/Step": 5636, "Pretrain/Step Time": 8.717805314809084} +{"Pretrain/Learning Rate": 1.890272203983528e-05, "Pretrain/Loss": 1.9583451747894287, "Pretrain/Loss (Raw)": 1.4764915704727173, "Pretrain/Step": 5637, "Pretrain/Step Time": 8.709255088120699} +{"Pretrain/Learning Rate": 1.8894488890367885e-05, "Pretrain/Loss": 1.9601316452026367, "Pretrain/Loss (Raw)": 2.146047592163086, "Pretrain/Step": 5638, "Pretrain/Step Time": 8.704709108918905} +{"Pretrain/Learning Rate": 1.8886256445016798e-05, "Pretrain/Loss": 1.9619855880737305, "Pretrain/Loss (Raw)": 2.131755828857422, "Pretrain/Step": 5639, "Pretrain/Step Time": 8.710980407893658} +{"Pretrain/Learning Rate": 1.8878024704731433e-05, "Pretrain/Loss": 1.962834119796753, "Pretrain/Loss (Raw)": 2.0881569385528564, "Pretrain/Step": 5640, "Pretrain/Step Time": 8.707708088681102} +{"Pretrain/Learning Rate": 1.88697936704611e-05, "Pretrain/Loss": 1.9647903442382812, "Pretrain/Loss (Raw)": 1.7795168161392212, "Pretrain/Step": 5641, "Pretrain/Step Time": 8.708428051322699} +{"Pretrain/Learning Rate": 1.8861563343155054e-05, "Pretrain/Loss": 1.9620893001556396, "Pretrain/Loss (Raw)": 1.720030665397644, "Pretrain/Step": 5642, "Pretrain/Step Time": 8.701833628118038} +{"Pretrain/Learning Rate": 1.8853333723762438e-05, "Pretrain/Loss": 1.9650214910507202, "Pretrain/Loss (Raw)": 2.132899284362793, "Pretrain/Step": 5643, "Pretrain/Step Time": 8.701889438554645} +{"Pretrain/Learning Rate": 1.884510481323236e-05, "Pretrain/Loss": 1.9632233381271362, "Pretrain/Loss (Raw)": 1.85038423538208, "Pretrain/Step": 5644, "Pretrain/Step Time": 8.698877442628145} +{"Pretrain/Learning Rate": 1.8836876612513777e-05, "Pretrain/Loss": 1.9650362730026245, "Pretrain/Loss (Raw)": 2.0804073810577393, "Pretrain/Step": 5645, "Pretrain/Step Time": 8.698577215895057} +{"Pretrain/Learning Rate": 1.882864912255564e-05, "Pretrain/Loss": 1.9637906551361084, "Pretrain/Loss (Raw)": 1.9713433980941772, "Pretrain/Step": 5646, "Pretrain/Step Time": 8.701330723240972} +{"Pretrain/Learning Rate": 1.882042234430675e-05, "Pretrain/Loss": 1.9651954174041748, "Pretrain/Loss (Raw)": 2.0835773944854736, "Pretrain/Step": 5647, "Pretrain/Step Time": 8.700346894562244} +{"Pretrain/Learning Rate": 1.8812196278715895e-05, "Pretrain/Loss": 1.9659581184387207, "Pretrain/Loss (Raw)": 1.9113515615463257, "Pretrain/Step": 5648, "Pretrain/Step Time": 8.700119022279978} +{"Pretrain/Learning Rate": 1.8803970926731703e-05, "Pretrain/Loss": 1.9684207439422607, "Pretrain/Loss (Raw)": 1.973809838294983, "Pretrain/Step": 5649, "Pretrain/Step Time": 8.69919053837657} +{"Pretrain/Learning Rate": 1.8795746289302798e-05, "Pretrain/Loss": 1.9706668853759766, "Pretrain/Loss (Raw)": 2.0473625659942627, "Pretrain/Step": 5650, "Pretrain/Step Time": 8.702016051858664} +{"Pretrain/Learning Rate": 1.878752236737765e-05, "Pretrain/Loss": 1.970214605331421, "Pretrain/Loss (Raw)": 1.9413846731185913, "Pretrain/Step": 5651, "Pretrain/Step Time": 8.703359389677644} +{"Pretrain/Learning Rate": 1.8779299161904712e-05, "Pretrain/Loss": 1.9688750505447388, "Pretrain/Loss (Raw)": 2.055492877960205, "Pretrain/Step": 5652, "Pretrain/Step Time": 8.709492191672325} +{"Pretrain/Learning Rate": 1.87710766738323e-05, "Pretrain/Loss": 1.969825029373169, "Pretrain/Loss (Raw)": 1.933531403541565, "Pretrain/Step": 5653, "Pretrain/Step Time": 8.703563390299678} +{"Pretrain/Learning Rate": 1.8762854904108677e-05, "Pretrain/Loss": 1.9674897193908691, "Pretrain/Loss (Raw)": 1.9115307331085205, "Pretrain/Step": 5654, "Pretrain/Step Time": 8.706111866980791} +{"Pretrain/Learning Rate": 1.8754633853682016e-05, "Pretrain/Loss": 1.966705322265625, "Pretrain/Loss (Raw)": 1.9520652294158936, "Pretrain/Step": 5655, "Pretrain/Step Time": 8.708440955728292} +{"Pretrain/Learning Rate": 1.874641352350041e-05, "Pretrain/Loss": 1.966029167175293, "Pretrain/Loss (Raw)": 2.1450157165527344, "Pretrain/Step": 5656, "Pretrain/Step Time": 8.71311349235475} +{"Pretrain/Learning Rate": 1.8738193914511865e-05, "Pretrain/Loss": 1.9690685272216797, "Pretrain/Loss (Raw)": 2.2903172969818115, "Pretrain/Step": 5657, "Pretrain/Step Time": 8.7045982144773} +{"Pretrain/Learning Rate": 1.8729975027664303e-05, "Pretrain/Loss": 1.9712152481079102, "Pretrain/Loss (Raw)": 2.0654971599578857, "Pretrain/Step": 5658, "Pretrain/Step Time": 8.704513417556882} +{"Pretrain/Learning Rate": 1.8721756863905566e-05, "Pretrain/Loss": 1.9686517715454102, "Pretrain/Loss (Raw)": 1.9196176528930664, "Pretrain/Step": 5659, "Pretrain/Step Time": 8.701469568535686} +{"Pretrain/Learning Rate": 1.8713539424183417e-05, "Pretrain/Loss": 1.9688940048217773, "Pretrain/Loss (Raw)": 2.0104503631591797, "Pretrain/Step": 5660, "Pretrain/Step Time": 8.69235429726541} +{"Pretrain/Learning Rate": 1.8705322709445515e-05, "Pretrain/Loss": 1.9681800603866577, "Pretrain/Loss (Raw)": 2.0498604774475098, "Pretrain/Step": 5661, "Pretrain/Step Time": 8.692852606996894} +{"Pretrain/Learning Rate": 1.8697106720639467e-05, "Pretrain/Loss": 1.966049075126648, "Pretrain/Loss (Raw)": 1.755537509918213, "Pretrain/Step": 5662, "Pretrain/Step Time": 8.695089807733893} +{"Pretrain/Learning Rate": 1.8688891458712765e-05, "Pretrain/Loss": 1.9656784534454346, "Pretrain/Loss (Raw)": 1.9069408178329468, "Pretrain/Step": 5663, "Pretrain/Step Time": 8.694768462330103} +{"Pretrain/Learning Rate": 1.8680676924612847e-05, "Pretrain/Loss": 1.9655985832214355, "Pretrain/Loss (Raw)": 2.126220226287842, "Pretrain/Step": 5664, "Pretrain/Step Time": 8.68880538083613} +{"Pretrain/Learning Rate": 1.8672463119287037e-05, "Pretrain/Loss": 1.9641101360321045, "Pretrain/Loss (Raw)": 1.7348788976669312, "Pretrain/Step": 5665, "Pretrain/Step Time": 8.686813823878765} +{"Pretrain/Learning Rate": 1.86642500436826e-05, "Pretrain/Loss": 1.9617817401885986, "Pretrain/Loss (Raw)": 1.7615211009979248, "Pretrain/Step": 5666, "Pretrain/Step Time": 8.687120091170073} +{"Pretrain/Learning Rate": 1.8656037698746704e-05, "Pretrain/Loss": 1.9608923196792603, "Pretrain/Loss (Raw)": 1.8209835290908813, "Pretrain/Step": 5667, "Pretrain/Step Time": 8.683535493910313} +{"Pretrain/Learning Rate": 1.8647826085426433e-05, "Pretrain/Loss": 1.965466856956482, "Pretrain/Loss (Raw)": 1.9234256744384766, "Pretrain/Step": 5668, "Pretrain/Step Time": 8.681398138403893} +{"Pretrain/Learning Rate": 1.8639615204668786e-05, "Pretrain/Loss": 1.9665229320526123, "Pretrain/Loss (Raw)": 2.054638624191284, "Pretrain/Step": 5669, "Pretrain/Step Time": 8.678390022367239} +{"Pretrain/Learning Rate": 1.863140505742069e-05, "Pretrain/Loss": 1.9687178134918213, "Pretrain/Loss (Raw)": 2.0173773765563965, "Pretrain/Step": 5670, "Pretrain/Step Time": 8.679114073514938} +{"Pretrain/Learning Rate": 1.862319564462897e-05, "Pretrain/Loss": 1.9688963890075684, "Pretrain/Loss (Raw)": 1.9342050552368164, "Pretrain/Step": 5671, "Pretrain/Step Time": 8.670525826513767} +{"Pretrain/Learning Rate": 1.8614986967240382e-05, "Pretrain/Loss": 1.9682493209838867, "Pretrain/Loss (Raw)": 2.0211119651794434, "Pretrain/Step": 5672, "Pretrain/Step Time": 8.673080399632454} +{"Pretrain/Learning Rate": 1.8606779026201577e-05, "Pretrain/Loss": 1.9678723812103271, "Pretrain/Loss (Raw)": 1.9737913608551025, "Pretrain/Step": 5673, "Pretrain/Step Time": 8.674847779795527} +{"Pretrain/Learning Rate": 1.859857182245914e-05, "Pretrain/Loss": 1.9668457508087158, "Pretrain/Loss (Raw)": 1.7930238246917725, "Pretrain/Step": 5674, "Pretrain/Step Time": 8.670146705582738} +{"Pretrain/Learning Rate": 1.859036535695957e-05, "Pretrain/Loss": 1.9676179885864258, "Pretrain/Loss (Raw)": 2.028977394104004, "Pretrain/Step": 5675, "Pretrain/Step Time": 8.673253359273076} +{"Pretrain/Learning Rate": 1.858215963064927e-05, "Pretrain/Loss": 1.96822988986969, "Pretrain/Loss (Raw)": 2.0948381423950195, "Pretrain/Step": 5676, "Pretrain/Step Time": 8.671470787376165} +{"Pretrain/Learning Rate": 1.8573954644474562e-05, "Pretrain/Loss": 1.9695017337799072, "Pretrain/Loss (Raw)": 2.244053840637207, "Pretrain/Step": 5677, "Pretrain/Step Time": 8.66711669228971} +{"Pretrain/Learning Rate": 1.8565750399381684e-05, "Pretrain/Loss": 1.9670907258987427, "Pretrain/Loss (Raw)": 1.7824392318725586, "Pretrain/Step": 5678, "Pretrain/Step Time": 8.673439407721162} +{"Pretrain/Learning Rate": 1.8557546896316793e-05, "Pretrain/Loss": 1.966349482536316, "Pretrain/Loss (Raw)": 2.0755276679992676, "Pretrain/Step": 5679, "Pretrain/Step Time": 8.670820772647858} +{"Pretrain/Learning Rate": 1.8549344136225946e-05, "Pretrain/Loss": 1.9653782844543457, "Pretrain/Loss (Raw)": 1.8481922149658203, "Pretrain/Step": 5680, "Pretrain/Step Time": 8.670341443270445} +{"Pretrain/Learning Rate": 1.8541142120055136e-05, "Pretrain/Loss": 1.965796947479248, "Pretrain/Loss (Raw)": 1.9621334075927734, "Pretrain/Step": 5681, "Pretrain/Step Time": 8.66878355666995} +{"Pretrain/Learning Rate": 1.8532940848750245e-05, "Pretrain/Loss": 1.9662306308746338, "Pretrain/Loss (Raw)": 2.094119071960449, "Pretrain/Step": 5682, "Pretrain/Step Time": 8.684314142912626} +{"Pretrain/Learning Rate": 1.8524740323257095e-05, "Pretrain/Loss": 1.9656040668487549, "Pretrain/Loss (Raw)": 2.025606632232666, "Pretrain/Step": 5683, "Pretrain/Step Time": 8.685731707140803} +{"Pretrain/Learning Rate": 1.85165405445214e-05, "Pretrain/Loss": 1.9654275178909302, "Pretrain/Loss (Raw)": 1.9227819442749023, "Pretrain/Step": 5684, "Pretrain/Step Time": 8.681195694953203} +{"Pretrain/Learning Rate": 1.8508341513488804e-05, "Pretrain/Loss": 1.9649358987808228, "Pretrain/Loss (Raw)": 1.771304726600647, "Pretrain/Step": 5685, "Pretrain/Step Time": 8.677857726812363} +{"Pretrain/Learning Rate": 1.8500143231104846e-05, "Pretrain/Loss": 1.9634157419204712, "Pretrain/Loss (Raw)": 1.8894201517105103, "Pretrain/Step": 5686, "Pretrain/Step Time": 8.679162438958883} +{"Pretrain/Learning Rate": 1.8491945698315014e-05, "Pretrain/Loss": 1.9660215377807617, "Pretrain/Loss (Raw)": 2.0126028060913086, "Pretrain/Step": 5687, "Pretrain/Step Time": 8.684676652774215} +{"Pretrain/Learning Rate": 1.8483748916064654e-05, "Pretrain/Loss": 1.9610979557037354, "Pretrain/Loss (Raw)": 1.6413757801055908, "Pretrain/Step": 5688, "Pretrain/Step Time": 8.68419735133648} +{"Pretrain/Learning Rate": 1.8475552885299092e-05, "Pretrain/Loss": 1.962523341178894, "Pretrain/Loss (Raw)": 2.0698463916778564, "Pretrain/Step": 5689, "Pretrain/Step Time": 8.687363443896174} +{"Pretrain/Learning Rate": 1.8467357606963496e-05, "Pretrain/Loss": 1.9615964889526367, "Pretrain/Loss (Raw)": 1.6887333393096924, "Pretrain/Step": 5690, "Pretrain/Step Time": 8.68377766944468} +{"Pretrain/Learning Rate": 1.845916308200302e-05, "Pretrain/Loss": 1.9612014293670654, "Pretrain/Loss (Raw)": 2.012099027633667, "Pretrain/Step": 5691, "Pretrain/Step Time": 8.680978156626225} +{"Pretrain/Learning Rate": 1.8450969311362666e-05, "Pretrain/Loss": 1.9613410234451294, "Pretrain/Loss (Raw)": 2.1457717418670654, "Pretrain/Step": 5692, "Pretrain/Step Time": 8.680335532873869} +{"Pretrain/Learning Rate": 1.8442776295987403e-05, "Pretrain/Loss": 1.9595052003860474, "Pretrain/Loss (Raw)": 1.8174901008605957, "Pretrain/Step": 5693, "Pretrain/Step Time": 8.682127702981234} +{"Pretrain/Learning Rate": 1.843458403682206e-05, "Pretrain/Loss": 1.958146333694458, "Pretrain/Loss (Raw)": 1.8842004537582397, "Pretrain/Step": 5694, "Pretrain/Step Time": 8.684254618361592} +{"Pretrain/Learning Rate": 1.8426392534811445e-05, "Pretrain/Loss": 1.9611788988113403, "Pretrain/Loss (Raw)": 2.0815296173095703, "Pretrain/Step": 5695, "Pretrain/Step Time": 8.68054774031043} +{"Pretrain/Learning Rate": 1.84182017909002e-05, "Pretrain/Loss": 1.9597598314285278, "Pretrain/Loss (Raw)": 1.7627006769180298, "Pretrain/Step": 5696, "Pretrain/Step Time": 8.682294469326735} +{"Pretrain/Learning Rate": 1.841001180603295e-05, "Pretrain/Loss": 1.9552702903747559, "Pretrain/Loss (Raw)": 1.556765079498291, "Pretrain/Step": 5697, "Pretrain/Step Time": 8.684781236574054} +{"Pretrain/Learning Rate": 1.8401822581154188e-05, "Pretrain/Loss": 1.9557359218597412, "Pretrain/Loss (Raw)": 2.0750930309295654, "Pretrain/Step": 5698, "Pretrain/Step Time": 8.67878969758749} +{"Pretrain/Learning Rate": 1.8393634117208343e-05, "Pretrain/Loss": 1.9579929113388062, "Pretrain/Loss (Raw)": 2.00907826423645, "Pretrain/Step": 5699, "Pretrain/Step Time": 8.687321299687028} +{"Pretrain/Learning Rate": 1.838544641513973e-05, "Pretrain/Loss": 1.9596481323242188, "Pretrain/Loss (Raw)": 1.9747092723846436, "Pretrain/Step": 5700, "Pretrain/Step Time": 8.683380383998156} +{"Pretrain/Learning Rate": 1.8377259475892612e-05, "Pretrain/Loss": 1.9587717056274414, "Pretrain/Loss (Raw)": 2.031703233718872, "Pretrain/Step": 5701, "Pretrain/Step Time": 8.683939324691892} +{"Pretrain/Learning Rate": 1.8369073300411137e-05, "Pretrain/Loss": 1.9581167697906494, "Pretrain/Loss (Raw)": 1.8866866827011108, "Pretrain/Step": 5702, "Pretrain/Step Time": 8.68430526740849} +{"Pretrain/Learning Rate": 1.836088788963938e-05, "Pretrain/Loss": 1.9574315547943115, "Pretrain/Loss (Raw)": 1.927446722984314, "Pretrain/Step": 5703, "Pretrain/Step Time": 8.689312955364585} +{"Pretrain/Learning Rate": 1.8352703244521308e-05, "Pretrain/Loss": 1.9583921432495117, "Pretrain/Loss (Raw)": 2.0659940242767334, "Pretrain/Step": 5704, "Pretrain/Step Time": 8.689144445583224} +{"Pretrain/Learning Rate": 1.8344519366000828e-05, "Pretrain/Loss": 1.9553205966949463, "Pretrain/Loss (Raw)": 1.6612093448638916, "Pretrain/Step": 5705, "Pretrain/Step Time": 8.689640961587429} +{"Pretrain/Learning Rate": 1.833633625502173e-05, "Pretrain/Loss": 1.955788254737854, "Pretrain/Loss (Raw)": 1.9950147867202759, "Pretrain/Step": 5706, "Pretrain/Step Time": 8.678835287690163} +{"Pretrain/Learning Rate": 1.832815391252774e-05, "Pretrain/Loss": 1.956106424331665, "Pretrain/Loss (Raw)": 1.9624484777450562, "Pretrain/Step": 5707, "Pretrain/Step Time": 8.676166988909245} +{"Pretrain/Learning Rate": 1.8319972339462478e-05, "Pretrain/Loss": 1.960719108581543, "Pretrain/Loss (Raw)": 2.142476797103882, "Pretrain/Step": 5708, "Pretrain/Step Time": 8.679918019101024} +{"Pretrain/Learning Rate": 1.8311791536769483e-05, "Pretrain/Loss": 1.959798812866211, "Pretrain/Loss (Raw)": 1.7712339162826538, "Pretrain/Step": 5709, "Pretrain/Step Time": 8.684308419004083} +{"Pretrain/Learning Rate": 1.8303611505392205e-05, "Pretrain/Loss": 1.9582432508468628, "Pretrain/Loss (Raw)": 1.8761358261108398, "Pretrain/Step": 5710, "Pretrain/Step Time": 8.684685917571187} +{"Pretrain/Learning Rate": 1.8295432246274e-05, "Pretrain/Loss": 1.9578564167022705, "Pretrain/Loss (Raw)": 1.813132405281067, "Pretrain/Step": 5711, "Pretrain/Step Time": 8.685902697965503} +{"Pretrain/Learning Rate": 1.828725376035814e-05, "Pretrain/Loss": 1.9575939178466797, "Pretrain/Loss (Raw)": 2.095982789993286, "Pretrain/Step": 5712, "Pretrain/Step Time": 8.6841208525002} +{"Pretrain/Learning Rate": 1.827907604858782e-05, "Pretrain/Loss": 1.9577285051345825, "Pretrain/Loss (Raw)": 1.9406969547271729, "Pretrain/Step": 5713, "Pretrain/Step Time": 8.687434613704681} +{"Pretrain/Learning Rate": 1.8270899111906102e-05, "Pretrain/Loss": 1.9560768604278564, "Pretrain/Loss (Raw)": 2.042656421661377, "Pretrain/Step": 5714, "Pretrain/Step Time": 8.68846802227199} +{"Pretrain/Learning Rate": 1.826272295125602e-05, "Pretrain/Loss": 1.955788016319275, "Pretrain/Loss (Raw)": 1.861503005027771, "Pretrain/Step": 5715, "Pretrain/Step Time": 8.686671456322074} +{"Pretrain/Learning Rate": 1.8254547567580472e-05, "Pretrain/Loss": 1.952046275138855, "Pretrain/Loss (Raw)": 1.7010482549667358, "Pretrain/Step": 5716, "Pretrain/Step Time": 8.689978186041117} +{"Pretrain/Learning Rate": 1.824637296182228e-05, "Pretrain/Loss": 1.9535812139511108, "Pretrain/Loss (Raw)": 1.9494739770889282, "Pretrain/Step": 5717, "Pretrain/Step Time": 8.689203564077616} +{"Pretrain/Learning Rate": 1.8238199134924185e-05, "Pretrain/Loss": 1.9489558935165405, "Pretrain/Loss (Raw)": 1.9010329246520996, "Pretrain/Step": 5718, "Pretrain/Step Time": 8.686729226261377} +{"Pretrain/Learning Rate": 1.8230026087828824e-05, "Pretrain/Loss": 1.9504787921905518, "Pretrain/Loss (Raw)": 2.008601427078247, "Pretrain/Step": 5719, "Pretrain/Step Time": 8.688207510858774} +{"Pretrain/Learning Rate": 1.8221853821478763e-05, "Pretrain/Loss": 1.9488980770111084, "Pretrain/Loss (Raw)": 1.7272920608520508, "Pretrain/Step": 5720, "Pretrain/Step Time": 8.690544582903385} +{"Pretrain/Learning Rate": 1.821368233681645e-05, "Pretrain/Loss": 1.9494540691375732, "Pretrain/Loss (Raw)": 1.9624146223068237, "Pretrain/Step": 5721, "Pretrain/Step Time": 8.684329964220524} +{"Pretrain/Learning Rate": 1.820551163478428e-05, "Pretrain/Loss": 1.948089361190796, "Pretrain/Loss (Raw)": 1.8509581089019775, "Pretrain/Step": 5722, "Pretrain/Step Time": 8.68312095105648} +{"Pretrain/Learning Rate": 1.8197341716324516e-05, "Pretrain/Loss": 1.9494655132293701, "Pretrain/Loss (Raw)": 2.0772929191589355, "Pretrain/Step": 5723, "Pretrain/Step Time": 8.684514921158552} +{"Pretrain/Learning Rate": 1.8189172582379365e-05, "Pretrain/Loss": 1.948148488998413, "Pretrain/Loss (Raw)": 1.9114243984222412, "Pretrain/Step": 5724, "Pretrain/Step Time": 8.68222038820386} +{"Pretrain/Learning Rate": 1.818100423389092e-05, "Pretrain/Loss": 1.9505854845046997, "Pretrain/Loss (Raw)": 1.9498143196105957, "Pretrain/Step": 5725, "Pretrain/Step Time": 8.678674964234233} +{"Pretrain/Learning Rate": 1.817283667180121e-05, "Pretrain/Loss": 1.9517838954925537, "Pretrain/Loss (Raw)": 2.206460475921631, "Pretrain/Step": 5726, "Pretrain/Step Time": 8.684410916641355} +{"Pretrain/Learning Rate": 1.8164669897052134e-05, "Pretrain/Loss": 1.9515609741210938, "Pretrain/Loss (Raw)": 1.9234309196472168, "Pretrain/Step": 5727, "Pretrain/Step Time": 8.682054409757257} +{"Pretrain/Learning Rate": 1.8156503910585544e-05, "Pretrain/Loss": 1.9518916606903076, "Pretrain/Loss (Raw)": 1.7738734483718872, "Pretrain/Step": 5728, "Pretrain/Step Time": 8.685324437916279} +{"Pretrain/Learning Rate": 1.814833871334316e-05, "Pretrain/Loss": 1.9514082670211792, "Pretrain/Loss (Raw)": 1.9491255283355713, "Pretrain/Step": 5729, "Pretrain/Step Time": 8.687310403212905} +{"Pretrain/Learning Rate": 1.8140174306266655e-05, "Pretrain/Loss": 1.9490950107574463, "Pretrain/Loss (Raw)": 1.8248705863952637, "Pretrain/Step": 5730, "Pretrain/Step Time": 8.687575107440352} +{"Pretrain/Learning Rate": 1.8132010690297557e-05, "Pretrain/Loss": 1.9471145868301392, "Pretrain/Loss (Raw)": 1.8299446105957031, "Pretrain/Step": 5731, "Pretrain/Step Time": 8.68464651145041} +{"Pretrain/Learning Rate": 1.8123847866377367e-05, "Pretrain/Loss": 1.946432113647461, "Pretrain/Loss (Raw)": 2.0659966468811035, "Pretrain/Step": 5732, "Pretrain/Step Time": 8.686164576560259} +{"Pretrain/Learning Rate": 1.8115685835447423e-05, "Pretrain/Loss": 1.946324348449707, "Pretrain/Loss (Raw)": 1.7148739099502563, "Pretrain/Step": 5733, "Pretrain/Step Time": 8.691529909148812} +{"Pretrain/Learning Rate": 1.810752459844905e-05, "Pretrain/Loss": 1.9468467235565186, "Pretrain/Loss (Raw)": 2.10868501663208, "Pretrain/Step": 5734, "Pretrain/Step Time": 8.693404879420996} +{"Pretrain/Learning Rate": 1.8099364156323396e-05, "Pretrain/Loss": 1.949446439743042, "Pretrain/Loss (Raw)": 2.2400388717651367, "Pretrain/Step": 5735, "Pretrain/Step Time": 8.69128249771893} +{"Pretrain/Learning Rate": 1.8091204510011607e-05, "Pretrain/Loss": 1.9468543529510498, "Pretrain/Loss (Raw)": 1.5319970846176147, "Pretrain/Step": 5736, "Pretrain/Step Time": 8.695190912112594} +{"Pretrain/Learning Rate": 1.8083045660454655e-05, "Pretrain/Loss": 1.9466629028320312, "Pretrain/Loss (Raw)": 1.9478033781051636, "Pretrain/Step": 5737, "Pretrain/Step Time": 8.688313242048025} +{"Pretrain/Learning Rate": 1.8074887608593477e-05, "Pretrain/Loss": 1.9459142684936523, "Pretrain/Loss (Raw)": 2.233630895614624, "Pretrain/Step": 5738, "Pretrain/Step Time": 8.691759493201971} +{"Pretrain/Learning Rate": 1.8066730355368888e-05, "Pretrain/Loss": 1.944455623626709, "Pretrain/Loss (Raw)": 1.941399335861206, "Pretrain/Step": 5739, "Pretrain/Step Time": 8.690711362287402} +{"Pretrain/Learning Rate": 1.805857390172163e-05, "Pretrain/Loss": 1.9436805248260498, "Pretrain/Loss (Raw)": 1.8917639255523682, "Pretrain/Step": 5740, "Pretrain/Step Time": 8.692150907590985} +{"Pretrain/Learning Rate": 1.8050418248592334e-05, "Pretrain/Loss": 1.943770408630371, "Pretrain/Loss (Raw)": 2.014521837234497, "Pretrain/Step": 5741, "Pretrain/Step Time": 8.69299396686256} +{"Pretrain/Learning Rate": 1.8042263396921554e-05, "Pretrain/Loss": 1.9426686763763428, "Pretrain/Loss (Raw)": 1.6981953382492065, "Pretrain/Step": 5742, "Pretrain/Step Time": 8.6932015363127} +{"Pretrain/Learning Rate": 1.803410934764974e-05, "Pretrain/Loss": 1.9416468143463135, "Pretrain/Loss (Raw)": 2.144373893737793, "Pretrain/Step": 5743, "Pretrain/Step Time": 8.685294611379504} +{"Pretrain/Learning Rate": 1.8025956101717272e-05, "Pretrain/Loss": 1.9408982992172241, "Pretrain/Loss (Raw)": 1.8406505584716797, "Pretrain/Step": 5744, "Pretrain/Step Time": 8.694185841828585} +{"Pretrain/Learning Rate": 1.80178036600644e-05, "Pretrain/Loss": 1.9436068534851074, "Pretrain/Loss (Raw)": 2.1408040523529053, "Pretrain/Step": 5745, "Pretrain/Step Time": 8.692006209865212} +{"Pretrain/Learning Rate": 1.8009652023631318e-05, "Pretrain/Loss": 1.9443426132202148, "Pretrain/Loss (Raw)": 2.0372531414031982, "Pretrain/Step": 5746, "Pretrain/Step Time": 8.689128037542105} +{"Pretrain/Learning Rate": 1.8001501193358096e-05, "Pretrain/Loss": 1.9445263147354126, "Pretrain/Loss (Raw)": 2.064711570739746, "Pretrain/Step": 5747, "Pretrain/Step Time": 8.694146744906902} +{"Pretrain/Learning Rate": 1.799335117018474e-05, "Pretrain/Loss": 1.9425064325332642, "Pretrain/Loss (Raw)": 1.6412893533706665, "Pretrain/Step": 5748, "Pretrain/Step Time": 8.6878899987787} +{"Pretrain/Learning Rate": 1.798520195505114e-05, "Pretrain/Loss": 1.9403846263885498, "Pretrain/Loss (Raw)": 1.882346510887146, "Pretrain/Step": 5749, "Pretrain/Step Time": 8.687914548441768} +{"Pretrain/Learning Rate": 1.7977053548897112e-05, "Pretrain/Loss": 1.9446523189544678, "Pretrain/Loss (Raw)": 1.7981263399124146, "Pretrain/Step": 5750, "Pretrain/Step Time": 8.692331423982978} +{"Pretrain/Learning Rate": 1.7968905952662354e-05, "Pretrain/Loss": 1.942696213722229, "Pretrain/Loss (Raw)": 1.893551230430603, "Pretrain/Step": 5751, "Pretrain/Step Time": 8.689178539440036} +{"Pretrain/Learning Rate": 1.79607591672865e-05, "Pretrain/Loss": 1.9454448223114014, "Pretrain/Loss (Raw)": 2.077373743057251, "Pretrain/Step": 5752, "Pretrain/Step Time": 8.685451237484813} +{"Pretrain/Learning Rate": 1.7952613193709063e-05, "Pretrain/Loss": 1.9497854709625244, "Pretrain/Loss (Raw)": 2.4653542041778564, "Pretrain/Step": 5753, "Pretrain/Step Time": 8.688775600865483} +{"Pretrain/Learning Rate": 1.7944468032869486e-05, "Pretrain/Loss": 1.9498664140701294, "Pretrain/Loss (Raw)": 1.9997178316116333, "Pretrain/Step": 5754, "Pretrain/Step Time": 8.689594060182571} +{"Pretrain/Learning Rate": 1.7936323685707095e-05, "Pretrain/Loss": 1.9490357637405396, "Pretrain/Loss (Raw)": 1.8266005516052246, "Pretrain/Step": 5755, "Pretrain/Step Time": 8.69057689793408} +{"Pretrain/Learning Rate": 1.7928180153161146e-05, "Pretrain/Loss": 1.9464049339294434, "Pretrain/Loss (Raw)": 1.9269229173660278, "Pretrain/Step": 5756, "Pretrain/Step Time": 8.692269690334797} +{"Pretrain/Learning Rate": 1.792003743617079e-05, "Pretrain/Loss": 1.9499987363815308, "Pretrain/Loss (Raw)": 2.268167734146118, "Pretrain/Step": 5757, "Pretrain/Step Time": 8.68719464354217} +{"Pretrain/Learning Rate": 1.7911895535675067e-05, "Pretrain/Loss": 1.9508702754974365, "Pretrain/Loss (Raw)": 1.908737301826477, "Pretrain/Step": 5758, "Pretrain/Step Time": 8.687081202864647} +{"Pretrain/Learning Rate": 1.7903754452612964e-05, "Pretrain/Loss": 1.9510411024093628, "Pretrain/Loss (Raw)": 1.9022941589355469, "Pretrain/Step": 5759, "Pretrain/Step Time": 8.686110133305192} +{"Pretrain/Learning Rate": 1.7895614187923326e-05, "Pretrain/Loss": 1.9524431228637695, "Pretrain/Loss (Raw)": 2.076185464859009, "Pretrain/Step": 5760, "Pretrain/Step Time": 8.687050817534328} +{"Pretrain/Learning Rate": 1.7887474742544945e-05, "Pretrain/Loss": 1.9518917798995972, "Pretrain/Loss (Raw)": 1.9599716663360596, "Pretrain/Step": 5761, "Pretrain/Step Time": 8.684205701574683} +{"Pretrain/Learning Rate": 1.7879336117416485e-05, "Pretrain/Loss": 1.9542794227600098, "Pretrain/Loss (Raw)": 2.270250082015991, "Pretrain/Step": 5762, "Pretrain/Step Time": 8.68544221110642} +{"Pretrain/Learning Rate": 1.7871198313476544e-05, "Pretrain/Loss": 1.954261302947998, "Pretrain/Loss (Raw)": 1.9878854751586914, "Pretrain/Step": 5763, "Pretrain/Step Time": 8.683340286836028} +{"Pretrain/Learning Rate": 1.78630613316636e-05, "Pretrain/Loss": 1.951979637145996, "Pretrain/Loss (Raw)": 1.7675938606262207, "Pretrain/Step": 5764, "Pretrain/Step Time": 8.681266844272614} +{"Pretrain/Learning Rate": 1.785492517291606e-05, "Pretrain/Loss": 1.9540412425994873, "Pretrain/Loss (Raw)": 1.7403720617294312, "Pretrain/Step": 5765, "Pretrain/Step Time": 8.679956493899226} +{"Pretrain/Learning Rate": 1.784678983817221e-05, "Pretrain/Loss": 1.9523875713348389, "Pretrain/Loss (Raw)": 1.9343934059143066, "Pretrain/Step": 5766, "Pretrain/Step Time": 8.681469405069947} +{"Pretrain/Learning Rate": 1.783865532837027e-05, "Pretrain/Loss": 1.9522628784179688, "Pretrain/Loss (Raw)": 2.1157643795013428, "Pretrain/Step": 5767, "Pretrain/Step Time": 8.678284766152501} +{"Pretrain/Learning Rate": 1.7830521644448334e-05, "Pretrain/Loss": 1.9501978158950806, "Pretrain/Loss (Raw)": 1.8238518238067627, "Pretrain/Step": 5768, "Pretrain/Step Time": 8.680619437247515} +{"Pretrain/Learning Rate": 1.7822388787344434e-05, "Pretrain/Loss": 1.9524040222167969, "Pretrain/Loss (Raw)": 2.0618972778320312, "Pretrain/Step": 5769, "Pretrain/Step Time": 8.681022131815553} +{"Pretrain/Learning Rate": 1.781425675799648e-05, "Pretrain/Loss": 1.9537012577056885, "Pretrain/Loss (Raw)": 1.886085867881775, "Pretrain/Step": 5770, "Pretrain/Step Time": 8.685023820027709} +{"Pretrain/Learning Rate": 1.7806125557342303e-05, "Pretrain/Loss": 1.9524978399276733, "Pretrain/Loss (Raw)": 1.9788612127304077, "Pretrain/Step": 5771, "Pretrain/Step Time": 8.684743506833911} +{"Pretrain/Learning Rate": 1.7797995186319606e-05, "Pretrain/Loss": 1.953716516494751, "Pretrain/Loss (Raw)": 2.0063869953155518, "Pretrain/Step": 5772, "Pretrain/Step Time": 8.686588181182742} +{"Pretrain/Learning Rate": 1.778986564586606e-05, "Pretrain/Loss": 1.9549201726913452, "Pretrain/Loss (Raw)": 2.234464645385742, "Pretrain/Step": 5773, "Pretrain/Step Time": 8.68813706934452} +{"Pretrain/Learning Rate": 1.778173693691917e-05, "Pretrain/Loss": 1.954416275024414, "Pretrain/Loss (Raw)": 1.9068403244018555, "Pretrain/Step": 5774, "Pretrain/Step Time": 8.685349751263857} +{"Pretrain/Learning Rate": 1.77736090604164e-05, "Pretrain/Loss": 1.9539196491241455, "Pretrain/Loss (Raw)": 2.0200142860412598, "Pretrain/Step": 5775, "Pretrain/Step Time": 8.683048006147146} +{"Pretrain/Learning Rate": 1.7765482017295077e-05, "Pretrain/Loss": 1.9560233354568481, "Pretrain/Loss (Raw)": 2.180629253387451, "Pretrain/Step": 5776, "Pretrain/Step Time": 8.681033860892057} +{"Pretrain/Learning Rate": 1.7757355808492468e-05, "Pretrain/Loss": 1.9571614265441895, "Pretrain/Loss (Raw)": 2.1194846630096436, "Pretrain/Step": 5777, "Pretrain/Step Time": 8.68309891410172} +{"Pretrain/Learning Rate": 1.77492304349457e-05, "Pretrain/Loss": 1.9562510251998901, "Pretrain/Loss (Raw)": 1.9308327436447144, "Pretrain/Step": 5778, "Pretrain/Step Time": 8.6799108479172} +{"Pretrain/Learning Rate": 1.7741105897591865e-05, "Pretrain/Loss": 1.954675316810608, "Pretrain/Loss (Raw)": 1.7396860122680664, "Pretrain/Step": 5779, "Pretrain/Step Time": 8.681199619546533} +{"Pretrain/Learning Rate": 1.7732982197367888e-05, "Pretrain/Loss": 1.9499932527542114, "Pretrain/Loss (Raw)": 1.4561880826950073, "Pretrain/Step": 5780, "Pretrain/Step Time": 8.676183557137847} +{"Pretrain/Learning Rate": 1.7724859335210654e-05, "Pretrain/Loss": 1.9501444101333618, "Pretrain/Loss (Raw)": 1.952877402305603, "Pretrain/Step": 5781, "Pretrain/Step Time": 8.676262920722365} +{"Pretrain/Learning Rate": 1.771673731205692e-05, "Pretrain/Loss": 1.9517557621002197, "Pretrain/Loss (Raw)": 2.11779522895813, "Pretrain/Step": 5782, "Pretrain/Step Time": 8.67122027464211} +{"Pretrain/Learning Rate": 1.770861612884336e-05, "Pretrain/Loss": 1.951210856437683, "Pretrain/Loss (Raw)": 1.882301688194275, "Pretrain/Step": 5783, "Pretrain/Step Time": 8.671179408207536} +{"Pretrain/Learning Rate": 1.7700495786506545e-05, "Pretrain/Loss": 1.95103120803833, "Pretrain/Loss (Raw)": 2.1220316886901855, "Pretrain/Step": 5784, "Pretrain/Step Time": 8.669863419607282} +{"Pretrain/Learning Rate": 1.7692376285982953e-05, "Pretrain/Loss": 1.9493772983551025, "Pretrain/Loss (Raw)": 2.0786020755767822, "Pretrain/Step": 5785, "Pretrain/Step Time": 8.669718144461513} +{"Pretrain/Learning Rate": 1.768425762820896e-05, "Pretrain/Loss": 1.9496628046035767, "Pretrain/Loss (Raw)": 2.102055788040161, "Pretrain/Step": 5786, "Pretrain/Step Time": 8.668579708784819} +{"Pretrain/Learning Rate": 1.7676139814120857e-05, "Pretrain/Loss": 1.9500892162322998, "Pretrain/Loss (Raw)": 1.9741864204406738, "Pretrain/Step": 5787, "Pretrain/Step Time": 8.675778234377503} +{"Pretrain/Learning Rate": 1.7668022844654812e-05, "Pretrain/Loss": 1.9486644268035889, "Pretrain/Loss (Raw)": 1.8280946016311646, "Pretrain/Step": 5788, "Pretrain/Step Time": 8.67737216874957} +{"Pretrain/Learning Rate": 1.765990672074693e-05, "Pretrain/Loss": 1.9473958015441895, "Pretrain/Loss (Raw)": 1.8874614238739014, "Pretrain/Step": 5789, "Pretrain/Step Time": 8.678907440975308} +{"Pretrain/Learning Rate": 1.7651791443333187e-05, "Pretrain/Loss": 1.9497522115707397, "Pretrain/Loss (Raw)": 2.0571656227111816, "Pretrain/Step": 5790, "Pretrain/Step Time": 8.677157185971737} +{"Pretrain/Learning Rate": 1.764367701334949e-05, "Pretrain/Loss": 1.9497839212417603, "Pretrain/Loss (Raw)": 1.910996913909912, "Pretrain/Step": 5791, "Pretrain/Step Time": 8.678368475288153} +{"Pretrain/Learning Rate": 1.7635563431731612e-05, "Pretrain/Loss": 1.9478623867034912, "Pretrain/Loss (Raw)": 1.8802686929702759, "Pretrain/Step": 5792, "Pretrain/Step Time": 8.67560855858028} +{"Pretrain/Learning Rate": 1.762745069941527e-05, "Pretrain/Loss": 1.9513822793960571, "Pretrain/Loss (Raw)": 2.1854166984558105, "Pretrain/Step": 5793, "Pretrain/Step Time": 8.675369827076793} +{"Pretrain/Learning Rate": 1.7619338817336046e-05, "Pretrain/Loss": 1.9533214569091797, "Pretrain/Loss (Raw)": 2.0097458362579346, "Pretrain/Step": 5794, "Pretrain/Step Time": 8.67436702363193} +{"Pretrain/Learning Rate": 1.7611227786429457e-05, "Pretrain/Loss": 1.9544862508773804, "Pretrain/Loss (Raw)": 1.9700732231140137, "Pretrain/Step": 5795, "Pretrain/Step Time": 8.677252817898989} +{"Pretrain/Learning Rate": 1.7603117607630893e-05, "Pretrain/Loss": 1.9554744958877563, "Pretrain/Loss (Raw)": 2.049917697906494, "Pretrain/Step": 5796, "Pretrain/Step Time": 8.679285211488605} +{"Pretrain/Learning Rate": 1.7595008281875657e-05, "Pretrain/Loss": 1.9547330141067505, "Pretrain/Loss (Raw)": 1.9597315788269043, "Pretrain/Step": 5797, "Pretrain/Step Time": 8.680272975936532} +{"Pretrain/Learning Rate": 1.7586899810098967e-05, "Pretrain/Loss": 1.954027771949768, "Pretrain/Loss (Raw)": 1.9271080493927002, "Pretrain/Step": 5798, "Pretrain/Step Time": 8.678295489400625} +{"Pretrain/Learning Rate": 1.757879219323592e-05, "Pretrain/Loss": 1.9543789625167847, "Pretrain/Loss (Raw)": 1.9791553020477295, "Pretrain/Step": 5799, "Pretrain/Step Time": 8.68231675773859} +{"Pretrain/Learning Rate": 1.757068543222153e-05, "Pretrain/Loss": 1.9541921615600586, "Pretrain/Loss (Raw)": 1.997206211090088, "Pretrain/Step": 5800, "Pretrain/Step Time": 8.685205399990082} +{"Pretrain/Learning Rate": 1.7562579527990696e-05, "Pretrain/Loss": 1.9532634019851685, "Pretrain/Loss (Raw)": 1.85490083694458, "Pretrain/Step": 5801, "Pretrain/Step Time": 8.684628613293171} +{"Pretrain/Learning Rate": 1.7554474481478245e-05, "Pretrain/Loss": 1.9554649591445923, "Pretrain/Loss (Raw)": 2.07483172416687, "Pretrain/Step": 5802, "Pretrain/Step Time": 8.684953296557069} +{"Pretrain/Learning Rate": 1.7546370293618875e-05, "Pretrain/Loss": 1.9537171125411987, "Pretrain/Loss (Raw)": 1.8052512407302856, "Pretrain/Step": 5803, "Pretrain/Step Time": 8.684397798031569} +{"Pretrain/Learning Rate": 1.7538266965347212e-05, "Pretrain/Loss": 1.9543390274047852, "Pretrain/Loss (Raw)": 2.174431324005127, "Pretrain/Step": 5804, "Pretrain/Step Time": 8.683220503851771} +{"Pretrain/Learning Rate": 1.7530164497597757e-05, "Pretrain/Loss": 1.9532760381698608, "Pretrain/Loss (Raw)": 2.1079983711242676, "Pretrain/Step": 5805, "Pretrain/Step Time": 8.687688432633877} +{"Pretrain/Learning Rate": 1.7522062891304936e-05, "Pretrain/Loss": 1.9542086124420166, "Pretrain/Loss (Raw)": 1.9018139839172363, "Pretrain/Step": 5806, "Pretrain/Step Time": 8.68010032363236} +{"Pretrain/Learning Rate": 1.7513962147403057e-05, "Pretrain/Loss": 1.9538565874099731, "Pretrain/Loss (Raw)": 2.030466318130493, "Pretrain/Step": 5807, "Pretrain/Step Time": 8.680903336033225} +{"Pretrain/Learning Rate": 1.750586226682634e-05, "Pretrain/Loss": 1.9542877674102783, "Pretrain/Loss (Raw)": 1.9033803939819336, "Pretrain/Step": 5808, "Pretrain/Step Time": 8.685211712494493} +{"Pretrain/Learning Rate": 1.74977632505089e-05, "Pretrain/Loss": 1.9534398317337036, "Pretrain/Loss (Raw)": 1.8535935878753662, "Pretrain/Step": 5809, "Pretrain/Step Time": 8.684903386980295} +{"Pretrain/Learning Rate": 1.7489665099384755e-05, "Pretrain/Loss": 1.952993392944336, "Pretrain/Loss (Raw)": 2.0369834899902344, "Pretrain/Step": 5810, "Pretrain/Step Time": 8.670904690399766} +{"Pretrain/Learning Rate": 1.7481567814387815e-05, "Pretrain/Loss": 1.9521188735961914, "Pretrain/Loss (Raw)": 1.9136701822280884, "Pretrain/Step": 5811, "Pretrain/Step Time": 8.672401206567883} +{"Pretrain/Learning Rate": 1.7473471396451913e-05, "Pretrain/Loss": 1.9517513513565063, "Pretrain/Loss (Raw)": 1.8757399320602417, "Pretrain/Step": 5812, "Pretrain/Step Time": 8.67393864504993} +{"Pretrain/Learning Rate": 1.746537584651074e-05, "Pretrain/Loss": 1.9532501697540283, "Pretrain/Loss (Raw)": 1.9631578922271729, "Pretrain/Step": 5813, "Pretrain/Step Time": 8.675809698179364} +{"Pretrain/Learning Rate": 1.7457281165497947e-05, "Pretrain/Loss": 1.9537489414215088, "Pretrain/Loss (Raw)": 1.9532384872436523, "Pretrain/Step": 5814, "Pretrain/Step Time": 8.675760742276907} +{"Pretrain/Learning Rate": 1.7449187354347014e-05, "Pretrain/Loss": 1.951953649520874, "Pretrain/Loss (Raw)": 1.7828290462493896, "Pretrain/Step": 5815, "Pretrain/Step Time": 8.670634621754289} +{"Pretrain/Learning Rate": 1.7441094413991393e-05, "Pretrain/Loss": 1.9518848657608032, "Pretrain/Loss (Raw)": 1.6325640678405762, "Pretrain/Step": 5816, "Pretrain/Step Time": 8.668941285461187} +{"Pretrain/Learning Rate": 1.7433002345364368e-05, "Pretrain/Loss": 1.9520924091339111, "Pretrain/Loss (Raw)": 2.0963997840881348, "Pretrain/Step": 5817, "Pretrain/Step Time": 8.669922715052962} +{"Pretrain/Learning Rate": 1.7424911149399183e-05, "Pretrain/Loss": 1.95460844039917, "Pretrain/Loss (Raw)": 2.0107951164245605, "Pretrain/Step": 5818, "Pretrain/Step Time": 8.666415825486183} +{"Pretrain/Learning Rate": 1.7416820827028926e-05, "Pretrain/Loss": 1.9534918069839478, "Pretrain/Loss (Raw)": 1.8691768646240234, "Pretrain/Step": 5819, "Pretrain/Step Time": 8.667441502213478} +{"Pretrain/Learning Rate": 1.7408731379186638e-05, "Pretrain/Loss": 1.9523452520370483, "Pretrain/Loss (Raw)": 1.9990111589431763, "Pretrain/Step": 5820, "Pretrain/Step Time": 8.668795920908451} +{"Pretrain/Learning Rate": 1.740064280680521e-05, "Pretrain/Loss": 1.9540021419525146, "Pretrain/Loss (Raw)": 2.029557943344116, "Pretrain/Step": 5821, "Pretrain/Step Time": 8.662715595215559} +{"Pretrain/Learning Rate": 1.7392555110817467e-05, "Pretrain/Loss": 1.9542388916015625, "Pretrain/Loss (Raw)": 1.9145209789276123, "Pretrain/Step": 5822, "Pretrain/Step Time": 8.661145772784948} +{"Pretrain/Learning Rate": 1.738446829215611e-05, "Pretrain/Loss": 1.9528865814208984, "Pretrain/Loss (Raw)": 1.9084440469741821, "Pretrain/Step": 5823, "Pretrain/Step Time": 8.654594853520393} +{"Pretrain/Learning Rate": 1.737638235175376e-05, "Pretrain/Loss": 1.9542827606201172, "Pretrain/Loss (Raw)": 1.9414029121398926, "Pretrain/Step": 5824, "Pretrain/Step Time": 8.65919648297131} +{"Pretrain/Learning Rate": 1.736829729054292e-05, "Pretrain/Loss": 1.9588630199432373, "Pretrain/Loss (Raw)": 2.1430230140686035, "Pretrain/Step": 5825, "Pretrain/Step Time": 8.650845635682344} +{"Pretrain/Learning Rate": 1.7360213109456e-05, "Pretrain/Loss": 1.9604564905166626, "Pretrain/Loss (Raw)": 2.279062032699585, "Pretrain/Step": 5826, "Pretrain/Step Time": 8.65488382987678} +{"Pretrain/Learning Rate": 1.73521298094253e-05, "Pretrain/Loss": 1.9609601497650146, "Pretrain/Loss (Raw)": 2.073559045791626, "Pretrain/Step": 5827, "Pretrain/Step Time": 8.647255968302488} +{"Pretrain/Learning Rate": 1.734404739138303e-05, "Pretrain/Loss": 1.9612822532653809, "Pretrain/Loss (Raw)": 2.015937089920044, "Pretrain/Step": 5828, "Pretrain/Step Time": 8.64858803898096} +{"Pretrain/Learning Rate": 1.733596585626129e-05, "Pretrain/Loss": 1.9601187705993652, "Pretrain/Loss (Raw)": 1.8827680349349976, "Pretrain/Step": 5829, "Pretrain/Step Time": 8.65014273300767} +{"Pretrain/Learning Rate": 1.7327885204992083e-05, "Pretrain/Loss": 1.9614595174789429, "Pretrain/Loss (Raw)": 2.058291435241699, "Pretrain/Step": 5830, "Pretrain/Step Time": 8.650197178125381} +{"Pretrain/Learning Rate": 1.7319805438507303e-05, "Pretrain/Loss": 1.959826111793518, "Pretrain/Loss (Raw)": 1.7183822393417358, "Pretrain/Step": 5831, "Pretrain/Step Time": 8.651290277019143} +{"Pretrain/Learning Rate": 1.7311726557738754e-05, "Pretrain/Loss": 1.9581496715545654, "Pretrain/Loss (Raw)": 1.85141122341156, "Pretrain/Step": 5832, "Pretrain/Step Time": 8.65387362241745} +{"Pretrain/Learning Rate": 1.7303648563618125e-05, "Pretrain/Loss": 1.9590508937835693, "Pretrain/Loss (Raw)": 1.7765634059906006, "Pretrain/Step": 5833, "Pretrain/Step Time": 8.654266709461808} +{"Pretrain/Learning Rate": 1.7295571457077015e-05, "Pretrain/Loss": 1.9591670036315918, "Pretrain/Loss (Raw)": 2.009873867034912, "Pretrain/Step": 5834, "Pretrain/Step Time": 8.657414119690657} +{"Pretrain/Learning Rate": 1.72874952390469e-05, "Pretrain/Loss": 1.959730863571167, "Pretrain/Loss (Raw)": 2.0346298217773438, "Pretrain/Step": 5835, "Pretrain/Step Time": 8.659844107925892} +{"Pretrain/Learning Rate": 1.7279419910459182e-05, "Pretrain/Loss": 1.9594786167144775, "Pretrain/Loss (Raw)": 2.110182762145996, "Pretrain/Step": 5836, "Pretrain/Step Time": 8.656661465764046} +{"Pretrain/Learning Rate": 1.727134547224514e-05, "Pretrain/Loss": 1.9607776403427124, "Pretrain/Loss (Raw)": 1.9375150203704834, "Pretrain/Step": 5837, "Pretrain/Step Time": 8.654458526521921} +{"Pretrain/Learning Rate": 1.726327192533595e-05, "Pretrain/Loss": 1.962147831916809, "Pretrain/Loss (Raw)": 2.0515241622924805, "Pretrain/Step": 5838, "Pretrain/Step Time": 8.654860185459256} +{"Pretrain/Learning Rate": 1.7255199270662708e-05, "Pretrain/Loss": 1.963515281677246, "Pretrain/Loss (Raw)": 1.9881771802902222, "Pretrain/Step": 5839, "Pretrain/Step Time": 8.649214277043939} +{"Pretrain/Learning Rate": 1.7247127509156377e-05, "Pretrain/Loss": 1.9656362533569336, "Pretrain/Loss (Raw)": 2.367457151412964, "Pretrain/Step": 5840, "Pretrain/Step Time": 8.652069177478552} +{"Pretrain/Learning Rate": 1.7239056641747836e-05, "Pretrain/Loss": 1.9653635025024414, "Pretrain/Loss (Raw)": 1.9057743549346924, "Pretrain/Step": 5841, "Pretrain/Step Time": 8.646888764575124} +{"Pretrain/Learning Rate": 1.723098666936785e-05, "Pretrain/Loss": 1.965580701828003, "Pretrain/Loss (Raw)": 2.070457935333252, "Pretrain/Step": 5842, "Pretrain/Step Time": 8.648817216977477} +{"Pretrain/Learning Rate": 1.7222917592947096e-05, "Pretrain/Loss": 1.9665511846542358, "Pretrain/Loss (Raw)": 1.9857231378555298, "Pretrain/Step": 5843, "Pretrain/Step Time": 8.651980156078935} +{"Pretrain/Learning Rate": 1.7214849413416128e-05, "Pretrain/Loss": 1.9684760570526123, "Pretrain/Loss (Raw)": 1.9474469423294067, "Pretrain/Step": 5844, "Pretrain/Step Time": 8.647148605436087} +{"Pretrain/Learning Rate": 1.7206782131705414e-05, "Pretrain/Loss": 1.967186450958252, "Pretrain/Loss (Raw)": 1.7843917608261108, "Pretrain/Step": 5845, "Pretrain/Step Time": 8.651668198406696} +{"Pretrain/Learning Rate": 1.7198715748745304e-05, "Pretrain/Loss": 1.9682064056396484, "Pretrain/Loss (Raw)": 2.03157901763916, "Pretrain/Step": 5846, "Pretrain/Step Time": 8.656404370442033} +{"Pretrain/Learning Rate": 1.7190650265466056e-05, "Pretrain/Loss": 1.9683843851089478, "Pretrain/Loss (Raw)": 2.0313947200775146, "Pretrain/Step": 5847, "Pretrain/Step Time": 8.653956267982721} +{"Pretrain/Learning Rate": 1.7182585682797815e-05, "Pretrain/Loss": 1.9686534404754639, "Pretrain/Loss (Raw)": 1.7617359161376953, "Pretrain/Step": 5848, "Pretrain/Step Time": 8.65582930482924} +{"Pretrain/Learning Rate": 1.7174522001670633e-05, "Pretrain/Loss": 1.9702279567718506, "Pretrain/Loss (Raw)": 2.163950204849243, "Pretrain/Step": 5849, "Pretrain/Step Time": 8.654392508789897} +{"Pretrain/Learning Rate": 1.7166459223014448e-05, "Pretrain/Loss": 1.9688385725021362, "Pretrain/Loss (Raw)": 1.6731077432632446, "Pretrain/Step": 5850, "Pretrain/Step Time": 8.65915447473526} +{"Pretrain/Learning Rate": 1.71583973477591e-05, "Pretrain/Loss": 1.969066858291626, "Pretrain/Loss (Raw)": 2.106527805328369, "Pretrain/Step": 5851, "Pretrain/Step Time": 8.653598040342331} +{"Pretrain/Learning Rate": 1.7150336376834315e-05, "Pretrain/Loss": 1.968770980834961, "Pretrain/Loss (Raw)": 1.8735504150390625, "Pretrain/Step": 5852, "Pretrain/Step Time": 8.654823960736394} +{"Pretrain/Learning Rate": 1.714227631116974e-05, "Pretrain/Loss": 1.9700186252593994, "Pretrain/Loss (Raw)": 2.109503746032715, "Pretrain/Step": 5853, "Pretrain/Step Time": 8.654269756749272} +{"Pretrain/Learning Rate": 1.7134217151694872e-05, "Pretrain/Loss": 1.967986822128296, "Pretrain/Loss (Raw)": 1.946386456489563, "Pretrain/Step": 5854, "Pretrain/Step Time": 8.65215653553605} +{"Pretrain/Learning Rate": 1.7126158899339164e-05, "Pretrain/Loss": 1.9691357612609863, "Pretrain/Loss (Raw)": 2.0705111026763916, "Pretrain/Step": 5855, "Pretrain/Step Time": 8.650911785662174} +{"Pretrain/Learning Rate": 1.7118101555031895e-05, "Pretrain/Loss": 1.9698917865753174, "Pretrain/Loss (Raw)": 1.8706344366073608, "Pretrain/Step": 5856, "Pretrain/Step Time": 8.64837626926601} +{"Pretrain/Learning Rate": 1.7110045119702314e-05, "Pretrain/Loss": 1.9721465110778809, "Pretrain/Loss (Raw)": 2.237743377685547, "Pretrain/Step": 5857, "Pretrain/Step Time": 8.649721652269363} +{"Pretrain/Learning Rate": 1.7101989594279495e-05, "Pretrain/Loss": 1.97321617603302, "Pretrain/Loss (Raw)": 1.9617713689804077, "Pretrain/Step": 5858, "Pretrain/Step Time": 8.648860601708293} +{"Pretrain/Learning Rate": 1.7093934979692465e-05, "Pretrain/Loss": 1.9758515357971191, "Pretrain/Loss (Raw)": 2.167271375656128, "Pretrain/Step": 5859, "Pretrain/Step Time": 8.64990077726543} +{"Pretrain/Learning Rate": 1.7085881276870093e-05, "Pretrain/Loss": 1.975709319114685, "Pretrain/Loss (Raw)": 2.047806978225708, "Pretrain/Step": 5860, "Pretrain/Step Time": 8.647358344867826} +{"Pretrain/Learning Rate": 1.70778284867412e-05, "Pretrain/Loss": 1.977150797843933, "Pretrain/Loss (Raw)": 1.8993747234344482, "Pretrain/Step": 5861, "Pretrain/Step Time": 8.646286629140377} +{"Pretrain/Learning Rate": 1.706977661023444e-05, "Pretrain/Loss": 1.9777625799179077, "Pretrain/Loss (Raw)": 2.186988115310669, "Pretrain/Step": 5862, "Pretrain/Step Time": 8.643982782959938} +{"Pretrain/Learning Rate": 1.7061725648278423e-05, "Pretrain/Loss": 1.9748198986053467, "Pretrain/Loss (Raw)": 1.8633815050125122, "Pretrain/Step": 5863, "Pretrain/Step Time": 8.648252293467522} +{"Pretrain/Learning Rate": 1.7053675601801606e-05, "Pretrain/Loss": 1.9769017696380615, "Pretrain/Loss (Raw)": 1.7984795570373535, "Pretrain/Step": 5864, "Pretrain/Step Time": 8.646281844004989} +{"Pretrain/Learning Rate": 1.7045626471732363e-05, "Pretrain/Loss": 1.9784170389175415, "Pretrain/Loss (Raw)": 2.1417558193206787, "Pretrain/Step": 5865, "Pretrain/Step Time": 8.651193771511316} +{"Pretrain/Learning Rate": 1.7037578258998956e-05, "Pretrain/Loss": 1.9746507406234741, "Pretrain/Loss (Raw)": 1.7515391111373901, "Pretrain/Step": 5866, "Pretrain/Step Time": 8.644333584234118} +{"Pretrain/Learning Rate": 1.702953096452955e-05, "Pretrain/Loss": 1.9720444679260254, "Pretrain/Loss (Raw)": 1.607784628868103, "Pretrain/Step": 5867, "Pretrain/Step Time": 8.650057259947062} +{"Pretrain/Learning Rate": 1.702148458925218e-05, "Pretrain/Loss": 1.9725466966629028, "Pretrain/Loss (Raw)": 1.956071376800537, "Pretrain/Step": 5868, "Pretrain/Step Time": 8.645589550957084} +{"Pretrain/Learning Rate": 1.7013439134094815e-05, "Pretrain/Loss": 1.9707201719284058, "Pretrain/Loss (Raw)": 1.7807183265686035, "Pretrain/Step": 5869, "Pretrain/Step Time": 8.649099038913846} +{"Pretrain/Learning Rate": 1.7005394599985273e-05, "Pretrain/Loss": 1.9737473726272583, "Pretrain/Loss (Raw)": 2.0856778621673584, "Pretrain/Step": 5870, "Pretrain/Step Time": 8.646584928035736} +{"Pretrain/Learning Rate": 1.6997350987851308e-05, "Pretrain/Loss": 1.9722508192062378, "Pretrain/Loss (Raw)": 1.9528106451034546, "Pretrain/Step": 5871, "Pretrain/Step Time": 8.644868006929755} +{"Pretrain/Learning Rate": 1.6989308298620526e-05, "Pretrain/Loss": 1.9737143516540527, "Pretrain/Loss (Raw)": 2.0279757976531982, "Pretrain/Step": 5872, "Pretrain/Step Time": 8.638272911310196} +{"Pretrain/Learning Rate": 1.6981266533220467e-05, "Pretrain/Loss": 1.9723454713821411, "Pretrain/Loss (Raw)": 1.9656078815460205, "Pretrain/Step": 5873, "Pretrain/Step Time": 8.637796210125089} +{"Pretrain/Learning Rate": 1.6973225692578533e-05, "Pretrain/Loss": 1.9742437601089478, "Pretrain/Loss (Raw)": 2.2802224159240723, "Pretrain/Step": 5874, "Pretrain/Step Time": 8.640350352972746} +{"Pretrain/Learning Rate": 1.6965185777622037e-05, "Pretrain/Loss": 1.9745516777038574, "Pretrain/Loss (Raw)": 2.104125738143921, "Pretrain/Step": 5875, "Pretrain/Step Time": 8.64033286087215} +{"Pretrain/Learning Rate": 1.6957146789278175e-05, "Pretrain/Loss": 1.975691795349121, "Pretrain/Loss (Raw)": 1.7872270345687866, "Pretrain/Step": 5876, "Pretrain/Step Time": 8.64097360149026} +{"Pretrain/Learning Rate": 1.694910872847405e-05, "Pretrain/Loss": 1.9772157669067383, "Pretrain/Loss (Raw)": 2.077425003051758, "Pretrain/Step": 5877, "Pretrain/Step Time": 8.640591438859701} +{"Pretrain/Learning Rate": 1.694107159613664e-05, "Pretrain/Loss": 1.9786231517791748, "Pretrain/Loss (Raw)": 1.9782723188400269, "Pretrain/Step": 5878, "Pretrain/Step Time": 8.640827655792236} +{"Pretrain/Learning Rate": 1.6933035393192824e-05, "Pretrain/Loss": 1.9798223972320557, "Pretrain/Loss (Raw)": 2.047039031982422, "Pretrain/Step": 5879, "Pretrain/Step Time": 8.646790564060211} +{"Pretrain/Learning Rate": 1.6925000120569385e-05, "Pretrain/Loss": 1.9796559810638428, "Pretrain/Loss (Raw)": 2.056074619293213, "Pretrain/Step": 5880, "Pretrain/Step Time": 8.643146367743611} +{"Pretrain/Learning Rate": 1.6916965779192983e-05, "Pretrain/Loss": 1.9763541221618652, "Pretrain/Loss (Raw)": 2.042710542678833, "Pretrain/Step": 5881, "Pretrain/Step Time": 8.64716007374227} +{"Pretrain/Learning Rate": 1.6908932369990176e-05, "Pretrain/Loss": 1.9762375354766846, "Pretrain/Loss (Raw)": 1.984810471534729, "Pretrain/Step": 5882, "Pretrain/Step Time": 8.644237458705902} +{"Pretrain/Learning Rate": 1.6900899893887408e-05, "Pretrain/Loss": 1.9776116609573364, "Pretrain/Loss (Raw)": 2.002473831176758, "Pretrain/Step": 5883, "Pretrain/Step Time": 8.648558434098959} +{"Pretrain/Learning Rate": 1.6892868351811036e-05, "Pretrain/Loss": 1.9767184257507324, "Pretrain/Loss (Raw)": 1.8126085996627808, "Pretrain/Step": 5884, "Pretrain/Step Time": 8.651426503434777} +{"Pretrain/Learning Rate": 1.6884837744687284e-05, "Pretrain/Loss": 1.9724559783935547, "Pretrain/Loss (Raw)": 1.7225559949874878, "Pretrain/Step": 5885, "Pretrain/Step Time": 8.652721583843231} +{"Pretrain/Learning Rate": 1.687680807344229e-05, "Pretrain/Loss": 1.9730801582336426, "Pretrain/Loss (Raw)": 1.9886326789855957, "Pretrain/Step": 5886, "Pretrain/Step Time": 8.651027312502265} +{"Pretrain/Learning Rate": 1.6868779339002056e-05, "Pretrain/Loss": 1.9736835956573486, "Pretrain/Loss (Raw)": 1.9795328378677368, "Pretrain/Step": 5887, "Pretrain/Step Time": 8.648570615798235} +{"Pretrain/Learning Rate": 1.6860751542292515e-05, "Pretrain/Loss": 1.972456932067871, "Pretrain/Loss (Raw)": 1.919167160987854, "Pretrain/Step": 5888, "Pretrain/Step Time": 8.65486865118146} +{"Pretrain/Learning Rate": 1.685272468423945e-05, "Pretrain/Loss": 1.9710712432861328, "Pretrain/Loss (Raw)": 1.7826194763183594, "Pretrain/Step": 5889, "Pretrain/Step Time": 8.654621565714478} +{"Pretrain/Learning Rate": 1.6844698765768575e-05, "Pretrain/Loss": 1.9684855937957764, "Pretrain/Loss (Raw)": 1.93929123878479, "Pretrain/Step": 5890, "Pretrain/Step Time": 8.65342971868813} +{"Pretrain/Learning Rate": 1.6836673787805456e-05, "Pretrain/Loss": 1.9673385620117188, "Pretrain/Loss (Raw)": 1.841045618057251, "Pretrain/Step": 5891, "Pretrain/Step Time": 8.660608572885394} +{"Pretrain/Learning Rate": 1.6828649751275592e-05, "Pretrain/Loss": 1.9690148830413818, "Pretrain/Loss (Raw)": 1.98218834400177, "Pretrain/Step": 5892, "Pretrain/Step Time": 8.663651837036014} +{"Pretrain/Learning Rate": 1.682062665710434e-05, "Pretrain/Loss": 1.9704227447509766, "Pretrain/Loss (Raw)": 1.9205691814422607, "Pretrain/Step": 5893, "Pretrain/Step Time": 8.6680675316602} +{"Pretrain/Learning Rate": 1.6812604506216966e-05, "Pretrain/Loss": 1.971034288406372, "Pretrain/Loss (Raw)": 2.0126760005950928, "Pretrain/Step": 5894, "Pretrain/Step Time": 8.666017333045602} +{"Pretrain/Learning Rate": 1.6804583299538614e-05, "Pretrain/Loss": 1.971558928489685, "Pretrain/Loss (Raw)": 2.182903528213501, "Pretrain/Step": 5895, "Pretrain/Step Time": 8.66898206435144} +{"Pretrain/Learning Rate": 1.6796563037994347e-05, "Pretrain/Loss": 1.9707493782043457, "Pretrain/Loss (Raw)": 1.7202404737472534, "Pretrain/Step": 5896, "Pretrain/Step Time": 8.665870361030102} +{"Pretrain/Learning Rate": 1.678854372250907e-05, "Pretrain/Loss": 1.9662598371505737, "Pretrain/Loss (Raw)": 1.4872329235076904, "Pretrain/Step": 5897, "Pretrain/Step Time": 8.664375308901072} +{"Pretrain/Learning Rate": 1.6780525354007644e-05, "Pretrain/Loss": 1.966480016708374, "Pretrain/Loss (Raw)": 1.9142580032348633, "Pretrain/Step": 5898, "Pretrain/Step Time": 8.661623077467084} +{"Pretrain/Learning Rate": 1.6772507933414744e-05, "Pretrain/Loss": 1.9661154747009277, "Pretrain/Loss (Raw)": 1.9322103261947632, "Pretrain/Step": 5899, "Pretrain/Step Time": 8.6665414031595} +{"Pretrain/Learning Rate": 1.6764491461655017e-05, "Pretrain/Loss": 1.9658762216567993, "Pretrain/Loss (Raw)": 1.9757581949234009, "Pretrain/Step": 5900, "Pretrain/Step Time": 8.66368542984128} +{"Pretrain/Learning Rate": 1.6756475939652927e-05, "Pretrain/Loss": 1.9634838104248047, "Pretrain/Loss (Raw)": 1.9282292127609253, "Pretrain/Step": 5901, "Pretrain/Step Time": 8.66236656345427} +{"Pretrain/Learning Rate": 1.674846136833289e-05, "Pretrain/Loss": 1.963062047958374, "Pretrain/Loss (Raw)": 1.8528605699539185, "Pretrain/Step": 5902, "Pretrain/Step Time": 8.659860890358686} +{"Pretrain/Learning Rate": 1.6740447748619156e-05, "Pretrain/Loss": 1.9613354206085205, "Pretrain/Loss (Raw)": 1.7990033626556396, "Pretrain/Step": 5903, "Pretrain/Step Time": 8.661016315221786} +{"Pretrain/Learning Rate": 1.6732435081435924e-05, "Pretrain/Loss": 1.9592986106872559, "Pretrain/Loss (Raw)": 1.919916033744812, "Pretrain/Step": 5904, "Pretrain/Step Time": 8.667450273409486} +{"Pretrain/Learning Rate": 1.6724423367707226e-05, "Pretrain/Loss": 1.959071159362793, "Pretrain/Loss (Raw)": 2.090376138687134, "Pretrain/Step": 5905, "Pretrain/Step Time": 8.667322697117925} +{"Pretrain/Learning Rate": 1.6716412608357024e-05, "Pretrain/Loss": 1.9582552909851074, "Pretrain/Loss (Raw)": 1.8264037370681763, "Pretrain/Step": 5906, "Pretrain/Step Time": 8.670489402487874} +{"Pretrain/Learning Rate": 1.670840280430915e-05, "Pretrain/Loss": 1.9585602283477783, "Pretrain/Loss (Raw)": 1.7787144184112549, "Pretrain/Step": 5907, "Pretrain/Step Time": 8.66948682256043} +{"Pretrain/Learning Rate": 1.6700393956487342e-05, "Pretrain/Loss": 1.9633255004882812, "Pretrain/Loss (Raw)": 2.066147565841675, "Pretrain/Step": 5908, "Pretrain/Step Time": 8.66990383900702} +{"Pretrain/Learning Rate": 1.6692386065815203e-05, "Pretrain/Loss": 1.9655431509017944, "Pretrain/Loss (Raw)": 2.236729383468628, "Pretrain/Step": 5909, "Pretrain/Step Time": 8.673036359250546} +{"Pretrain/Learning Rate": 1.668437913321626e-05, "Pretrain/Loss": 1.9657963514328003, "Pretrain/Loss (Raw)": 2.1502108573913574, "Pretrain/Step": 5910, "Pretrain/Step Time": 8.67248484864831} +{"Pretrain/Learning Rate": 1.667637315961389e-05, "Pretrain/Loss": 1.9676315784454346, "Pretrain/Loss (Raw)": 2.117216110229492, "Pretrain/Step": 5911, "Pretrain/Step Time": 8.673220502212644} +{"Pretrain/Learning Rate": 1.6668368145931397e-05, "Pretrain/Loss": 1.9662044048309326, "Pretrain/Loss (Raw)": 1.9393547773361206, "Pretrain/Step": 5912, "Pretrain/Step Time": 8.678235640749335} +{"Pretrain/Learning Rate": 1.6660364093091945e-05, "Pretrain/Loss": 1.9643783569335938, "Pretrain/Loss (Raw)": 1.8448554277420044, "Pretrain/Step": 5913, "Pretrain/Step Time": 8.676630951464176} +{"Pretrain/Learning Rate": 1.6652361002018608e-05, "Pretrain/Loss": 1.9634933471679688, "Pretrain/Loss (Raw)": 1.988783836364746, "Pretrain/Step": 5914, "Pretrain/Step Time": 8.678347459062934} +{"Pretrain/Learning Rate": 1.664435887363433e-05, "Pretrain/Loss": 1.9636276960372925, "Pretrain/Loss (Raw)": 1.9913759231567383, "Pretrain/Step": 5915, "Pretrain/Step Time": 8.669006306678057} +{"Pretrain/Learning Rate": 1.6636357708861966e-05, "Pretrain/Loss": 1.964980959892273, "Pretrain/Loss (Raw)": 2.0013058185577393, "Pretrain/Step": 5916, "Pretrain/Step Time": 8.670617258176208} +{"Pretrain/Learning Rate": 1.6628357508624234e-05, "Pretrain/Loss": 1.96397066116333, "Pretrain/Loss (Raw)": 1.7581541538238525, "Pretrain/Step": 5917, "Pretrain/Step Time": 8.667910331860185} +{"Pretrain/Learning Rate": 1.662035827384377e-05, "Pretrain/Loss": 1.9644520282745361, "Pretrain/Loss (Raw)": 2.1187732219696045, "Pretrain/Step": 5918, "Pretrain/Step Time": 8.66603404097259} +{"Pretrain/Learning Rate": 1.661236000544307e-05, "Pretrain/Loss": 1.9649367332458496, "Pretrain/Loss (Raw)": 1.9730393886566162, "Pretrain/Step": 5919, "Pretrain/Step Time": 8.666683327406645} +{"Pretrain/Learning Rate": 1.660436270434454e-05, "Pretrain/Loss": 1.9671614170074463, "Pretrain/Loss (Raw)": 2.165036916732788, "Pretrain/Step": 5920, "Pretrain/Step Time": 8.667113101109862} +{"Pretrain/Learning Rate": 1.6596366371470466e-05, "Pretrain/Loss": 1.96694016456604, "Pretrain/Loss (Raw)": 2.1570937633514404, "Pretrain/Step": 5921, "Pretrain/Step Time": 8.667300650849938} +{"Pretrain/Learning Rate": 1.658837100774302e-05, "Pretrain/Loss": 1.969759225845337, "Pretrain/Loss (Raw)": 2.3705790042877197, "Pretrain/Step": 5922, "Pretrain/Step Time": 8.665745537728071} +{"Pretrain/Learning Rate": 1.658037661408427e-05, "Pretrain/Loss": 1.9705173969268799, "Pretrain/Loss (Raw)": 2.067131519317627, "Pretrain/Step": 5923, "Pretrain/Step Time": 8.668481776490808} +{"Pretrain/Learning Rate": 1.657238319141616e-05, "Pretrain/Loss": 1.970674753189087, "Pretrain/Loss (Raw)": 2.0700466632843018, "Pretrain/Step": 5924, "Pretrain/Step Time": 8.669487124308944} +{"Pretrain/Learning Rate": 1.656439074066053e-05, "Pretrain/Loss": 1.9704705476760864, "Pretrain/Loss (Raw)": 1.933603286743164, "Pretrain/Step": 5925, "Pretrain/Step Time": 8.66845920868218} +{"Pretrain/Learning Rate": 1.655639926273911e-05, "Pretrain/Loss": 1.9722840785980225, "Pretrain/Loss (Raw)": 2.1592347621917725, "Pretrain/Step": 5926, "Pretrain/Step Time": 8.671910734847188} +{"Pretrain/Learning Rate": 1.654840875857352e-05, "Pretrain/Loss": 1.9726229906082153, "Pretrain/Loss (Raw)": 2.0225396156311035, "Pretrain/Step": 5927, "Pretrain/Step Time": 8.665672067552805} +{"Pretrain/Learning Rate": 1.654041922908525e-05, "Pretrain/Loss": 1.972253680229187, "Pretrain/Loss (Raw)": 1.9499297142028809, "Pretrain/Step": 5928, "Pretrain/Step Time": 8.667911559343338} +{"Pretrain/Learning Rate": 1.6532430675195705e-05, "Pretrain/Loss": 1.9732413291931152, "Pretrain/Loss (Raw)": 1.9813326597213745, "Pretrain/Step": 5929, "Pretrain/Step Time": 8.664388628676534} +{"Pretrain/Learning Rate": 1.652444309782615e-05, "Pretrain/Loss": 1.97030770778656, "Pretrain/Loss (Raw)": 1.6993237733840942, "Pretrain/Step": 5930, "Pretrain/Step Time": 8.665378261357546} +{"Pretrain/Learning Rate": 1.651645649789776e-05, "Pretrain/Loss": 1.9714417457580566, "Pretrain/Loss (Raw)": 1.9504008293151855, "Pretrain/Step": 5931, "Pretrain/Step Time": 8.66402635537088} +{"Pretrain/Learning Rate": 1.6508470876331577e-05, "Pretrain/Loss": 1.9699122905731201, "Pretrain/Loss (Raw)": 1.978661060333252, "Pretrain/Step": 5932, "Pretrain/Step Time": 8.6626210026443} +{"Pretrain/Learning Rate": 1.650048623404855e-05, "Pretrain/Loss": 1.969260334968567, "Pretrain/Loss (Raw)": 2.0245521068573, "Pretrain/Step": 5933, "Pretrain/Step Time": 8.661817882210016} +{"Pretrain/Learning Rate": 1.6492502571969498e-05, "Pretrain/Loss": 1.9700188636779785, "Pretrain/Loss (Raw)": 1.9989060163497925, "Pretrain/Step": 5934, "Pretrain/Step Time": 8.6622483599931} +{"Pretrain/Learning Rate": 1.6484519891015143e-05, "Pretrain/Loss": 1.9691303968429565, "Pretrain/Loss (Raw)": 1.9167381525039673, "Pretrain/Step": 5935, "Pretrain/Step Time": 8.662793152034283} +{"Pretrain/Learning Rate": 1.647653819210607e-05, "Pretrain/Loss": 1.9707908630371094, "Pretrain/Loss (Raw)": 2.11592698097229, "Pretrain/Step": 5936, "Pretrain/Step Time": 8.656031291931868} +{"Pretrain/Learning Rate": 1.6468557476162793e-05, "Pretrain/Loss": 1.9697139263153076, "Pretrain/Loss (Raw)": 1.7157388925552368, "Pretrain/Step": 5937, "Pretrain/Step Time": 8.659111022949219} +{"Pretrain/Learning Rate": 1.6460577744105654e-05, "Pretrain/Loss": 1.968742847442627, "Pretrain/Loss (Raw)": 1.912684679031372, "Pretrain/Step": 5938, "Pretrain/Step Time": 8.66578477434814} +{"Pretrain/Learning Rate": 1.6452598996854943e-05, "Pretrain/Loss": 1.9687976837158203, "Pretrain/Loss (Raw)": 1.9206790924072266, "Pretrain/Step": 5939, "Pretrain/Step Time": 8.66352117061615} +{"Pretrain/Learning Rate": 1.6444621235330777e-05, "Pretrain/Loss": 1.9699043035507202, "Pretrain/Loss (Raw)": 2.0173933506011963, "Pretrain/Step": 5940, "Pretrain/Step Time": 8.667289873585105} +{"Pretrain/Learning Rate": 1.6436644460453217e-05, "Pretrain/Loss": 1.969327688217163, "Pretrain/Loss (Raw)": 1.8893641233444214, "Pretrain/Step": 5941, "Pretrain/Step Time": 8.670348301529884} +{"Pretrain/Learning Rate": 1.642866867314216e-05, "Pretrain/Loss": 1.9688076972961426, "Pretrain/Loss (Raw)": 1.886668086051941, "Pretrain/Step": 5942, "Pretrain/Step Time": 8.678151052445173} +{"Pretrain/Learning Rate": 1.642069387431743e-05, "Pretrain/Loss": 1.9696727991104126, "Pretrain/Loss (Raw)": 1.8935643434524536, "Pretrain/Step": 5943, "Pretrain/Step Time": 8.678904250264168} +{"Pretrain/Learning Rate": 1.64127200648987e-05, "Pretrain/Loss": 1.973522424697876, "Pretrain/Loss (Raw)": 2.125312089920044, "Pretrain/Step": 5944, "Pretrain/Step Time": 8.683366667479277} +{"Pretrain/Learning Rate": 1.6404747245805567e-05, "Pretrain/Loss": 1.9725828170776367, "Pretrain/Loss (Raw)": 1.9761440753936768, "Pretrain/Step": 5945, "Pretrain/Step Time": 8.681543782353401} +{"Pretrain/Learning Rate": 1.6396775417957478e-05, "Pretrain/Loss": 1.9748201370239258, "Pretrain/Loss (Raw)": 2.2971625328063965, "Pretrain/Step": 5946, "Pretrain/Step Time": 8.682076629251242} +{"Pretrain/Learning Rate": 1.6388804582273788e-05, "Pretrain/Loss": 1.9753310680389404, "Pretrain/Loss (Raw)": 1.9345749616622925, "Pretrain/Step": 5947, "Pretrain/Step Time": 8.678150363266468} +{"Pretrain/Learning Rate": 1.6380834739673727e-05, "Pretrain/Loss": 1.974808692932129, "Pretrain/Loss (Raw)": 1.9321486949920654, "Pretrain/Step": 5948, "Pretrain/Step Time": 8.67709207907319} +{"Pretrain/Learning Rate": 1.6372865891076426e-05, "Pretrain/Loss": 1.9730541706085205, "Pretrain/Loss (Raw)": 1.8049767017364502, "Pretrain/Step": 5949, "Pretrain/Step Time": 8.676473328843713} +{"Pretrain/Learning Rate": 1.6364898037400876e-05, "Pretrain/Loss": 1.9746685028076172, "Pretrain/Loss (Raw)": 2.121166944503784, "Pretrain/Step": 5950, "Pretrain/Step Time": 8.67718324251473} +{"Pretrain/Learning Rate": 1.6356931179565978e-05, "Pretrain/Loss": 1.9761888980865479, "Pretrain/Loss (Raw)": 2.1030540466308594, "Pretrain/Step": 5951, "Pretrain/Step Time": 8.68022639118135} +{"Pretrain/Learning Rate": 1.63489653184905e-05, "Pretrain/Loss": 1.9762674570083618, "Pretrain/Loss (Raw)": 1.9514522552490234, "Pretrain/Step": 5952, "Pretrain/Step Time": 8.67663537338376} +{"Pretrain/Learning Rate": 1.6341000455093115e-05, "Pretrain/Loss": 1.974083423614502, "Pretrain/Loss (Raw)": 1.8634740114212036, "Pretrain/Step": 5953, "Pretrain/Step Time": 8.684167874976993} +{"Pretrain/Learning Rate": 1.633303659029235e-05, "Pretrain/Loss": 1.9735223054885864, "Pretrain/Loss (Raw)": 2.2072246074676514, "Pretrain/Step": 5954, "Pretrain/Step Time": 8.684760060161352} +{"Pretrain/Learning Rate": 1.6325073725006654e-05, "Pretrain/Loss": 1.9732105731964111, "Pretrain/Loss (Raw)": 2.0336508750915527, "Pretrain/Step": 5955, "Pretrain/Step Time": 8.682665238156915} +{"Pretrain/Learning Rate": 1.6317111860154328e-05, "Pretrain/Loss": 1.9743068218231201, "Pretrain/Loss (Raw)": 2.1562559604644775, "Pretrain/Step": 5956, "Pretrain/Step Time": 8.682611059397459} +{"Pretrain/Learning Rate": 1.6309150996653582e-05, "Pretrain/Loss": 1.9753395318984985, "Pretrain/Loss (Raw)": 2.0149714946746826, "Pretrain/Step": 5957, "Pretrain/Step Time": 8.685864312574267} +{"Pretrain/Learning Rate": 1.630119113542249e-05, "Pretrain/Loss": 1.971089243888855, "Pretrain/Loss (Raw)": 1.5142470598220825, "Pretrain/Step": 5958, "Pretrain/Step Time": 8.685636645182967} +{"Pretrain/Learning Rate": 1.629323227737903e-05, "Pretrain/Loss": 1.9702540636062622, "Pretrain/Loss (Raw)": 1.6114935874938965, "Pretrain/Step": 5959, "Pretrain/Step Time": 8.681395579129457} +{"Pretrain/Learning Rate": 1.628527442344105e-05, "Pretrain/Loss": 1.9732335805892944, "Pretrain/Loss (Raw)": 2.2327778339385986, "Pretrain/Step": 5960, "Pretrain/Step Time": 8.68031764216721} +{"Pretrain/Learning Rate": 1.6277317574526284e-05, "Pretrain/Loss": 1.9746005535125732, "Pretrain/Loss (Raw)": 1.9515281915664673, "Pretrain/Step": 5961, "Pretrain/Step Time": 8.67669309861958} +{"Pretrain/Learning Rate": 1.626936173155237e-05, "Pretrain/Loss": 1.9754900932312012, "Pretrain/Loss (Raw)": 2.1237494945526123, "Pretrain/Step": 5962, "Pretrain/Step Time": 8.67798475548625} +{"Pretrain/Learning Rate": 1.626140689543679e-05, "Pretrain/Loss": 1.973337173461914, "Pretrain/Loss (Raw)": 1.759042501449585, "Pretrain/Step": 5963, "Pretrain/Step Time": 8.677150432020426} +{"Pretrain/Learning Rate": 1.6253453067096954e-05, "Pretrain/Loss": 1.9713099002838135, "Pretrain/Loss (Raw)": 1.8506946563720703, "Pretrain/Step": 5964, "Pretrain/Step Time": 8.679736603051424} +{"Pretrain/Learning Rate": 1.6245500247450114e-05, "Pretrain/Loss": 1.9716243743896484, "Pretrain/Loss (Raw)": 1.9777802228927612, "Pretrain/Step": 5965, "Pretrain/Step Time": 8.677339090034366} +{"Pretrain/Learning Rate": 1.6237548437413448e-05, "Pretrain/Loss": 1.9704861640930176, "Pretrain/Loss (Raw)": 1.9058185815811157, "Pretrain/Step": 5966, "Pretrain/Step Time": 8.67822433821857} +{"Pretrain/Learning Rate": 1.622959763790398e-05, "Pretrain/Loss": 1.9717636108398438, "Pretrain/Loss (Raw)": 2.151704788208008, "Pretrain/Step": 5967, "Pretrain/Step Time": 8.679281286895275} +{"Pretrain/Learning Rate": 1.6221647849838645e-05, "Pretrain/Loss": 1.968492031097412, "Pretrain/Loss (Raw)": 1.9486737251281738, "Pretrain/Step": 5968, "Pretrain/Step Time": 8.677162332460284} +{"Pretrain/Learning Rate": 1.621369907413424e-05, "Pretrain/Loss": 1.9694428443908691, "Pretrain/Loss (Raw)": 2.0274858474731445, "Pretrain/Step": 5969, "Pretrain/Step Time": 8.682171568274498} +{"Pretrain/Learning Rate": 1.6205751311707463e-05, "Pretrain/Loss": 1.9699803590774536, "Pretrain/Loss (Raw)": 2.139265537261963, "Pretrain/Step": 5970, "Pretrain/Step Time": 8.679389774799347} +{"Pretrain/Learning Rate": 1.6197804563474882e-05, "Pretrain/Loss": 1.9691734313964844, "Pretrain/Loss (Raw)": 1.882423758506775, "Pretrain/Step": 5971, "Pretrain/Step Time": 8.678215188905597} +{"Pretrain/Learning Rate": 1.6189858830352962e-05, "Pretrain/Loss": 1.966235637664795, "Pretrain/Loss (Raw)": 1.5714120864868164, "Pretrain/Step": 5972, "Pretrain/Step Time": 8.678748842328787} +{"Pretrain/Learning Rate": 1.618191411325803e-05, "Pretrain/Loss": 1.9622248411178589, "Pretrain/Loss (Raw)": 1.2710237503051758, "Pretrain/Step": 5973, "Pretrain/Step Time": 8.67954353056848} +{"Pretrain/Learning Rate": 1.617397041310632e-05, "Pretrain/Loss": 1.9613726139068604, "Pretrain/Loss (Raw)": 1.9224882125854492, "Pretrain/Step": 5974, "Pretrain/Step Time": 8.677963616326451} +{"Pretrain/Learning Rate": 1.6166027730813926e-05, "Pretrain/Loss": 1.9589970111846924, "Pretrain/Loss (Raw)": 1.7273294925689697, "Pretrain/Step": 5975, "Pretrain/Step Time": 8.67777405679226} +{"Pretrain/Learning Rate": 1.6158086067296844e-05, "Pretrain/Loss": 1.9592862129211426, "Pretrain/Loss (Raw)": 1.798740267753601, "Pretrain/Step": 5976, "Pretrain/Step Time": 8.674813525751233} +{"Pretrain/Learning Rate": 1.615014542347094e-05, "Pretrain/Loss": 1.9573404788970947, "Pretrain/Loss (Raw)": 1.9148951768875122, "Pretrain/Step": 5977, "Pretrain/Step Time": 8.679874312132597} +{"Pretrain/Learning Rate": 1.6142205800251968e-05, "Pretrain/Loss": 1.9590041637420654, "Pretrain/Loss (Raw)": 1.8860793113708496, "Pretrain/Step": 5978, "Pretrain/Step Time": 8.67763714119792} +{"Pretrain/Learning Rate": 1.6134267198555563e-05, "Pretrain/Loss": 1.9560898542404175, "Pretrain/Loss (Raw)": 1.7334775924682617, "Pretrain/Step": 5979, "Pretrain/Step Time": 8.682571256533265} +{"Pretrain/Learning Rate": 1.612632961929725e-05, "Pretrain/Loss": 1.956571102142334, "Pretrain/Loss (Raw)": 1.935142993927002, "Pretrain/Step": 5980, "Pretrain/Step Time": 8.67891425639391} +{"Pretrain/Learning Rate": 1.6118393063392402e-05, "Pretrain/Loss": 1.953361988067627, "Pretrain/Loss (Raw)": 1.6987485885620117, "Pretrain/Step": 5981, "Pretrain/Step Time": 8.680674102157354} +{"Pretrain/Learning Rate": 1.6110457531756334e-05, "Pretrain/Loss": 1.9533392190933228, "Pretrain/Loss (Raw)": 1.9434716701507568, "Pretrain/Step": 5982, "Pretrain/Step Time": 8.682830614969134} +{"Pretrain/Learning Rate": 1.6102523025304178e-05, "Pretrain/Loss": 1.954740285873413, "Pretrain/Loss (Raw)": 2.2498526573181152, "Pretrain/Step": 5983, "Pretrain/Step Time": 8.683222621679306} +{"Pretrain/Learning Rate": 1.6094589544951006e-05, "Pretrain/Loss": 1.9554407596588135, "Pretrain/Loss (Raw)": 1.9602781534194946, "Pretrain/Step": 5984, "Pretrain/Step Time": 8.686240868642926} +{"Pretrain/Learning Rate": 1.6086657091611718e-05, "Pretrain/Loss": 1.9530820846557617, "Pretrain/Loss (Raw)": 1.9358359575271606, "Pretrain/Step": 5985, "Pretrain/Step Time": 8.68122911080718} +{"Pretrain/Learning Rate": 1.607872566620115e-05, "Pretrain/Loss": 1.95304536819458, "Pretrain/Loss (Raw)": 1.9570765495300293, "Pretrain/Step": 5986, "Pretrain/Step Time": 8.682307353243232} +{"Pretrain/Learning Rate": 1.6070795269633964e-05, "Pretrain/Loss": 1.9520008563995361, "Pretrain/Loss (Raw)": 2.0335826873779297, "Pretrain/Step": 5987, "Pretrain/Step Time": 8.680342473089695} +{"Pretrain/Learning Rate": 1.6062865902824754e-05, "Pretrain/Loss": 1.9512152671813965, "Pretrain/Loss (Raw)": 1.9472419023513794, "Pretrain/Step": 5988, "Pretrain/Step Time": 8.683222325518727} +{"Pretrain/Learning Rate": 1.605493756668795e-05, "Pretrain/Loss": 1.9514175653457642, "Pretrain/Loss (Raw)": 1.9252740144729614, "Pretrain/Step": 5989, "Pretrain/Step Time": 8.681678745895624} +{"Pretrain/Learning Rate": 1.6047010262137908e-05, "Pretrain/Loss": 1.9495375156402588, "Pretrain/Loss (Raw)": 1.9463412761688232, "Pretrain/Step": 5990, "Pretrain/Step Time": 8.683587411418557} +{"Pretrain/Learning Rate": 1.603908399008882e-05, "Pretrain/Loss": 1.9519020318984985, "Pretrain/Loss (Raw)": 2.16603684425354, "Pretrain/Step": 5991, "Pretrain/Step Time": 8.68049594387412} +{"Pretrain/Learning Rate": 1.60311587514548e-05, "Pretrain/Loss": 1.953047275543213, "Pretrain/Loss (Raw)": 1.9450831413269043, "Pretrain/Step": 5992, "Pretrain/Step Time": 8.680715221911669} +{"Pretrain/Learning Rate": 1.6023234547149808e-05, "Pretrain/Loss": 1.9528931379318237, "Pretrain/Loss (Raw)": 2.1220083236694336, "Pretrain/Step": 5993, "Pretrain/Step Time": 8.676418293267488} +{"Pretrain/Learning Rate": 1.6015311378087714e-05, "Pretrain/Loss": 1.9548449516296387, "Pretrain/Loss (Raw)": 2.0013930797576904, "Pretrain/Step": 5994, "Pretrain/Step Time": 8.68034902215004} +{"Pretrain/Learning Rate": 1.600738924518224e-05, "Pretrain/Loss": 1.9574790000915527, "Pretrain/Loss (Raw)": 1.9449164867401123, "Pretrain/Step": 5995, "Pretrain/Step Time": 8.676585733890533} +{"Pretrain/Learning Rate": 1.5999468149347024e-05, "Pretrain/Loss": 1.9570355415344238, "Pretrain/Loss (Raw)": 1.8993288278579712, "Pretrain/Step": 5996, "Pretrain/Step Time": 8.677747167646885} +{"Pretrain/Learning Rate": 1.5991548091495546e-05, "Pretrain/Loss": 1.9584949016571045, "Pretrain/Loss (Raw)": 1.967513084411621, "Pretrain/Step": 5997, "Pretrain/Step Time": 8.675260750576854} +{"Pretrain/Learning Rate": 1.5983629072541196e-05, "Pretrain/Loss": 1.9581748247146606, "Pretrain/Loss (Raw)": 2.0447030067443848, "Pretrain/Step": 5998, "Pretrain/Step Time": 8.677076691761613} +{"Pretrain/Learning Rate": 1.597571109339722e-05, "Pretrain/Loss": 1.9612739086151123, "Pretrain/Loss (Raw)": 2.3494908809661865, "Pretrain/Step": 5999, "Pretrain/Step Time": 8.677570343017578} +{"Pretrain/Learning Rate": 1.5967794154976773e-05, "Pretrain/Loss": 1.9617186784744263, "Pretrain/Loss (Raw)": 2.084909439086914, "Pretrain/Step": 6000, "Pretrain/Step Time": 8.677925646305084} +{"Pretrain/Learning Rate": 1.5959878258192863e-05, "Pretrain/Loss": 1.9626879692077637, "Pretrain/Loss (Raw)": 2.0896682739257812, "Pretrain/Step": 6001, "Pretrain/Step Time": 8.681038478389382} +{"Pretrain/Learning Rate": 1.5951963403958382e-05, "Pretrain/Loss": 1.9608876705169678, "Pretrain/Loss (Raw)": 2.049785852432251, "Pretrain/Step": 6002, "Pretrain/Step Time": 8.679059544578195} +{"Pretrain/Learning Rate": 1.5944049593186127e-05, "Pretrain/Loss": 1.960031270980835, "Pretrain/Loss (Raw)": 1.994513988494873, "Pretrain/Step": 6003, "Pretrain/Step Time": 8.674887558445334} +{"Pretrain/Learning Rate": 1.5936136826788745e-05, "Pretrain/Loss": 1.9615479707717896, "Pretrain/Loss (Raw)": 1.9813672304153442, "Pretrain/Step": 6004, "Pretrain/Step Time": 8.674977468326688} +{"Pretrain/Learning Rate": 1.5928225105678774e-05, "Pretrain/Loss": 1.96249258518219, "Pretrain/Loss (Raw)": 2.19832706451416, "Pretrain/Step": 6005, "Pretrain/Step Time": 8.672138066962361} +{"Pretrain/Learning Rate": 1.592031443076863e-05, "Pretrain/Loss": 1.9615185260772705, "Pretrain/Loss (Raw)": 1.8536020517349243, "Pretrain/Step": 6006, "Pretrain/Step Time": 8.671695606783032} +{"Pretrain/Learning Rate": 1.591240480297061e-05, "Pretrain/Loss": 1.9593182802200317, "Pretrain/Loss (Raw)": 1.765398383140564, "Pretrain/Step": 6007, "Pretrain/Step Time": 8.669412732124329} +{"Pretrain/Learning Rate": 1.590449622319689e-05, "Pretrain/Loss": 1.9578324556350708, "Pretrain/Loss (Raw)": 1.8658994436264038, "Pretrain/Step": 6008, "Pretrain/Step Time": 8.6730537135154} +{"Pretrain/Learning Rate": 1.589658869235953e-05, "Pretrain/Loss": 1.9578962326049805, "Pretrain/Loss (Raw)": 2.05086612701416, "Pretrain/Step": 6009, "Pretrain/Step Time": 8.667910307645798} +{"Pretrain/Learning Rate": 1.588868221137045e-05, "Pretrain/Loss": 1.958439826965332, "Pretrain/Loss (Raw)": 2.0543928146362305, "Pretrain/Step": 6010, "Pretrain/Step Time": 8.668442575260997} +{"Pretrain/Learning Rate": 1.588077678114148e-05, "Pretrain/Loss": 1.9597198963165283, "Pretrain/Loss (Raw)": 2.1663308143615723, "Pretrain/Step": 6011, "Pretrain/Step Time": 8.669164463877678} +{"Pretrain/Learning Rate": 1.5872872402584296e-05, "Pretrain/Loss": 1.9629722833633423, "Pretrain/Loss (Raw)": 2.2289133071899414, "Pretrain/Step": 6012, "Pretrain/Step Time": 8.66554855927825} +{"Pretrain/Learning Rate": 1.586496907661048e-05, "Pretrain/Loss": 1.9655730724334717, "Pretrain/Loss (Raw)": 2.055459976196289, "Pretrain/Step": 6013, "Pretrain/Step Time": 8.665823563933372} +{"Pretrain/Learning Rate": 1.5857066804131472e-05, "Pretrain/Loss": 1.9660484790802002, "Pretrain/Loss (Raw)": 2.049487829208374, "Pretrain/Step": 6014, "Pretrain/Step Time": 8.665863811969757} +{"Pretrain/Learning Rate": 1.5849165586058608e-05, "Pretrain/Loss": 1.9669203758239746, "Pretrain/Loss (Raw)": 2.091118574142456, "Pretrain/Step": 6015, "Pretrain/Step Time": 8.668377110734582} +{"Pretrain/Learning Rate": 1.5841265423303084e-05, "Pretrain/Loss": 1.967987060546875, "Pretrain/Loss (Raw)": 2.055704355239868, "Pretrain/Step": 6016, "Pretrain/Step Time": 8.659564416855574} +{"Pretrain/Learning Rate": 1.5833366316775994e-05, "Pretrain/Loss": 1.9699965715408325, "Pretrain/Loss (Raw)": 2.0398387908935547, "Pretrain/Step": 6017, "Pretrain/Step Time": 8.664920967072248} +{"Pretrain/Learning Rate": 1.582546826738829e-05, "Pretrain/Loss": 1.971268892288208, "Pretrain/Loss (Raw)": 2.102156400680542, "Pretrain/Step": 6018, "Pretrain/Step Time": 8.666617704555392} +{"Pretrain/Learning Rate": 1.581757127605082e-05, "Pretrain/Loss": 1.9713990688323975, "Pretrain/Loss (Raw)": 1.8577113151550293, "Pretrain/Step": 6019, "Pretrain/Step Time": 8.663168299943209} +{"Pretrain/Learning Rate": 1.5809675343674295e-05, "Pretrain/Loss": 1.9727914333343506, "Pretrain/Loss (Raw)": 2.160395860671997, "Pretrain/Step": 6020, "Pretrain/Step Time": 8.66122874058783} +{"Pretrain/Learning Rate": 1.5801780471169324e-05, "Pretrain/Loss": 1.9732446670532227, "Pretrain/Loss (Raw)": 1.9785761833190918, "Pretrain/Step": 6021, "Pretrain/Step Time": 8.662108043208718} +{"Pretrain/Learning Rate": 1.579388665944636e-05, "Pretrain/Loss": 1.9726474285125732, "Pretrain/Loss (Raw)": 1.93623685836792, "Pretrain/Step": 6022, "Pretrain/Step Time": 8.663482068106532} +{"Pretrain/Learning Rate": 1.578599390941578e-05, "Pretrain/Loss": 1.9722355604171753, "Pretrain/Loss (Raw)": 2.1301968097686768, "Pretrain/Step": 6023, "Pretrain/Step Time": 8.657936053350568} +{"Pretrain/Learning Rate": 1.577810222198779e-05, "Pretrain/Loss": 1.9746744632720947, "Pretrain/Loss (Raw)": 2.0324177742004395, "Pretrain/Step": 6024, "Pretrain/Step Time": 8.659277260303497} +{"Pretrain/Learning Rate": 1.577021159807252e-05, "Pretrain/Loss": 1.9791308641433716, "Pretrain/Loss (Raw)": 2.0576446056365967, "Pretrain/Step": 6025, "Pretrain/Step Time": 8.661049330607057} +{"Pretrain/Learning Rate": 1.5762322038579925e-05, "Pretrain/Loss": 1.9766426086425781, "Pretrain/Loss (Raw)": 1.595765471458435, "Pretrain/Step": 6026, "Pretrain/Step Time": 8.664979299530387} +{"Pretrain/Learning Rate": 1.5754433544419893e-05, "Pretrain/Loss": 1.9777421951293945, "Pretrain/Loss (Raw)": 2.0729620456695557, "Pretrain/Step": 6027, "Pretrain/Step Time": 8.658584566786885} +{"Pretrain/Learning Rate": 1.574654611650214e-05, "Pretrain/Loss": 1.978540062904358, "Pretrain/Loss (Raw)": 2.0778753757476807, "Pretrain/Step": 6028, "Pretrain/Step Time": 8.658011673018336} +{"Pretrain/Learning Rate": 1.5738659755736308e-05, "Pretrain/Loss": 1.9787886142730713, "Pretrain/Loss (Raw)": 1.9600332975387573, "Pretrain/Step": 6029, "Pretrain/Step Time": 8.661094455048442} +{"Pretrain/Learning Rate": 1.5730774463031862e-05, "Pretrain/Loss": 1.979831337928772, "Pretrain/Loss (Raw)": 1.9863488674163818, "Pretrain/Step": 6030, "Pretrain/Step Time": 8.663708040490746} +{"Pretrain/Learning Rate": 1.572289023929819e-05, "Pretrain/Loss": 1.9823349714279175, "Pretrain/Loss (Raw)": 2.119459390640259, "Pretrain/Step": 6031, "Pretrain/Step Time": 8.664575992152095} +{"Pretrain/Learning Rate": 1.5715007085444523e-05, "Pretrain/Loss": 1.9817780256271362, "Pretrain/Loss (Raw)": 1.8486287593841553, "Pretrain/Step": 6032, "Pretrain/Step Time": 8.659760106354952} +{"Pretrain/Learning Rate": 1.5707125002379996e-05, "Pretrain/Loss": 1.9812066555023193, "Pretrain/Loss (Raw)": 2.0172486305236816, "Pretrain/Step": 6033, "Pretrain/Step Time": 8.659306667745113} +{"Pretrain/Learning Rate": 1.56992439910136e-05, "Pretrain/Loss": 1.9822700023651123, "Pretrain/Loss (Raw)": 1.9625024795532227, "Pretrain/Step": 6034, "Pretrain/Step Time": 8.654179356992245} +{"Pretrain/Learning Rate": 1.569136405225422e-05, "Pretrain/Loss": 1.9841668605804443, "Pretrain/Loss (Raw)": 2.0215201377868652, "Pretrain/Step": 6035, "Pretrain/Step Time": 8.651308281347156} +{"Pretrain/Learning Rate": 1.5683485187010593e-05, "Pretrain/Loss": 1.983379602432251, "Pretrain/Loss (Raw)": 1.965378999710083, "Pretrain/Step": 6036, "Pretrain/Step Time": 8.653427004814148} +{"Pretrain/Learning Rate": 1.5675607396191366e-05, "Pretrain/Loss": 1.9814579486846924, "Pretrain/Loss (Raw)": 1.9907344579696655, "Pretrain/Step": 6037, "Pretrain/Step Time": 8.65347364731133} +{"Pretrain/Learning Rate": 1.5667730680705022e-05, "Pretrain/Loss": 1.977663278579712, "Pretrain/Loss (Raw)": 1.664511799812317, "Pretrain/Step": 6038, "Pretrain/Step Time": 8.653946785256267} +{"Pretrain/Learning Rate": 1.5659855041459955e-05, "Pretrain/Loss": 1.9782236814498901, "Pretrain/Loss (Raw)": 2.1889519691467285, "Pretrain/Step": 6039, "Pretrain/Step Time": 8.653406528756022} +{"Pretrain/Learning Rate": 1.5651980479364416e-05, "Pretrain/Loss": 1.9811278581619263, "Pretrain/Loss (Raw)": 2.311094045639038, "Pretrain/Step": 6040, "Pretrain/Step Time": 8.64684266410768} +{"Pretrain/Learning Rate": 1.564410699532654e-05, "Pretrain/Loss": 1.9819340705871582, "Pretrain/Loss (Raw)": 1.9480397701263428, "Pretrain/Step": 6041, "Pretrain/Step Time": 8.653204565867782} +{"Pretrain/Learning Rate": 1.5636234590254324e-05, "Pretrain/Loss": 1.983083963394165, "Pretrain/Loss (Raw)": 2.135969877243042, "Pretrain/Step": 6042, "Pretrain/Step Time": 8.651280958205462} +{"Pretrain/Learning Rate": 1.5628363265055664e-05, "Pretrain/Loss": 1.983374834060669, "Pretrain/Loss (Raw)": 2.0286178588867188, "Pretrain/Step": 6043, "Pretrain/Step Time": 8.65755806863308} +{"Pretrain/Learning Rate": 1.5620493020638315e-05, "Pretrain/Loss": 1.9847015142440796, "Pretrain/Loss (Raw)": 2.171112060546875, "Pretrain/Step": 6044, "Pretrain/Step Time": 8.653003042563796} +{"Pretrain/Learning Rate": 1.5612623857909904e-05, "Pretrain/Loss": 1.98563814163208, "Pretrain/Loss (Raw)": 1.8780322074890137, "Pretrain/Step": 6045, "Pretrain/Step Time": 8.65447716228664} +{"Pretrain/Learning Rate": 1.5604755777777948e-05, "Pretrain/Loss": 1.9847049713134766, "Pretrain/Loss (Raw)": 1.9993314743041992, "Pretrain/Step": 6046, "Pretrain/Step Time": 8.655836472287774} +{"Pretrain/Learning Rate": 1.5596888781149827e-05, "Pretrain/Loss": 1.9861018657684326, "Pretrain/Loss (Raw)": 2.15183162689209, "Pretrain/Step": 6047, "Pretrain/Step Time": 8.652122193947434} +{"Pretrain/Learning Rate": 1.55890228689328e-05, "Pretrain/Loss": 1.9854044914245605, "Pretrain/Loss (Raw)": 2.0757904052734375, "Pretrain/Step": 6048, "Pretrain/Step Time": 8.653607454150915} +{"Pretrain/Learning Rate": 1.5581158042034e-05, "Pretrain/Loss": 1.9857159852981567, "Pretrain/Loss (Raw)": 2.196969509124756, "Pretrain/Step": 6049, "Pretrain/Step Time": 8.662236295640469} +{"Pretrain/Learning Rate": 1.557329430136044e-05, "Pretrain/Loss": 1.9812238216400146, "Pretrain/Loss (Raw)": 1.795575499534607, "Pretrain/Step": 6050, "Pretrain/Step Time": 8.663599519059062} +{"Pretrain/Learning Rate": 1.5565431647819e-05, "Pretrain/Loss": 1.980299949645996, "Pretrain/Loss (Raw)": 1.9488791227340698, "Pretrain/Step": 6051, "Pretrain/Step Time": 8.660240853205323} +{"Pretrain/Learning Rate": 1.555757008231644e-05, "Pretrain/Loss": 1.9795730113983154, "Pretrain/Loss (Raw)": 1.976995587348938, "Pretrain/Step": 6052, "Pretrain/Step Time": 8.663166925311089} +{"Pretrain/Learning Rate": 1.5549709605759393e-05, "Pretrain/Loss": 1.9799423217773438, "Pretrain/Loss (Raw)": 1.9808621406555176, "Pretrain/Step": 6053, "Pretrain/Step Time": 8.663686506450176} +{"Pretrain/Learning Rate": 1.5541850219054366e-05, "Pretrain/Loss": 1.9791414737701416, "Pretrain/Loss (Raw)": 2.0567352771759033, "Pretrain/Step": 6054, "Pretrain/Step Time": 8.661719316616654} +{"Pretrain/Learning Rate": 1.5533991923107737e-05, "Pretrain/Loss": 1.9789655208587646, "Pretrain/Loss (Raw)": 2.0000109672546387, "Pretrain/Step": 6055, "Pretrain/Step Time": 8.663849875330925} +{"Pretrain/Learning Rate": 1.552613471882577e-05, "Pretrain/Loss": 1.977315902709961, "Pretrain/Loss (Raw)": 1.7387970685958862, "Pretrain/Step": 6056, "Pretrain/Step Time": 8.65818196721375} +{"Pretrain/Learning Rate": 1.5518278607114585e-05, "Pretrain/Loss": 1.977329134941101, "Pretrain/Loss (Raw)": 1.9830093383789062, "Pretrain/Step": 6057, "Pretrain/Step Time": 8.656745225191116} +{"Pretrain/Learning Rate": 1.5510423588880194e-05, "Pretrain/Loss": 1.9800543785095215, "Pretrain/Loss (Raw)": 2.048175811767578, "Pretrain/Step": 6058, "Pretrain/Step Time": 8.656825235113502} +{"Pretrain/Learning Rate": 1.5502569665028465e-05, "Pretrain/Loss": 1.9807446002960205, "Pretrain/Loss (Raw)": 2.038738489151001, "Pretrain/Step": 6059, "Pretrain/Step Time": 8.659524742513895} +{"Pretrain/Learning Rate": 1.549471683646516e-05, "Pretrain/Loss": 1.9826399087905884, "Pretrain/Loss (Raw)": 2.2212700843811035, "Pretrain/Step": 6060, "Pretrain/Step Time": 8.661518467590213} +{"Pretrain/Learning Rate": 1.54868651040959e-05, "Pretrain/Loss": 1.9818439483642578, "Pretrain/Loss (Raw)": 1.9226619005203247, "Pretrain/Step": 6061, "Pretrain/Step Time": 8.659597106277943} +{"Pretrain/Learning Rate": 1.5479014468826184e-05, "Pretrain/Loss": 1.9817695617675781, "Pretrain/Loss (Raw)": 1.9893741607666016, "Pretrain/Step": 6062, "Pretrain/Step Time": 8.661234999075532} +{"Pretrain/Learning Rate": 1.547116493156138e-05, "Pretrain/Loss": 1.9827799797058105, "Pretrain/Loss (Raw)": 2.046088933944702, "Pretrain/Step": 6063, "Pretrain/Step Time": 8.661967473104596} +{"Pretrain/Learning Rate": 1.5463316493206748e-05, "Pretrain/Loss": 1.9838694334030151, "Pretrain/Loss (Raw)": 2.25536847114563, "Pretrain/Step": 6064, "Pretrain/Step Time": 8.661964133381844} +{"Pretrain/Learning Rate": 1.545546915466738e-05, "Pretrain/Loss": 1.9849920272827148, "Pretrain/Loss (Raw)": 1.859430193901062, "Pretrain/Step": 6065, "Pretrain/Step Time": 8.667993718758225} +{"Pretrain/Learning Rate": 1.54476229168483e-05, "Pretrain/Loss": 1.9827154874801636, "Pretrain/Loss (Raw)": 1.6212880611419678, "Pretrain/Step": 6066, "Pretrain/Step Time": 8.662266364321113} +{"Pretrain/Learning Rate": 1.543977778065434e-05, "Pretrain/Loss": 1.9834904670715332, "Pretrain/Loss (Raw)": 2.0198726654052734, "Pretrain/Step": 6067, "Pretrain/Step Time": 8.663765728473663} +{"Pretrain/Learning Rate": 1.5431933746990276e-05, "Pretrain/Loss": 1.983076810836792, "Pretrain/Loss (Raw)": 1.964451789855957, "Pretrain/Step": 6068, "Pretrain/Step Time": 8.65845463424921} +{"Pretrain/Learning Rate": 1.542409081676068e-05, "Pretrain/Loss": 1.983534812927246, "Pretrain/Loss (Raw)": 1.9479825496673584, "Pretrain/Step": 6069, "Pretrain/Step Time": 8.65604443475604} +{"Pretrain/Learning Rate": 1.541624899087007e-05, "Pretrain/Loss": 1.9835492372512817, "Pretrain/Loss (Raw)": 1.8885211944580078, "Pretrain/Step": 6070, "Pretrain/Step Time": 8.647763537243009} +{"Pretrain/Learning Rate": 1.5408408270222773e-05, "Pretrain/Loss": 1.983006477355957, "Pretrain/Loss (Raw)": 1.8240766525268555, "Pretrain/Step": 6071, "Pretrain/Step Time": 8.645527981221676} +{"Pretrain/Learning Rate": 1.5400568655723043e-05, "Pretrain/Loss": 1.9804210662841797, "Pretrain/Loss (Raw)": 1.7943823337554932, "Pretrain/Step": 6072, "Pretrain/Step Time": 8.6414226423949} +{"Pretrain/Learning Rate": 1.5392730148274965e-05, "Pretrain/Loss": 1.9801504611968994, "Pretrain/Loss (Raw)": 1.9415067434310913, "Pretrain/Step": 6073, "Pretrain/Step Time": 8.64425304532051} +{"Pretrain/Learning Rate": 1.5384892748782513e-05, "Pretrain/Loss": 1.9782679080963135, "Pretrain/Loss (Raw)": 2.0562071800231934, "Pretrain/Step": 6074, "Pretrain/Step Time": 8.64611148275435} +{"Pretrain/Learning Rate": 1.5377056458149542e-05, "Pretrain/Loss": 1.9796066284179688, "Pretrain/Loss (Raw)": 2.1059210300445557, "Pretrain/Step": 6075, "Pretrain/Step Time": 8.650470847263932} +{"Pretrain/Learning Rate": 1.5369221277279765e-05, "Pretrain/Loss": 1.980149269104004, "Pretrain/Loss (Raw)": 2.001619338989258, "Pretrain/Step": 6076, "Pretrain/Step Time": 8.650541020557284} +{"Pretrain/Learning Rate": 1.5361387207076766e-05, "Pretrain/Loss": 1.9829238653182983, "Pretrain/Loss (Raw)": 2.1601202487945557, "Pretrain/Step": 6077, "Pretrain/Step Time": 8.656417656689882} +{"Pretrain/Learning Rate": 1.5353554248444022e-05, "Pretrain/Loss": 1.982947826385498, "Pretrain/Loss (Raw)": 2.1242306232452393, "Pretrain/Step": 6078, "Pretrain/Step Time": 8.656939871609211} +{"Pretrain/Learning Rate": 1.5345722402284852e-05, "Pretrain/Loss": 1.9812034368515015, "Pretrain/Loss (Raw)": 1.8797845840454102, "Pretrain/Step": 6079, "Pretrain/Step Time": 8.657773638144135} +{"Pretrain/Learning Rate": 1.5337891669502468e-05, "Pretrain/Loss": 1.982088327407837, "Pretrain/Loss (Raw)": 2.0647037029266357, "Pretrain/Step": 6080, "Pretrain/Step Time": 8.662265656515956} +{"Pretrain/Learning Rate": 1.5330062050999945e-05, "Pretrain/Loss": 1.9838390350341797, "Pretrain/Loss (Raw)": 2.0875768661499023, "Pretrain/Step": 6081, "Pretrain/Step Time": 8.658051691949368} +{"Pretrain/Learning Rate": 1.5322233547680235e-05, "Pretrain/Loss": 1.9814589023590088, "Pretrain/Loss (Raw)": 1.9025474786758423, "Pretrain/Step": 6082, "Pretrain/Step Time": 8.659090556204319} +{"Pretrain/Learning Rate": 1.531440616044615e-05, "Pretrain/Loss": 1.981429100036621, "Pretrain/Loss (Raw)": 2.029849052429199, "Pretrain/Step": 6083, "Pretrain/Step Time": 8.659345595166087} +{"Pretrain/Learning Rate": 1.530657989020039e-05, "Pretrain/Loss": 1.9810607433319092, "Pretrain/Loss (Raw)": 2.1090989112854004, "Pretrain/Step": 6084, "Pretrain/Step Time": 8.65792285837233} +{"Pretrain/Learning Rate": 1.5298754737845515e-05, "Pretrain/Loss": 1.9821128845214844, "Pretrain/Loss (Raw)": 2.1496644020080566, "Pretrain/Step": 6085, "Pretrain/Step Time": 8.655908504500985} +{"Pretrain/Learning Rate": 1.5290930704283953e-05, "Pretrain/Loss": 1.9858258962631226, "Pretrain/Loss (Raw)": 1.9895097017288208, "Pretrain/Step": 6086, "Pretrain/Step Time": 8.657605422660708} +{"Pretrain/Learning Rate": 1.5283107790418023e-05, "Pretrain/Loss": 1.9885611534118652, "Pretrain/Loss (Raw)": 1.9616178274154663, "Pretrain/Step": 6087, "Pretrain/Step Time": 8.657451760023832} +{"Pretrain/Learning Rate": 1.527528599714988e-05, "Pretrain/Loss": 1.9871976375579834, "Pretrain/Loss (Raw)": 2.058210849761963, "Pretrain/Step": 6088, "Pretrain/Step Time": 8.65960387699306} +{"Pretrain/Learning Rate": 1.5267465325381584e-05, "Pretrain/Loss": 1.9881582260131836, "Pretrain/Loss (Raw)": 2.074516534805298, "Pretrain/Step": 6089, "Pretrain/Step Time": 8.659605590626597} +{"Pretrain/Learning Rate": 1.5259645776015047e-05, "Pretrain/Loss": 1.9855393171310425, "Pretrain/Loss (Raw)": 1.788510799407959, "Pretrain/Step": 6090, "Pretrain/Step Time": 8.660618165507913} +{"Pretrain/Learning Rate": 1.5251827349952058e-05, "Pretrain/Loss": 1.9876582622528076, "Pretrain/Loss (Raw)": 2.030280113220215, "Pretrain/Step": 6091, "Pretrain/Step Time": 8.672446498647332} +{"Pretrain/Learning Rate": 1.524401004809427e-05, "Pretrain/Loss": 1.9878312349319458, "Pretrain/Loss (Raw)": 1.8728272914886475, "Pretrain/Step": 6092, "Pretrain/Step Time": 8.671845776960254} +{"Pretrain/Learning Rate": 1.5236193871343224e-05, "Pretrain/Loss": 1.9881261587142944, "Pretrain/Loss (Raw)": 2.01554012298584, "Pretrain/Step": 6093, "Pretrain/Step Time": 8.671647656708956} +{"Pretrain/Learning Rate": 1.5228378820600303e-05, "Pretrain/Loss": 1.9874778985977173, "Pretrain/Loss (Raw)": 1.8228392601013184, "Pretrain/Step": 6094, "Pretrain/Step Time": 8.671994470059872} +{"Pretrain/Learning Rate": 1.5220564896766784e-05, "Pretrain/Loss": 1.9856956005096436, "Pretrain/Loss (Raw)": 1.9235628843307495, "Pretrain/Step": 6095, "Pretrain/Step Time": 8.671591751277447} +{"Pretrain/Learning Rate": 1.52127521007438e-05, "Pretrain/Loss": 1.9860823154449463, "Pretrain/Loss (Raw)": 1.9981662034988403, "Pretrain/Step": 6096, "Pretrain/Step Time": 8.672100258991122} +{"Pretrain/Learning Rate": 1.5204940433432368e-05, "Pretrain/Loss": 1.9817606210708618, "Pretrain/Loss (Raw)": 1.4743188619613647, "Pretrain/Step": 6097, "Pretrain/Step Time": 8.675150567665696} +{"Pretrain/Learning Rate": 1.5197129895733354e-05, "Pretrain/Loss": 1.9803661108016968, "Pretrain/Loss (Raw)": 1.9607595205307007, "Pretrain/Step": 6098, "Pretrain/Step Time": 8.67676916718483} +{"Pretrain/Learning Rate": 1.518932048854752e-05, "Pretrain/Loss": 1.9786489009857178, "Pretrain/Loss (Raw)": 1.6626334190368652, "Pretrain/Step": 6099, "Pretrain/Step Time": 8.677878694608808} +{"Pretrain/Learning Rate": 1.5181512212775472e-05, "Pretrain/Loss": 1.9799014329910278, "Pretrain/Loss (Raw)": 1.7317286729812622, "Pretrain/Step": 6100, "Pretrain/Step Time": 8.678595684468746} +{"Pretrain/Learning Rate": 1.5173705069317706e-05, "Pretrain/Loss": 1.9868618249893188, "Pretrain/Loss (Raw)": 2.161956548690796, "Pretrain/Step": 6101, "Pretrain/Step Time": 8.673297334462404} +{"Pretrain/Learning Rate": 1.5165899059074567e-05, "Pretrain/Loss": 1.9872649908065796, "Pretrain/Loss (Raw)": 1.9740947484970093, "Pretrain/Step": 6102, "Pretrain/Step Time": 8.672404842451215} +{"Pretrain/Learning Rate": 1.5158094182946298e-05, "Pretrain/Loss": 1.9903454780578613, "Pretrain/Loss (Raw)": 2.12162446975708, "Pretrain/Step": 6103, "Pretrain/Step Time": 8.673853566870093} +{"Pretrain/Learning Rate": 1.5150290441832976e-05, "Pretrain/Loss": 1.9928034543991089, "Pretrain/Loss (Raw)": 2.113358736038208, "Pretrain/Step": 6104, "Pretrain/Step Time": 8.670652620494366} +{"Pretrain/Learning Rate": 1.5142487836634587e-05, "Pretrain/Loss": 1.9929759502410889, "Pretrain/Loss (Raw)": 1.936998963356018, "Pretrain/Step": 6105, "Pretrain/Step Time": 8.670663263648748} +{"Pretrain/Learning Rate": 1.5134686368250932e-05, "Pretrain/Loss": 1.9937896728515625, "Pretrain/Loss (Raw)": 1.9902162551879883, "Pretrain/Step": 6106, "Pretrain/Step Time": 8.670912766829133} +{"Pretrain/Learning Rate": 1.512688603758175e-05, "Pretrain/Loss": 1.995924711227417, "Pretrain/Loss (Raw)": 2.0067548751831055, "Pretrain/Step": 6107, "Pretrain/Step Time": 8.667939895763993} +{"Pretrain/Learning Rate": 1.5119086845526576e-05, "Pretrain/Loss": 1.9964399337768555, "Pretrain/Loss (Raw)": 2.001107692718506, "Pretrain/Step": 6108, "Pretrain/Step Time": 8.671045079827309} +{"Pretrain/Learning Rate": 1.5111288792984884e-05, "Pretrain/Loss": 1.999414324760437, "Pretrain/Loss (Raw)": 2.0794765949249268, "Pretrain/Step": 6109, "Pretrain/Step Time": 8.669756215065718} +{"Pretrain/Learning Rate": 1.5103491880855953e-05, "Pretrain/Loss": 1.9992125034332275, "Pretrain/Loss (Raw)": 1.9176292419433594, "Pretrain/Step": 6110, "Pretrain/Step Time": 8.668036244809628} +{"Pretrain/Learning Rate": 1.5095696110038981e-05, "Pretrain/Loss": 1.9963841438293457, "Pretrain/Loss (Raw)": 1.887816071510315, "Pretrain/Step": 6111, "Pretrain/Step Time": 8.67087746039033} +{"Pretrain/Learning Rate": 1.5087901481432993e-05, "Pretrain/Loss": 1.9951748847961426, "Pretrain/Loss (Raw)": 1.8054989576339722, "Pretrain/Step": 6112, "Pretrain/Step Time": 8.667411325499415} +{"Pretrain/Learning Rate": 1.5080107995936929e-05, "Pretrain/Loss": 1.9951320886611938, "Pretrain/Loss (Raw)": 1.9303563833236694, "Pretrain/Step": 6113, "Pretrain/Step Time": 8.669544707983732} +{"Pretrain/Learning Rate": 1.5072315654449543e-05, "Pretrain/Loss": 1.9951090812683105, "Pretrain/Loss (Raw)": 1.9541219472885132, "Pretrain/Step": 6114, "Pretrain/Step Time": 8.670168116688728} +{"Pretrain/Learning Rate": 1.5064524457869506e-05, "Pretrain/Loss": 1.993713617324829, "Pretrain/Loss (Raw)": 1.8549610376358032, "Pretrain/Step": 6115, "Pretrain/Step Time": 8.669982368126512} +{"Pretrain/Learning Rate": 1.5056734407095316e-05, "Pretrain/Loss": 1.9915096759796143, "Pretrain/Loss (Raw)": 1.6651424169540405, "Pretrain/Step": 6116, "Pretrain/Step Time": 8.669917033985257} +{"Pretrain/Learning Rate": 1.5048945503025375e-05, "Pretrain/Loss": 1.9932200908660889, "Pretrain/Loss (Raw)": 2.1442198753356934, "Pretrain/Step": 6117, "Pretrain/Step Time": 8.669425323605537} +{"Pretrain/Learning Rate": 1.5041157746557924e-05, "Pretrain/Loss": 1.9937480688095093, "Pretrain/Loss (Raw)": 2.013909101486206, "Pretrain/Step": 6118, "Pretrain/Step Time": 8.669456264004111} +{"Pretrain/Learning Rate": 1.5033371138591095e-05, "Pretrain/Loss": 1.9918467998504639, "Pretrain/Loss (Raw)": 1.922682762145996, "Pretrain/Step": 6119, "Pretrain/Step Time": 8.671253629028797} +{"Pretrain/Learning Rate": 1.5025585680022866e-05, "Pretrain/Loss": 1.9918837547302246, "Pretrain/Loss (Raw)": 1.9498096704483032, "Pretrain/Step": 6120, "Pretrain/Step Time": 8.67039730772376} +{"Pretrain/Learning Rate": 1.50178013717511e-05, "Pretrain/Loss": 1.9912617206573486, "Pretrain/Loss (Raw)": 2.0424036979675293, "Pretrain/Step": 6121, "Pretrain/Step Time": 8.67873908393085} +{"Pretrain/Learning Rate": 1.5010018214673515e-05, "Pretrain/Loss": 1.99155592918396, "Pretrain/Loss (Raw)": 2.039025068283081, "Pretrain/Step": 6122, "Pretrain/Step Time": 8.67472175695002} +{"Pretrain/Learning Rate": 1.5002236209687709e-05, "Pretrain/Loss": 1.992527723312378, "Pretrain/Loss (Raw)": 2.069305658340454, "Pretrain/Step": 6123, "Pretrain/Step Time": 8.674518898129463} +{"Pretrain/Learning Rate": 1.4994455357691128e-05, "Pretrain/Loss": 1.9923224449157715, "Pretrain/Loss (Raw)": 1.8730652332305908, "Pretrain/Step": 6124, "Pretrain/Step Time": 8.675086420029402} +{"Pretrain/Learning Rate": 1.4986675659581103e-05, "Pretrain/Loss": 1.9933134317398071, "Pretrain/Loss (Raw)": 2.094362735748291, "Pretrain/Step": 6125, "Pretrain/Step Time": 8.674576930701733} +{"Pretrain/Learning Rate": 1.4978897116254832e-05, "Pretrain/Loss": 1.9922003746032715, "Pretrain/Loss (Raw)": 1.9022281169891357, "Pretrain/Step": 6126, "Pretrain/Step Time": 8.672312323004007} +{"Pretrain/Learning Rate": 1.4971119728609359e-05, "Pretrain/Loss": 1.9902398586273193, "Pretrain/Loss (Raw)": 2.098543405532837, "Pretrain/Step": 6127, "Pretrain/Step Time": 8.674788584932685} +{"Pretrain/Learning Rate": 1.4963343497541621e-05, "Pretrain/Loss": 1.9891529083251953, "Pretrain/Loss (Raw)": 1.9457865953445435, "Pretrain/Step": 6128, "Pretrain/Step Time": 8.678055735304952} +{"Pretrain/Learning Rate": 1.4955568423948402e-05, "Pretrain/Loss": 1.9887452125549316, "Pretrain/Loss (Raw)": 2.0374755859375, "Pretrain/Step": 6129, "Pretrain/Step Time": 8.675910696387291} +{"Pretrain/Learning Rate": 1.494779450872637e-05, "Pretrain/Loss": 1.9874558448791504, "Pretrain/Loss (Raw)": 1.8847343921661377, "Pretrain/Step": 6130, "Pretrain/Step Time": 8.677511358633637} +{"Pretrain/Learning Rate": 1.4940021752772034e-05, "Pretrain/Loss": 1.9883086681365967, "Pretrain/Loss (Raw)": 2.103682279586792, "Pretrain/Step": 6131, "Pretrain/Step Time": 8.676432773470879} +{"Pretrain/Learning Rate": 1.4932250156981803e-05, "Pretrain/Loss": 1.9884639978408813, "Pretrain/Loss (Raw)": 2.0012447834014893, "Pretrain/Step": 6132, "Pretrain/Step Time": 8.67783397436142} +{"Pretrain/Learning Rate": 1.4924479722251916e-05, "Pretrain/Loss": 1.9874814748764038, "Pretrain/Loss (Raw)": 2.0725789070129395, "Pretrain/Step": 6133, "Pretrain/Step Time": 8.681491887196898} +{"Pretrain/Learning Rate": 1.4916710449478511e-05, "Pretrain/Loss": 1.987510323524475, "Pretrain/Loss (Raw)": 1.857292890548706, "Pretrain/Step": 6134, "Pretrain/Step Time": 8.677267108112574} +{"Pretrain/Learning Rate": 1.4908942339557564e-05, "Pretrain/Loss": 1.9904887676239014, "Pretrain/Loss (Raw)": 2.1466455459594727, "Pretrain/Step": 6135, "Pretrain/Step Time": 8.67802377231419} +{"Pretrain/Learning Rate": 1.4901175393384944e-05, "Pretrain/Loss": 1.992052435874939, "Pretrain/Loss (Raw)": 2.0660438537597656, "Pretrain/Step": 6136, "Pretrain/Step Time": 8.680504776537418} +{"Pretrain/Learning Rate": 1.4893409611856362e-05, "Pretrain/Loss": 1.9910800457000732, "Pretrain/Loss (Raw)": 1.9263988733291626, "Pretrain/Step": 6137, "Pretrain/Step Time": 8.678614854812622} +{"Pretrain/Learning Rate": 1.488564499586741e-05, "Pretrain/Loss": 1.9892756938934326, "Pretrain/Loss (Raw)": 1.823419451713562, "Pretrain/Step": 6138, "Pretrain/Step Time": 8.68683772534132} +{"Pretrain/Learning Rate": 1.4877881546313532e-05, "Pretrain/Loss": 1.9890286922454834, "Pretrain/Loss (Raw)": 2.1347200870513916, "Pretrain/Step": 6139, "Pretrain/Step Time": 8.682999685406685} +{"Pretrain/Learning Rate": 1.4870119264090057e-05, "Pretrain/Loss": 1.9856810569763184, "Pretrain/Loss (Raw)": 1.8004142045974731, "Pretrain/Step": 6140, "Pretrain/Step Time": 8.680857034400105} +{"Pretrain/Learning Rate": 1.4862358150092157e-05, "Pretrain/Loss": 1.9855921268463135, "Pretrain/Loss (Raw)": 2.044085741043091, "Pretrain/Step": 6141, "Pretrain/Step Time": 8.685658123344183} +{"Pretrain/Learning Rate": 1.485459820521489e-05, "Pretrain/Loss": 1.9852039813995361, "Pretrain/Loss (Raw)": 1.9997985363006592, "Pretrain/Step": 6142, "Pretrain/Step Time": 8.683889504522085} +{"Pretrain/Learning Rate": 1.484683943035316e-05, "Pretrain/Loss": 1.9852432012557983, "Pretrain/Loss (Raw)": 2.0961475372314453, "Pretrain/Step": 6143, "Pretrain/Step Time": 8.68403603695333} +{"Pretrain/Learning Rate": 1.4839081826401755e-05, "Pretrain/Loss": 1.984332799911499, "Pretrain/Loss (Raw)": 1.939168930053711, "Pretrain/Step": 6144, "Pretrain/Step Time": 8.68640410900116} +{"Pretrain/Learning Rate": 1.4831325394255307e-05, "Pretrain/Loss": 1.9834258556365967, "Pretrain/Loss (Raw)": 1.9237571954727173, "Pretrain/Step": 6145, "Pretrain/Step Time": 8.683648446574807} +{"Pretrain/Learning Rate": 1.4823570134808342e-05, "Pretrain/Loss": 1.982621192932129, "Pretrain/Loss (Raw)": 1.9991428852081299, "Pretrain/Step": 6146, "Pretrain/Step Time": 8.680335370823741} +{"Pretrain/Learning Rate": 1.4815816048955208e-05, "Pretrain/Loss": 1.984480857849121, "Pretrain/Loss (Raw)": 2.0957634449005127, "Pretrain/Step": 6147, "Pretrain/Step Time": 8.677516737952828} +{"Pretrain/Learning Rate": 1.4808063137590172e-05, "Pretrain/Loss": 1.9831782579421997, "Pretrain/Loss (Raw)": 1.993659496307373, "Pretrain/Step": 6148, "Pretrain/Step Time": 8.676562825217843} +{"Pretrain/Learning Rate": 1.4800311401607304e-05, "Pretrain/Loss": 1.9819074869155884, "Pretrain/Loss (Raw)": 1.8159255981445312, "Pretrain/Step": 6149, "Pretrain/Step Time": 8.671364957466722} +{"Pretrain/Learning Rate": 1.4792560841900604e-05, "Pretrain/Loss": 1.983197808265686, "Pretrain/Loss (Raw)": 2.1013965606689453, "Pretrain/Step": 6150, "Pretrain/Step Time": 8.670188941061497} +{"Pretrain/Learning Rate": 1.4784811459363873e-05, "Pretrain/Loss": 1.9809054136276245, "Pretrain/Loss (Raw)": 1.8367687463760376, "Pretrain/Step": 6151, "Pretrain/Step Time": 8.676526471972466} +{"Pretrain/Learning Rate": 1.4777063254890833e-05, "Pretrain/Loss": 1.981217622756958, "Pretrain/Loss (Raw)": 2.0723795890808105, "Pretrain/Step": 6152, "Pretrain/Step Time": 8.67570574209094} +{"Pretrain/Learning Rate": 1.4769316229375012e-05, "Pretrain/Loss": 1.9795856475830078, "Pretrain/Loss (Raw)": 1.8487557172775269, "Pretrain/Step": 6153, "Pretrain/Step Time": 8.675367996096611} +{"Pretrain/Learning Rate": 1.4761570383709871e-05, "Pretrain/Loss": 1.9849481582641602, "Pretrain/Loss (Raw)": 2.2821481227874756, "Pretrain/Step": 6154, "Pretrain/Step Time": 8.675551477819681} +{"Pretrain/Learning Rate": 1.4753825718788667e-05, "Pretrain/Loss": 1.9829801321029663, "Pretrain/Loss (Raw)": 1.821065902709961, "Pretrain/Step": 6155, "Pretrain/Step Time": 8.677783699706197} +{"Pretrain/Learning Rate": 1.4746082235504572e-05, "Pretrain/Loss": 1.9823195934295654, "Pretrain/Loss (Raw)": 1.9933158159255981, "Pretrain/Step": 6156, "Pretrain/Step Time": 8.67871911264956} +{"Pretrain/Learning Rate": 1.4738339934750584e-05, "Pretrain/Loss": 1.9834794998168945, "Pretrain/Loss (Raw)": 2.108510732650757, "Pretrain/Step": 6157, "Pretrain/Step Time": 8.676006769761443} +{"Pretrain/Learning Rate": 1.4730598817419593e-05, "Pretrain/Loss": 1.984828233718872, "Pretrain/Loss (Raw)": 2.1589932441711426, "Pretrain/Step": 6158, "Pretrain/Step Time": 8.674711037427187} +{"Pretrain/Learning Rate": 1.4722858884404333e-05, "Pretrain/Loss": 1.9842921495437622, "Pretrain/Loss (Raw)": 2.05084490776062, "Pretrain/Step": 6159, "Pretrain/Step Time": 8.674237603321671} +{"Pretrain/Learning Rate": 1.4715120136597421e-05, "Pretrain/Loss": 1.9857696294784546, "Pretrain/Loss (Raw)": 2.037733793258667, "Pretrain/Step": 6160, "Pretrain/Step Time": 8.674661882221699} +{"Pretrain/Learning Rate": 1.4707382574891312e-05, "Pretrain/Loss": 1.982912302017212, "Pretrain/Loss (Raw)": 1.65152108669281, "Pretrain/Step": 6161, "Pretrain/Step Time": 8.68086438253522} +{"Pretrain/Learning Rate": 1.4699646200178353e-05, "Pretrain/Loss": 1.9819817543029785, "Pretrain/Loss (Raw)": 1.8433886766433716, "Pretrain/Step": 6162, "Pretrain/Step Time": 8.67897298745811} +{"Pretrain/Learning Rate": 1.469191101335072e-05, "Pretrain/Loss": 1.9825975894927979, "Pretrain/Loss (Raw)": 2.1003448963165283, "Pretrain/Step": 6163, "Pretrain/Step Time": 8.681279910728335} +{"Pretrain/Learning Rate": 1.4684177015300491e-05, "Pretrain/Loss": 1.9844191074371338, "Pretrain/Loss (Raw)": 2.198535203933716, "Pretrain/Step": 6164, "Pretrain/Step Time": 8.67861170321703} +{"Pretrain/Learning Rate": 1.467644420691957e-05, "Pretrain/Loss": 1.9860607385635376, "Pretrain/Loss (Raw)": 2.200861930847168, "Pretrain/Step": 6165, "Pretrain/Step Time": 8.677893405780196} +{"Pretrain/Learning Rate": 1.4668712589099753e-05, "Pretrain/Loss": 1.987839937210083, "Pretrain/Loss (Raw)": 1.8922531604766846, "Pretrain/Step": 6166, "Pretrain/Step Time": 8.678469244390726} +{"Pretrain/Learning Rate": 1.466098216273269e-05, "Pretrain/Loss": 1.9849352836608887, "Pretrain/Loss (Raw)": 1.8171632289886475, "Pretrain/Step": 6167, "Pretrain/Step Time": 8.678338354453444} +{"Pretrain/Learning Rate": 1.465325292870987e-05, "Pretrain/Loss": 1.982591152191162, "Pretrain/Loss (Raw)": 2.011035680770874, "Pretrain/Step": 6168, "Pretrain/Step Time": 8.678230002522469} +{"Pretrain/Learning Rate": 1.464552488792269e-05, "Pretrain/Loss": 1.9813117980957031, "Pretrain/Loss (Raw)": 1.7842779159545898, "Pretrain/Step": 6169, "Pretrain/Step Time": 8.675949305295944} +{"Pretrain/Learning Rate": 1.4637798041262363e-05, "Pretrain/Loss": 1.9805846214294434, "Pretrain/Loss (Raw)": 2.042905807495117, "Pretrain/Step": 6170, "Pretrain/Step Time": 8.675943585112691} +{"Pretrain/Learning Rate": 1.4630072389620003e-05, "Pretrain/Loss": 1.9798438549041748, "Pretrain/Loss (Raw)": 1.9337904453277588, "Pretrain/Step": 6171, "Pretrain/Step Time": 8.67561350762844} +{"Pretrain/Learning Rate": 1.462234793388655e-05, "Pretrain/Loss": 1.9777120351791382, "Pretrain/Loss (Raw)": 1.8982363939285278, "Pretrain/Step": 6172, "Pretrain/Step Time": 8.677407866343856} +{"Pretrain/Learning Rate": 1.4614624674952842e-05, "Pretrain/Loss": 1.9784860610961914, "Pretrain/Loss (Raw)": 1.977108359336853, "Pretrain/Step": 6173, "Pretrain/Step Time": 8.675891624763608} +{"Pretrain/Learning Rate": 1.460690261370955e-05, "Pretrain/Loss": 1.9782679080963135, "Pretrain/Loss (Raw)": 1.9713950157165527, "Pretrain/Step": 6174, "Pretrain/Step Time": 8.676645938307047} +{"Pretrain/Learning Rate": 1.4599181751047225e-05, "Pretrain/Loss": 1.9771966934204102, "Pretrain/Loss (Raw)": 2.014739751815796, "Pretrain/Step": 6175, "Pretrain/Step Time": 8.675738643854856} +{"Pretrain/Learning Rate": 1.4591462087856262e-05, "Pretrain/Loss": 1.9762911796569824, "Pretrain/Loss (Raw)": 1.9598712921142578, "Pretrain/Step": 6176, "Pretrain/Step Time": 8.677870389074087} +{"Pretrain/Learning Rate": 1.4583743625026958e-05, "Pretrain/Loss": 1.9765052795410156, "Pretrain/Loss (Raw)": 2.2243754863739014, "Pretrain/Step": 6177, "Pretrain/Step Time": 8.667530614882708} +{"Pretrain/Learning Rate": 1.4576026363449402e-05, "Pretrain/Loss": 1.979142189025879, "Pretrain/Loss (Raw)": 2.133091926574707, "Pretrain/Step": 6178, "Pretrain/Step Time": 8.668862076476216} +{"Pretrain/Learning Rate": 1.4568310304013613e-05, "Pretrain/Loss": 1.9776434898376465, "Pretrain/Loss (Raw)": 1.7570452690124512, "Pretrain/Step": 6179, "Pretrain/Step Time": 8.668270057067275} +{"Pretrain/Learning Rate": 1.4560595447609427e-05, "Pretrain/Loss": 1.9782875776290894, "Pretrain/Loss (Raw)": 2.0594468116760254, "Pretrain/Step": 6180, "Pretrain/Step Time": 8.664044653996825} +{"Pretrain/Learning Rate": 1.4552881795126588e-05, "Pretrain/Loss": 1.977928638458252, "Pretrain/Loss (Raw)": 1.9349101781845093, "Pretrain/Step": 6181, "Pretrain/Step Time": 8.66342144086957} +{"Pretrain/Learning Rate": 1.4545169347454627e-05, "Pretrain/Loss": 1.978616714477539, "Pretrain/Loss (Raw)": 2.1448168754577637, "Pretrain/Step": 6182, "Pretrain/Step Time": 8.667406309396029} +{"Pretrain/Learning Rate": 1.453745810548301e-05, "Pretrain/Loss": 1.977475643157959, "Pretrain/Loss (Raw)": 1.853961706161499, "Pretrain/Step": 6183, "Pretrain/Step Time": 8.668223429471254} +{"Pretrain/Learning Rate": 1.452974807010103e-05, "Pretrain/Loss": 1.9792776107788086, "Pretrain/Loss (Raw)": 1.9694492816925049, "Pretrain/Step": 6184, "Pretrain/Step Time": 8.666403822600842} +{"Pretrain/Learning Rate": 1.4522039242197835e-05, "Pretrain/Loss": 1.9787663221359253, "Pretrain/Loss (Raw)": 1.9175587892532349, "Pretrain/Step": 6185, "Pretrain/Step Time": 8.67044067569077} +{"Pretrain/Learning Rate": 1.4514331622662441e-05, "Pretrain/Loss": 1.9786264896392822, "Pretrain/Loss (Raw)": 2.030273199081421, "Pretrain/Step": 6186, "Pretrain/Step Time": 8.671928763389587} +{"Pretrain/Learning Rate": 1.4506625212383743e-05, "Pretrain/Loss": 1.9781560897827148, "Pretrain/Loss (Raw)": 1.9785383939743042, "Pretrain/Step": 6187, "Pretrain/Step Time": 8.668621685355902} +{"Pretrain/Learning Rate": 1.4498920012250472e-05, "Pretrain/Loss": 1.9772450923919678, "Pretrain/Loss (Raw)": 2.1046528816223145, "Pretrain/Step": 6188, "Pretrain/Step Time": 8.667988289147615} +{"Pretrain/Learning Rate": 1.449121602315123e-05, "Pretrain/Loss": 1.975393533706665, "Pretrain/Loss (Raw)": 1.6856601238250732, "Pretrain/Step": 6189, "Pretrain/Step Time": 8.674750223755836} +{"Pretrain/Learning Rate": 1.4483513245974461e-05, "Pretrain/Loss": 1.97298264503479, "Pretrain/Loss (Raw)": 1.680772066116333, "Pretrain/Step": 6190, "Pretrain/Step Time": 8.67174900881946} +{"Pretrain/Learning Rate": 1.4475811681608515e-05, "Pretrain/Loss": 1.9736888408660889, "Pretrain/Loss (Raw)": 2.136495590209961, "Pretrain/Step": 6191, "Pretrain/Step Time": 8.669980727136135} +{"Pretrain/Learning Rate": 1.4468111330941556e-05, "Pretrain/Loss": 1.9714373350143433, "Pretrain/Loss (Raw)": 1.967169165611267, "Pretrain/Step": 6192, "Pretrain/Step Time": 8.670276936143637} +{"Pretrain/Learning Rate": 1.4460412194861624e-05, "Pretrain/Loss": 1.9722797870635986, "Pretrain/Loss (Raw)": 1.9672757387161255, "Pretrain/Step": 6193, "Pretrain/Step Time": 8.661802029237151} +{"Pretrain/Learning Rate": 1.4452714274256612e-05, "Pretrain/Loss": 1.9735502004623413, "Pretrain/Loss (Raw)": 1.7838999032974243, "Pretrain/Step": 6194, "Pretrain/Step Time": 8.660376152023673} +{"Pretrain/Learning Rate": 1.4445017570014303e-05, "Pretrain/Loss": 1.9735267162322998, "Pretrain/Loss (Raw)": 2.0168769359588623, "Pretrain/Step": 6195, "Pretrain/Step Time": 8.661954935640097} +{"Pretrain/Learning Rate": 1.4437322083022304e-05, "Pretrain/Loss": 1.9759399890899658, "Pretrain/Loss (Raw)": 2.2733359336853027, "Pretrain/Step": 6196, "Pretrain/Step Time": 8.664976093918085} +{"Pretrain/Learning Rate": 1.4429627814168095e-05, "Pretrain/Loss": 1.9763818979263306, "Pretrain/Loss (Raw)": 2.0045461654663086, "Pretrain/Step": 6197, "Pretrain/Step Time": 8.664289558306336} +{"Pretrain/Learning Rate": 1.4421934764339004e-05, "Pretrain/Loss": 1.97381591796875, "Pretrain/Loss (Raw)": 1.560075044631958, "Pretrain/Step": 6198, "Pretrain/Step Time": 8.663079675287008} +{"Pretrain/Learning Rate": 1.4414242934422251e-05, "Pretrain/Loss": 1.9761555194854736, "Pretrain/Loss (Raw)": 2.123546600341797, "Pretrain/Step": 6199, "Pretrain/Step Time": 8.667391860857606} +{"Pretrain/Learning Rate": 1.440655232530489e-05, "Pretrain/Loss": 1.9774885177612305, "Pretrain/Loss (Raw)": 1.9650083780288696, "Pretrain/Step": 6200, "Pretrain/Step Time": 8.673590762540698} +{"Pretrain/Learning Rate": 1.4398862937873825e-05, "Pretrain/Loss": 1.9782302379608154, "Pretrain/Loss (Raw)": 2.03644061088562, "Pretrain/Step": 6201, "Pretrain/Step Time": 8.667413506656885} +{"Pretrain/Learning Rate": 1.4391174773015836e-05, "Pretrain/Loss": 1.977567434310913, "Pretrain/Loss (Raw)": 1.9713741540908813, "Pretrain/Step": 6202, "Pretrain/Step Time": 8.671424951404333} +{"Pretrain/Learning Rate": 1.4383487831617571e-05, "Pretrain/Loss": 1.977608561515808, "Pretrain/Loss (Raw)": 2.1111936569213867, "Pretrain/Step": 6203, "Pretrain/Step Time": 8.668282443657517} +{"Pretrain/Learning Rate": 1.4375802114565515e-05, "Pretrain/Loss": 1.9788954257965088, "Pretrain/Loss (Raw)": 2.166328191757202, "Pretrain/Step": 6204, "Pretrain/Step Time": 8.667161833494902} +{"Pretrain/Learning Rate": 1.4368117622746025e-05, "Pretrain/Loss": 1.9765585660934448, "Pretrain/Loss (Raw)": 1.8610060214996338, "Pretrain/Step": 6205, "Pretrain/Step Time": 8.663380283862352} +{"Pretrain/Learning Rate": 1.4360434357045294e-05, "Pretrain/Loss": 1.9750291109085083, "Pretrain/Loss (Raw)": 1.9284528493881226, "Pretrain/Step": 6206, "Pretrain/Step Time": 8.663508484140038} +{"Pretrain/Learning Rate": 1.4352752318349421e-05, "Pretrain/Loss": 1.9743242263793945, "Pretrain/Loss (Raw)": 1.7895549535751343, "Pretrain/Step": 6207, "Pretrain/Step Time": 8.664027782157063} +{"Pretrain/Learning Rate": 1.4345071507544326e-05, "Pretrain/Loss": 1.9749984741210938, "Pretrain/Loss (Raw)": 2.151005268096924, "Pretrain/Step": 6208, "Pretrain/Step Time": 8.657685801386833} +{"Pretrain/Learning Rate": 1.4337391925515777e-05, "Pretrain/Loss": 1.9742616415023804, "Pretrain/Loss (Raw)": 1.9932774305343628, "Pretrain/Step": 6209, "Pretrain/Step Time": 8.657592674717307} +{"Pretrain/Learning Rate": 1.432971357314945e-05, "Pretrain/Loss": 1.9745750427246094, "Pretrain/Loss (Raw)": 1.9426747560501099, "Pretrain/Step": 6210, "Pretrain/Step Time": 8.65383524633944} +{"Pretrain/Learning Rate": 1.4322036451330828e-05, "Pretrain/Loss": 1.976233720779419, "Pretrain/Loss (Raw)": 2.2421607971191406, "Pretrain/Step": 6211, "Pretrain/Step Time": 8.652912957593799} +{"Pretrain/Learning Rate": 1.4314360560945284e-05, "Pretrain/Loss": 1.9728617668151855, "Pretrain/Loss (Raw)": 1.677470326423645, "Pretrain/Step": 6212, "Pretrain/Step Time": 8.654536563903093} +{"Pretrain/Learning Rate": 1.430668590287802e-05, "Pretrain/Loss": 1.973469614982605, "Pretrain/Loss (Raw)": 2.227475643157959, "Pretrain/Step": 6213, "Pretrain/Step Time": 8.653243081644177} +{"Pretrain/Learning Rate": 1.4299012478014146e-05, "Pretrain/Loss": 1.9729305505752563, "Pretrain/Loss (Raw)": 1.9205073118209839, "Pretrain/Step": 6214, "Pretrain/Step Time": 8.650638699531555} +{"Pretrain/Learning Rate": 1.4291340287238558e-05, "Pretrain/Loss": 1.9735567569732666, "Pretrain/Loss (Raw)": 2.041771173477173, "Pretrain/Step": 6215, "Pretrain/Step Time": 8.652880027890205} +{"Pretrain/Learning Rate": 1.4283669331436078e-05, "Pretrain/Loss": 1.9720059633255005, "Pretrain/Loss (Raw)": 1.8597121238708496, "Pretrain/Step": 6216, "Pretrain/Step Time": 8.649825595319271} +{"Pretrain/Learning Rate": 1.4275999611491342e-05, "Pretrain/Loss": 1.9707090854644775, "Pretrain/Loss (Raw)": 1.9085103273391724, "Pretrain/Step": 6217, "Pretrain/Step Time": 8.650674700737} +{"Pretrain/Learning Rate": 1.4268331128288881e-05, "Pretrain/Loss": 1.971118688583374, "Pretrain/Loss (Raw)": 1.8409385681152344, "Pretrain/Step": 6218, "Pretrain/Step Time": 8.649288035929203} +{"Pretrain/Learning Rate": 1.4260663882713022e-05, "Pretrain/Loss": 1.96986722946167, "Pretrain/Loss (Raw)": 1.8701149225234985, "Pretrain/Step": 6219, "Pretrain/Step Time": 8.637351505458355} +{"Pretrain/Learning Rate": 1.4252997875648021e-05, "Pretrain/Loss": 1.9714868068695068, "Pretrain/Loss (Raw)": 2.0800979137420654, "Pretrain/Step": 6220, "Pretrain/Step Time": 8.634319273754954} +{"Pretrain/Learning Rate": 1.4245333107977937e-05, "Pretrain/Loss": 1.9664685726165771, "Pretrain/Loss (Raw)": 1.373225450515747, "Pretrain/Step": 6221, "Pretrain/Step Time": 8.63833300024271} +{"Pretrain/Learning Rate": 1.4237669580586736e-05, "Pretrain/Loss": 1.9678065776824951, "Pretrain/Loss (Raw)": 1.994106411933899, "Pretrain/Step": 6222, "Pretrain/Step Time": 8.640203434973955} +{"Pretrain/Learning Rate": 1.4230007294358173e-05, "Pretrain/Loss": 1.9691354036331177, "Pretrain/Loss (Raw)": 2.0936522483825684, "Pretrain/Step": 6223, "Pretrain/Step Time": 8.642592370510101} +{"Pretrain/Learning Rate": 1.4222346250175928e-05, "Pretrain/Loss": 1.9694428443908691, "Pretrain/Loss (Raw)": 2.0375185012817383, "Pretrain/Step": 6224, "Pretrain/Step Time": 8.64223294891417} +{"Pretrain/Learning Rate": 1.4214686448923498e-05, "Pretrain/Loss": 1.9726101160049438, "Pretrain/Loss (Raw)": 1.8797338008880615, "Pretrain/Step": 6225, "Pretrain/Step Time": 8.636734316125512} +{"Pretrain/Learning Rate": 1.420702789148425e-05, "Pretrain/Loss": 1.9725513458251953, "Pretrain/Loss (Raw)": 1.9532251358032227, "Pretrain/Step": 6226, "Pretrain/Step Time": 8.635260494425893} +{"Pretrain/Learning Rate": 1.4199370578741395e-05, "Pretrain/Loss": 1.975351333618164, "Pretrain/Loss (Raw)": 2.021029233932495, "Pretrain/Step": 6227, "Pretrain/Step Time": 8.631202002987266} +{"Pretrain/Learning Rate": 1.419171451157803e-05, "Pretrain/Loss": 1.9765291213989258, "Pretrain/Loss (Raw)": 1.8824965953826904, "Pretrain/Step": 6228, "Pretrain/Step Time": 8.637668337672949} +{"Pretrain/Learning Rate": 1.4184059690877075e-05, "Pretrain/Loss": 1.9755443334579468, "Pretrain/Loss (Raw)": 2.035893678665161, "Pretrain/Step": 6229, "Pretrain/Step Time": 8.641730887815356} +{"Pretrain/Learning Rate": 1.4176406117521324e-05, "Pretrain/Loss": 1.9725537300109863, "Pretrain/Loss (Raw)": 1.591312050819397, "Pretrain/Step": 6230, "Pretrain/Step Time": 8.645659428089857} +{"Pretrain/Learning Rate": 1.4168753792393414e-05, "Pretrain/Loss": 1.972829818725586, "Pretrain/Loss (Raw)": 2.1569554805755615, "Pretrain/Step": 6231, "Pretrain/Step Time": 8.643202049657702} +{"Pretrain/Learning Rate": 1.4161102716375863e-05, "Pretrain/Loss": 1.973369836807251, "Pretrain/Loss (Raw)": 2.182486057281494, "Pretrain/Step": 6232, "Pretrain/Step Time": 8.645228462293744} +{"Pretrain/Learning Rate": 1.4153452890351022e-05, "Pretrain/Loss": 1.972236156463623, "Pretrain/Loss (Raw)": 1.7918795347213745, "Pretrain/Step": 6233, "Pretrain/Step Time": 8.644282331690192} +{"Pretrain/Learning Rate": 1.41458043152011e-05, "Pretrain/Loss": 1.972771406173706, "Pretrain/Loss (Raw)": 2.058743953704834, "Pretrain/Step": 6234, "Pretrain/Step Time": 8.642299683764577} +{"Pretrain/Learning Rate": 1.4138156991808165e-05, "Pretrain/Loss": 1.9735257625579834, "Pretrain/Loss (Raw)": 2.1032979488372803, "Pretrain/Step": 6235, "Pretrain/Step Time": 8.646097544580698} +{"Pretrain/Learning Rate": 1.4130510921054157e-05, "Pretrain/Loss": 1.9735524654388428, "Pretrain/Loss (Raw)": 2.0045225620269775, "Pretrain/Step": 6236, "Pretrain/Step Time": 8.644486652687192} +{"Pretrain/Learning Rate": 1.4122866103820854e-05, "Pretrain/Loss": 1.973713994026184, "Pretrain/Loss (Raw)": 2.100149631500244, "Pretrain/Step": 6237, "Pretrain/Step Time": 8.643720585852861} +{"Pretrain/Learning Rate": 1.411522254098988e-05, "Pretrain/Loss": 1.9750192165374756, "Pretrain/Loss (Raw)": 2.0846996307373047, "Pretrain/Step": 6238, "Pretrain/Step Time": 8.646578945219517} +{"Pretrain/Learning Rate": 1.4107580233442725e-05, "Pretrain/Loss": 1.9746549129486084, "Pretrain/Loss (Raw)": 1.841176986694336, "Pretrain/Step": 6239, "Pretrain/Step Time": 8.645529370754957} +{"Pretrain/Learning Rate": 1.4099939182060755e-05, "Pretrain/Loss": 1.982653021812439, "Pretrain/Loss (Raw)": 2.8292624950408936, "Pretrain/Step": 6240, "Pretrain/Step Time": 8.647196101024747} +{"Pretrain/Learning Rate": 1.409229938772516e-05, "Pretrain/Loss": 1.9825429916381836, "Pretrain/Loss (Raw)": 1.9162790775299072, "Pretrain/Step": 6241, "Pretrain/Step Time": 8.644169563427567} +{"Pretrain/Learning Rate": 1.4084660851316999e-05, "Pretrain/Loss": 1.9826844930648804, "Pretrain/Loss (Raw)": 1.9722392559051514, "Pretrain/Step": 6242, "Pretrain/Step Time": 8.644330885261297} +{"Pretrain/Learning Rate": 1.4077023573717174e-05, "Pretrain/Loss": 1.9805384874343872, "Pretrain/Loss (Raw)": 1.5802643299102783, "Pretrain/Step": 6243, "Pretrain/Step Time": 8.645537000149488} +{"Pretrain/Learning Rate": 1.4069387555806473e-05, "Pretrain/Loss": 1.983933687210083, "Pretrain/Loss (Raw)": 2.0997254848480225, "Pretrain/Step": 6244, "Pretrain/Step Time": 8.649774096906185} +{"Pretrain/Learning Rate": 1.4061752798465503e-05, "Pretrain/Loss": 1.982578992843628, "Pretrain/Loss (Raw)": 1.9708155393600464, "Pretrain/Step": 6245, "Pretrain/Step Time": 8.650664618238807} +{"Pretrain/Learning Rate": 1.4054119302574741e-05, "Pretrain/Loss": 1.9829766750335693, "Pretrain/Loss (Raw)": 2.0648036003112793, "Pretrain/Step": 6246, "Pretrain/Step Time": 8.650194318965077} +{"Pretrain/Learning Rate": 1.4046487069014513e-05, "Pretrain/Loss": 1.9825189113616943, "Pretrain/Loss (Raw)": 1.8640949726104736, "Pretrain/Step": 6247, "Pretrain/Step Time": 8.64967262558639} +{"Pretrain/Learning Rate": 1.403885609866502e-05, "Pretrain/Loss": 1.979250192642212, "Pretrain/Loss (Raw)": 1.5314264297485352, "Pretrain/Step": 6248, "Pretrain/Step Time": 8.650284100323915} +{"Pretrain/Learning Rate": 1.4031226392406293e-05, "Pretrain/Loss": 1.9777305126190186, "Pretrain/Loss (Raw)": 1.8478894233703613, "Pretrain/Step": 6249, "Pretrain/Step Time": 8.645418645814061} +{"Pretrain/Learning Rate": 1.4023597951118217e-05, "Pretrain/Loss": 1.9784483909606934, "Pretrain/Loss (Raw)": 2.1309008598327637, "Pretrain/Step": 6250, "Pretrain/Step Time": 8.644629921764135} +{"Pretrain/Learning Rate": 1.4015970775680554e-05, "Pretrain/Loss": 1.979327917098999, "Pretrain/Loss (Raw)": 2.181886911392212, "Pretrain/Step": 6251, "Pretrain/Step Time": 8.647477386519313} +{"Pretrain/Learning Rate": 1.4008344866972902e-05, "Pretrain/Loss": 1.9810140132904053, "Pretrain/Loss (Raw)": 2.088895797729492, "Pretrain/Step": 6252, "Pretrain/Step Time": 8.646745968610048} +{"Pretrain/Learning Rate": 1.4000720225874714e-05, "Pretrain/Loss": 1.9816088676452637, "Pretrain/Loss (Raw)": 2.170498847961426, "Pretrain/Step": 6253, "Pretrain/Step Time": 8.64947253651917} +{"Pretrain/Learning Rate": 1.399309685326529e-05, "Pretrain/Loss": 1.98318350315094, "Pretrain/Loss (Raw)": 2.1037726402282715, "Pretrain/Step": 6254, "Pretrain/Step Time": 8.651522321626544} +{"Pretrain/Learning Rate": 1.3985474750023821e-05, "Pretrain/Loss": 1.983649492263794, "Pretrain/Loss (Raw)": 2.1581950187683105, "Pretrain/Step": 6255, "Pretrain/Step Time": 8.648871432989836} +{"Pretrain/Learning Rate": 1.3977853917029287e-05, "Pretrain/Loss": 1.984216332435608, "Pretrain/Loss (Raw)": 2.0183334350585938, "Pretrain/Step": 6256, "Pretrain/Step Time": 8.642760245129466} +{"Pretrain/Learning Rate": 1.3970234355160588e-05, "Pretrain/Loss": 1.982843041419983, "Pretrain/Loss (Raw)": 1.8617026805877686, "Pretrain/Step": 6257, "Pretrain/Step Time": 8.645038332790136} +{"Pretrain/Learning Rate": 1.3962616065296428e-05, "Pretrain/Loss": 1.9835162162780762, "Pretrain/Loss (Raw)": 1.9708980321884155, "Pretrain/Step": 6258, "Pretrain/Step Time": 8.64322023279965} +{"Pretrain/Learning Rate": 1.395499904831541e-05, "Pretrain/Loss": 1.982972264289856, "Pretrain/Loss (Raw)": 2.034061908721924, "Pretrain/Step": 6259, "Pretrain/Step Time": 8.648708168417215} +{"Pretrain/Learning Rate": 1.394738330509593e-05, "Pretrain/Loss": 1.9830060005187988, "Pretrain/Loss (Raw)": 2.005575656890869, "Pretrain/Step": 6260, "Pretrain/Step Time": 8.646229434758425} +{"Pretrain/Learning Rate": 1.3939768836516299e-05, "Pretrain/Loss": 1.9823405742645264, "Pretrain/Loss (Raw)": 1.9873926639556885, "Pretrain/Step": 6261, "Pretrain/Step Time": 8.651235671713948} +{"Pretrain/Learning Rate": 1.393215564345463e-05, "Pretrain/Loss": 1.98236083984375, "Pretrain/Loss (Raw)": 1.8598700761795044, "Pretrain/Step": 6262, "Pretrain/Step Time": 8.652790391817689} +{"Pretrain/Learning Rate": 1.3924543726788953e-05, "Pretrain/Loss": 1.9813882112503052, "Pretrain/Loss (Raw)": 2.0221595764160156, "Pretrain/Step": 6263, "Pretrain/Step Time": 8.647644964978099} +{"Pretrain/Learning Rate": 1.3916933087397055e-05, "Pretrain/Loss": 1.9802167415618896, "Pretrain/Loss (Raw)": 1.9160964488983154, "Pretrain/Step": 6264, "Pretrain/Step Time": 8.64889058098197} +{"Pretrain/Learning Rate": 1.3909323726156672e-05, "Pretrain/Loss": 1.9801186323165894, "Pretrain/Loss (Raw)": 1.9138442277908325, "Pretrain/Step": 6265, "Pretrain/Step Time": 8.653793705627322} +{"Pretrain/Learning Rate": 1.3901715643945337e-05, "Pretrain/Loss": 1.9804046154022217, "Pretrain/Loss (Raw)": 1.8600265979766846, "Pretrain/Step": 6266, "Pretrain/Step Time": 8.647741734981537} +{"Pretrain/Learning Rate": 1.3894108841640452e-05, "Pretrain/Loss": 1.9775958061218262, "Pretrain/Loss (Raw)": 1.7751822471618652, "Pretrain/Step": 6267, "Pretrain/Step Time": 8.646951626986265} +{"Pretrain/Learning Rate": 1.3886503320119256e-05, "Pretrain/Loss": 1.9784126281738281, "Pretrain/Loss (Raw)": 1.9049677848815918, "Pretrain/Step": 6268, "Pretrain/Step Time": 8.648819733411074} +{"Pretrain/Learning Rate": 1.3878899080258878e-05, "Pretrain/Loss": 1.977154016494751, "Pretrain/Loss (Raw)": 1.8829859495162964, "Pretrain/Step": 6269, "Pretrain/Step Time": 8.646180605515838} +{"Pretrain/Learning Rate": 1.3871296122936261e-05, "Pretrain/Loss": 1.9756712913513184, "Pretrain/Loss (Raw)": 1.8100204467773438, "Pretrain/Step": 6270, "Pretrain/Step Time": 8.646820861846209} +{"Pretrain/Learning Rate": 1.3863694449028214e-05, "Pretrain/Loss": 1.9753059148788452, "Pretrain/Loss (Raw)": 2.0493757724761963, "Pretrain/Step": 6271, "Pretrain/Step Time": 8.64395765401423} +{"Pretrain/Learning Rate": 1.3856094059411392e-05, "Pretrain/Loss": 1.975450038909912, "Pretrain/Loss (Raw)": 1.957610011100769, "Pretrain/Step": 6272, "Pretrain/Step Time": 8.641782216727734} +{"Pretrain/Learning Rate": 1.3848494954962324e-05, "Pretrain/Loss": 1.9756805896759033, "Pretrain/Loss (Raw)": 1.953266978263855, "Pretrain/Step": 6273, "Pretrain/Step Time": 8.640143303200603} +{"Pretrain/Learning Rate": 1.3840897136557366e-05, "Pretrain/Loss": 1.9756861925125122, "Pretrain/Loss (Raw)": 1.9998664855957031, "Pretrain/Step": 6274, "Pretrain/Step Time": 8.647379430010915} +{"Pretrain/Learning Rate": 1.383330060507273e-05, "Pretrain/Loss": 1.9737251996994019, "Pretrain/Loss (Raw)": 1.8447589874267578, "Pretrain/Step": 6275, "Pretrain/Step Time": 8.649250792339444} +{"Pretrain/Learning Rate": 1.382570536138448e-05, "Pretrain/Loss": 1.9704959392547607, "Pretrain/Loss (Raw)": 1.5803080797195435, "Pretrain/Step": 6276, "Pretrain/Step Time": 8.64836360886693} +{"Pretrain/Learning Rate": 1.3818111406368555e-05, "Pretrain/Loss": 1.9707121849060059, "Pretrain/Loss (Raw)": 1.843613624572754, "Pretrain/Step": 6277, "Pretrain/Step Time": 8.654781214892864} +{"Pretrain/Learning Rate": 1.381051874090071e-05, "Pretrain/Loss": 1.969125747680664, "Pretrain/Loss (Raw)": 1.8983370065689087, "Pretrain/Step": 6278, "Pretrain/Step Time": 8.659196522086859} +{"Pretrain/Learning Rate": 1.3802927365856571e-05, "Pretrain/Loss": 1.9722914695739746, "Pretrain/Loss (Raw)": 2.241973876953125, "Pretrain/Step": 6279, "Pretrain/Step Time": 8.652348689734936} +{"Pretrain/Learning Rate": 1.3795337282111604e-05, "Pretrain/Loss": 1.9730067253112793, "Pretrain/Loss (Raw)": 2.163923740386963, "Pretrain/Step": 6280, "Pretrain/Step Time": 8.649949450045824} +{"Pretrain/Learning Rate": 1.3787748490541144e-05, "Pretrain/Loss": 1.974993348121643, "Pretrain/Loss (Raw)": 2.1030466556549072, "Pretrain/Step": 6281, "Pretrain/Step Time": 8.651642348617315} +{"Pretrain/Learning Rate": 1.3780160992020364e-05, "Pretrain/Loss": 1.9721717834472656, "Pretrain/Loss (Raw)": 1.9210041761398315, "Pretrain/Step": 6282, "Pretrain/Step Time": 8.649839919060469} +{"Pretrain/Learning Rate": 1.3772574787424291e-05, "Pretrain/Loss": 1.9744946956634521, "Pretrain/Loss (Raw)": 2.1183793544769287, "Pretrain/Step": 6283, "Pretrain/Step Time": 8.647272378206253} +{"Pretrain/Learning Rate": 1.3764989877627785e-05, "Pretrain/Loss": 1.973676323890686, "Pretrain/Loss (Raw)": 1.8885704278945923, "Pretrain/Step": 6284, "Pretrain/Step Time": 8.653046084567904} +{"Pretrain/Learning Rate": 1.3757406263505602e-05, "Pretrain/Loss": 1.9730890989303589, "Pretrain/Loss (Raw)": 2.0333385467529297, "Pretrain/Step": 6285, "Pretrain/Step Time": 8.653339082375169} +{"Pretrain/Learning Rate": 1.37498239459323e-05, "Pretrain/Loss": 1.9727983474731445, "Pretrain/Loss (Raw)": 2.121772289276123, "Pretrain/Step": 6286, "Pretrain/Step Time": 8.654032211750746} +{"Pretrain/Learning Rate": 1.3742242925782317e-05, "Pretrain/Loss": 1.971944808959961, "Pretrain/Loss (Raw)": 1.941596269607544, "Pretrain/Step": 6287, "Pretrain/Step Time": 8.654489209875464} +{"Pretrain/Learning Rate": 1.3734663203929916e-05, "Pretrain/Loss": 1.9706149101257324, "Pretrain/Loss (Raw)": 1.8675119876861572, "Pretrain/Step": 6288, "Pretrain/Step Time": 8.653080211952329} +{"Pretrain/Learning Rate": 1.372708478124925e-05, "Pretrain/Loss": 1.973860502243042, "Pretrain/Loss (Raw)": 2.06695556640625, "Pretrain/Step": 6289, "Pretrain/Step Time": 8.647805318236351} +{"Pretrain/Learning Rate": 1.3719507658614284e-05, "Pretrain/Loss": 1.9753451347351074, "Pretrain/Loss (Raw)": 2.0334184169769287, "Pretrain/Step": 6290, "Pretrain/Step Time": 8.652020778506994} +{"Pretrain/Learning Rate": 1.3711931836898842e-05, "Pretrain/Loss": 1.9703729152679443, "Pretrain/Loss (Raw)": 1.4639103412628174, "Pretrain/Step": 6291, "Pretrain/Step Time": 8.649527624249458} +{"Pretrain/Learning Rate": 1.3704357316976623e-05, "Pretrain/Loss": 1.9676527976989746, "Pretrain/Loss (Raw)": 1.8503526449203491, "Pretrain/Step": 6292, "Pretrain/Step Time": 8.652529707178473} +{"Pretrain/Learning Rate": 1.3696784099721143e-05, "Pretrain/Loss": 1.9640650749206543, "Pretrain/Loss (Raw)": 1.7416304349899292, "Pretrain/Step": 6293, "Pretrain/Step Time": 8.651346132159233} +{"Pretrain/Learning Rate": 1.3689212186005784e-05, "Pretrain/Loss": 1.9651892185211182, "Pretrain/Loss (Raw)": 2.036142587661743, "Pretrain/Step": 6294, "Pretrain/Step Time": 8.654648933559656} +{"Pretrain/Learning Rate": 1.3681641576703763e-05, "Pretrain/Loss": 1.9653515815734863, "Pretrain/Loss (Raw)": 1.8379651308059692, "Pretrain/Step": 6295, "Pretrain/Step Time": 8.65170837752521} +{"Pretrain/Learning Rate": 1.3674072272688182e-05, "Pretrain/Loss": 1.9653308391571045, "Pretrain/Loss (Raw)": 2.008373975753784, "Pretrain/Step": 6296, "Pretrain/Step Time": 8.652753802016377} +{"Pretrain/Learning Rate": 1.3666504274831954e-05, "Pretrain/Loss": 1.9651070833206177, "Pretrain/Loss (Raw)": 1.7556257247924805, "Pretrain/Step": 6297, "Pretrain/Step Time": 8.650523915886879} +{"Pretrain/Learning Rate": 1.3658937584007859e-05, "Pretrain/Loss": 1.9648826122283936, "Pretrain/Loss (Raw)": 2.0141782760620117, "Pretrain/Step": 6298, "Pretrain/Step Time": 8.652688913047314} +{"Pretrain/Learning Rate": 1.3651372201088508e-05, "Pretrain/Loss": 1.9650614261627197, "Pretrain/Loss (Raw)": 1.9566844701766968, "Pretrain/Step": 6299, "Pretrain/Step Time": 8.647625716403127} +{"Pretrain/Learning Rate": 1.3643808126946417e-05, "Pretrain/Loss": 1.9659862518310547, "Pretrain/Loss (Raw)": 2.0166265964508057, "Pretrain/Step": 6300, "Pretrain/Step Time": 8.660474261268973} +{"Pretrain/Learning Rate": 1.3636245362453865e-05, "Pretrain/Loss": 1.9668469429016113, "Pretrain/Loss (Raw)": 2.087261438369751, "Pretrain/Step": 6301, "Pretrain/Step Time": 8.659299971535802} +{"Pretrain/Learning Rate": 1.3628683908483054e-05, "Pretrain/Loss": 1.9675509929656982, "Pretrain/Loss (Raw)": 2.0615127086639404, "Pretrain/Step": 6302, "Pretrain/Step Time": 8.65804181061685} +{"Pretrain/Learning Rate": 1.3621123765905985e-05, "Pretrain/Loss": 1.9676215648651123, "Pretrain/Loss (Raw)": 2.0237643718719482, "Pretrain/Step": 6303, "Pretrain/Step Time": 8.659135106950998} +{"Pretrain/Learning Rate": 1.3613564935594565e-05, "Pretrain/Loss": 1.9678065776824951, "Pretrain/Loss (Raw)": 1.9835684299468994, "Pretrain/Step": 6304, "Pretrain/Step Time": 8.661306273192167} +{"Pretrain/Learning Rate": 1.3606007418420472e-05, "Pretrain/Loss": 1.9670888185501099, "Pretrain/Loss (Raw)": 2.1324923038482666, "Pretrain/Step": 6305, "Pretrain/Step Time": 8.662252981215715} +{"Pretrain/Learning Rate": 1.3598451215255303e-05, "Pretrain/Loss": 1.9667779207229614, "Pretrain/Loss (Raw)": 2.0933001041412354, "Pretrain/Step": 6306, "Pretrain/Step Time": 8.662871796637774} +{"Pretrain/Learning Rate": 1.3590896326970465e-05, "Pretrain/Loss": 1.9695820808410645, "Pretrain/Loss (Raw)": 2.115990400314331, "Pretrain/Step": 6307, "Pretrain/Step Time": 8.664391424506903} +{"Pretrain/Learning Rate": 1.3583342754437226e-05, "Pretrain/Loss": 1.9700639247894287, "Pretrain/Loss (Raw)": 2.121127128601074, "Pretrain/Step": 6308, "Pretrain/Step Time": 8.666643615812063} +{"Pretrain/Learning Rate": 1.3575790498526687e-05, "Pretrain/Loss": 1.9702517986297607, "Pretrain/Loss (Raw)": 1.9589515924453735, "Pretrain/Step": 6309, "Pretrain/Step Time": 8.669975377619267} +{"Pretrain/Learning Rate": 1.356823956010983e-05, "Pretrain/Loss": 1.9689477682113647, "Pretrain/Loss (Raw)": 1.9778884649276733, "Pretrain/Step": 6310, "Pretrain/Step Time": 8.66566738113761} +{"Pretrain/Learning Rate": 1.3560689940057453e-05, "Pretrain/Loss": 1.969421625137329, "Pretrain/Loss (Raw)": 1.9146116971969604, "Pretrain/Step": 6311, "Pretrain/Step Time": 8.66149415448308} +{"Pretrain/Learning Rate": 1.3553141639240218e-05, "Pretrain/Loss": 1.9683588743209839, "Pretrain/Loss (Raw)": 1.8334330320358276, "Pretrain/Step": 6312, "Pretrain/Step Time": 8.665908135473728} +{"Pretrain/Learning Rate": 1.354559465852862e-05, "Pretrain/Loss": 1.9693684577941895, "Pretrain/Loss (Raw)": 2.046757936477661, "Pretrain/Step": 6313, "Pretrain/Step Time": 8.664407443255186} +{"Pretrain/Learning Rate": 1.353804899879303e-05, "Pretrain/Loss": 1.9678454399108887, "Pretrain/Loss (Raw)": 1.8353545665740967, "Pretrain/Step": 6314, "Pretrain/Step Time": 8.665325148031116} +{"Pretrain/Learning Rate": 1.3530504660903637e-05, "Pretrain/Loss": 1.9685739278793335, "Pretrain/Loss (Raw)": 2.071781873703003, "Pretrain/Step": 6315, "Pretrain/Step Time": 8.667160354554653} +{"Pretrain/Learning Rate": 1.3522961645730498e-05, "Pretrain/Loss": 1.967061996459961, "Pretrain/Loss (Raw)": 1.9111181497573853, "Pretrain/Step": 6316, "Pretrain/Step Time": 8.666604382917285} +{"Pretrain/Learning Rate": 1.3515419954143489e-05, "Pretrain/Loss": 1.9689780473709106, "Pretrain/Loss (Raw)": 1.9309204816818237, "Pretrain/Step": 6317, "Pretrain/Step Time": 8.6615369040519} +{"Pretrain/Learning Rate": 1.3507879587012378e-05, "Pretrain/Loss": 1.9713770151138306, "Pretrain/Loss (Raw)": 1.9878288507461548, "Pretrain/Step": 6318, "Pretrain/Step Time": 8.66221608221531} +{"Pretrain/Learning Rate": 1.3500340545206747e-05, "Pretrain/Loss": 1.9698930978775024, "Pretrain/Loss (Raw)": 1.946555256843567, "Pretrain/Step": 6319, "Pretrain/Step Time": 8.667148020118475} +{"Pretrain/Learning Rate": 1.3492802829596035e-05, "Pretrain/Loss": 1.9731357097625732, "Pretrain/Loss (Raw)": 2.3822197914123535, "Pretrain/Step": 6320, "Pretrain/Step Time": 8.670511750504375} +{"Pretrain/Learning Rate": 1.348526644104951e-05, "Pretrain/Loss": 1.9733572006225586, "Pretrain/Loss (Raw)": 1.995619773864746, "Pretrain/Step": 6321, "Pretrain/Step Time": 8.673611011356115} +{"Pretrain/Learning Rate": 1.3477731380436332e-05, "Pretrain/Loss": 1.9742614030838013, "Pretrain/Loss (Raw)": 1.8996561765670776, "Pretrain/Step": 6322, "Pretrain/Step Time": 8.671196088194847} +{"Pretrain/Learning Rate": 1.3470197648625463e-05, "Pretrain/Loss": 1.9747216701507568, "Pretrain/Loss (Raw)": 2.075782299041748, "Pretrain/Step": 6323, "Pretrain/Step Time": 8.672407990321517} +{"Pretrain/Learning Rate": 1.3462665246485734e-05, "Pretrain/Loss": 1.9701991081237793, "Pretrain/Loss (Raw)": 1.6944630146026611, "Pretrain/Step": 6324, "Pretrain/Step Time": 8.673510938882828} +{"Pretrain/Learning Rate": 1.3455134174885802e-05, "Pretrain/Loss": 1.9647835493087769, "Pretrain/Loss (Raw)": 1.3113515377044678, "Pretrain/Step": 6325, "Pretrain/Step Time": 8.674600698053837} +{"Pretrain/Learning Rate": 1.3447604434694207e-05, "Pretrain/Loss": 1.965989589691162, "Pretrain/Loss (Raw)": 1.7144408226013184, "Pretrain/Step": 6326, "Pretrain/Step Time": 8.677472896873951} +{"Pretrain/Learning Rate": 1.3440076026779309e-05, "Pretrain/Loss": 1.9644758701324463, "Pretrain/Loss (Raw)": 1.9297858476638794, "Pretrain/Step": 6327, "Pretrain/Step Time": 8.673793131485581} +{"Pretrain/Learning Rate": 1.3432548952009313e-05, "Pretrain/Loss": 1.9622553586959839, "Pretrain/Loss (Raw)": 1.680790662765503, "Pretrain/Step": 6328, "Pretrain/Step Time": 8.667612737044692} +{"Pretrain/Learning Rate": 1.3425023211252272e-05, "Pretrain/Loss": 1.9617972373962402, "Pretrain/Loss (Raw)": 1.97780442237854, "Pretrain/Step": 6329, "Pretrain/Step Time": 8.668916936963797} +{"Pretrain/Learning Rate": 1.3417498805376105e-05, "Pretrain/Loss": 1.9633982181549072, "Pretrain/Loss (Raw)": 2.17631196975708, "Pretrain/Step": 6330, "Pretrain/Step Time": 8.666810179129243} +{"Pretrain/Learning Rate": 1.3409975735248556e-05, "Pretrain/Loss": 1.9622836112976074, "Pretrain/Loss (Raw)": 1.9685124158859253, "Pretrain/Step": 6331, "Pretrain/Step Time": 8.66762749478221} +{"Pretrain/Learning Rate": 1.3402454001737209e-05, "Pretrain/Loss": 1.9610021114349365, "Pretrain/Loss (Raw)": 2.002305269241333, "Pretrain/Step": 6332, "Pretrain/Step Time": 8.670254193246365} +{"Pretrain/Learning Rate": 1.3394933605709525e-05, "Pretrain/Loss": 1.9591399431228638, "Pretrain/Loss (Raw)": 1.6226387023925781, "Pretrain/Step": 6333, "Pretrain/Step Time": 8.672072187066078} +{"Pretrain/Learning Rate": 1.3387414548032783e-05, "Pretrain/Loss": 1.960174560546875, "Pretrain/Loss (Raw)": 2.0608818531036377, "Pretrain/Step": 6334, "Pretrain/Step Time": 8.678349535912275} +{"Pretrain/Learning Rate": 1.3379896829574115e-05, "Pretrain/Loss": 1.960334062576294, "Pretrain/Loss (Raw)": 1.8099607229232788, "Pretrain/Step": 6335, "Pretrain/Step Time": 8.67694791033864} +{"Pretrain/Learning Rate": 1.337238045120049e-05, "Pretrain/Loss": 1.9608876705169678, "Pretrain/Loss (Raw)": 2.2218666076660156, "Pretrain/Step": 6336, "Pretrain/Step Time": 8.67698859795928} +{"Pretrain/Learning Rate": 1.3364865413778755e-05, "Pretrain/Loss": 1.9619190692901611, "Pretrain/Loss (Raw)": 2.1252925395965576, "Pretrain/Step": 6337, "Pretrain/Step Time": 8.679560672491789} +{"Pretrain/Learning Rate": 1.3357351718175564e-05, "Pretrain/Loss": 1.9611226320266724, "Pretrain/Loss (Raw)": 1.840751051902771, "Pretrain/Step": 6338, "Pretrain/Step Time": 8.677067896351218} +{"Pretrain/Learning Rate": 1.3349839365257438e-05, "Pretrain/Loss": 1.9588055610656738, "Pretrain/Loss (Raw)": 1.945568561553955, "Pretrain/Step": 6339, "Pretrain/Step Time": 8.684731794521213} +{"Pretrain/Learning Rate": 1.3342328355890721e-05, "Pretrain/Loss": 1.9627171754837036, "Pretrain/Loss (Raw)": 2.1781575679779053, "Pretrain/Step": 6340, "Pretrain/Step Time": 8.683463733643293} +{"Pretrain/Learning Rate": 1.3334818690941652e-05, "Pretrain/Loss": 1.9617748260498047, "Pretrain/Loss (Raw)": 2.1068551540374756, "Pretrain/Step": 6341, "Pretrain/Step Time": 8.67920633777976} +{"Pretrain/Learning Rate": 1.332731037127624e-05, "Pretrain/Loss": 1.9644052982330322, "Pretrain/Loss (Raw)": 2.257204532623291, "Pretrain/Step": 6342, "Pretrain/Step Time": 8.685446485877037} +{"Pretrain/Learning Rate": 1.3319803397760408e-05, "Pretrain/Loss": 1.964083194732666, "Pretrain/Loss (Raw)": 2.000556468963623, "Pretrain/Step": 6343, "Pretrain/Step Time": 8.683029305189848} +{"Pretrain/Learning Rate": 1.331229777125988e-05, "Pretrain/Loss": 1.9658633470535278, "Pretrain/Loss (Raw)": 2.0875651836395264, "Pretrain/Step": 6344, "Pretrain/Step Time": 8.683371799066663} +{"Pretrain/Learning Rate": 1.3304793492640263e-05, "Pretrain/Loss": 1.9670408964157104, "Pretrain/Loss (Raw)": 2.059231758117676, "Pretrain/Step": 6345, "Pretrain/Step Time": 8.682548336684704} +{"Pretrain/Learning Rate": 1.329729056276695e-05, "Pretrain/Loss": 1.9689570665359497, "Pretrain/Loss (Raw)": 2.086214303970337, "Pretrain/Step": 6346, "Pretrain/Step Time": 8.681218789890409} +{"Pretrain/Learning Rate": 1.328978898250525e-05, "Pretrain/Loss": 1.9703377485275269, "Pretrain/Loss (Raw)": 2.046832799911499, "Pretrain/Step": 6347, "Pretrain/Step Time": 8.684085102751851} +{"Pretrain/Learning Rate": 1.3282288752720262e-05, "Pretrain/Loss": 1.9681869745254517, "Pretrain/Loss (Raw)": 1.8048112392425537, "Pretrain/Step": 6348, "Pretrain/Step Time": 8.688270173966885} +{"Pretrain/Learning Rate": 1.3274789874276949e-05, "Pretrain/Loss": 1.9739030599594116, "Pretrain/Loss (Raw)": 2.1048810482025146, "Pretrain/Step": 6349, "Pretrain/Step Time": 8.683740807697177} +{"Pretrain/Learning Rate": 1.3267292348040111e-05, "Pretrain/Loss": 1.9714916944503784, "Pretrain/Loss (Raw)": 1.6854442358016968, "Pretrain/Step": 6350, "Pretrain/Step Time": 8.683416308835149} +{"Pretrain/Learning Rate": 1.3259796174874411e-05, "Pretrain/Loss": 1.9704413414001465, "Pretrain/Loss (Raw)": 1.9591978788375854, "Pretrain/Step": 6351, "Pretrain/Step Time": 8.681978119537234} +{"Pretrain/Learning Rate": 1.3252301355644341e-05, "Pretrain/Loss": 1.969648838043213, "Pretrain/Loss (Raw)": 1.9360928535461426, "Pretrain/Step": 6352, "Pretrain/Step Time": 8.682239931076765} +{"Pretrain/Learning Rate": 1.324480789121424e-05, "Pretrain/Loss": 1.9704229831695557, "Pretrain/Loss (Raw)": 1.9788376092910767, "Pretrain/Step": 6353, "Pretrain/Step Time": 8.686258593574166} +{"Pretrain/Learning Rate": 1.323731578244827e-05, "Pretrain/Loss": 1.970292329788208, "Pretrain/Loss (Raw)": 1.9364863634109497, "Pretrain/Step": 6354, "Pretrain/Step Time": 8.688105186447501} +{"Pretrain/Learning Rate": 1.3229825030210482e-05, "Pretrain/Loss": 1.9704864025115967, "Pretrain/Loss (Raw)": 2.0458743572235107, "Pretrain/Step": 6355, "Pretrain/Step Time": 8.69628232344985} +{"Pretrain/Learning Rate": 1.3222335635364736e-05, "Pretrain/Loss": 1.9720635414123535, "Pretrain/Loss (Raw)": 2.084369659423828, "Pretrain/Step": 6356, "Pretrain/Step Time": 8.689237663522363} +{"Pretrain/Learning Rate": 1.3214847598774744e-05, "Pretrain/Loss": 1.9710216522216797, "Pretrain/Loss (Raw)": 1.9025311470031738, "Pretrain/Step": 6357, "Pretrain/Step Time": 8.68720486946404} +{"Pretrain/Learning Rate": 1.3207360921304046e-05, "Pretrain/Loss": 1.9698511362075806, "Pretrain/Loss (Raw)": 1.441491723060608, "Pretrain/Step": 6358, "Pretrain/Step Time": 8.682026600465178} +{"Pretrain/Learning Rate": 1.319987560381607e-05, "Pretrain/Loss": 1.9695396423339844, "Pretrain/Loss (Raw)": 2.1170833110809326, "Pretrain/Step": 6359, "Pretrain/Step Time": 8.680712670087814} +{"Pretrain/Learning Rate": 1.319239164717404e-05, "Pretrain/Loss": 1.9682645797729492, "Pretrain/Loss (Raw)": 2.0192768573760986, "Pretrain/Step": 6360, "Pretrain/Step Time": 8.682746209204197} +{"Pretrain/Learning Rate": 1.3184909052241046e-05, "Pretrain/Loss": 1.9679300785064697, "Pretrain/Loss (Raw)": 1.7490534782409668, "Pretrain/Step": 6361, "Pretrain/Step Time": 8.68640892766416} +{"Pretrain/Learning Rate": 1.3177427819880002e-05, "Pretrain/Loss": 1.965444803237915, "Pretrain/Loss (Raw)": 1.7406220436096191, "Pretrain/Step": 6362, "Pretrain/Step Time": 8.684749545529485} +{"Pretrain/Learning Rate": 1.3169947950953704e-05, "Pretrain/Loss": 1.9657384157180786, "Pretrain/Loss (Raw)": 2.140882730484009, "Pretrain/Step": 6363, "Pretrain/Step Time": 8.684997200965881} +{"Pretrain/Learning Rate": 1.3162469446324755e-05, "Pretrain/Loss": 1.9654558897018433, "Pretrain/Loss (Raw)": 1.9683727025985718, "Pretrain/Step": 6364, "Pretrain/Step Time": 8.684977693483233} +{"Pretrain/Learning Rate": 1.3154992306855607e-05, "Pretrain/Loss": 1.9654922485351562, "Pretrain/Loss (Raw)": 2.104796886444092, "Pretrain/Step": 6365, "Pretrain/Step Time": 8.683350693434477} +{"Pretrain/Learning Rate": 1.3147516533408552e-05, "Pretrain/Loss": 1.9658772945404053, "Pretrain/Loss (Raw)": 2.1339805126190186, "Pretrain/Step": 6366, "Pretrain/Step Time": 8.679092049598694} +{"Pretrain/Learning Rate": 1.3140042126845753e-05, "Pretrain/Loss": 1.9650661945343018, "Pretrain/Loss (Raw)": 1.7373675107955933, "Pretrain/Step": 6367, "Pretrain/Step Time": 8.679510300979018} +{"Pretrain/Learning Rate": 1.3132569088029179e-05, "Pretrain/Loss": 1.9595354795455933, "Pretrain/Loss (Raw)": 2.121328353881836, "Pretrain/Step": 6368, "Pretrain/Step Time": 8.679005827754736} +{"Pretrain/Learning Rate": 1.312509741782066e-05, "Pretrain/Loss": 1.9586050510406494, "Pretrain/Loss (Raw)": 1.7971974611282349, "Pretrain/Step": 6369, "Pretrain/Step Time": 8.682053625583649} +{"Pretrain/Learning Rate": 1.3117627117081854e-05, "Pretrain/Loss": 1.9591424465179443, "Pretrain/Loss (Raw)": 2.041006326675415, "Pretrain/Step": 6370, "Pretrain/Step Time": 8.67898383922875} +{"Pretrain/Learning Rate": 1.3110158186674293e-05, "Pretrain/Loss": 1.9598290920257568, "Pretrain/Loss (Raw)": 1.6681698560714722, "Pretrain/Step": 6371, "Pretrain/Step Time": 8.68094389885664} +{"Pretrain/Learning Rate": 1.3102690627459314e-05, "Pretrain/Loss": 1.9584054946899414, "Pretrain/Loss (Raw)": 1.9174914360046387, "Pretrain/Step": 6372, "Pretrain/Step Time": 8.67323449254036} +{"Pretrain/Learning Rate": 1.30952244402981e-05, "Pretrain/Loss": 1.9585175514221191, "Pretrain/Loss (Raw)": 1.9851680994033813, "Pretrain/Step": 6373, "Pretrain/Step Time": 8.674358205869794} +{"Pretrain/Learning Rate": 1.3087759626051716e-05, "Pretrain/Loss": 1.9587986469268799, "Pretrain/Loss (Raw)": 2.1007649898529053, "Pretrain/Step": 6374, "Pretrain/Step Time": 8.672470340505242} +{"Pretrain/Learning Rate": 1.308029618558102e-05, "Pretrain/Loss": 1.9592024087905884, "Pretrain/Loss (Raw)": 1.9157869815826416, "Pretrain/Step": 6375, "Pretrain/Step Time": 8.671980921179056} +{"Pretrain/Learning Rate": 1.3072834119746741e-05, "Pretrain/Loss": 1.9636740684509277, "Pretrain/Loss (Raw)": 2.1037979125976562, "Pretrain/Step": 6376, "Pretrain/Step Time": 8.670886095613241} +{"Pretrain/Learning Rate": 1.3065373429409419e-05, "Pretrain/Loss": 1.9648141860961914, "Pretrain/Loss (Raw)": 1.9938243627548218, "Pretrain/Step": 6377, "Pretrain/Step Time": 8.670320378616452} +{"Pretrain/Learning Rate": 1.3057914115429482e-05, "Pretrain/Loss": 1.9641085863113403, "Pretrain/Loss (Raw)": 2.040583848953247, "Pretrain/Step": 6378, "Pretrain/Step Time": 8.672578878700733} +{"Pretrain/Learning Rate": 1.3050456178667165e-05, "Pretrain/Loss": 1.9636468887329102, "Pretrain/Loss (Raw)": 2.122788667678833, "Pretrain/Step": 6379, "Pretrain/Step Time": 8.668942995369434} +{"Pretrain/Learning Rate": 1.3042999619982546e-05, "Pretrain/Loss": 1.9626445770263672, "Pretrain/Loss (Raw)": 1.9606107473373413, "Pretrain/Step": 6380, "Pretrain/Step Time": 8.670295486226678} +{"Pretrain/Learning Rate": 1.3035544440235548e-05, "Pretrain/Loss": 1.96028470993042, "Pretrain/Loss (Raw)": 1.8684231042861938, "Pretrain/Step": 6381, "Pretrain/Step Time": 8.669761652126908} +{"Pretrain/Learning Rate": 1.3028090640285958e-05, "Pretrain/Loss": 1.9593251943588257, "Pretrain/Loss (Raw)": 1.9809483289718628, "Pretrain/Step": 6382, "Pretrain/Step Time": 8.668945632874966} +{"Pretrain/Learning Rate": 1.3020638220993353e-05, "Pretrain/Loss": 1.9580001831054688, "Pretrain/Loss (Raw)": 1.9886022806167603, "Pretrain/Step": 6383, "Pretrain/Step Time": 8.667705023661256} +{"Pretrain/Learning Rate": 1.3013187183217206e-05, "Pretrain/Loss": 1.9580711126327515, "Pretrain/Loss (Raw)": 2.0274155139923096, "Pretrain/Step": 6384, "Pretrain/Step Time": 8.670801378786564} +{"Pretrain/Learning Rate": 1.3005737527816786e-05, "Pretrain/Loss": 1.9600727558135986, "Pretrain/Loss (Raw)": 2.117906093597412, "Pretrain/Step": 6385, "Pretrain/Step Time": 8.671251026913524} +{"Pretrain/Learning Rate": 1.2998289255651253e-05, "Pretrain/Loss": 1.9592845439910889, "Pretrain/Loss (Raw)": 1.8700190782546997, "Pretrain/Step": 6386, "Pretrain/Step Time": 8.67706241644919} +{"Pretrain/Learning Rate": 1.2990842367579539e-05, "Pretrain/Loss": 1.9578354358673096, "Pretrain/Loss (Raw)": 1.848567247390747, "Pretrain/Step": 6387, "Pretrain/Step Time": 8.671257039532065} +{"Pretrain/Learning Rate": 1.2983396864460482e-05, "Pretrain/Loss": 1.958479881286621, "Pretrain/Loss (Raw)": 2.0880539417266846, "Pretrain/Step": 6388, "Pretrain/Step Time": 8.66968871280551} +{"Pretrain/Learning Rate": 1.2975952747152709e-05, "Pretrain/Loss": 1.956525444984436, "Pretrain/Loss (Raw)": 1.7372369766235352, "Pretrain/Step": 6389, "Pretrain/Step Time": 8.6678206641227} +{"Pretrain/Learning Rate": 1.2968510016514749e-05, "Pretrain/Loss": 1.9588606357574463, "Pretrain/Loss (Raw)": 2.1587765216827393, "Pretrain/Step": 6390, "Pretrain/Step Time": 8.667753666639328} +{"Pretrain/Learning Rate": 1.2961068673404886e-05, "Pretrain/Loss": 1.958537220954895, "Pretrain/Loss (Raw)": 1.9807531833648682, "Pretrain/Step": 6391, "Pretrain/Step Time": 8.670085452497005} +{"Pretrain/Learning Rate": 1.295362871868132e-05, "Pretrain/Loss": 1.960067629814148, "Pretrain/Loss (Raw)": 2.1119985580444336, "Pretrain/Step": 6392, "Pretrain/Step Time": 8.66757151670754} +{"Pretrain/Learning Rate": 1.2946190153202059e-05, "Pretrain/Loss": 1.9606494903564453, "Pretrain/Loss (Raw)": 1.9883179664611816, "Pretrain/Step": 6393, "Pretrain/Step Time": 8.664965433999896} +{"Pretrain/Learning Rate": 1.2938752977824947e-05, "Pretrain/Loss": 1.9600305557250977, "Pretrain/Loss (Raw)": 1.7808014154434204, "Pretrain/Step": 6394, "Pretrain/Step Time": 8.66550425812602} +{"Pretrain/Learning Rate": 1.2931317193407665e-05, "Pretrain/Loss": 1.962748646736145, "Pretrain/Loss (Raw)": 2.123106002807617, "Pretrain/Step": 6395, "Pretrain/Step Time": 8.667228700593114} +{"Pretrain/Learning Rate": 1.2923882800807768e-05, "Pretrain/Loss": 1.9632186889648438, "Pretrain/Loss (Raw)": 1.965128779411316, "Pretrain/Step": 6396, "Pretrain/Step Time": 8.668438455089927} +{"Pretrain/Learning Rate": 1.2916449800882607e-05, "Pretrain/Loss": 1.9646661281585693, "Pretrain/Loss (Raw)": 2.068251848220825, "Pretrain/Step": 6397, "Pretrain/Step Time": 8.668592788279057} +{"Pretrain/Learning Rate": 1.2909018194489397e-05, "Pretrain/Loss": 1.9675530195236206, "Pretrain/Loss (Raw)": 2.1795403957366943, "Pretrain/Step": 6398, "Pretrain/Step Time": 8.671145105734468} +{"Pretrain/Learning Rate": 1.2901587982485172e-05, "Pretrain/Loss": 1.9682141542434692, "Pretrain/Loss (Raw)": 2.1340134143829346, "Pretrain/Step": 6399, "Pretrain/Step Time": 8.67458776384592} +{"Pretrain/Learning Rate": 1.289415916572684e-05, "Pretrain/Loss": 1.9672424793243408, "Pretrain/Loss (Raw)": 1.833223819732666, "Pretrain/Step": 6400, "Pretrain/Step Time": 8.675233352929354} +{"Pretrain/Learning Rate": 1.2886731745071117e-05, "Pretrain/Loss": 1.9656727313995361, "Pretrain/Loss (Raw)": 1.7523499727249146, "Pretrain/Step": 6401, "Pretrain/Step Time": 8.675629671663046} +{"Pretrain/Learning Rate": 1.287930572137457e-05, "Pretrain/Loss": 1.9656517505645752, "Pretrain/Loss (Raw)": 1.9971822500228882, "Pretrain/Step": 6402, "Pretrain/Step Time": 8.668533511459827} +{"Pretrain/Learning Rate": 1.2871881095493592e-05, "Pretrain/Loss": 1.9670944213867188, "Pretrain/Loss (Raw)": 2.0294108390808105, "Pretrain/Step": 6403, "Pretrain/Step Time": 8.666942156851292} +{"Pretrain/Learning Rate": 1.2864457868284446e-05, "Pretrain/Loss": 1.9689128398895264, "Pretrain/Loss (Raw)": 1.8130571842193604, "Pretrain/Step": 6404, "Pretrain/Step Time": 8.670301923528314} +{"Pretrain/Learning Rate": 1.2857036040603205e-05, "Pretrain/Loss": 1.971313238143921, "Pretrain/Loss (Raw)": 2.150864839553833, "Pretrain/Step": 6405, "Pretrain/Step Time": 8.666285445913672} +{"Pretrain/Learning Rate": 1.2849615613305782e-05, "Pretrain/Loss": 1.972355842590332, "Pretrain/Loss (Raw)": 2.031806230545044, "Pretrain/Step": 6406, "Pretrain/Step Time": 8.658959059044719} +{"Pretrain/Learning Rate": 1.2842196587247935e-05, "Pretrain/Loss": 1.9702337980270386, "Pretrain/Loss (Raw)": 1.9703428745269775, "Pretrain/Step": 6407, "Pretrain/Step Time": 8.662513146176934} +{"Pretrain/Learning Rate": 1.2834778963285276e-05, "Pretrain/Loss": 1.9695242643356323, "Pretrain/Loss (Raw)": 2.0731232166290283, "Pretrain/Step": 6408, "Pretrain/Step Time": 8.663018241524696} +{"Pretrain/Learning Rate": 1.282736274227323e-05, "Pretrain/Loss": 1.968071460723877, "Pretrain/Loss (Raw)": 1.9170801639556885, "Pretrain/Step": 6409, "Pretrain/Step Time": 8.659387677907944} +{"Pretrain/Learning Rate": 1.2819947925067071e-05, "Pretrain/Loss": 1.9683547019958496, "Pretrain/Loss (Raw)": 1.9572651386260986, "Pretrain/Step": 6410, "Pretrain/Step Time": 8.658980848267674} +{"Pretrain/Learning Rate": 1.2812534512521906e-05, "Pretrain/Loss": 1.9675968885421753, "Pretrain/Loss (Raw)": 2.0213747024536133, "Pretrain/Step": 6411, "Pretrain/Step Time": 8.670101676136255} +{"Pretrain/Learning Rate": 1.2805122505492697e-05, "Pretrain/Loss": 1.9674630165100098, "Pretrain/Loss (Raw)": 1.8714169263839722, "Pretrain/Step": 6412, "Pretrain/Step Time": 8.662313928827643} +{"Pretrain/Learning Rate": 1.2797711904834226e-05, "Pretrain/Loss": 1.967641830444336, "Pretrain/Loss (Raw)": 2.0562405586242676, "Pretrain/Step": 6413, "Pretrain/Step Time": 8.665990874171257} +{"Pretrain/Learning Rate": 1.279030271140111e-05, "Pretrain/Loss": 1.9671452045440674, "Pretrain/Loss (Raw)": 2.0581953525543213, "Pretrain/Step": 6414, "Pretrain/Step Time": 8.66877087764442} +{"Pretrain/Learning Rate": 1.2782894926047822e-05, "Pretrain/Loss": 1.9686880111694336, "Pretrain/Loss (Raw)": 2.1390862464904785, "Pretrain/Step": 6415, "Pretrain/Step Time": 8.668678905814886} +{"Pretrain/Learning Rate": 1.2775488549628667e-05, "Pretrain/Loss": 1.9671313762664795, "Pretrain/Loss (Raw)": 1.6682699918746948, "Pretrain/Step": 6416, "Pretrain/Step Time": 8.67363846115768} +{"Pretrain/Learning Rate": 1.2768083582997772e-05, "Pretrain/Loss": 1.964890718460083, "Pretrain/Loss (Raw)": 1.7801368236541748, "Pretrain/Step": 6417, "Pretrain/Step Time": 8.673555551096797} +{"Pretrain/Learning Rate": 1.2760680027009109e-05, "Pretrain/Loss": 1.9630024433135986, "Pretrain/Loss (Raw)": 1.791717767715454, "Pretrain/Step": 6418, "Pretrain/Step Time": 8.669703360646963} +{"Pretrain/Learning Rate": 1.2753277882516507e-05, "Pretrain/Loss": 1.9656858444213867, "Pretrain/Loss (Raw)": 1.8073943853378296, "Pretrain/Step": 6419, "Pretrain/Step Time": 8.670288955792785} +{"Pretrain/Learning Rate": 1.2745877150373612e-05, "Pretrain/Loss": 1.9674315452575684, "Pretrain/Loss (Raw)": 2.0737874507904053, "Pretrain/Step": 6420, "Pretrain/Step Time": 8.670638035982847} +{"Pretrain/Learning Rate": 1.2738477831433904e-05, "Pretrain/Loss": 1.9675660133361816, "Pretrain/Loss (Raw)": 1.7588527202606201, "Pretrain/Step": 6421, "Pretrain/Step Time": 8.673847565427423} +{"Pretrain/Learning Rate": 1.2731079926550701e-05, "Pretrain/Loss": 1.9693325757980347, "Pretrain/Loss (Raw)": 2.26226806640625, "Pretrain/Step": 6422, "Pretrain/Step Time": 8.67149469256401} +{"Pretrain/Learning Rate": 1.2723683436577195e-05, "Pretrain/Loss": 1.9704444408416748, "Pretrain/Loss (Raw)": 1.9802663326263428, "Pretrain/Step": 6423, "Pretrain/Step Time": 8.675917299464345} +{"Pretrain/Learning Rate": 1.271628836236634e-05, "Pretrain/Loss": 1.9718748331069946, "Pretrain/Loss (Raw)": 2.191488265991211, "Pretrain/Step": 6424, "Pretrain/Step Time": 8.674080291762948} +{"Pretrain/Learning Rate": 1.2708894704771007e-05, "Pretrain/Loss": 1.9723702669143677, "Pretrain/Loss (Raw)": 1.8190314769744873, "Pretrain/Step": 6425, "Pretrain/Step Time": 8.675053335726261} +{"Pretrain/Learning Rate": 1.2701502464643844e-05, "Pretrain/Loss": 1.9718289375305176, "Pretrain/Loss (Raw)": 1.944899082183838, "Pretrain/Step": 6426, "Pretrain/Step Time": 8.672667415812612} +{"Pretrain/Learning Rate": 1.2694111642837386e-05, "Pretrain/Loss": 1.9735807180404663, "Pretrain/Loss (Raw)": 2.180905818939209, "Pretrain/Step": 6427, "Pretrain/Step Time": 8.67629699781537} +{"Pretrain/Learning Rate": 1.2686722240203946e-05, "Pretrain/Loss": 1.9734809398651123, "Pretrain/Loss (Raw)": 2.0038435459136963, "Pretrain/Step": 6428, "Pretrain/Step Time": 8.664665708318353} +{"Pretrain/Learning Rate": 1.2679334257595727e-05, "Pretrain/Loss": 1.9730724096298218, "Pretrain/Loss (Raw)": 2.0349650382995605, "Pretrain/Step": 6429, "Pretrain/Step Time": 8.667376577854156} +{"Pretrain/Learning Rate": 1.2671947695864727e-05, "Pretrain/Loss": 1.9710030555725098, "Pretrain/Loss (Raw)": 1.7966516017913818, "Pretrain/Step": 6430, "Pretrain/Step Time": 8.66745763644576} +{"Pretrain/Learning Rate": 1.266456255586283e-05, "Pretrain/Loss": 1.9707348346710205, "Pretrain/Loss (Raw)": 1.98941171169281, "Pretrain/Step": 6431, "Pretrain/Step Time": 8.670820206403732} +{"Pretrain/Learning Rate": 1.2657178838441686e-05, "Pretrain/Loss": 1.9716193675994873, "Pretrain/Loss (Raw)": 2.096794605255127, "Pretrain/Step": 6432, "Pretrain/Step Time": 8.664092730730772} +{"Pretrain/Learning Rate": 1.2649796544452852e-05, "Pretrain/Loss": 1.9694263935089111, "Pretrain/Loss (Raw)": 1.851792335510254, "Pretrain/Step": 6433, "Pretrain/Step Time": 8.662517350167036} +{"Pretrain/Learning Rate": 1.2642415674747673e-05, "Pretrain/Loss": 1.968983769416809, "Pretrain/Loss (Raw)": 2.036652088165283, "Pretrain/Step": 6434, "Pretrain/Step Time": 8.664237473160028} +{"Pretrain/Learning Rate": 1.263503623017735e-05, "Pretrain/Loss": 1.9660754203796387, "Pretrain/Loss (Raw)": 1.7437140941619873, "Pretrain/Step": 6435, "Pretrain/Step Time": 8.66510734334588} +{"Pretrain/Learning Rate": 1.2627658211592907e-05, "Pretrain/Loss": 1.9646598100662231, "Pretrain/Loss (Raw)": 1.939924955368042, "Pretrain/Step": 6436, "Pretrain/Step Time": 8.660920936614275} +{"Pretrain/Learning Rate": 1.262028161984523e-05, "Pretrain/Loss": 1.9660446643829346, "Pretrain/Loss (Raw)": 2.136214017868042, "Pretrain/Step": 6437, "Pretrain/Step Time": 8.659804198890924} +{"Pretrain/Learning Rate": 1.2612906455785006e-05, "Pretrain/Loss": 1.9657365083694458, "Pretrain/Loss (Raw)": 1.9384547472000122, "Pretrain/Step": 6438, "Pretrain/Step Time": 8.663221469148993} +{"Pretrain/Learning Rate": 1.2605532720262785e-05, "Pretrain/Loss": 1.965749740600586, "Pretrain/Loss (Raw)": 1.9163119792938232, "Pretrain/Step": 6439, "Pretrain/Step Time": 8.662633147090673} +{"Pretrain/Learning Rate": 1.2598160414128924e-05, "Pretrain/Loss": 1.9685382843017578, "Pretrain/Loss (Raw)": 2.1903579235076904, "Pretrain/Step": 6440, "Pretrain/Step Time": 8.662345251068473} +{"Pretrain/Learning Rate": 1.2590789538233652e-05, "Pretrain/Loss": 1.9678459167480469, "Pretrain/Loss (Raw)": 1.9581310749053955, "Pretrain/Step": 6441, "Pretrain/Step Time": 8.658474210649729} +{"Pretrain/Learning Rate": 1.2583420093427006e-05, "Pretrain/Loss": 1.9685933589935303, "Pretrain/Loss (Raw)": 1.931035041809082, "Pretrain/Step": 6442, "Pretrain/Step Time": 8.654006401076913} +{"Pretrain/Learning Rate": 1.2576052080558864e-05, "Pretrain/Loss": 1.968529462814331, "Pretrain/Loss (Raw)": 2.063605308532715, "Pretrain/Step": 6443, "Pretrain/Step Time": 8.656661266461015} +{"Pretrain/Learning Rate": 1.2568685500478927e-05, "Pretrain/Loss": 1.9686617851257324, "Pretrain/Loss (Raw)": 1.9280428886413574, "Pretrain/Step": 6444, "Pretrain/Step Time": 8.66088180989027} +{"Pretrain/Learning Rate": 1.256132035403677e-05, "Pretrain/Loss": 1.969110369682312, "Pretrain/Loss (Raw)": 1.988336205482483, "Pretrain/Step": 6445, "Pretrain/Step Time": 8.657734164968133} +{"Pretrain/Learning Rate": 1.255395664208176e-05, "Pretrain/Loss": 1.9676889181137085, "Pretrain/Loss (Raw)": 1.8058918714523315, "Pretrain/Step": 6446, "Pretrain/Step Time": 8.66372887417674} +{"Pretrain/Learning Rate": 1.2546594365463119e-05, "Pretrain/Loss": 1.9678151607513428, "Pretrain/Loss (Raw)": 1.9627161026000977, "Pretrain/Step": 6447, "Pretrain/Step Time": 8.655555952340364} +{"Pretrain/Learning Rate": 1.2539233525029886e-05, "Pretrain/Loss": 1.9627596139907837, "Pretrain/Loss (Raw)": 1.7351096868515015, "Pretrain/Step": 6448, "Pretrain/Step Time": 8.656041147187352} +{"Pretrain/Learning Rate": 1.2531874121630973e-05, "Pretrain/Loss": 1.9621424674987793, "Pretrain/Loss (Raw)": 1.9166184663772583, "Pretrain/Step": 6449, "Pretrain/Step Time": 8.652681443840265} +{"Pretrain/Learning Rate": 1.2524516156115088e-05, "Pretrain/Loss": 1.9631223678588867, "Pretrain/Loss (Raw)": 2.025083065032959, "Pretrain/Step": 6450, "Pretrain/Step Time": 8.654611570760608} +{"Pretrain/Learning Rate": 1.2517159629330783e-05, "Pretrain/Loss": 1.9617557525634766, "Pretrain/Loss (Raw)": 1.9008616209030151, "Pretrain/Step": 6451, "Pretrain/Step Time": 8.65201379917562} +{"Pretrain/Learning Rate": 1.2509804542126444e-05, "Pretrain/Loss": 1.9637510776519775, "Pretrain/Loss (Raw)": 1.9498647451400757, "Pretrain/Step": 6452, "Pretrain/Step Time": 8.644734619185328} +{"Pretrain/Learning Rate": 1.250245089535031e-05, "Pretrain/Loss": 1.9697675704956055, "Pretrain/Loss (Raw)": 2.0814599990844727, "Pretrain/Step": 6453, "Pretrain/Step Time": 8.642399968579412} +{"Pretrain/Learning Rate": 1.2495098689850429e-05, "Pretrain/Loss": 1.9714477062225342, "Pretrain/Loss (Raw)": 1.9295059442520142, "Pretrain/Step": 6454, "Pretrain/Step Time": 8.646536761894822} +{"Pretrain/Learning Rate": 1.2487747926474683e-05, "Pretrain/Loss": 1.971838355064392, "Pretrain/Loss (Raw)": 1.9797954559326172, "Pretrain/Step": 6455, "Pretrain/Step Time": 8.643879674375057} +{"Pretrain/Learning Rate": 1.2480398606070815e-05, "Pretrain/Loss": 1.9746873378753662, "Pretrain/Loss (Raw)": 2.045440196990967, "Pretrain/Step": 6456, "Pretrain/Step Time": 8.644311362877488} +{"Pretrain/Learning Rate": 1.2473050729486371e-05, "Pretrain/Loss": 1.9752750396728516, "Pretrain/Loss (Raw)": 2.053032398223877, "Pretrain/Step": 6457, "Pretrain/Step Time": 8.642863465473056} +{"Pretrain/Learning Rate": 1.246570429756875e-05, "Pretrain/Loss": 1.974208116531372, "Pretrain/Loss (Raw)": 2.0397398471832275, "Pretrain/Step": 6458, "Pretrain/Step Time": 8.642414519563317} +{"Pretrain/Learning Rate": 1.245835931116516e-05, "Pretrain/Loss": 1.9729712009429932, "Pretrain/Loss (Raw)": 1.8102141618728638, "Pretrain/Step": 6459, "Pretrain/Step Time": 8.642112668603659} +{"Pretrain/Learning Rate": 1.2451015771122684e-05, "Pretrain/Loss": 1.9729923009872437, "Pretrain/Loss (Raw)": 2.0049893856048584, "Pretrain/Step": 6460, "Pretrain/Step Time": 8.643941979855299} +{"Pretrain/Learning Rate": 1.2443673678288204e-05, "Pretrain/Loss": 1.9769678115844727, "Pretrain/Loss (Raw)": 2.1314985752105713, "Pretrain/Step": 6461, "Pretrain/Step Time": 8.644938431680202} +{"Pretrain/Learning Rate": 1.243633303350844e-05, "Pretrain/Loss": 1.9780181646347046, "Pretrain/Loss (Raw)": 2.195342779159546, "Pretrain/Step": 6462, "Pretrain/Step Time": 8.639219097793102} +{"Pretrain/Learning Rate": 1.2428993837629943e-05, "Pretrain/Loss": 1.9795814752578735, "Pretrain/Loss (Raw)": 2.0100631713867188, "Pretrain/Step": 6463, "Pretrain/Step Time": 8.645649461075664} +{"Pretrain/Learning Rate": 1.2421656091499123e-05, "Pretrain/Loss": 1.9734044075012207, "Pretrain/Loss (Raw)": 1.4312081336975098, "Pretrain/Step": 6464, "Pretrain/Step Time": 8.648095378652215} +{"Pretrain/Learning Rate": 1.2414319795962196e-05, "Pretrain/Loss": 1.9710594415664673, "Pretrain/Loss (Raw)": 1.8251270055770874, "Pretrain/Step": 6465, "Pretrain/Step Time": 8.644154602661729} +{"Pretrain/Learning Rate": 1.240698495186521e-05, "Pretrain/Loss": 1.9728131294250488, "Pretrain/Loss (Raw)": 2.0652101039886475, "Pretrain/Step": 6466, "Pretrain/Step Time": 8.645382588729262} +{"Pretrain/Learning Rate": 1.2399651560054056e-05, "Pretrain/Loss": 1.9735459089279175, "Pretrain/Loss (Raw)": 2.0393807888031006, "Pretrain/Step": 6467, "Pretrain/Step Time": 8.638587465509772} +{"Pretrain/Learning Rate": 1.2392319621374476e-05, "Pretrain/Loss": 1.9725620746612549, "Pretrain/Loss (Raw)": 2.052217483520508, "Pretrain/Step": 6468, "Pretrain/Step Time": 8.643254917114973} +{"Pretrain/Learning Rate": 1.2384989136671987e-05, "Pretrain/Loss": 1.9708409309387207, "Pretrain/Loss (Raw)": 1.8865671157836914, "Pretrain/Step": 6469, "Pretrain/Step Time": 8.646046498790383} +{"Pretrain/Learning Rate": 1.2377660106792005e-05, "Pretrain/Loss": 1.9674842357635498, "Pretrain/Loss (Raw)": 1.8275446891784668, "Pretrain/Step": 6470, "Pretrain/Step Time": 8.640171498060226} +{"Pretrain/Learning Rate": 1.2370332532579726e-05, "Pretrain/Loss": 1.9661757946014404, "Pretrain/Loss (Raw)": 1.833089828491211, "Pretrain/Step": 6471, "Pretrain/Step Time": 8.644234465435147} +{"Pretrain/Learning Rate": 1.2363006414880236e-05, "Pretrain/Loss": 1.966619849205017, "Pretrain/Loss (Raw)": 2.144378662109375, "Pretrain/Step": 6472, "Pretrain/Step Time": 8.64505560696125} +{"Pretrain/Learning Rate": 1.235568175453837e-05, "Pretrain/Loss": 1.9659825563430786, "Pretrain/Loss (Raw)": 1.9776670932769775, "Pretrain/Step": 6473, "Pretrain/Step Time": 8.644914159551263} +{"Pretrain/Learning Rate": 1.2348358552398878e-05, "Pretrain/Loss": 1.9650907516479492, "Pretrain/Loss (Raw)": 1.9720464944839478, "Pretrain/Step": 6474, "Pretrain/Step Time": 8.647218151018023} +{"Pretrain/Learning Rate": 1.2341036809306292e-05, "Pretrain/Loss": 1.9636099338531494, "Pretrain/Loss (Raw)": 1.8572947978973389, "Pretrain/Step": 6475, "Pretrain/Step Time": 8.643363267183304} +{"Pretrain/Learning Rate": 1.2333716526104993e-05, "Pretrain/Loss": 1.9652504920959473, "Pretrain/Loss (Raw)": 2.01481556892395, "Pretrain/Step": 6476, "Pretrain/Step Time": 8.646277504041791} +{"Pretrain/Learning Rate": 1.2326397703639181e-05, "Pretrain/Loss": 1.9643791913986206, "Pretrain/Loss (Raw)": 1.993348240852356, "Pretrain/Step": 6477, "Pretrain/Step Time": 8.646536387503147} +{"Pretrain/Learning Rate": 1.2319080342752918e-05, "Pretrain/Loss": 1.9679794311523438, "Pretrain/Loss (Raw)": 2.1462838649749756, "Pretrain/Step": 6478, "Pretrain/Step Time": 8.64474861882627} +{"Pretrain/Learning Rate": 1.2311764444290061e-05, "Pretrain/Loss": 1.9676543474197388, "Pretrain/Loss (Raw)": 1.91757333278656, "Pretrain/Step": 6479, "Pretrain/Step Time": 8.645919358357787} +{"Pretrain/Learning Rate": 1.2304450009094317e-05, "Pretrain/Loss": 1.9635767936706543, "Pretrain/Loss (Raw)": 1.4141614437103271, "Pretrain/Step": 6480, "Pretrain/Step Time": 8.645419280976057} +{"Pretrain/Learning Rate": 1.2297137038009213e-05, "Pretrain/Loss": 1.9629065990447998, "Pretrain/Loss (Raw)": 1.8930745124816895, "Pretrain/Step": 6481, "Pretrain/Step Time": 8.642876647412777} +{"Pretrain/Learning Rate": 1.2289825531878133e-05, "Pretrain/Loss": 1.963578224182129, "Pretrain/Loss (Raw)": 2.022432804107666, "Pretrain/Step": 6482, "Pretrain/Step Time": 8.640504259616137} +{"Pretrain/Learning Rate": 1.2282515491544264e-05, "Pretrain/Loss": 1.9617654085159302, "Pretrain/Loss (Raw)": 1.8138383626937866, "Pretrain/Step": 6483, "Pretrain/Step Time": 8.634290108457208} +{"Pretrain/Learning Rate": 1.2275206917850635e-05, "Pretrain/Loss": 1.9580373764038086, "Pretrain/Loss (Raw)": 1.6071888208389282, "Pretrain/Step": 6484, "Pretrain/Step Time": 8.638189796358347} +{"Pretrain/Learning Rate": 1.22678998116401e-05, "Pretrain/Loss": 1.9580152034759521, "Pretrain/Loss (Raw)": 1.899692416191101, "Pretrain/Step": 6485, "Pretrain/Step Time": 8.636697925627232} +{"Pretrain/Learning Rate": 1.2260594173755358e-05, "Pretrain/Loss": 1.9616899490356445, "Pretrain/Loss (Raw)": 1.911846399307251, "Pretrain/Step": 6486, "Pretrain/Step Time": 8.638948146253824} +{"Pretrain/Learning Rate": 1.2253290005038929e-05, "Pretrain/Loss": 1.9617252349853516, "Pretrain/Loss (Raw)": 2.121607780456543, "Pretrain/Step": 6487, "Pretrain/Step Time": 8.645262196660042} +{"Pretrain/Learning Rate": 1.2245987306333162e-05, "Pretrain/Loss": 1.9618518352508545, "Pretrain/Loss (Raw)": 2.0354764461517334, "Pretrain/Step": 6488, "Pretrain/Step Time": 8.64308524504304} +{"Pretrain/Learning Rate": 1.2238686078480227e-05, "Pretrain/Loss": 1.964364767074585, "Pretrain/Loss (Raw)": 2.0707132816314697, "Pretrain/Step": 6489, "Pretrain/Step Time": 8.639992918819189} +{"Pretrain/Learning Rate": 1.2231386322322155e-05, "Pretrain/Loss": 1.9618960618972778, "Pretrain/Loss (Raw)": 1.4246182441711426, "Pretrain/Step": 6490, "Pretrain/Step Time": 8.64258168451488} +{"Pretrain/Learning Rate": 1.2224088038700782e-05, "Pretrain/Loss": 1.9609870910644531, "Pretrain/Loss (Raw)": 2.0245420932769775, "Pretrain/Step": 6491, "Pretrain/Step Time": 8.638900524005294} +{"Pretrain/Learning Rate": 1.2216791228457778e-05, "Pretrain/Loss": 1.960636019706726, "Pretrain/Loss (Raw)": 1.923439383506775, "Pretrain/Step": 6492, "Pretrain/Step Time": 8.642542868852615} +{"Pretrain/Learning Rate": 1.2209495892434635e-05, "Pretrain/Loss": 1.96023690700531, "Pretrain/Loss (Raw)": 2.0537145137786865, "Pretrain/Step": 6493, "Pretrain/Step Time": 8.646077740937471} +{"Pretrain/Learning Rate": 1.2202202031472707e-05, "Pretrain/Loss": 1.9588477611541748, "Pretrain/Loss (Raw)": 1.9561632871627808, "Pretrain/Step": 6494, "Pretrain/Step Time": 8.649404287338257} +{"Pretrain/Learning Rate": 1.2194909646413147e-05, "Pretrain/Loss": 1.9619715213775635, "Pretrain/Loss (Raw)": 2.137204885482788, "Pretrain/Step": 6495, "Pretrain/Step Time": 8.650345407426357} +{"Pretrain/Learning Rate": 1.2187618738096934e-05, "Pretrain/Loss": 1.95931077003479, "Pretrain/Loss (Raw)": 1.7807538509368896, "Pretrain/Step": 6496, "Pretrain/Step Time": 8.650852927938104} +{"Pretrain/Learning Rate": 1.2180329307364916e-05, "Pretrain/Loss": 1.9617507457733154, "Pretrain/Loss (Raw)": 2.109515428543091, "Pretrain/Step": 6497, "Pretrain/Step Time": 8.650687186047435} +{"Pretrain/Learning Rate": 1.2173041355057727e-05, "Pretrain/Loss": 1.9608486890792847, "Pretrain/Loss (Raw)": 1.9255450963974, "Pretrain/Step": 6498, "Pretrain/Step Time": 8.653255200013518} +{"Pretrain/Learning Rate": 1.216575488201585e-05, "Pretrain/Loss": 1.962575912475586, "Pretrain/Loss (Raw)": 1.88924241065979, "Pretrain/Step": 6499, "Pretrain/Step Time": 8.652813009917736} +{"Pretrain/Learning Rate": 1.215846988907959e-05, "Pretrain/Loss": 1.9639685153961182, "Pretrain/Loss (Raw)": 2.095754384994507, "Pretrain/Step": 6500, "Pretrain/Step Time": 8.654084451496601} +{"Pretrain/Learning Rate": 1.2151186377089105e-05, "Pretrain/Loss": 1.9631870985031128, "Pretrain/Loss (Raw)": 1.8851433992385864, "Pretrain/Step": 6501, "Pretrain/Step Time": 8.652007395401597} +{"Pretrain/Learning Rate": 1.214390434688435e-05, "Pretrain/Loss": 1.9623090028762817, "Pretrain/Loss (Raw)": 1.9883674383163452, "Pretrain/Step": 6502, "Pretrain/Step Time": 8.653802061453462} +{"Pretrain/Learning Rate": 1.2136623799305127e-05, "Pretrain/Loss": 1.9628729820251465, "Pretrain/Loss (Raw)": 1.9879820346832275, "Pretrain/Step": 6503, "Pretrain/Step Time": 8.651302982121706} +{"Pretrain/Learning Rate": 1.212934473519105e-05, "Pretrain/Loss": 1.9613008499145508, "Pretrain/Loss (Raw)": 1.9025774002075195, "Pretrain/Step": 6504, "Pretrain/Step Time": 8.65180353447795} +{"Pretrain/Learning Rate": 1.2122067155381598e-05, "Pretrain/Loss": 1.9613995552062988, "Pretrain/Loss (Raw)": 2.0064537525177, "Pretrain/Step": 6505, "Pretrain/Step Time": 8.652457050979137} +{"Pretrain/Learning Rate": 1.2114791060716043e-05, "Pretrain/Loss": 1.9624849557876587, "Pretrain/Loss (Raw)": 2.1794958114624023, "Pretrain/Step": 6506, "Pretrain/Step Time": 8.652832420542836} +{"Pretrain/Learning Rate": 1.2107516452033502e-05, "Pretrain/Loss": 1.9616358280181885, "Pretrain/Loss (Raw)": 2.0141119956970215, "Pretrain/Step": 6507, "Pretrain/Step Time": 8.654651803895831} +{"Pretrain/Learning Rate": 1.2100243330172905e-05, "Pretrain/Loss": 1.9613330364227295, "Pretrain/Loss (Raw)": 1.9218502044677734, "Pretrain/Step": 6508, "Pretrain/Step Time": 8.65427329018712} +{"Pretrain/Learning Rate": 1.2092971695973052e-05, "Pretrain/Loss": 1.9612336158752441, "Pretrain/Loss (Raw)": 1.855696678161621, "Pretrain/Step": 6509, "Pretrain/Step Time": 8.652698419988155} +{"Pretrain/Learning Rate": 1.2085701550272502e-05, "Pretrain/Loss": 1.9604506492614746, "Pretrain/Loss (Raw)": 1.8807331323623657, "Pretrain/Step": 6510, "Pretrain/Step Time": 8.65450543537736} +{"Pretrain/Learning Rate": 1.2078432893909714e-05, "Pretrain/Loss": 1.959078073501587, "Pretrain/Loss (Raw)": 1.8129154443740845, "Pretrain/Step": 6511, "Pretrain/Step Time": 8.659073309972882} +{"Pretrain/Learning Rate": 1.2071165727722925e-05, "Pretrain/Loss": 1.959594964981079, "Pretrain/Loss (Raw)": 2.0935654640197754, "Pretrain/Step": 6512, "Pretrain/Step Time": 8.661448488011956} +{"Pretrain/Learning Rate": 1.2063900052550246e-05, "Pretrain/Loss": 1.9570926427841187, "Pretrain/Loss (Raw)": 1.7976254224777222, "Pretrain/Step": 6513, "Pretrain/Step Time": 8.65590782649815} +{"Pretrain/Learning Rate": 1.2056635869229549e-05, "Pretrain/Loss": 1.9581044912338257, "Pretrain/Loss (Raw)": 1.999532699584961, "Pretrain/Step": 6514, "Pretrain/Step Time": 8.652147747576237} +{"Pretrain/Learning Rate": 1.2049373178598606e-05, "Pretrain/Loss": 1.9570772647857666, "Pretrain/Loss (Raw)": 1.717079997062683, "Pretrain/Step": 6515, "Pretrain/Step Time": 8.656346529722214} +{"Pretrain/Learning Rate": 1.2042111981494968e-05, "Pretrain/Loss": 1.9565808773040771, "Pretrain/Loss (Raw)": 2.0245115756988525, "Pretrain/Step": 6516, "Pretrain/Step Time": 8.657914379611611} +{"Pretrain/Learning Rate": 1.2034852278756042e-05, "Pretrain/Loss": 1.9594420194625854, "Pretrain/Loss (Raw)": 2.1034674644470215, "Pretrain/Step": 6517, "Pretrain/Step Time": 8.654303718358278} +{"Pretrain/Learning Rate": 1.2027594071219033e-05, "Pretrain/Loss": 1.9579031467437744, "Pretrain/Loss (Raw)": 1.9617846012115479, "Pretrain/Step": 6518, "Pretrain/Step Time": 8.655432097613811} +{"Pretrain/Learning Rate": 1.2020337359721015e-05, "Pretrain/Loss": 1.9593160152435303, "Pretrain/Loss (Raw)": 2.161604404449463, "Pretrain/Step": 6519, "Pretrain/Step Time": 8.657894467934966} +{"Pretrain/Learning Rate": 1.2013082145098852e-05, "Pretrain/Loss": 1.9577040672302246, "Pretrain/Loss (Raw)": 1.9056859016418457, "Pretrain/Step": 6520, "Pretrain/Step Time": 8.655122075229883} +{"Pretrain/Learning Rate": 1.2005828428189256e-05, "Pretrain/Loss": 1.957746982574463, "Pretrain/Loss (Raw)": 1.9938081502914429, "Pretrain/Step": 6521, "Pretrain/Step Time": 8.653494086116552} +{"Pretrain/Learning Rate": 1.1998576209828743e-05, "Pretrain/Loss": 1.9581894874572754, "Pretrain/Loss (Raw)": 1.837432622909546, "Pretrain/Step": 6522, "Pretrain/Step Time": 8.653561675921082} +{"Pretrain/Learning Rate": 1.19913254908537e-05, "Pretrain/Loss": 1.95685875415802, "Pretrain/Loss (Raw)": 1.952771782875061, "Pretrain/Step": 6523, "Pretrain/Step Time": 8.653197044506669} +{"Pretrain/Learning Rate": 1.1984076272100297e-05, "Pretrain/Loss": 1.9554240703582764, "Pretrain/Loss (Raw)": 1.7814844846725464, "Pretrain/Step": 6524, "Pretrain/Step Time": 8.649090340360999} +{"Pretrain/Learning Rate": 1.1976828554404552e-05, "Pretrain/Loss": 1.952889323234558, "Pretrain/Loss (Raw)": 1.7438055276870728, "Pretrain/Step": 6525, "Pretrain/Step Time": 8.651256628334522} +{"Pretrain/Learning Rate": 1.1969582338602295e-05, "Pretrain/Loss": 1.9524705410003662, "Pretrain/Loss (Raw)": 2.125929832458496, "Pretrain/Step": 6526, "Pretrain/Step Time": 8.649859515950084} +{"Pretrain/Learning Rate": 1.1962337625529215e-05, "Pretrain/Loss": 1.9493906497955322, "Pretrain/Loss (Raw)": 1.739801049232483, "Pretrain/Step": 6527, "Pretrain/Step Time": 8.651656931266189} +{"Pretrain/Learning Rate": 1.1955094416020795e-05, "Pretrain/Loss": 1.94992995262146, "Pretrain/Loss (Raw)": 1.9022687673568726, "Pretrain/Step": 6528, "Pretrain/Step Time": 8.651621071621776} +{"Pretrain/Learning Rate": 1.1947852710912355e-05, "Pretrain/Loss": 1.952593445777893, "Pretrain/Loss (Raw)": 2.0932631492614746, "Pretrain/Step": 6529, "Pretrain/Step Time": 8.6516092158854} +{"Pretrain/Learning Rate": 1.1940612511039038e-05, "Pretrain/Loss": 1.9523199796676636, "Pretrain/Loss (Raw)": 1.9621847867965698, "Pretrain/Step": 6530, "Pretrain/Step Time": 8.653975257650018} +{"Pretrain/Learning Rate": 1.1933373817235832e-05, "Pretrain/Loss": 1.9510958194732666, "Pretrain/Loss (Raw)": 1.8727037906646729, "Pretrain/Step": 6531, "Pretrain/Step Time": 8.65405973047018} +{"Pretrain/Learning Rate": 1.1926136630337528e-05, "Pretrain/Loss": 1.9526135921478271, "Pretrain/Loss (Raw)": 2.007349967956543, "Pretrain/Step": 6532, "Pretrain/Step Time": 8.653279788792133} +{"Pretrain/Learning Rate": 1.1918900951178755e-05, "Pretrain/Loss": 1.9514223337173462, "Pretrain/Loss (Raw)": 1.998374104499817, "Pretrain/Step": 6533, "Pretrain/Step Time": 8.650966484099627} +{"Pretrain/Learning Rate": 1.1911666780593955e-05, "Pretrain/Loss": 1.948716163635254, "Pretrain/Loss (Raw)": 1.6854188442230225, "Pretrain/Step": 6534, "Pretrain/Step Time": 8.652744427323341} +{"Pretrain/Learning Rate": 1.1904434119417426e-05, "Pretrain/Loss": 1.9489195346832275, "Pretrain/Loss (Raw)": 1.9963854551315308, "Pretrain/Step": 6535, "Pretrain/Step Time": 8.653338560834527} +{"Pretrain/Learning Rate": 1.1897202968483263e-05, "Pretrain/Loss": 1.9478260278701782, "Pretrain/Loss (Raw)": 1.933142066001892, "Pretrain/Step": 6536, "Pretrain/Step Time": 8.653847355395555} +{"Pretrain/Learning Rate": 1.1889973328625384e-05, "Pretrain/Loss": 1.946871280670166, "Pretrain/Loss (Raw)": 1.7948665618896484, "Pretrain/Step": 6537, "Pretrain/Step Time": 8.653396420180798} +{"Pretrain/Learning Rate": 1.1882745200677569e-05, "Pretrain/Loss": 1.9466195106506348, "Pretrain/Loss (Raw)": 1.9250333309173584, "Pretrain/Step": 6538, "Pretrain/Step Time": 8.654350755736232} +{"Pretrain/Learning Rate": 1.1875518585473389e-05, "Pretrain/Loss": 1.9475414752960205, "Pretrain/Loss (Raw)": 2.1393957138061523, "Pretrain/Step": 6539, "Pretrain/Step Time": 8.646464459598064} +{"Pretrain/Learning Rate": 1.1868293483846247e-05, "Pretrain/Loss": 1.9493310451507568, "Pretrain/Loss (Raw)": 2.100482225418091, "Pretrain/Step": 6540, "Pretrain/Step Time": 8.649419583380222} +{"Pretrain/Learning Rate": 1.186106989662937e-05, "Pretrain/Loss": 1.9473991394042969, "Pretrain/Loss (Raw)": 1.8089559078216553, "Pretrain/Step": 6541, "Pretrain/Step Time": 8.646287273615599} +{"Pretrain/Learning Rate": 1.1853847824655836e-05, "Pretrain/Loss": 1.9460724592208862, "Pretrain/Loss (Raw)": 1.8883744478225708, "Pretrain/Step": 6542, "Pretrain/Step Time": 8.646030358970165} +{"Pretrain/Learning Rate": 1.184662726875852e-05, "Pretrain/Loss": 1.944523811340332, "Pretrain/Loss (Raw)": 1.9408814907073975, "Pretrain/Step": 6543, "Pretrain/Step Time": 8.647328894585371} +{"Pretrain/Learning Rate": 1.1839408229770124e-05, "Pretrain/Loss": 1.9464677572250366, "Pretrain/Loss (Raw)": 1.9170767068862915, "Pretrain/Step": 6544, "Pretrain/Step Time": 8.643006835132837} +{"Pretrain/Learning Rate": 1.183219070852318e-05, "Pretrain/Loss": 1.9457859992980957, "Pretrain/Loss (Raw)": 1.692874789237976, "Pretrain/Step": 6545, "Pretrain/Step Time": 8.645920611917973} +{"Pretrain/Learning Rate": 1.1824974705850058e-05, "Pretrain/Loss": 1.946155309677124, "Pretrain/Loss (Raw)": 1.8389836549758911, "Pretrain/Step": 6546, "Pretrain/Step Time": 8.648040657863021} +{"Pretrain/Learning Rate": 1.1817760222582938e-05, "Pretrain/Loss": 1.9470865726470947, "Pretrain/Loss (Raw)": 1.9266116619110107, "Pretrain/Step": 6547, "Pretrain/Step Time": 8.648884335532784} +{"Pretrain/Learning Rate": 1.1810547259553826e-05, "Pretrain/Loss": 1.9449541568756104, "Pretrain/Loss (Raw)": 1.8008185625076294, "Pretrain/Step": 6548, "Pretrain/Step Time": 8.645194852724671} +{"Pretrain/Learning Rate": 1.1803335817594544e-05, "Pretrain/Loss": 1.9465404748916626, "Pretrain/Loss (Raw)": 1.96190345287323, "Pretrain/Step": 6549, "Pretrain/Step Time": 8.64343841932714} +{"Pretrain/Learning Rate": 1.179612589753678e-05, "Pretrain/Loss": 1.9455857276916504, "Pretrain/Loss (Raw)": 2.1400625705718994, "Pretrain/Step": 6550, "Pretrain/Step Time": 8.643534095957875} +{"Pretrain/Learning Rate": 1.1788917500211976e-05, "Pretrain/Loss": 1.945103645324707, "Pretrain/Loss (Raw)": 1.918582558631897, "Pretrain/Step": 6551, "Pretrain/Step Time": 8.646238565444946} +{"Pretrain/Learning Rate": 1.178171062645147e-05, "Pretrain/Loss": 1.9409101009368896, "Pretrain/Loss (Raw)": 1.654701828956604, "Pretrain/Step": 6552, "Pretrain/Step Time": 8.64606799185276} +{"Pretrain/Learning Rate": 1.177450527708637e-05, "Pretrain/Loss": 1.9430843591690063, "Pretrain/Loss (Raw)": 2.097325086593628, "Pretrain/Step": 6553, "Pretrain/Step Time": 8.646130084991455} +{"Pretrain/Learning Rate": 1.1767301452947663e-05, "Pretrain/Loss": 1.940690279006958, "Pretrain/Loss (Raw)": 1.6384533643722534, "Pretrain/Step": 6554, "Pretrain/Step Time": 8.651544308289886} +{"Pretrain/Learning Rate": 1.1760099154866086e-05, "Pretrain/Loss": 1.9387993812561035, "Pretrain/Loss (Raw)": 1.938894510269165, "Pretrain/Step": 6555, "Pretrain/Step Time": 8.648121055215597} +{"Pretrain/Learning Rate": 1.1752898383672273e-05, "Pretrain/Loss": 1.936111330986023, "Pretrain/Loss (Raw)": 1.6597596406936646, "Pretrain/Step": 6556, "Pretrain/Step Time": 8.64868283085525} +{"Pretrain/Learning Rate": 1.1745699140196632e-05, "Pretrain/Loss": 1.935274362564087, "Pretrain/Loss (Raw)": 1.927841305732727, "Pretrain/Step": 6557, "Pretrain/Step Time": 8.652129638940096} +{"Pretrain/Learning Rate": 1.1738501425269441e-05, "Pretrain/Loss": 1.9369678497314453, "Pretrain/Loss (Raw)": 2.0134007930755615, "Pretrain/Step": 6558, "Pretrain/Step Time": 8.650200050324202} +{"Pretrain/Learning Rate": 1.1731305239720735e-05, "Pretrain/Loss": 1.936598777770996, "Pretrain/Loss (Raw)": 1.9421814680099487, "Pretrain/Step": 6559, "Pretrain/Step Time": 8.648397617042065} +{"Pretrain/Learning Rate": 1.1724110584380444e-05, "Pretrain/Loss": 1.9367023706436157, "Pretrain/Loss (Raw)": 2.1100430488586426, "Pretrain/Step": 6560, "Pretrain/Step Time": 8.648649837821722} +{"Pretrain/Learning Rate": 1.1716917460078278e-05, "Pretrain/Loss": 1.9346882104873657, "Pretrain/Loss (Raw)": 1.5939942598342896, "Pretrain/Step": 6561, "Pretrain/Step Time": 8.649625338613987} +{"Pretrain/Learning Rate": 1.1709725867643784e-05, "Pretrain/Loss": 1.9331142902374268, "Pretrain/Loss (Raw)": 1.8351871967315674, "Pretrain/Step": 6562, "Pretrain/Step Time": 8.646088723093271} +{"Pretrain/Learning Rate": 1.1702535807906318e-05, "Pretrain/Loss": 1.9342231750488281, "Pretrain/Loss (Raw)": 1.885661005973816, "Pretrain/Step": 6563, "Pretrain/Step Time": 8.648382971063256} +{"Pretrain/Learning Rate": 1.1695347281695093e-05, "Pretrain/Loss": 1.9341468811035156, "Pretrain/Loss (Raw)": 1.9301539659500122, "Pretrain/Step": 6564, "Pretrain/Step Time": 8.647743932902813} +{"Pretrain/Learning Rate": 1.1688160289839111e-05, "Pretrain/Loss": 1.933887243270874, "Pretrain/Loss (Raw)": 2.102968454360962, "Pretrain/Step": 6565, "Pretrain/Step Time": 8.648680370301008} +{"Pretrain/Learning Rate": 1.1680974833167214e-05, "Pretrain/Loss": 1.933351755142212, "Pretrain/Loss (Raw)": 1.869908094406128, "Pretrain/Step": 6566, "Pretrain/Step Time": 8.643151037395} +{"Pretrain/Learning Rate": 1.1673790912508051e-05, "Pretrain/Loss": 1.9332890510559082, "Pretrain/Loss (Raw)": 1.9083013534545898, "Pretrain/Step": 6567, "Pretrain/Step Time": 8.645141134038568} +{"Pretrain/Learning Rate": 1.1666608528690123e-05, "Pretrain/Loss": 1.9302563667297363, "Pretrain/Loss (Raw)": 1.8021724224090576, "Pretrain/Step": 6568, "Pretrain/Step Time": 8.641972377896309} +{"Pretrain/Learning Rate": 1.165942768254173e-05, "Pretrain/Loss": 1.9314861297607422, "Pretrain/Loss (Raw)": 2.1155378818511963, "Pretrain/Step": 6569, "Pretrain/Step Time": 8.648483579978347} +{"Pretrain/Learning Rate": 1.1652248374890999e-05, "Pretrain/Loss": 1.932700753211975, "Pretrain/Loss (Raw)": 2.086510181427002, "Pretrain/Step": 6570, "Pretrain/Step Time": 8.647605020552874} +{"Pretrain/Learning Rate": 1.164507060656587e-05, "Pretrain/Loss": 1.9308143854141235, "Pretrain/Loss (Raw)": 1.8221468925476074, "Pretrain/Step": 6571, "Pretrain/Step Time": 8.645665537565947} +{"Pretrain/Learning Rate": 1.163789437839414e-05, "Pretrain/Loss": 1.932501196861267, "Pretrain/Loss (Raw)": 2.1439568996429443, "Pretrain/Step": 6572, "Pretrain/Step Time": 8.647918164730072} +{"Pretrain/Learning Rate": 1.1630719691203395e-05, "Pretrain/Loss": 1.9314217567443848, "Pretrain/Loss (Raw)": 1.8501542806625366, "Pretrain/Step": 6573, "Pretrain/Step Time": 8.65430323034525} +{"Pretrain/Learning Rate": 1.1623546545821054e-05, "Pretrain/Loss": 1.9306977987289429, "Pretrain/Loss (Raw)": 1.7132411003112793, "Pretrain/Step": 6574, "Pretrain/Step Time": 8.648593971505761} +{"Pretrain/Learning Rate": 1.1616374943074349e-05, "Pretrain/Loss": 1.931410551071167, "Pretrain/Loss (Raw)": 2.0539498329162598, "Pretrain/Step": 6575, "Pretrain/Step Time": 8.651901626959443} +{"Pretrain/Learning Rate": 1.1609204883790359e-05, "Pretrain/Loss": 1.9333809614181519, "Pretrain/Loss (Raw)": 1.9873162508010864, "Pretrain/Step": 6576, "Pretrain/Step Time": 8.648414358496666} +{"Pretrain/Learning Rate": 1.1602036368795963e-05, "Pretrain/Loss": 1.9352600574493408, "Pretrain/Loss (Raw)": 2.1571385860443115, "Pretrain/Step": 6577, "Pretrain/Step Time": 8.64875366538763} +{"Pretrain/Learning Rate": 1.1594869398917854e-05, "Pretrain/Loss": 1.9346988201141357, "Pretrain/Loss (Raw)": 1.9532480239868164, "Pretrain/Step": 6578, "Pretrain/Step Time": 8.652009516954422} +{"Pretrain/Learning Rate": 1.1587703974982584e-05, "Pretrain/Loss": 1.9337022304534912, "Pretrain/Loss (Raw)": 1.7733116149902344, "Pretrain/Step": 6579, "Pretrain/Step Time": 8.655655520036817} +{"Pretrain/Learning Rate": 1.1580540097816491e-05, "Pretrain/Loss": 1.9319987297058105, "Pretrain/Loss (Raw)": 1.7318100929260254, "Pretrain/Step": 6580, "Pretrain/Step Time": 8.659756625071168} +{"Pretrain/Learning Rate": 1.157337776824575e-05, "Pretrain/Loss": 1.9301702976226807, "Pretrain/Loss (Raw)": 1.8474208116531372, "Pretrain/Step": 6581, "Pretrain/Step Time": 8.662179585546255} +{"Pretrain/Learning Rate": 1.1566216987096343e-05, "Pretrain/Loss": 1.9312628507614136, "Pretrain/Loss (Raw)": 2.069348096847534, "Pretrain/Step": 6582, "Pretrain/Step Time": 8.659932358190417} +{"Pretrain/Learning Rate": 1.1559057755194105e-05, "Pretrain/Loss": 1.9299383163452148, "Pretrain/Loss (Raw)": 1.8102399110794067, "Pretrain/Step": 6583, "Pretrain/Step Time": 8.660764841362834} +{"Pretrain/Learning Rate": 1.1551900073364663e-05, "Pretrain/Loss": 1.9286022186279297, "Pretrain/Loss (Raw)": 1.8744373321533203, "Pretrain/Step": 6584, "Pretrain/Step Time": 8.662714118137956} +{"Pretrain/Learning Rate": 1.1544743942433473e-05, "Pretrain/Loss": 1.9293582439422607, "Pretrain/Loss (Raw)": 2.1498055458068848, "Pretrain/Step": 6585, "Pretrain/Step Time": 8.667915409430861} +{"Pretrain/Learning Rate": 1.1537589363225806e-05, "Pretrain/Loss": 1.9293205738067627, "Pretrain/Loss (Raw)": 2.034925937652588, "Pretrain/Step": 6586, "Pretrain/Step Time": 8.664498073980212} +{"Pretrain/Learning Rate": 1.153043633656678e-05, "Pretrain/Loss": 1.931833267211914, "Pretrain/Loss (Raw)": 2.1318295001983643, "Pretrain/Step": 6587, "Pretrain/Step Time": 8.664765937253833} +{"Pretrain/Learning Rate": 1.1523284863281306e-05, "Pretrain/Loss": 1.9309487342834473, "Pretrain/Loss (Raw)": 1.891779899597168, "Pretrain/Step": 6588, "Pretrain/Step Time": 8.663694703951478} +{"Pretrain/Learning Rate": 1.1516134944194126e-05, "Pretrain/Loss": 1.9294894933700562, "Pretrain/Loss (Raw)": 1.9447038173675537, "Pretrain/Step": 6589, "Pretrain/Step Time": 8.663534414023161} +{"Pretrain/Learning Rate": 1.1508986580129794e-05, "Pretrain/Loss": 1.9292700290679932, "Pretrain/Loss (Raw)": 2.1672587394714355, "Pretrain/Step": 6590, "Pretrain/Step Time": 8.663734750822186} +{"Pretrain/Learning Rate": 1.1501839771912718e-05, "Pretrain/Loss": 1.9289355278015137, "Pretrain/Loss (Raw)": 1.9672293663024902, "Pretrain/Step": 6591, "Pretrain/Step Time": 8.655698526650667} +{"Pretrain/Learning Rate": 1.1494694520367068e-05, "Pretrain/Loss": 1.9333504438400269, "Pretrain/Loss (Raw)": 1.996335744857788, "Pretrain/Step": 6592, "Pretrain/Step Time": 8.657812340185046} +{"Pretrain/Learning Rate": 1.1487550826316893e-05, "Pretrain/Loss": 1.9338793754577637, "Pretrain/Loss (Raw)": 1.892829418182373, "Pretrain/Step": 6593, "Pretrain/Step Time": 8.660521542653441} +{"Pretrain/Learning Rate": 1.1480408690586022e-05, "Pretrain/Loss": 1.9338703155517578, "Pretrain/Loss (Raw)": 2.0640459060668945, "Pretrain/Step": 6594, "Pretrain/Step Time": 8.661952530965209} +{"Pretrain/Learning Rate": 1.1473268113998146e-05, "Pretrain/Loss": 1.9336283206939697, "Pretrain/Loss (Raw)": 2.0084073543548584, "Pretrain/Step": 6595, "Pretrain/Step Time": 8.663776634261012} +{"Pretrain/Learning Rate": 1.146612909737671e-05, "Pretrain/Loss": 1.9334993362426758, "Pretrain/Loss (Raw)": 2.0357117652893066, "Pretrain/Step": 6596, "Pretrain/Step Time": 8.660533510148525} +{"Pretrain/Learning Rate": 1.145899164154505e-05, "Pretrain/Loss": 1.93346107006073, "Pretrain/Loss (Raw)": 1.8816546201705933, "Pretrain/Step": 6597, "Pretrain/Step Time": 8.65949877165258} +{"Pretrain/Learning Rate": 1.1451855747326273e-05, "Pretrain/Loss": 1.9348530769348145, "Pretrain/Loss (Raw)": 2.005725860595703, "Pretrain/Step": 6598, "Pretrain/Step Time": 8.661854119971395} +{"Pretrain/Learning Rate": 1.1444721415543349e-05, "Pretrain/Loss": 1.936522364616394, "Pretrain/Loss (Raw)": 2.046746015548706, "Pretrain/Step": 6599, "Pretrain/Step Time": 8.65827015414834} +{"Pretrain/Learning Rate": 1.143758864701901e-05, "Pretrain/Loss": 1.9352821111679077, "Pretrain/Loss (Raw)": 1.985643982887268, "Pretrain/Step": 6600, "Pretrain/Step Time": 8.656232995912433} +{"Pretrain/Learning Rate": 1.1430457442575863e-05, "Pretrain/Loss": 1.9338457584381104, "Pretrain/Loss (Raw)": 1.7938061952590942, "Pretrain/Step": 6601, "Pretrain/Step Time": 8.664037216454744} +{"Pretrain/Learning Rate": 1.1423327803036308e-05, "Pretrain/Loss": 1.9335148334503174, "Pretrain/Loss (Raw)": 1.9297003746032715, "Pretrain/Step": 6602, "Pretrain/Step Time": 8.661465672776103} +{"Pretrain/Learning Rate": 1.1416199729222565e-05, "Pretrain/Loss": 1.9359585046768188, "Pretrain/Loss (Raw)": 2.1700708866119385, "Pretrain/Step": 6603, "Pretrain/Step Time": 8.660880032926798} +{"Pretrain/Learning Rate": 1.1409073221956668e-05, "Pretrain/Loss": 1.9361188411712646, "Pretrain/Loss (Raw)": 2.0353517532348633, "Pretrain/Step": 6604, "Pretrain/Step Time": 8.661952152848244} +{"Pretrain/Learning Rate": 1.14019482820605e-05, "Pretrain/Loss": 1.9365432262420654, "Pretrain/Loss (Raw)": 2.047651767730713, "Pretrain/Step": 6605, "Pretrain/Step Time": 8.662673853337765} +{"Pretrain/Learning Rate": 1.1394824910355731e-05, "Pretrain/Loss": 1.9348806142807007, "Pretrain/Loss (Raw)": 1.9334722757339478, "Pretrain/Step": 6606, "Pretrain/Step Time": 8.661605281755328} +{"Pretrain/Learning Rate": 1.1387703107663864e-05, "Pretrain/Loss": 1.9368315935134888, "Pretrain/Loss (Raw)": 2.167309045791626, "Pretrain/Step": 6607, "Pretrain/Step Time": 8.660170286893845} +{"Pretrain/Learning Rate": 1.1380582874806209e-05, "Pretrain/Loss": 1.9430451393127441, "Pretrain/Loss (Raw)": 2.2094876766204834, "Pretrain/Step": 6608, "Pretrain/Step Time": 8.661700630560517} +{"Pretrain/Learning Rate": 1.1373464212603923e-05, "Pretrain/Loss": 1.9444928169250488, "Pretrain/Loss (Raw)": 2.0783796310424805, "Pretrain/Step": 6609, "Pretrain/Step Time": 8.661286812275648} +{"Pretrain/Learning Rate": 1.1366347121877955e-05, "Pretrain/Loss": 1.9430774450302124, "Pretrain/Loss (Raw)": 1.8412734270095825, "Pretrain/Step": 6610, "Pretrain/Step Time": 8.664827825501561} +{"Pretrain/Learning Rate": 1.1359231603449078e-05, "Pretrain/Loss": 1.9454915523529053, "Pretrain/Loss (Raw)": 2.122828245162964, "Pretrain/Step": 6611, "Pretrain/Step Time": 8.669385911896825} +{"Pretrain/Learning Rate": 1.1352117658137884e-05, "Pretrain/Loss": 1.9471973180770874, "Pretrain/Loss (Raw)": 1.825533390045166, "Pretrain/Step": 6612, "Pretrain/Step Time": 8.66590572707355} +{"Pretrain/Learning Rate": 1.1345005286764798e-05, "Pretrain/Loss": 1.945144534111023, "Pretrain/Loss (Raw)": 1.636931300163269, "Pretrain/Step": 6613, "Pretrain/Step Time": 8.6662731282413} +{"Pretrain/Learning Rate": 1.133789449015005e-05, "Pretrain/Loss": 1.9454728364944458, "Pretrain/Loss (Raw)": 1.9538726806640625, "Pretrain/Step": 6614, "Pretrain/Step Time": 8.661501828581095} +{"Pretrain/Learning Rate": 1.1330785269113686e-05, "Pretrain/Loss": 1.944678544998169, "Pretrain/Loss (Raw)": 2.0199525356292725, "Pretrain/Step": 6615, "Pretrain/Step Time": 8.658607402816415} +{"Pretrain/Learning Rate": 1.1323677624475567e-05, "Pretrain/Loss": 1.9450863599777222, "Pretrain/Loss (Raw)": 2.0876669883728027, "Pretrain/Step": 6616, "Pretrain/Step Time": 8.659765603020787} +{"Pretrain/Learning Rate": 1.13165715570554e-05, "Pretrain/Loss": 1.9439741373062134, "Pretrain/Loss (Raw)": 1.928346037864685, "Pretrain/Step": 6617, "Pretrain/Step Time": 8.657883496955037} +{"Pretrain/Learning Rate": 1.1309467067672678e-05, "Pretrain/Loss": 1.9458034038543701, "Pretrain/Loss (Raw)": 1.6587730646133423, "Pretrain/Step": 6618, "Pretrain/Step Time": 8.65621406212449} +{"Pretrain/Learning Rate": 1.1302364157146716e-05, "Pretrain/Loss": 1.945449709892273, "Pretrain/Loss (Raw)": 1.9792633056640625, "Pretrain/Step": 6619, "Pretrain/Step Time": 8.658194040879607} +{"Pretrain/Learning Rate": 1.1295262826296677e-05, "Pretrain/Loss": 1.945997953414917, "Pretrain/Loss (Raw)": 1.9936110973358154, "Pretrain/Step": 6620, "Pretrain/Step Time": 8.65814496204257} +{"Pretrain/Learning Rate": 1.1288163075941505e-05, "Pretrain/Loss": 1.944615364074707, "Pretrain/Loss (Raw)": 1.8767396211624146, "Pretrain/Step": 6621, "Pretrain/Step Time": 8.656114691868424} +{"Pretrain/Learning Rate": 1.128106490689998e-05, "Pretrain/Loss": 1.943472146987915, "Pretrain/Loss (Raw)": 1.809827446937561, "Pretrain/Step": 6622, "Pretrain/Step Time": 8.656179746612906} +{"Pretrain/Learning Rate": 1.1273968319990685e-05, "Pretrain/Loss": 1.9423508644104004, "Pretrain/Loss (Raw)": 1.993697166442871, "Pretrain/Step": 6623, "Pretrain/Step Time": 8.652545215561986} +{"Pretrain/Learning Rate": 1.1266873316032053e-05, "Pretrain/Loss": 1.9444479942321777, "Pretrain/Loss (Raw)": 2.049189329147339, "Pretrain/Step": 6624, "Pretrain/Step Time": 8.652007460594177} +{"Pretrain/Learning Rate": 1.1259779895842304e-05, "Pretrain/Loss": 1.9423712491989136, "Pretrain/Loss (Raw)": 1.8436827659606934, "Pretrain/Step": 6625, "Pretrain/Step Time": 8.654237553477287} +{"Pretrain/Learning Rate": 1.1252688060239481e-05, "Pretrain/Loss": 1.9461966753005981, "Pretrain/Loss (Raw)": 2.41520357131958, "Pretrain/Step": 6626, "Pretrain/Step Time": 8.655622752383351} +{"Pretrain/Learning Rate": 1.1245597810041441e-05, "Pretrain/Loss": 1.9458074569702148, "Pretrain/Loss (Raw)": 1.8394176959991455, "Pretrain/Step": 6627, "Pretrain/Step Time": 8.652544975280762} +{"Pretrain/Learning Rate": 1.1238509146065887e-05, "Pretrain/Loss": 1.943267822265625, "Pretrain/Loss (Raw)": 1.770676612854004, "Pretrain/Step": 6628, "Pretrain/Step Time": 8.654848901554942} +{"Pretrain/Learning Rate": 1.1231422069130302e-05, "Pretrain/Loss": 1.9434361457824707, "Pretrain/Loss (Raw)": 1.9067033529281616, "Pretrain/Step": 6629, "Pretrain/Step Time": 8.652859998866916} +{"Pretrain/Learning Rate": 1.1224336580052005e-05, "Pretrain/Loss": 1.9423654079437256, "Pretrain/Loss (Raw)": 1.8513046503067017, "Pretrain/Step": 6630, "Pretrain/Step Time": 8.653038086369634} +{"Pretrain/Learning Rate": 1.1217252679648116e-05, "Pretrain/Loss": 1.9428963661193848, "Pretrain/Loss (Raw)": 2.055950880050659, "Pretrain/Step": 6631, "Pretrain/Step Time": 8.6524787992239} +{"Pretrain/Learning Rate": 1.1210170368735615e-05, "Pretrain/Loss": 1.9432024955749512, "Pretrain/Loss (Raw)": 1.9417471885681152, "Pretrain/Step": 6632, "Pretrain/Step Time": 8.653287226334214} +{"Pretrain/Learning Rate": 1.1203089648131227e-05, "Pretrain/Loss": 1.9392907619476318, "Pretrain/Loss (Raw)": 1.5057684183120728, "Pretrain/Step": 6633, "Pretrain/Step Time": 8.652872923761606} +{"Pretrain/Learning Rate": 1.1196010518651562e-05, "Pretrain/Loss": 1.9340797662734985, "Pretrain/Loss (Raw)": 1.512477159500122, "Pretrain/Step": 6634, "Pretrain/Step Time": 8.653759030625224} +{"Pretrain/Learning Rate": 1.1188932981113004e-05, "Pretrain/Loss": 1.9313437938690186, "Pretrain/Loss (Raw)": 1.6639056205749512, "Pretrain/Step": 6635, "Pretrain/Step Time": 8.652212738990784} +{"Pretrain/Learning Rate": 1.1181857036331792e-05, "Pretrain/Loss": 1.932179570198059, "Pretrain/Loss (Raw)": 2.0288338661193848, "Pretrain/Step": 6636, "Pretrain/Step Time": 8.651771685108542} +{"Pretrain/Learning Rate": 1.1174782685123918e-05, "Pretrain/Loss": 1.9322391748428345, "Pretrain/Loss (Raw)": 1.8633332252502441, "Pretrain/Step": 6637, "Pretrain/Step Time": 8.655077617615461} +{"Pretrain/Learning Rate": 1.1167709928305265e-05, "Pretrain/Loss": 1.9323031902313232, "Pretrain/Loss (Raw)": 1.888926386833191, "Pretrain/Step": 6638, "Pretrain/Step Time": 8.652812719345093} +{"Pretrain/Learning Rate": 1.1160638766691473e-05, "Pretrain/Loss": 1.932651162147522, "Pretrain/Loss (Raw)": 1.8574533462524414, "Pretrain/Step": 6639, "Pretrain/Step Time": 8.651311131194234} +{"Pretrain/Learning Rate": 1.1153569201098046e-05, "Pretrain/Loss": 1.931349754333496, "Pretrain/Loss (Raw)": 1.9269779920578003, "Pretrain/Step": 6640, "Pretrain/Step Time": 8.653190799057484} +{"Pretrain/Learning Rate": 1.114650123234025e-05, "Pretrain/Loss": 1.9346562623977661, "Pretrain/Loss (Raw)": 2.2208592891693115, "Pretrain/Step": 6641, "Pretrain/Step Time": 8.65734501555562} +{"Pretrain/Learning Rate": 1.1139434861233223e-05, "Pretrain/Loss": 1.934783935546875, "Pretrain/Loss (Raw)": 2.0158841609954834, "Pretrain/Step": 6642, "Pretrain/Step Time": 8.658401258289814} +{"Pretrain/Learning Rate": 1.1132370088591879e-05, "Pretrain/Loss": 1.934570550918579, "Pretrain/Loss (Raw)": 1.6897623538970947, "Pretrain/Step": 6643, "Pretrain/Step Time": 8.65475808084011} +{"Pretrain/Learning Rate": 1.1125306915230963e-05, "Pretrain/Loss": 1.9348695278167725, "Pretrain/Loss (Raw)": 2.0627734661102295, "Pretrain/Step": 6644, "Pretrain/Step Time": 8.655099924653769} +{"Pretrain/Learning Rate": 1.1118245341965022e-05, "Pretrain/Loss": 1.9334907531738281, "Pretrain/Loss (Raw)": 1.9269815683364868, "Pretrain/Step": 6645, "Pretrain/Step Time": 8.652634724974632} +{"Pretrain/Learning Rate": 1.1111185369608454e-05, "Pretrain/Loss": 1.9336400032043457, "Pretrain/Loss (Raw)": 1.9809001684188843, "Pretrain/Step": 6646, "Pretrain/Step Time": 8.654711605980992} +{"Pretrain/Learning Rate": 1.110412699897543e-05, "Pretrain/Loss": 1.9310892820358276, "Pretrain/Loss (Raw)": 1.8351075649261475, "Pretrain/Step": 6647, "Pretrain/Step Time": 8.651023898273706} +{"Pretrain/Learning Rate": 1.1097070230879965e-05, "Pretrain/Loss": 1.9325401782989502, "Pretrain/Loss (Raw)": 2.0914077758789062, "Pretrain/Step": 6648, "Pretrain/Step Time": 8.654794653877616} +{"Pretrain/Learning Rate": 1.1090015066135865e-05, "Pretrain/Loss": 1.9323737621307373, "Pretrain/Loss (Raw)": 1.9724903106689453, "Pretrain/Step": 6649, "Pretrain/Step Time": 8.654569808393717} +{"Pretrain/Learning Rate": 1.108296150555678e-05, "Pretrain/Loss": 1.934179663658142, "Pretrain/Loss (Raw)": 2.0685951709747314, "Pretrain/Step": 6650, "Pretrain/Step Time": 8.658263074234128} +{"Pretrain/Learning Rate": 1.1075909549956154e-05, "Pretrain/Loss": 1.9332748651504517, "Pretrain/Loss (Raw)": 1.8369600772857666, "Pretrain/Step": 6651, "Pretrain/Step Time": 8.656203556805849} +{"Pretrain/Learning Rate": 1.106885920014725e-05, "Pretrain/Loss": 1.934516191482544, "Pretrain/Loss (Raw)": 1.9403867721557617, "Pretrain/Step": 6652, "Pretrain/Step Time": 8.656015142798424} +{"Pretrain/Learning Rate": 1.1061810456943142e-05, "Pretrain/Loss": 1.9323761463165283, "Pretrain/Loss (Raw)": 1.4698660373687744, "Pretrain/Step": 6653, "Pretrain/Step Time": 8.65148513019085} +{"Pretrain/Learning Rate": 1.1054763321156738e-05, "Pretrain/Loss": 1.9319524765014648, "Pretrain/Loss (Raw)": 2.071687936782837, "Pretrain/Step": 6654, "Pretrain/Step Time": 8.651592668145895} +{"Pretrain/Learning Rate": 1.1047717793600743e-05, "Pretrain/Loss": 1.932373285293579, "Pretrain/Loss (Raw)": 1.793688178062439, "Pretrain/Step": 6655, "Pretrain/Step Time": 8.651133367791772} +{"Pretrain/Learning Rate": 1.1040673875087673e-05, "Pretrain/Loss": 1.9326305389404297, "Pretrain/Loss (Raw)": 1.9351750612258911, "Pretrain/Step": 6656, "Pretrain/Step Time": 8.651235077530146} +{"Pretrain/Learning Rate": 1.1033631566429863e-05, "Pretrain/Loss": 1.9329140186309814, "Pretrain/Loss (Raw)": 2.129564046859741, "Pretrain/Step": 6657, "Pretrain/Step Time": 8.652767846360803} +{"Pretrain/Learning Rate": 1.1026590868439482e-05, "Pretrain/Loss": 1.9326939582824707, "Pretrain/Loss (Raw)": 1.9340143203735352, "Pretrain/Step": 6658, "Pretrain/Step Time": 8.656481916084886} +{"Pretrain/Learning Rate": 1.1019551781928489e-05, "Pretrain/Loss": 1.936207890510559, "Pretrain/Loss (Raw)": 2.322486162185669, "Pretrain/Step": 6659, "Pretrain/Step Time": 8.653030624613166} +{"Pretrain/Learning Rate": 1.1012514307708648e-05, "Pretrain/Loss": 1.9359862804412842, "Pretrain/Loss (Raw)": 1.9789888858795166, "Pretrain/Step": 6660, "Pretrain/Step Time": 8.651682041585445} +{"Pretrain/Learning Rate": 1.1005478446591582e-05, "Pretrain/Loss": 1.934805989265442, "Pretrain/Loss (Raw)": 1.8472832441329956, "Pretrain/Step": 6661, "Pretrain/Step Time": 8.654650285840034} +{"Pretrain/Learning Rate": 1.0998444199388686e-05, "Pretrain/Loss": 1.9366211891174316, "Pretrain/Loss (Raw)": 1.917781114578247, "Pretrain/Step": 6662, "Pretrain/Step Time": 8.659098863601685} +{"Pretrain/Learning Rate": 1.099141156691118e-05, "Pretrain/Loss": 1.9370428323745728, "Pretrain/Loss (Raw)": 2.0503437519073486, "Pretrain/Step": 6663, "Pretrain/Step Time": 8.656509447842836} +{"Pretrain/Learning Rate": 1.0984380549970095e-05, "Pretrain/Loss": 1.9371187686920166, "Pretrain/Loss (Raw)": 1.9428555965423584, "Pretrain/Step": 6664, "Pretrain/Step Time": 8.654175981879234} +{"Pretrain/Learning Rate": 1.0977351149376297e-05, "Pretrain/Loss": 1.938382625579834, "Pretrain/Loss (Raw)": 1.9566493034362793, "Pretrain/Step": 6665, "Pretrain/Step Time": 8.658358123153448} +{"Pretrain/Learning Rate": 1.0970323365940444e-05, "Pretrain/Loss": 1.939129114151001, "Pretrain/Loss (Raw)": 2.0205891132354736, "Pretrain/Step": 6666, "Pretrain/Step Time": 8.65765948407352} +{"Pretrain/Learning Rate": 1.0963297200473007e-05, "Pretrain/Loss": 1.9403579235076904, "Pretrain/Loss (Raw)": 2.296685218811035, "Pretrain/Step": 6667, "Pretrain/Step Time": 8.655997527763247} +{"Pretrain/Learning Rate": 1.0956272653784271e-05, "Pretrain/Loss": 1.9391697645187378, "Pretrain/Loss (Raw)": 1.9483909606933594, "Pretrain/Step": 6668, "Pretrain/Step Time": 8.65434822626412} +{"Pretrain/Learning Rate": 1.094924972668436e-05, "Pretrain/Loss": 1.9400341510772705, "Pretrain/Loss (Raw)": 1.9195994138717651, "Pretrain/Step": 6669, "Pretrain/Step Time": 8.654501024633646} +{"Pretrain/Learning Rate": 1.0942228419983177e-05, "Pretrain/Loss": 1.9405556917190552, "Pretrain/Loss (Raw)": 1.9551283121109009, "Pretrain/Step": 6670, "Pretrain/Step Time": 8.650224203243852} +{"Pretrain/Learning Rate": 1.093520873449046e-05, "Pretrain/Loss": 1.9412257671356201, "Pretrain/Loss (Raw)": 2.026656150817871, "Pretrain/Step": 6671, "Pretrain/Step Time": 8.649600287899375} +{"Pretrain/Learning Rate": 1.0928190671015734e-05, "Pretrain/Loss": 1.9424606561660767, "Pretrain/Loss (Raw)": 2.075136423110962, "Pretrain/Step": 6672, "Pretrain/Step Time": 8.652998752892017} +{"Pretrain/Learning Rate": 1.0921174230368378e-05, "Pretrain/Loss": 1.9421968460083008, "Pretrain/Loss (Raw)": 1.6591039896011353, "Pretrain/Step": 6673, "Pretrain/Step Time": 8.650311538949609} +{"Pretrain/Learning Rate": 1.0914159413357553e-05, "Pretrain/Loss": 1.9433743953704834, "Pretrain/Loss (Raw)": 1.9897286891937256, "Pretrain/Step": 6674, "Pretrain/Step Time": 8.656487125903368} +{"Pretrain/Learning Rate": 1.0907146220792236e-05, "Pretrain/Loss": 1.9414643049240112, "Pretrain/Loss (Raw)": 1.6821037530899048, "Pretrain/Step": 6675, "Pretrain/Step Time": 8.655663883313537} +{"Pretrain/Learning Rate": 1.0900134653481217e-05, "Pretrain/Loss": 1.9398983716964722, "Pretrain/Loss (Raw)": 1.6003819704055786, "Pretrain/Step": 6676, "Pretrain/Step Time": 8.656815111637115} +{"Pretrain/Learning Rate": 1.089312471223313e-05, "Pretrain/Loss": 1.9381844997406006, "Pretrain/Loss (Raw)": 1.7425262928009033, "Pretrain/Step": 6677, "Pretrain/Step Time": 8.655790941789746} +{"Pretrain/Learning Rate": 1.0886116397856355e-05, "Pretrain/Loss": 1.935781717300415, "Pretrain/Loss (Raw)": 1.8325104713439941, "Pretrain/Step": 6678, "Pretrain/Step Time": 8.65872336179018} +{"Pretrain/Learning Rate": 1.0879109711159156e-05, "Pretrain/Loss": 1.9374516010284424, "Pretrain/Loss (Raw)": 2.132323741912842, "Pretrain/Step": 6679, "Pretrain/Step Time": 8.651983363553882} +{"Pretrain/Learning Rate": 1.0872104652949552e-05, "Pretrain/Loss": 1.9416735172271729, "Pretrain/Loss (Raw)": 2.195098638534546, "Pretrain/Step": 6680, "Pretrain/Step Time": 8.654229475185275} +{"Pretrain/Learning Rate": 1.0865101224035432e-05, "Pretrain/Loss": 1.940826654434204, "Pretrain/Loss (Raw)": 1.988933801651001, "Pretrain/Step": 6681, "Pretrain/Step Time": 8.65182577073574} +{"Pretrain/Learning Rate": 1.0858099425224427e-05, "Pretrain/Loss": 1.9448593854904175, "Pretrain/Loss (Raw)": 2.154648780822754, "Pretrain/Step": 6682, "Pretrain/Step Time": 8.651561556383967} +{"Pretrain/Learning Rate": 1.0851099257324043e-05, "Pretrain/Loss": 1.9439139366149902, "Pretrain/Loss (Raw)": 1.817865014076233, "Pretrain/Step": 6683, "Pretrain/Step Time": 8.651505107060075} +{"Pretrain/Learning Rate": 1.0844100721141564e-05, "Pretrain/Loss": 1.9466345310211182, "Pretrain/Loss (Raw)": 2.008012294769287, "Pretrain/Step": 6684, "Pretrain/Step Time": 8.650417806580663} +{"Pretrain/Learning Rate": 1.0837103817484096e-05, "Pretrain/Loss": 1.9451770782470703, "Pretrain/Loss (Raw)": 1.7412818670272827, "Pretrain/Step": 6685, "Pretrain/Step Time": 8.649808719754219} +{"Pretrain/Learning Rate": 1.0830108547158544e-05, "Pretrain/Loss": 1.9454479217529297, "Pretrain/Loss (Raw)": 2.0480775833129883, "Pretrain/Step": 6686, "Pretrain/Step Time": 8.650189325213432} +{"Pretrain/Learning Rate": 1.0823114910971654e-05, "Pretrain/Loss": 1.9458132982254028, "Pretrain/Loss (Raw)": 1.9889355897903442, "Pretrain/Step": 6687, "Pretrain/Step Time": 8.655628927052021} +{"Pretrain/Learning Rate": 1.0816122909729957e-05, "Pretrain/Loss": 1.9470198154449463, "Pretrain/Loss (Raw)": 2.264479875564575, "Pretrain/Step": 6688, "Pretrain/Step Time": 8.657295163720846} +{"Pretrain/Learning Rate": 1.0809132544239803e-05, "Pretrain/Loss": 1.950111985206604, "Pretrain/Loss (Raw)": 1.989801287651062, "Pretrain/Step": 6689, "Pretrain/Step Time": 8.661640219390392} +{"Pretrain/Learning Rate": 1.0802143815307342e-05, "Pretrain/Loss": 1.9503214359283447, "Pretrain/Loss (Raw)": 1.8619948625564575, "Pretrain/Step": 6690, "Pretrain/Step Time": 8.663984596729279} +{"Pretrain/Learning Rate": 1.079515672373857e-05, "Pretrain/Loss": 1.9516818523406982, "Pretrain/Loss (Raw)": 2.0597991943359375, "Pretrain/Step": 6691, "Pretrain/Step Time": 8.660667318850756} +{"Pretrain/Learning Rate": 1.078817127033926e-05, "Pretrain/Loss": 1.9530388116836548, "Pretrain/Loss (Raw)": 2.103837251663208, "Pretrain/Step": 6692, "Pretrain/Step Time": 8.659573765471578} +{"Pretrain/Learning Rate": 1.0781187455915007e-05, "Pretrain/Loss": 1.9529163837432861, "Pretrain/Loss (Raw)": 2.0872902870178223, "Pretrain/Step": 6693, "Pretrain/Step Time": 8.661443118005991} +{"Pretrain/Learning Rate": 1.0774205281271208e-05, "Pretrain/Loss": 1.9518086910247803, "Pretrain/Loss (Raw)": 1.7281419038772583, "Pretrain/Step": 6694, "Pretrain/Step Time": 8.666606340557337} +{"Pretrain/Learning Rate": 1.0767224747213101e-05, "Pretrain/Loss": 1.9549212455749512, "Pretrain/Loss (Raw)": 2.306687831878662, "Pretrain/Step": 6695, "Pretrain/Step Time": 8.666018016636372} +{"Pretrain/Learning Rate": 1.07602458545457e-05, "Pretrain/Loss": 1.9576513767242432, "Pretrain/Loss (Raw)": 2.151637315750122, "Pretrain/Step": 6696, "Pretrain/Step Time": 8.672378895804286} +{"Pretrain/Learning Rate": 1.0753268604073849e-05, "Pretrain/Loss": 1.9527297019958496, "Pretrain/Loss (Raw)": 1.4855585098266602, "Pretrain/Step": 6697, "Pretrain/Step Time": 8.668427651748061} +{"Pretrain/Learning Rate": 1.0746292996602187e-05, "Pretrain/Loss": 1.9529452323913574, "Pretrain/Loss (Raw)": 2.114108085632324, "Pretrain/Step": 6698, "Pretrain/Step Time": 8.673324767500162} +{"Pretrain/Learning Rate": 1.0739319032935192e-05, "Pretrain/Loss": 1.952655553817749, "Pretrain/Loss (Raw)": 1.785064458847046, "Pretrain/Step": 6699, "Pretrain/Step Time": 8.671102529391646} +{"Pretrain/Learning Rate": 1.0732346713877123e-05, "Pretrain/Loss": 1.9511849880218506, "Pretrain/Loss (Raw)": 1.9557286500930786, "Pretrain/Step": 6700, "Pretrain/Step Time": 8.664077296853065} +{"Pretrain/Learning Rate": 1.0725376040232052e-05, "Pretrain/Loss": 1.952239990234375, "Pretrain/Loss (Raw)": 1.985193133354187, "Pretrain/Step": 6701, "Pretrain/Step Time": 8.66146594285965} +{"Pretrain/Learning Rate": 1.071840701280389e-05, "Pretrain/Loss": 1.9534212350845337, "Pretrain/Loss (Raw)": 1.8644418716430664, "Pretrain/Step": 6702, "Pretrain/Step Time": 8.664270207285881} +{"Pretrain/Learning Rate": 1.071143963239633e-05, "Pretrain/Loss": 1.9521334171295166, "Pretrain/Loss (Raw)": 1.8891013860702515, "Pretrain/Step": 6703, "Pretrain/Step Time": 8.666986282914877} +{"Pretrain/Learning Rate": 1.0704473899812881e-05, "Pretrain/Loss": 1.95381498336792, "Pretrain/Loss (Raw)": 2.202561378479004, "Pretrain/Step": 6704, "Pretrain/Step Time": 8.667336709797382} +{"Pretrain/Learning Rate": 1.0697509815856858e-05, "Pretrain/Loss": 1.9528143405914307, "Pretrain/Loss (Raw)": 2.029050827026367, "Pretrain/Step": 6705, "Pretrain/Step Time": 8.6712048612535} +{"Pretrain/Learning Rate": 1.0690547381331403e-05, "Pretrain/Loss": 1.9521511793136597, "Pretrain/Loss (Raw)": 1.8683643341064453, "Pretrain/Step": 6706, "Pretrain/Step Time": 8.665770841762424} +{"Pretrain/Learning Rate": 1.0683586597039456e-05, "Pretrain/Loss": 1.9542646408081055, "Pretrain/Loss (Raw)": 2.0438404083251953, "Pretrain/Step": 6707, "Pretrain/Step Time": 8.66288098320365} +{"Pretrain/Learning Rate": 1.0676627463783762e-05, "Pretrain/Loss": 1.9552266597747803, "Pretrain/Loss (Raw)": 1.8549391031265259, "Pretrain/Step": 6708, "Pretrain/Step Time": 8.66209702193737} +{"Pretrain/Learning Rate": 1.0669669982366873e-05, "Pretrain/Loss": 1.9571161270141602, "Pretrain/Loss (Raw)": 2.089272975921631, "Pretrain/Step": 6709, "Pretrain/Step Time": 8.660833213478327} +{"Pretrain/Learning Rate": 1.0662714153591177e-05, "Pretrain/Loss": 1.9524407386779785, "Pretrain/Loss (Raw)": 1.4709086418151855, "Pretrain/Step": 6710, "Pretrain/Step Time": 8.661376528441906} +{"Pretrain/Learning Rate": 1.0655759978258847e-05, "Pretrain/Loss": 1.953101396560669, "Pretrain/Loss (Raw)": 1.8947901725769043, "Pretrain/Step": 6711, "Pretrain/Step Time": 8.661306763067842} +{"Pretrain/Learning Rate": 1.0648807457171867e-05, "Pretrain/Loss": 1.954874038696289, "Pretrain/Loss (Raw)": 2.1013376712799072, "Pretrain/Step": 6712, "Pretrain/Step Time": 8.66194362938404} +{"Pretrain/Learning Rate": 1.0641856591132027e-05, "Pretrain/Loss": 1.952173113822937, "Pretrain/Loss (Raw)": 1.8040882349014282, "Pretrain/Step": 6713, "Pretrain/Step Time": 8.657975455746055} +{"Pretrain/Learning Rate": 1.063490738094095e-05, "Pretrain/Loss": 1.9532790184020996, "Pretrain/Loss (Raw)": 2.1764938831329346, "Pretrain/Step": 6714, "Pretrain/Step Time": 8.66371931694448} +{"Pretrain/Learning Rate": 1.0627959827400047e-05, "Pretrain/Loss": 1.9528330564498901, "Pretrain/Loss (Raw)": 2.0747361183166504, "Pretrain/Step": 6715, "Pretrain/Step Time": 8.661595599725842} +{"Pretrain/Learning Rate": 1.0621013931310541e-05, "Pretrain/Loss": 1.9539055824279785, "Pretrain/Loss (Raw)": 2.0290768146514893, "Pretrain/Step": 6716, "Pretrain/Step Time": 8.661081537604332} +{"Pretrain/Learning Rate": 1.0614069693473452e-05, "Pretrain/Loss": 1.9539704322814941, "Pretrain/Loss (Raw)": 1.9529831409454346, "Pretrain/Step": 6717, "Pretrain/Step Time": 8.657223552465439} +{"Pretrain/Learning Rate": 1.0607127114689655e-05, "Pretrain/Loss": 1.9514559507369995, "Pretrain/Loss (Raw)": 1.8454246520996094, "Pretrain/Step": 6718, "Pretrain/Step Time": 8.656739903613925} +{"Pretrain/Learning Rate": 1.0600186195759762e-05, "Pretrain/Loss": 1.951101303100586, "Pretrain/Loss (Raw)": 1.9218205213546753, "Pretrain/Step": 6719, "Pretrain/Step Time": 8.65923541598022} +{"Pretrain/Learning Rate": 1.0593246937484261e-05, "Pretrain/Loss": 1.9525647163391113, "Pretrain/Loss (Raw)": 2.183661699295044, "Pretrain/Step": 6720, "Pretrain/Step Time": 8.654049545526505} +{"Pretrain/Learning Rate": 1.05863093406634e-05, "Pretrain/Loss": 1.9530365467071533, "Pretrain/Loss (Raw)": 1.9532206058502197, "Pretrain/Step": 6721, "Pretrain/Step Time": 8.656194403767586} +{"Pretrain/Learning Rate": 1.0579373406097284e-05, "Pretrain/Loss": 1.9464118480682373, "Pretrain/Loss (Raw)": 1.2160735130310059, "Pretrain/Step": 6722, "Pretrain/Step Time": 8.655157558619976} +{"Pretrain/Learning Rate": 1.057243913458576e-05, "Pretrain/Loss": 1.9448215961456299, "Pretrain/Loss (Raw)": 1.8048641681671143, "Pretrain/Step": 6723, "Pretrain/Step Time": 8.65328142978251} +{"Pretrain/Learning Rate": 1.0565506526928548e-05, "Pretrain/Loss": 1.9453728199005127, "Pretrain/Loss (Raw)": 2.106278419494629, "Pretrain/Step": 6724, "Pretrain/Step Time": 8.652402026578784} +{"Pretrain/Learning Rate": 1.0558575583925143e-05, "Pretrain/Loss": 1.9461536407470703, "Pretrain/Loss (Raw)": 1.98158597946167, "Pretrain/Step": 6725, "Pretrain/Step Time": 8.656425025314093} +{"Pretrain/Learning Rate": 1.0551646306374851e-05, "Pretrain/Loss": 1.9463698863983154, "Pretrain/Loss (Raw)": 2.0334136486053467, "Pretrain/Step": 6726, "Pretrain/Step Time": 8.653419326990843} +{"Pretrain/Learning Rate": 1.0544718695076783e-05, "Pretrain/Loss": 1.9441357851028442, "Pretrain/Loss (Raw)": 1.7607645988464355, "Pretrain/Step": 6727, "Pretrain/Step Time": 8.656777486205101} +{"Pretrain/Learning Rate": 1.0537792750829875e-05, "Pretrain/Loss": 1.9419769048690796, "Pretrain/Loss (Raw)": 1.7093225717544556, "Pretrain/Step": 6728, "Pretrain/Step Time": 8.65770323202014} +{"Pretrain/Learning Rate": 1.053086847443286e-05, "Pretrain/Loss": 1.943105697631836, "Pretrain/Loss (Raw)": 1.938279628753662, "Pretrain/Step": 6729, "Pretrain/Step Time": 8.651455519720912} +{"Pretrain/Learning Rate": 1.052394586668427e-05, "Pretrain/Loss": 1.9420900344848633, "Pretrain/Loss (Raw)": 1.7997066974639893, "Pretrain/Step": 6730, "Pretrain/Step Time": 8.651706408709288} +{"Pretrain/Learning Rate": 1.0517024928382449e-05, "Pretrain/Loss": 1.9417885541915894, "Pretrain/Loss (Raw)": 2.1314706802368164, "Pretrain/Step": 6731, "Pretrain/Step Time": 8.651336757466197} +{"Pretrain/Learning Rate": 1.0510105660325567e-05, "Pretrain/Loss": 1.9426047801971436, "Pretrain/Loss (Raw)": 2.139840602874756, "Pretrain/Step": 6732, "Pretrain/Step Time": 8.646418031305075} +{"Pretrain/Learning Rate": 1.0503188063311578e-05, "Pretrain/Loss": 1.941793441772461, "Pretrain/Loss (Raw)": 1.9437789916992188, "Pretrain/Step": 6733, "Pretrain/Step Time": 8.647719426080585} +{"Pretrain/Learning Rate": 1.0496272138138255e-05, "Pretrain/Loss": 1.9433460235595703, "Pretrain/Loss (Raw)": 2.1322145462036133, "Pretrain/Step": 6734, "Pretrain/Step Time": 8.649655481800437} +{"Pretrain/Learning Rate": 1.0489357885603162e-05, "Pretrain/Loss": 1.9409759044647217, "Pretrain/Loss (Raw)": 1.8639411926269531, "Pretrain/Step": 6735, "Pretrain/Step Time": 8.652856862172484} +{"Pretrain/Learning Rate": 1.0482445306503705e-05, "Pretrain/Loss": 1.9412769079208374, "Pretrain/Loss (Raw)": 2.2480156421661377, "Pretrain/Step": 6736, "Pretrain/Step Time": 8.65312310680747} +{"Pretrain/Learning Rate": 1.0475534401637063e-05, "Pretrain/Loss": 1.940392017364502, "Pretrain/Loss (Raw)": 1.965105414390564, "Pretrain/Step": 6737, "Pretrain/Step Time": 8.657828046008945} +{"Pretrain/Learning Rate": 1.0468625171800233e-05, "Pretrain/Loss": 1.9417798519134521, "Pretrain/Loss (Raw)": 2.0189101696014404, "Pretrain/Step": 6738, "Pretrain/Step Time": 8.65559083595872} +{"Pretrain/Learning Rate": 1.0461717617790017e-05, "Pretrain/Loss": 1.9405004978179932, "Pretrain/Loss (Raw)": 1.9590849876403809, "Pretrain/Step": 6739, "Pretrain/Step Time": 8.6505733653903} +{"Pretrain/Learning Rate": 1.045481174040304e-05, "Pretrain/Loss": 1.9413474798202515, "Pretrain/Loss (Raw)": 1.9339509010314941, "Pretrain/Step": 6740, "Pretrain/Step Time": 8.654700374230742} +{"Pretrain/Learning Rate": 1.044790754043571e-05, "Pretrain/Loss": 1.9440951347351074, "Pretrain/Loss (Raw)": 1.9886152744293213, "Pretrain/Step": 6741, "Pretrain/Step Time": 8.654005821794271} +{"Pretrain/Learning Rate": 1.044100501868425e-05, "Pretrain/Loss": 1.9448494911193848, "Pretrain/Loss (Raw)": 2.050450563430786, "Pretrain/Step": 6742, "Pretrain/Step Time": 8.660579223185778} +{"Pretrain/Learning Rate": 1.0434104175944701e-05, "Pretrain/Loss": 1.9453330039978027, "Pretrain/Loss (Raw)": 2.0818207263946533, "Pretrain/Step": 6743, "Pretrain/Step Time": 8.656067023053765} +{"Pretrain/Learning Rate": 1.0427205013012894e-05, "Pretrain/Loss": 1.9450452327728271, "Pretrain/Loss (Raw)": 2.050837755203247, "Pretrain/Step": 6744, "Pretrain/Step Time": 8.658509468659759} +{"Pretrain/Learning Rate": 1.0420307530684478e-05, "Pretrain/Loss": 1.9431967735290527, "Pretrain/Loss (Raw)": 1.6917363405227661, "Pretrain/Step": 6745, "Pretrain/Step Time": 8.656271040439606} +{"Pretrain/Learning Rate": 1.0413411729754887e-05, "Pretrain/Loss": 1.9465662240982056, "Pretrain/Loss (Raw)": 2.0900678634643555, "Pretrain/Step": 6746, "Pretrain/Step Time": 8.656875982880592} +{"Pretrain/Learning Rate": 1.0406517611019401e-05, "Pretrain/Loss": 1.9459363222122192, "Pretrain/Loss (Raw)": 1.8986423015594482, "Pretrain/Step": 6747, "Pretrain/Step Time": 8.65675831772387} +{"Pretrain/Learning Rate": 1.039962517527307e-05, "Pretrain/Loss": 1.9453424215316772, "Pretrain/Loss (Raw)": 1.9175899028778076, "Pretrain/Step": 6748, "Pretrain/Step Time": 8.65222735889256} +{"Pretrain/Learning Rate": 1.0392734423310762e-05, "Pretrain/Loss": 1.9451829195022583, "Pretrain/Loss (Raw)": 1.8563169240951538, "Pretrain/Step": 6749, "Pretrain/Step Time": 8.652638485655189} +{"Pretrain/Learning Rate": 1.0385845355927144e-05, "Pretrain/Loss": 1.9464216232299805, "Pretrain/Loss (Raw)": 1.9683971405029297, "Pretrain/Step": 6750, "Pretrain/Step Time": 8.651284212246537} +{"Pretrain/Learning Rate": 1.0378957973916712e-05, "Pretrain/Loss": 1.9463655948638916, "Pretrain/Loss (Raw)": 1.9865117073059082, "Pretrain/Step": 6751, "Pretrain/Step Time": 8.65583142824471} +{"Pretrain/Learning Rate": 1.0372072278073744e-05, "Pretrain/Loss": 1.9464130401611328, "Pretrain/Loss (Raw)": 2.055277109146118, "Pretrain/Step": 6752, "Pretrain/Step Time": 8.658146560192108} +{"Pretrain/Learning Rate": 1.036518826919233e-05, "Pretrain/Loss": 1.9483039379119873, "Pretrain/Loss (Raw)": 2.0856950283050537, "Pretrain/Step": 6753, "Pretrain/Step Time": 8.651480441913009} +{"Pretrain/Learning Rate": 1.0358305948066355e-05, "Pretrain/Loss": 1.9458115100860596, "Pretrain/Loss (Raw)": 2.0961813926696777, "Pretrain/Step": 6754, "Pretrain/Step Time": 8.652995573356748} +{"Pretrain/Learning Rate": 1.0351425315489543e-05, "Pretrain/Loss": 1.9480481147766113, "Pretrain/Loss (Raw)": 2.1257131099700928, "Pretrain/Step": 6755, "Pretrain/Step Time": 8.654136773198843} +{"Pretrain/Learning Rate": 1.034454637225539e-05, "Pretrain/Loss": 1.9499711990356445, "Pretrain/Loss (Raw)": 2.0168206691741943, "Pretrain/Step": 6756, "Pretrain/Step Time": 8.652211494743824} +{"Pretrain/Learning Rate": 1.0337669119157208e-05, "Pretrain/Loss": 1.9512226581573486, "Pretrain/Loss (Raw)": 2.066894054412842, "Pretrain/Step": 6757, "Pretrain/Step Time": 8.65356571227312} +{"Pretrain/Learning Rate": 1.0330793556988106e-05, "Pretrain/Loss": 1.9539302587509155, "Pretrain/Loss (Raw)": 2.1978816986083984, "Pretrain/Step": 6758, "Pretrain/Step Time": 8.64940469712019} +{"Pretrain/Learning Rate": 1.032391968654103e-05, "Pretrain/Loss": 1.9544732570648193, "Pretrain/Loss (Raw)": 2.1254374980926514, "Pretrain/Step": 6759, "Pretrain/Step Time": 8.653473880141973} +{"Pretrain/Learning Rate": 1.0317047508608677e-05, "Pretrain/Loss": 1.9545512199401855, "Pretrain/Loss (Raw)": 1.9517357349395752, "Pretrain/Step": 6760, "Pretrain/Step Time": 8.6558467913419} +{"Pretrain/Learning Rate": 1.03101770239836e-05, "Pretrain/Loss": 1.958451509475708, "Pretrain/Loss (Raw)": 2.005005359649658, "Pretrain/Step": 6761, "Pretrain/Step Time": 8.657937981188297} +{"Pretrain/Learning Rate": 1.0303308233458123e-05, "Pretrain/Loss": 1.9605622291564941, "Pretrain/Loss (Raw)": 1.7826451063156128, "Pretrain/Step": 6762, "Pretrain/Step Time": 8.655877441167831} +{"Pretrain/Learning Rate": 1.029644113782441e-05, "Pretrain/Loss": 1.961315393447876, "Pretrain/Loss (Raw)": 1.7603131532669067, "Pretrain/Step": 6763, "Pretrain/Step Time": 8.654353549703956} +{"Pretrain/Learning Rate": 1.0289575737874372e-05, "Pretrain/Loss": 1.9603593349456787, "Pretrain/Loss (Raw)": 1.9064521789550781, "Pretrain/Step": 6764, "Pretrain/Step Time": 8.656029239296913} +{"Pretrain/Learning Rate": 1.0282712034399785e-05, "Pretrain/Loss": 1.9592511653900146, "Pretrain/Loss (Raw)": 1.7215075492858887, "Pretrain/Step": 6765, "Pretrain/Step Time": 8.65246140025556} +{"Pretrain/Learning Rate": 1.0275850028192192e-05, "Pretrain/Loss": 1.9609582424163818, "Pretrain/Loss (Raw)": 2.1074297428131104, "Pretrain/Step": 6766, "Pretrain/Step Time": 8.657338792458177} +{"Pretrain/Learning Rate": 1.026898972004297e-05, "Pretrain/Loss": 1.9609696865081787, "Pretrain/Loss (Raw)": 1.85891854763031, "Pretrain/Step": 6767, "Pretrain/Step Time": 8.656461954116821} +{"Pretrain/Learning Rate": 1.0262131110743254e-05, "Pretrain/Loss": 1.958777666091919, "Pretrain/Loss (Raw)": 1.6463978290557861, "Pretrain/Step": 6768, "Pretrain/Step Time": 8.654114423319697} +{"Pretrain/Learning Rate": 1.0255274201084031e-05, "Pretrain/Loss": 1.9577178955078125, "Pretrain/Loss (Raw)": 2.0852108001708984, "Pretrain/Step": 6769, "Pretrain/Step Time": 8.651450533419847} +{"Pretrain/Learning Rate": 1.0248418991856068e-05, "Pretrain/Loss": 1.9577968120574951, "Pretrain/Loss (Raw)": 2.0259764194488525, "Pretrain/Step": 6770, "Pretrain/Step Time": 8.651492493227124} +{"Pretrain/Learning Rate": 1.0241565483849939e-05, "Pretrain/Loss": 1.9604928493499756, "Pretrain/Loss (Raw)": 2.0348598957061768, "Pretrain/Step": 6771, "Pretrain/Step Time": 8.651938708499074} +{"Pretrain/Learning Rate": 1.0234713677856011e-05, "Pretrain/Loss": 1.9605090618133545, "Pretrain/Loss (Raw)": 2.06484317779541, "Pretrain/Step": 6772, "Pretrain/Step Time": 8.651177275925875} +{"Pretrain/Learning Rate": 1.022786357466449e-05, "Pretrain/Loss": 1.9635775089263916, "Pretrain/Loss (Raw)": 2.31976056098938, "Pretrain/Step": 6773, "Pretrain/Step Time": 8.655331205576658} +{"Pretrain/Learning Rate": 1.022101517506535e-05, "Pretrain/Loss": 1.9643909931182861, "Pretrain/Loss (Raw)": 2.0850272178649902, "Pretrain/Step": 6774, "Pretrain/Step Time": 8.650297401472926} +{"Pretrain/Learning Rate": 1.021416847984838e-05, "Pretrain/Loss": 1.9607797861099243, "Pretrain/Loss (Raw)": 1.3728491067886353, "Pretrain/Step": 6775, "Pretrain/Step Time": 8.651230121031404} +{"Pretrain/Learning Rate": 1.0207323489803164e-05, "Pretrain/Loss": 1.9585063457489014, "Pretrain/Loss (Raw)": 1.8004237413406372, "Pretrain/Step": 6776, "Pretrain/Step Time": 8.653172004967928} +{"Pretrain/Learning Rate": 1.0200480205719118e-05, "Pretrain/Loss": 1.9593369960784912, "Pretrain/Loss (Raw)": 2.0788180828094482, "Pretrain/Step": 6777, "Pretrain/Step Time": 8.653281493112445} +{"Pretrain/Learning Rate": 1.0193638628385433e-05, "Pretrain/Loss": 1.958299160003662, "Pretrain/Loss (Raw)": 1.9357471466064453, "Pretrain/Step": 6778, "Pretrain/Step Time": 8.647610895335674} +{"Pretrain/Learning Rate": 1.0186798758591112e-05, "Pretrain/Loss": 1.9573664665222168, "Pretrain/Loss (Raw)": 1.717564344406128, "Pretrain/Step": 6779, "Pretrain/Step Time": 8.65120292082429} +{"Pretrain/Learning Rate": 1.017996059712495e-05, "Pretrain/Loss": 1.9576143026351929, "Pretrain/Loss (Raw)": 1.972113847732544, "Pretrain/Step": 6780, "Pretrain/Step Time": 8.650605892762542} +{"Pretrain/Learning Rate": 1.0173124144775576e-05, "Pretrain/Loss": 1.9621074199676514, "Pretrain/Loss (Raw)": 2.044983386993408, "Pretrain/Step": 6781, "Pretrain/Step Time": 8.653155921027064} +{"Pretrain/Learning Rate": 1.0166289402331391e-05, "Pretrain/Loss": 1.960511326789856, "Pretrain/Loss (Raw)": 1.8673957586288452, "Pretrain/Step": 6782, "Pretrain/Step Time": 8.653382677584887} +{"Pretrain/Learning Rate": 1.0159456370580604e-05, "Pretrain/Loss": 1.9616281986236572, "Pretrain/Loss (Raw)": 1.9366350173950195, "Pretrain/Step": 6783, "Pretrain/Step Time": 8.650743436068296} +{"Pretrain/Learning Rate": 1.0152625050311247e-05, "Pretrain/Loss": 1.9601293802261353, "Pretrain/Loss (Raw)": 1.7433346509933472, "Pretrain/Step": 6784, "Pretrain/Step Time": 8.653890388086438} +{"Pretrain/Learning Rate": 1.0145795442311132e-05, "Pretrain/Loss": 1.959792137145996, "Pretrain/Loss (Raw)": 2.0864017009735107, "Pretrain/Step": 6785, "Pretrain/Step Time": 8.654967812821269} +{"Pretrain/Learning Rate": 1.0138967547367882e-05, "Pretrain/Loss": 1.9604823589324951, "Pretrain/Loss (Raw)": 2.0223517417907715, "Pretrain/Step": 6786, "Pretrain/Step Time": 8.653075290843844} +{"Pretrain/Learning Rate": 1.0132141366268913e-05, "Pretrain/Loss": 1.9568219184875488, "Pretrain/Loss (Raw)": 1.8539507389068604, "Pretrain/Step": 6787, "Pretrain/Step Time": 8.654362076893449} +{"Pretrain/Learning Rate": 1.012531689980147e-05, "Pretrain/Loss": 1.9574699401855469, "Pretrain/Loss (Raw)": 2.0619418621063232, "Pretrain/Step": 6788, "Pretrain/Step Time": 8.652854165062308} +{"Pretrain/Learning Rate": 1.0118494148752575e-05, "Pretrain/Loss": 1.9594941139221191, "Pretrain/Loss (Raw)": 2.106384038925171, "Pretrain/Step": 6789, "Pretrain/Step Time": 8.652860367670655} +{"Pretrain/Learning Rate": 1.0111673113909056e-05, "Pretrain/Loss": 1.95943021774292, "Pretrain/Loss (Raw)": 1.9096020460128784, "Pretrain/Step": 6790, "Pretrain/Step Time": 8.653045846149325} +{"Pretrain/Learning Rate": 1.0104853796057546e-05, "Pretrain/Loss": 1.9604392051696777, "Pretrain/Loss (Raw)": 2.1794745922088623, "Pretrain/Step": 6791, "Pretrain/Step Time": 8.661258198320866} +{"Pretrain/Learning Rate": 1.009803619598449e-05, "Pretrain/Loss": 1.959673285484314, "Pretrain/Loss (Raw)": 1.8448295593261719, "Pretrain/Step": 6792, "Pretrain/Step Time": 8.660185420885682} +{"Pretrain/Learning Rate": 1.0091220314476119e-05, "Pretrain/Loss": 1.9600584506988525, "Pretrain/Loss (Raw)": 2.0059618949890137, "Pretrain/Step": 6793, "Pretrain/Step Time": 8.659494072198868} +{"Pretrain/Learning Rate": 1.0084406152318473e-05, "Pretrain/Loss": 1.9605374336242676, "Pretrain/Loss (Raw)": 2.081895351409912, "Pretrain/Step": 6794, "Pretrain/Step Time": 8.658066116273403} +{"Pretrain/Learning Rate": 1.007759371029739e-05, "Pretrain/Loss": 1.9584814310073853, "Pretrain/Loss (Raw)": 2.0335071086883545, "Pretrain/Step": 6795, "Pretrain/Step Time": 8.66015088185668} +{"Pretrain/Learning Rate": 1.0070782989198521e-05, "Pretrain/Loss": 1.9585983753204346, "Pretrain/Loss (Raw)": 1.96335768699646, "Pretrain/Step": 6796, "Pretrain/Step Time": 8.660358563065529} +{"Pretrain/Learning Rate": 1.006397398980731e-05, "Pretrain/Loss": 1.9595110416412354, "Pretrain/Loss (Raw)": 2.03643798828125, "Pretrain/Step": 6797, "Pretrain/Step Time": 8.665030775591731} +{"Pretrain/Learning Rate": 1.0057166712908996e-05, "Pretrain/Loss": 1.9589699506759644, "Pretrain/Loss (Raw)": 1.8858627080917358, "Pretrain/Step": 6798, "Pretrain/Step Time": 8.668257055804133} +{"Pretrain/Learning Rate": 1.0050361159288625e-05, "Pretrain/Loss": 1.9590513706207275, "Pretrain/Loss (Raw)": 2.037069797515869, "Pretrain/Step": 6799, "Pretrain/Step Time": 8.66902468726039} +{"Pretrain/Learning Rate": 1.0043557329731065e-05, "Pretrain/Loss": 1.960005760192871, "Pretrain/Loss (Raw)": 2.197305202484131, "Pretrain/Step": 6800, "Pretrain/Step Time": 8.666764087975025} +{"Pretrain/Learning Rate": 1.0036755225020933e-05, "Pretrain/Loss": 1.9621398448944092, "Pretrain/Loss (Raw)": 1.9322625398635864, "Pretrain/Step": 6801, "Pretrain/Step Time": 8.669150564819574} +{"Pretrain/Learning Rate": 1.0029954845942707e-05, "Pretrain/Loss": 1.96128249168396, "Pretrain/Loss (Raw)": 1.879980206489563, "Pretrain/Step": 6802, "Pretrain/Step Time": 8.662490926682949} +{"Pretrain/Learning Rate": 1.0023156193280622e-05, "Pretrain/Loss": 1.9629991054534912, "Pretrain/Loss (Raw)": 1.9018372297286987, "Pretrain/Step": 6803, "Pretrain/Step Time": 8.663940535858274} +{"Pretrain/Learning Rate": 1.0016359267818754e-05, "Pretrain/Loss": 1.9657803773880005, "Pretrain/Loss (Raw)": 1.9563883543014526, "Pretrain/Step": 6804, "Pretrain/Step Time": 8.668045235797763} +{"Pretrain/Learning Rate": 1.0009564070340924e-05, "Pretrain/Loss": 1.9683157205581665, "Pretrain/Loss (Raw)": 2.067054033279419, "Pretrain/Step": 6805, "Pretrain/Step Time": 8.669511374086142} +{"Pretrain/Learning Rate": 1.0002770601630809e-05, "Pretrain/Loss": 1.968213438987732, "Pretrain/Loss (Raw)": 1.8194200992584229, "Pretrain/Step": 6806, "Pretrain/Step Time": 8.670968720689416} +{"Pretrain/Learning Rate": 9.99597886247185e-06, "Pretrain/Loss": 1.9668731689453125, "Pretrain/Loss (Raw)": 1.9607481956481934, "Pretrain/Step": 6807, "Pretrain/Step Time": 8.672015652060509} +{"Pretrain/Learning Rate": 9.98918885364733e-06, "Pretrain/Loss": 1.9646251201629639, "Pretrain/Loss (Raw)": 1.9073622226715088, "Pretrain/Step": 6808, "Pretrain/Step Time": 8.66931863874197} +{"Pretrain/Learning Rate": 9.982400575940262e-06, "Pretrain/Loss": 1.9624210596084595, "Pretrain/Loss (Raw)": 1.706818699836731, "Pretrain/Step": 6809, "Pretrain/Step Time": 8.670588862150908} +{"Pretrain/Learning Rate": 9.975614030133537e-06, "Pretrain/Loss": 1.9609596729278564, "Pretrain/Loss (Raw)": 1.9675859212875366, "Pretrain/Step": 6810, "Pretrain/Step Time": 8.668217929080129} +{"Pretrain/Learning Rate": 9.968829217009802e-06, "Pretrain/Loss": 1.96064031124115, "Pretrain/Loss (Raw)": 1.7769780158996582, "Pretrain/Step": 6811, "Pretrain/Step Time": 8.66991312801838} +{"Pretrain/Learning Rate": 9.962046137351505e-06, "Pretrain/Loss": 1.9606471061706543, "Pretrain/Loss (Raw)": 2.0088870525360107, "Pretrain/Step": 6812, "Pretrain/Step Time": 8.672439424321055} +{"Pretrain/Learning Rate": 9.955264791940902e-06, "Pretrain/Loss": 1.9618345499038696, "Pretrain/Loss (Raw)": 1.8932828903198242, "Pretrain/Step": 6813, "Pretrain/Step Time": 8.671944849193096} +{"Pretrain/Learning Rate": 9.948485181560066e-06, "Pretrain/Loss": 1.9609681367874146, "Pretrain/Loss (Raw)": 1.9371747970581055, "Pretrain/Step": 6814, "Pretrain/Step Time": 8.673306919634342} +{"Pretrain/Learning Rate": 9.941707306990843e-06, "Pretrain/Loss": 1.9600434303283691, "Pretrain/Loss (Raw)": 1.8705710172653198, "Pretrain/Step": 6815, "Pretrain/Step Time": 8.666730361059308} +{"Pretrain/Learning Rate": 9.934931169014891e-06, "Pretrain/Loss": 1.9581482410430908, "Pretrain/Loss (Raw)": 2.021895408630371, "Pretrain/Step": 6816, "Pretrain/Step Time": 8.668298633769155} +{"Pretrain/Learning Rate": 9.928156768413657e-06, "Pretrain/Loss": 1.957181692123413, "Pretrain/Loss (Raw)": 1.8660876750946045, "Pretrain/Step": 6817, "Pretrain/Step Time": 8.662913776934147} +{"Pretrain/Learning Rate": 9.921384105968415e-06, "Pretrain/Loss": 1.9582353830337524, "Pretrain/Loss (Raw)": 1.996862769126892, "Pretrain/Step": 6818, "Pretrain/Step Time": 8.660133061930537} +{"Pretrain/Learning Rate": 9.914613182460208e-06, "Pretrain/Loss": 1.9595379829406738, "Pretrain/Loss (Raw)": 2.226534605026245, "Pretrain/Step": 6819, "Pretrain/Step Time": 8.659274600446224} +{"Pretrain/Learning Rate": 9.907843998669895e-06, "Pretrain/Loss": 1.9587390422821045, "Pretrain/Loss (Raw)": 2.001563549041748, "Pretrain/Step": 6820, "Pretrain/Step Time": 8.660564744845033} +{"Pretrain/Learning Rate": 9.90107655537812e-06, "Pretrain/Loss": 1.959498405456543, "Pretrain/Loss (Raw)": 2.1844964027404785, "Pretrain/Step": 6821, "Pretrain/Step Time": 8.656767379492521} +{"Pretrain/Learning Rate": 9.894310853365354e-06, "Pretrain/Loss": 1.96205472946167, "Pretrain/Loss (Raw)": 2.0553576946258545, "Pretrain/Step": 6822, "Pretrain/Step Time": 8.652844792231917} +{"Pretrain/Learning Rate": 9.887546893411839e-06, "Pretrain/Loss": 1.9616544246673584, "Pretrain/Loss (Raw)": 2.25543212890625, "Pretrain/Step": 6823, "Pretrain/Step Time": 8.653872646391392} +{"Pretrain/Learning Rate": 9.880784676297622e-06, "Pretrain/Loss": 1.959306001663208, "Pretrain/Loss (Raw)": 1.8510607481002808, "Pretrain/Step": 6824, "Pretrain/Step Time": 8.6479366812855} +{"Pretrain/Learning Rate": 9.874024202802567e-06, "Pretrain/Loss": 1.9635443687438965, "Pretrain/Loss (Raw)": 2.028064489364624, "Pretrain/Step": 6825, "Pretrain/Step Time": 8.64979973807931} +{"Pretrain/Learning Rate": 9.867265473706319e-06, "Pretrain/Loss": 1.9613122940063477, "Pretrain/Loss (Raw)": 1.828400731086731, "Pretrain/Step": 6826, "Pretrain/Step Time": 8.646163076162338} +{"Pretrain/Learning Rate": 9.860508489788323e-06, "Pretrain/Loss": 1.9617197513580322, "Pretrain/Loss (Raw)": 1.8372100591659546, "Pretrain/Step": 6827, "Pretrain/Step Time": 8.648844216018915} +{"Pretrain/Learning Rate": 9.853753251827818e-06, "Pretrain/Loss": 1.9623868465423584, "Pretrain/Loss (Raw)": 2.041133165359497, "Pretrain/Step": 6828, "Pretrain/Step Time": 8.649880092591047} +{"Pretrain/Learning Rate": 9.84699976060387e-06, "Pretrain/Loss": 1.962461233139038, "Pretrain/Loss (Raw)": 1.9947123527526855, "Pretrain/Step": 6829, "Pretrain/Step Time": 8.649015283212066} +{"Pretrain/Learning Rate": 9.840248016895311e-06, "Pretrain/Loss": 1.9622827768325806, "Pretrain/Loss (Raw)": 1.841586947441101, "Pretrain/Step": 6830, "Pretrain/Step Time": 8.647163774818182} +{"Pretrain/Learning Rate": 9.833498021480789e-06, "Pretrain/Loss": 1.9628360271453857, "Pretrain/Loss (Raw)": 1.959926724433899, "Pretrain/Step": 6831, "Pretrain/Step Time": 8.643025748431683} +{"Pretrain/Learning Rate": 9.82674977513873e-06, "Pretrain/Loss": 1.9607045650482178, "Pretrain/Loss (Raw)": 1.9297457933425903, "Pretrain/Step": 6832, "Pretrain/Step Time": 8.645603971555829} +{"Pretrain/Learning Rate": 9.820003278647396e-06, "Pretrain/Loss": 1.9563233852386475, "Pretrain/Loss (Raw)": 1.4682471752166748, "Pretrain/Step": 6833, "Pretrain/Step Time": 8.641341159120202} +{"Pretrain/Learning Rate": 9.813258532784813e-06, "Pretrain/Loss": 1.9575951099395752, "Pretrain/Loss (Raw)": 2.0311429500579834, "Pretrain/Step": 6834, "Pretrain/Step Time": 8.64246646873653} +{"Pretrain/Learning Rate": 9.80651553832882e-06, "Pretrain/Loss": 1.9573765993118286, "Pretrain/Loss (Raw)": 2.015876054763794, "Pretrain/Step": 6835, "Pretrain/Step Time": 8.64749001711607} +{"Pretrain/Learning Rate": 9.79977429605704e-06, "Pretrain/Loss": 1.95638108253479, "Pretrain/Loss (Raw)": 1.7275054454803467, "Pretrain/Step": 6836, "Pretrain/Step Time": 8.651133628562093} +{"Pretrain/Learning Rate": 9.793034806746922e-06, "Pretrain/Loss": 1.9546396732330322, "Pretrain/Loss (Raw)": 1.866376280784607, "Pretrain/Step": 6837, "Pretrain/Step Time": 8.650272468104959} +{"Pretrain/Learning Rate": 9.786297071175687e-06, "Pretrain/Loss": 1.959455132484436, "Pretrain/Loss (Raw)": 2.087284564971924, "Pretrain/Step": 6838, "Pretrain/Step Time": 8.645146688446403} +{"Pretrain/Learning Rate": 9.779561090120366e-06, "Pretrain/Loss": 1.9590775966644287, "Pretrain/Loss (Raw)": 1.846474528312683, "Pretrain/Step": 6839, "Pretrain/Step Time": 8.646195150911808} +{"Pretrain/Learning Rate": 9.77282686435777e-06, "Pretrain/Loss": 1.9529662132263184, "Pretrain/Loss (Raw)": 1.3190635442733765, "Pretrain/Step": 6840, "Pretrain/Step Time": 8.64658616669476} +{"Pretrain/Learning Rate": 9.766094394664551e-06, "Pretrain/Loss": 1.9544684886932373, "Pretrain/Loss (Raw)": 1.9963934421539307, "Pretrain/Step": 6841, "Pretrain/Step Time": 8.647338150069118} +{"Pretrain/Learning Rate": 9.759363681817093e-06, "Pretrain/Loss": 1.9513630867004395, "Pretrain/Loss (Raw)": 1.778993010520935, "Pretrain/Step": 6842, "Pretrain/Step Time": 8.647244801744819} +{"Pretrain/Learning Rate": 9.752634726591642e-06, "Pretrain/Loss": 1.9524242877960205, "Pretrain/Loss (Raw)": 2.2105884552001953, "Pretrain/Step": 6843, "Pretrain/Step Time": 8.648649903014302} +{"Pretrain/Learning Rate": 9.745907529764189e-06, "Pretrain/Loss": 1.9521219730377197, "Pretrain/Loss (Raw)": 1.9903564453125, "Pretrain/Step": 6844, "Pretrain/Step Time": 8.64987607859075} +{"Pretrain/Learning Rate": 9.739182092110583e-06, "Pretrain/Loss": 1.952897548675537, "Pretrain/Loss (Raw)": 2.0522711277008057, "Pretrain/Step": 6845, "Pretrain/Step Time": 8.65331063978374} +{"Pretrain/Learning Rate": 9.732458414406387e-06, "Pretrain/Loss": 1.9529829025268555, "Pretrain/Loss (Raw)": 1.8563355207443237, "Pretrain/Step": 6846, "Pretrain/Step Time": 8.649664681404829} +{"Pretrain/Learning Rate": 9.72573649742704e-06, "Pretrain/Loss": 1.953684687614441, "Pretrain/Loss (Raw)": 2.0116519927978516, "Pretrain/Step": 6847, "Pretrain/Step Time": 8.65231953561306} +{"Pretrain/Learning Rate": 9.719016341947726e-06, "Pretrain/Loss": 1.9510709047317505, "Pretrain/Loss (Raw)": 1.8491108417510986, "Pretrain/Step": 6848, "Pretrain/Step Time": 8.6560177244246} +{"Pretrain/Learning Rate": 9.712297948743473e-06, "Pretrain/Loss": 1.9509962797164917, "Pretrain/Loss (Raw)": 1.943660020828247, "Pretrain/Step": 6849, "Pretrain/Step Time": 8.654007695615292} +{"Pretrain/Learning Rate": 9.705581318589038e-06, "Pretrain/Loss": 1.9575713872909546, "Pretrain/Loss (Raw)": 2.0576910972595215, "Pretrain/Step": 6850, "Pretrain/Step Time": 8.65351203456521} +{"Pretrain/Learning Rate": 9.698866452259048e-06, "Pretrain/Loss": 1.95883309841156, "Pretrain/Loss (Raw)": 1.9663598537445068, "Pretrain/Step": 6851, "Pretrain/Step Time": 8.657867001369596} +{"Pretrain/Learning Rate": 9.692153350527877e-06, "Pretrain/Loss": 1.9579527378082275, "Pretrain/Loss (Raw)": 1.9936052560806274, "Pretrain/Step": 6852, "Pretrain/Step Time": 8.658635411411524} +{"Pretrain/Learning Rate": 9.685442014169715e-06, "Pretrain/Loss": 1.959435224533081, "Pretrain/Loss (Raw)": 2.171332597732544, "Pretrain/Step": 6853, "Pretrain/Step Time": 8.656335089355707} +{"Pretrain/Learning Rate": 9.678732443958535e-06, "Pretrain/Loss": 1.9593372344970703, "Pretrain/Loss (Raw)": 2.0208640098571777, "Pretrain/Step": 6854, "Pretrain/Step Time": 8.65455917455256} +{"Pretrain/Learning Rate": 9.672024640668134e-06, "Pretrain/Loss": 1.958910346031189, "Pretrain/Loss (Raw)": 1.706125020980835, "Pretrain/Step": 6855, "Pretrain/Step Time": 8.652986533939838} +{"Pretrain/Learning Rate": 9.665318605072082e-06, "Pretrain/Loss": 1.9607751369476318, "Pretrain/Loss (Raw)": 1.9480032920837402, "Pretrain/Step": 6856, "Pretrain/Step Time": 8.652039660140872} +{"Pretrain/Learning Rate": 9.658614337943748e-06, "Pretrain/Loss": 1.9619016647338867, "Pretrain/Loss (Raw)": 2.082486391067505, "Pretrain/Step": 6857, "Pretrain/Step Time": 8.651265412569046} +{"Pretrain/Learning Rate": 9.651911840056287e-06, "Pretrain/Loss": 1.9623830318450928, "Pretrain/Loss (Raw)": 1.8613190650939941, "Pretrain/Step": 6858, "Pretrain/Step Time": 8.652178155258298} +{"Pretrain/Learning Rate": 9.645211112182687e-06, "Pretrain/Loss": 1.9605326652526855, "Pretrain/Loss (Raw)": 1.8946263790130615, "Pretrain/Step": 6859, "Pretrain/Step Time": 8.653086796402931} +{"Pretrain/Learning Rate": 9.638512155095694e-06, "Pretrain/Loss": 1.9588717222213745, "Pretrain/Loss (Raw)": 1.9272385835647583, "Pretrain/Step": 6860, "Pretrain/Step Time": 8.652609452605247} +{"Pretrain/Learning Rate": 9.631814969567866e-06, "Pretrain/Loss": 1.9580049514770508, "Pretrain/Loss (Raw)": 1.8328344821929932, "Pretrain/Step": 6861, "Pretrain/Step Time": 8.652028415352106} +{"Pretrain/Learning Rate": 9.625119556371542e-06, "Pretrain/Loss": 1.9566394090652466, "Pretrain/Loss (Raw)": 1.957425832748413, "Pretrain/Step": 6862, "Pretrain/Step Time": 8.651164369657636} +{"Pretrain/Learning Rate": 9.618425916278891e-06, "Pretrain/Loss": 1.9582167863845825, "Pretrain/Loss (Raw)": 2.06583833694458, "Pretrain/Step": 6863, "Pretrain/Step Time": 8.649522930383682} +{"Pretrain/Learning Rate": 9.611734050061844e-06, "Pretrain/Loss": 1.955127239227295, "Pretrain/Loss (Raw)": 1.8525679111480713, "Pretrain/Step": 6864, "Pretrain/Step Time": 8.648847542703152} +{"Pretrain/Learning Rate": 9.605043958492127e-06, "Pretrain/Loss": 1.954408049583435, "Pretrain/Loss (Raw)": 1.8730359077453613, "Pretrain/Step": 6865, "Pretrain/Step Time": 8.64264333061874} +{"Pretrain/Learning Rate": 9.598355642341294e-06, "Pretrain/Loss": 1.954445719718933, "Pretrain/Loss (Raw)": 2.0237417221069336, "Pretrain/Step": 6866, "Pretrain/Step Time": 8.64703856408596} +{"Pretrain/Learning Rate": 9.591669102380666e-06, "Pretrain/Loss": 1.9545893669128418, "Pretrain/Loss (Raw)": 1.9774659872055054, "Pretrain/Step": 6867, "Pretrain/Step Time": 8.65210535004735} +{"Pretrain/Learning Rate": 9.584984339381362e-06, "Pretrain/Loss": 1.9558440446853638, "Pretrain/Loss (Raw)": 2.094555616378784, "Pretrain/Step": 6868, "Pretrain/Step Time": 8.647266255691648} +{"Pretrain/Learning Rate": 9.578301354114291e-06, "Pretrain/Loss": 1.9573547840118408, "Pretrain/Loss (Raw)": 2.181992769241333, "Pretrain/Step": 6869, "Pretrain/Step Time": 8.650441594421864} +{"Pretrain/Learning Rate": 9.571620147350188e-06, "Pretrain/Loss": 1.955580234527588, "Pretrain/Loss (Raw)": 1.8232918977737427, "Pretrain/Step": 6870, "Pretrain/Step Time": 8.648713959380984} +{"Pretrain/Learning Rate": 9.56494071985955e-06, "Pretrain/Loss": 1.9541089534759521, "Pretrain/Loss (Raw)": 1.8934956789016724, "Pretrain/Step": 6871, "Pretrain/Step Time": 8.651596833020449} +{"Pretrain/Learning Rate": 9.558263072412679e-06, "Pretrain/Loss": 1.9519901275634766, "Pretrain/Loss (Raw)": 1.7796332836151123, "Pretrain/Step": 6872, "Pretrain/Step Time": 8.646146541461349} +{"Pretrain/Learning Rate": 9.551587205779666e-06, "Pretrain/Loss": 1.9532815217971802, "Pretrain/Loss (Raw)": 1.8570283651351929, "Pretrain/Step": 6873, "Pretrain/Step Time": 8.64808608777821} +{"Pretrain/Learning Rate": 9.544913120730423e-06, "Pretrain/Loss": 1.9506585597991943, "Pretrain/Loss (Raw)": 1.7543305158615112, "Pretrain/Step": 6874, "Pretrain/Step Time": 8.650268478319049} +{"Pretrain/Learning Rate": 9.538240818034624e-06, "Pretrain/Loss": 1.9514106512069702, "Pretrain/Loss (Raw)": 1.994905948638916, "Pretrain/Step": 6875, "Pretrain/Step Time": 8.64788768440485} +{"Pretrain/Learning Rate": 9.531570298461754e-06, "Pretrain/Loss": 1.9526605606079102, "Pretrain/Loss (Raw)": 2.0775818824768066, "Pretrain/Step": 6876, "Pretrain/Step Time": 8.652399299666286} +{"Pretrain/Learning Rate": 9.524901562781074e-06, "Pretrain/Loss": 1.9522689580917358, "Pretrain/Loss (Raw)": 1.8062063455581665, "Pretrain/Step": 6877, "Pretrain/Step Time": 8.650711793452501} +{"Pretrain/Learning Rate": 9.518234611761678e-06, "Pretrain/Loss": 1.9522366523742676, "Pretrain/Loss (Raw)": 1.9642541408538818, "Pretrain/Step": 6878, "Pretrain/Step Time": 8.650662913918495} +{"Pretrain/Learning Rate": 9.511569446172419e-06, "Pretrain/Loss": 1.9531254768371582, "Pretrain/Loss (Raw)": 2.100271701812744, "Pretrain/Step": 6879, "Pretrain/Step Time": 8.648919316008687} +{"Pretrain/Learning Rate": 9.504906066781954e-06, "Pretrain/Loss": 1.952131986618042, "Pretrain/Loss (Raw)": 1.9281216859817505, "Pretrain/Step": 6880, "Pretrain/Step Time": 8.652609951794147} +{"Pretrain/Learning Rate": 9.49824447435873e-06, "Pretrain/Loss": 1.950939416885376, "Pretrain/Loss (Raw)": 1.9330410957336426, "Pretrain/Step": 6881, "Pretrain/Step Time": 8.656617483124137} +{"Pretrain/Learning Rate": 9.491584669671008e-06, "Pretrain/Loss": 1.951049566268921, "Pretrain/Loss (Raw)": 2.11028790473938, "Pretrain/Step": 6882, "Pretrain/Step Time": 8.65351097472012} +{"Pretrain/Learning Rate": 9.484926653486819e-06, "Pretrain/Loss": 1.9510736465454102, "Pretrain/Loss (Raw)": 2.128798007965088, "Pretrain/Step": 6883, "Pretrain/Step Time": 8.652591690421104} +{"Pretrain/Learning Rate": 9.478270426574002e-06, "Pretrain/Loss": 1.9449307918548584, "Pretrain/Loss (Raw)": 1.230536937713623, "Pretrain/Step": 6884, "Pretrain/Step Time": 8.65278372168541} +{"Pretrain/Learning Rate": 9.471615989700167e-06, "Pretrain/Loss": 1.9431816339492798, "Pretrain/Loss (Raw)": 1.8429999351501465, "Pretrain/Step": 6885, "Pretrain/Step Time": 8.650767153128982} +{"Pretrain/Learning Rate": 9.464963343632766e-06, "Pretrain/Loss": 1.9415987730026245, "Pretrain/Loss (Raw)": 1.9952750205993652, "Pretrain/Step": 6886, "Pretrain/Step Time": 8.655706904828548} +{"Pretrain/Learning Rate": 9.458312489138979e-06, "Pretrain/Loss": 1.9407973289489746, "Pretrain/Loss (Raw)": 2.022840976715088, "Pretrain/Step": 6887, "Pretrain/Step Time": 8.657653307542205} +{"Pretrain/Learning Rate": 9.451663426985838e-06, "Pretrain/Loss": 1.9412997961044312, "Pretrain/Loss (Raw)": 2.0160629749298096, "Pretrain/Step": 6888, "Pretrain/Step Time": 8.6531419493258} +{"Pretrain/Learning Rate": 9.44501615794013e-06, "Pretrain/Loss": 1.9402925968170166, "Pretrain/Loss (Raw)": 1.8760851621627808, "Pretrain/Step": 6889, "Pretrain/Step Time": 8.654718462377787} +{"Pretrain/Learning Rate": 9.438370682768473e-06, "Pretrain/Loss": 1.9358819723129272, "Pretrain/Loss (Raw)": 1.2180790901184082, "Pretrain/Step": 6890, "Pretrain/Step Time": 8.656424034386873} +{"Pretrain/Learning Rate": 9.43172700223722e-06, "Pretrain/Loss": 1.9359846115112305, "Pretrain/Loss (Raw)": 1.7734483480453491, "Pretrain/Step": 6891, "Pretrain/Step Time": 8.658091155812144} +{"Pretrain/Learning Rate": 9.425085117112577e-06, "Pretrain/Loss": 1.9364827871322632, "Pretrain/Loss (Raw)": 1.9702268838882446, "Pretrain/Step": 6892, "Pretrain/Step Time": 8.660928146913648} +{"Pretrain/Learning Rate": 9.41844502816051e-06, "Pretrain/Loss": 1.9365390539169312, "Pretrain/Loss (Raw)": 1.7287166118621826, "Pretrain/Step": 6893, "Pretrain/Step Time": 8.662023808807135} +{"Pretrain/Learning Rate": 9.411806736146788e-06, "Pretrain/Loss": 1.9354381561279297, "Pretrain/Loss (Raw)": 1.9665169715881348, "Pretrain/Step": 6894, "Pretrain/Step Time": 8.657546747475863} +{"Pretrain/Learning Rate": 9.405170241836955e-06, "Pretrain/Loss": 1.936422348022461, "Pretrain/Loss (Raw)": 1.9848945140838623, "Pretrain/Step": 6895, "Pretrain/Step Time": 8.655062997713685} +{"Pretrain/Learning Rate": 9.398535545996386e-06, "Pretrain/Loss": 1.9403953552246094, "Pretrain/Loss (Raw)": 2.154923677444458, "Pretrain/Step": 6896, "Pretrain/Step Time": 8.656161867082119} +{"Pretrain/Learning Rate": 9.391902649390214e-06, "Pretrain/Loss": 1.9370708465576172, "Pretrain/Loss (Raw)": 1.6596848964691162, "Pretrain/Step": 6897, "Pretrain/Step Time": 8.658748542889953} +{"Pretrain/Learning Rate": 9.385271552783375e-06, "Pretrain/Loss": 1.9361374378204346, "Pretrain/Loss (Raw)": 1.9065040349960327, "Pretrain/Step": 6898, "Pretrain/Step Time": 8.656723164021969} +{"Pretrain/Learning Rate": 9.378642256940589e-06, "Pretrain/Loss": 1.935182809829712, "Pretrain/Loss (Raw)": 1.9126583337783813, "Pretrain/Step": 6899, "Pretrain/Step Time": 8.656709142029285} +{"Pretrain/Learning Rate": 9.372014762626401e-06, "Pretrain/Loss": 1.933847188949585, "Pretrain/Loss (Raw)": 1.893895149230957, "Pretrain/Step": 6900, "Pretrain/Step Time": 8.658265672624111} +{"Pretrain/Learning Rate": 9.36538907060511e-06, "Pretrain/Loss": 1.9315803050994873, "Pretrain/Loss (Raw)": 2.029592990875244, "Pretrain/Step": 6901, "Pretrain/Step Time": 8.653308544307947} +{"Pretrain/Learning Rate": 9.358765181640825e-06, "Pretrain/Loss": 1.9317214488983154, "Pretrain/Loss (Raw)": 2.1031038761138916, "Pretrain/Step": 6902, "Pretrain/Step Time": 8.65613909251988} +{"Pretrain/Learning Rate": 9.352143096497435e-06, "Pretrain/Loss": 1.9370954036712646, "Pretrain/Loss (Raw)": 2.060698986053467, "Pretrain/Step": 6903, "Pretrain/Step Time": 8.653740024194121} +{"Pretrain/Learning Rate": 9.345522815938645e-06, "Pretrain/Loss": 1.9381183385849, "Pretrain/Loss (Raw)": 1.9313664436340332, "Pretrain/Step": 6904, "Pretrain/Step Time": 8.662332400679588} +{"Pretrain/Learning Rate": 9.33890434072793e-06, "Pretrain/Loss": 1.9368267059326172, "Pretrain/Loss (Raw)": 1.9134775400161743, "Pretrain/Step": 6905, "Pretrain/Step Time": 8.6605308316648} +{"Pretrain/Learning Rate": 9.332287671628556e-06, "Pretrain/Loss": 1.9372920989990234, "Pretrain/Loss (Raw)": 1.9953323602676392, "Pretrain/Step": 6906, "Pretrain/Step Time": 8.662014681845903} +{"Pretrain/Learning Rate": 9.325672809403606e-06, "Pretrain/Loss": 1.938108205795288, "Pretrain/Loss (Raw)": 1.822016716003418, "Pretrain/Step": 6907, "Pretrain/Step Time": 8.65942201949656} +{"Pretrain/Learning Rate": 9.319059754815926e-06, "Pretrain/Loss": 1.9372899532318115, "Pretrain/Loss (Raw)": 1.8673956394195557, "Pretrain/Step": 6908, "Pretrain/Step Time": 8.662218963727355} +{"Pretrain/Learning Rate": 9.312448508628169e-06, "Pretrain/Loss": 1.9379489421844482, "Pretrain/Loss (Raw)": 2.129326581954956, "Pretrain/Step": 6909, "Pretrain/Step Time": 8.666883826255798} +{"Pretrain/Learning Rate": 9.30583907160276e-06, "Pretrain/Loss": 1.9379914999008179, "Pretrain/Loss (Raw)": 1.8728468418121338, "Pretrain/Step": 6910, "Pretrain/Step Time": 8.665557967498899} +{"Pretrain/Learning Rate": 9.299231444501953e-06, "Pretrain/Loss": 1.9401564598083496, "Pretrain/Loss (Raw)": 2.2137398719787598, "Pretrain/Step": 6911, "Pretrain/Step Time": 8.665600184351206} +{"Pretrain/Learning Rate": 9.29262562808776e-06, "Pretrain/Loss": 1.9420490264892578, "Pretrain/Loss (Raw)": 1.9855839014053345, "Pretrain/Step": 6912, "Pretrain/Step Time": 8.668497115373611} +{"Pretrain/Learning Rate": 9.286021623121993e-06, "Pretrain/Loss": 1.9415841102600098, "Pretrain/Loss (Raw)": 2.026888608932495, "Pretrain/Step": 6913, "Pretrain/Step Time": 8.668498145416379} +{"Pretrain/Learning Rate": 9.279419430366255e-06, "Pretrain/Loss": 1.939316749572754, "Pretrain/Loss (Raw)": 1.732131838798523, "Pretrain/Step": 6914, "Pretrain/Step Time": 8.667501956224442} +{"Pretrain/Learning Rate": 9.272819050581952e-06, "Pretrain/Loss": 1.9409880638122559, "Pretrain/Loss (Raw)": 2.067873477935791, "Pretrain/Step": 6915, "Pretrain/Step Time": 8.66832291521132} +{"Pretrain/Learning Rate": 9.266220484530263e-06, "Pretrain/Loss": 1.9406828880310059, "Pretrain/Loss (Raw)": 2.0228872299194336, "Pretrain/Step": 6916, "Pretrain/Step Time": 8.670867010951042} +{"Pretrain/Learning Rate": 9.259623732972173e-06, "Pretrain/Loss": 1.939730167388916, "Pretrain/Loss (Raw)": 1.9844335317611694, "Pretrain/Step": 6917, "Pretrain/Step Time": 8.667296228930354} +{"Pretrain/Learning Rate": 9.25302879666843e-06, "Pretrain/Loss": 1.940002679824829, "Pretrain/Loss (Raw)": 1.944483757019043, "Pretrain/Step": 6918, "Pretrain/Step Time": 8.663483517244458} +{"Pretrain/Learning Rate": 9.246435676379623e-06, "Pretrain/Loss": 1.9369215965270996, "Pretrain/Loss (Raw)": 1.7851080894470215, "Pretrain/Step": 6919, "Pretrain/Step Time": 8.659093040972948} +{"Pretrain/Learning Rate": 9.239844372866083e-06, "Pretrain/Loss": 1.939368724822998, "Pretrain/Loss (Raw)": 2.158052682876587, "Pretrain/Step": 6920, "Pretrain/Step Time": 8.664375960826874} +{"Pretrain/Learning Rate": 9.233254886887958e-06, "Pretrain/Loss": 1.9387009143829346, "Pretrain/Loss (Raw)": 1.9204856157302856, "Pretrain/Step": 6921, "Pretrain/Step Time": 8.661497699096799} +{"Pretrain/Learning Rate": 9.226667219205163e-06, "Pretrain/Loss": 1.9374775886535645, "Pretrain/Loss (Raw)": 1.9252982139587402, "Pretrain/Step": 6922, "Pretrain/Step Time": 8.665936227887869} +{"Pretrain/Learning Rate": 9.220081370577441e-06, "Pretrain/Loss": 1.9367094039916992, "Pretrain/Loss (Raw)": 1.9351866245269775, "Pretrain/Step": 6923, "Pretrain/Step Time": 8.667523356154561} +{"Pretrain/Learning Rate": 9.21349734176429e-06, "Pretrain/Loss": 1.9375567436218262, "Pretrain/Loss (Raw)": 2.0718047618865967, "Pretrain/Step": 6924, "Pretrain/Step Time": 8.668248480185866} +{"Pretrain/Learning Rate": 9.206915133525016e-06, "Pretrain/Loss": 1.9348700046539307, "Pretrain/Loss (Raw)": 1.6925535202026367, "Pretrain/Step": 6925, "Pretrain/Step Time": 8.66828247345984} +{"Pretrain/Learning Rate": 9.2003347466187e-06, "Pretrain/Loss": 1.9356672763824463, "Pretrain/Loss (Raw)": 1.9879004955291748, "Pretrain/Step": 6926, "Pretrain/Step Time": 8.663940342143178} +{"Pretrain/Learning Rate": 9.193756181804248e-06, "Pretrain/Loss": 1.9348993301391602, "Pretrain/Loss (Raw)": 1.9387834072113037, "Pretrain/Step": 6927, "Pretrain/Step Time": 8.666135590523481} +{"Pretrain/Learning Rate": 9.1871794398403e-06, "Pretrain/Loss": 1.9320793151855469, "Pretrain/Loss (Raw)": 1.836333990097046, "Pretrain/Step": 6928, "Pretrain/Step Time": 8.667155848816037} +{"Pretrain/Learning Rate": 9.180604521485337e-06, "Pretrain/Loss": 1.9333066940307617, "Pretrain/Loss (Raw)": 2.089369535446167, "Pretrain/Step": 6929, "Pretrain/Step Time": 8.667995173484087} +{"Pretrain/Learning Rate": 9.174031427497595e-06, "Pretrain/Loss": 1.933950662612915, "Pretrain/Loss (Raw)": 1.9624193906784058, "Pretrain/Step": 6930, "Pretrain/Step Time": 8.665619159117341} +{"Pretrain/Learning Rate": 9.167460158635141e-06, "Pretrain/Loss": 1.9354318380355835, "Pretrain/Loss (Raw)": 2.091416120529175, "Pretrain/Step": 6931, "Pretrain/Step Time": 8.664101511240005} +{"Pretrain/Learning Rate": 9.16089071565577e-06, "Pretrain/Loss": 1.935396432876587, "Pretrain/Loss (Raw)": 1.9518508911132812, "Pretrain/Step": 6932, "Pretrain/Step Time": 8.664722023531795} +{"Pretrain/Learning Rate": 9.154323099317128e-06, "Pretrain/Loss": 1.9375029802322388, "Pretrain/Loss (Raw)": 2.3367083072662354, "Pretrain/Step": 6933, "Pretrain/Step Time": 8.663041356950998} +{"Pretrain/Learning Rate": 9.147757310376612e-06, "Pretrain/Loss": 1.9394803047180176, "Pretrain/Loss (Raw)": 2.072507619857788, "Pretrain/Step": 6934, "Pretrain/Step Time": 8.658981129527092} +{"Pretrain/Learning Rate": 9.14119334959142e-06, "Pretrain/Loss": 1.9395606517791748, "Pretrain/Loss (Raw)": 1.9710320234298706, "Pretrain/Step": 6935, "Pretrain/Step Time": 8.659256422892213} +{"Pretrain/Learning Rate": 9.134631217718534e-06, "Pretrain/Loss": 1.9409259557724, "Pretrain/Loss (Raw)": 2.0821151733398438, "Pretrain/Step": 6936, "Pretrain/Step Time": 8.661470897495747} +{"Pretrain/Learning Rate": 9.128070915514744e-06, "Pretrain/Loss": 1.9419758319854736, "Pretrain/Loss (Raw)": 1.8412222862243652, "Pretrain/Step": 6937, "Pretrain/Step Time": 8.663246490061283} +{"Pretrain/Learning Rate": 9.121512443736607e-06, "Pretrain/Loss": 1.9439737796783447, "Pretrain/Loss (Raw)": 2.223310947418213, "Pretrain/Step": 6938, "Pretrain/Step Time": 8.660943111404777} +{"Pretrain/Learning Rate": 9.114955803140476e-06, "Pretrain/Loss": 1.9460372924804688, "Pretrain/Loss (Raw)": 2.04111647605896, "Pretrain/Step": 6939, "Pretrain/Step Time": 8.659217830747366} +{"Pretrain/Learning Rate": 9.108400994482485e-06, "Pretrain/Loss": 1.9466533660888672, "Pretrain/Loss (Raw)": 2.0877339839935303, "Pretrain/Step": 6940, "Pretrain/Step Time": 8.659304916858673} +{"Pretrain/Learning Rate": 9.101848018518586e-06, "Pretrain/Loss": 1.9489063024520874, "Pretrain/Loss (Raw)": 2.1816649436950684, "Pretrain/Step": 6941, "Pretrain/Step Time": 8.654794227331877} +{"Pretrain/Learning Rate": 9.09529687600449e-06, "Pretrain/Loss": 1.9474263191223145, "Pretrain/Loss (Raw)": 1.747725248336792, "Pretrain/Step": 6942, "Pretrain/Step Time": 8.658227507025003} +{"Pretrain/Learning Rate": 9.0887475676957e-06, "Pretrain/Loss": 1.949988842010498, "Pretrain/Loss (Raw)": 2.198596715927124, "Pretrain/Step": 6943, "Pretrain/Step Time": 8.658210098743439} +{"Pretrain/Learning Rate": 9.082200094347506e-06, "Pretrain/Loss": 1.9495787620544434, "Pretrain/Loss (Raw)": 1.9693952798843384, "Pretrain/Step": 6944, "Pretrain/Step Time": 8.661664931103587} +{"Pretrain/Learning Rate": 9.075654456715016e-06, "Pretrain/Loss": 1.9499623775482178, "Pretrain/Loss (Raw)": 1.9151947498321533, "Pretrain/Step": 6945, "Pretrain/Step Time": 8.662308955565095} +{"Pretrain/Learning Rate": 9.069110655553093e-06, "Pretrain/Loss": 1.9487563371658325, "Pretrain/Loss (Raw)": 1.8424748182296753, "Pretrain/Step": 6946, "Pretrain/Step Time": 8.66107471100986} +{"Pretrain/Learning Rate": 9.062568691616389e-06, "Pretrain/Loss": 1.947291374206543, "Pretrain/Loss (Raw)": 2.039026975631714, "Pretrain/Step": 6947, "Pretrain/Step Time": 8.660726414993405} +{"Pretrain/Learning Rate": 9.056028565659369e-06, "Pretrain/Loss": 1.9479809999465942, "Pretrain/Loss (Raw)": 2.089829921722412, "Pretrain/Step": 6948, "Pretrain/Step Time": 8.66369566693902} +{"Pretrain/Learning Rate": 9.049490278436269e-06, "Pretrain/Loss": 1.94574773311615, "Pretrain/Loss (Raw)": 1.8986492156982422, "Pretrain/Step": 6949, "Pretrain/Step Time": 8.662707205861807} +{"Pretrain/Learning Rate": 9.04295383070111e-06, "Pretrain/Loss": 1.9469473361968994, "Pretrain/Loss (Raw)": 2.208897113800049, "Pretrain/Step": 6950, "Pretrain/Step Time": 8.664136512205005} +{"Pretrain/Learning Rate": 9.036419223207699e-06, "Pretrain/Loss": 1.945159912109375, "Pretrain/Loss (Raw)": 2.026651620864868, "Pretrain/Step": 6951, "Pretrain/Step Time": 8.663651540875435} +{"Pretrain/Learning Rate": 9.029886456709652e-06, "Pretrain/Loss": 1.9474806785583496, "Pretrain/Loss (Raw)": 2.1481099128723145, "Pretrain/Step": 6952, "Pretrain/Step Time": 8.66690718010068} +{"Pretrain/Learning Rate": 9.023355531960353e-06, "Pretrain/Loss": 1.9478663206100464, "Pretrain/Loss (Raw)": 2.0774359703063965, "Pretrain/Step": 6953, "Pretrain/Step Time": 8.664564307779074} +{"Pretrain/Learning Rate": 9.016826449712981e-06, "Pretrain/Loss": 1.9475746154785156, "Pretrain/Loss (Raw)": 1.7910536527633667, "Pretrain/Step": 6954, "Pretrain/Step Time": 8.666386023163795} +{"Pretrain/Learning Rate": 9.010299210720487e-06, "Pretrain/Loss": 1.9470902681350708, "Pretrain/Loss (Raw)": 1.775219440460205, "Pretrain/Step": 6955, "Pretrain/Step Time": 8.6672049947083} +{"Pretrain/Learning Rate": 9.003773815735644e-06, "Pretrain/Loss": 1.9478877782821655, "Pretrain/Loss (Raw)": 2.1432135105133057, "Pretrain/Step": 6956, "Pretrain/Step Time": 8.668392412364483} +{"Pretrain/Learning Rate": 8.997250265510984e-06, "Pretrain/Loss": 1.9469902515411377, "Pretrain/Loss (Raw)": 1.8798290491104126, "Pretrain/Step": 6957, "Pretrain/Step Time": 8.665563946589828} +{"Pretrain/Learning Rate": 8.990728560798827e-06, "Pretrain/Loss": 1.947120189666748, "Pretrain/Loss (Raw)": 1.8582152128219604, "Pretrain/Step": 6958, "Pretrain/Step Time": 8.666851382702589} +{"Pretrain/Learning Rate": 8.984208702351281e-06, "Pretrain/Loss": 1.9461839199066162, "Pretrain/Loss (Raw)": 1.8400907516479492, "Pretrain/Step": 6959, "Pretrain/Step Time": 8.667905364185572} +{"Pretrain/Learning Rate": 8.977690690920269e-06, "Pretrain/Loss": 1.9475265741348267, "Pretrain/Loss (Raw)": 2.1015961170196533, "Pretrain/Step": 6960, "Pretrain/Step Time": 8.6638272870332} +{"Pretrain/Learning Rate": 8.971174527257464e-06, "Pretrain/Loss": 1.9509742259979248, "Pretrain/Loss (Raw)": 1.909546136856079, "Pretrain/Step": 6961, "Pretrain/Step Time": 8.662753906100988} +{"Pretrain/Learning Rate": 8.964660212114343e-06, "Pretrain/Loss": 1.9508074522018433, "Pretrain/Loss (Raw)": 2.009793281555176, "Pretrain/Step": 6962, "Pretrain/Step Time": 8.66397119499743} +{"Pretrain/Learning Rate": 8.958147746242157e-06, "Pretrain/Loss": 1.9510691165924072, "Pretrain/Loss (Raw)": 2.0493648052215576, "Pretrain/Step": 6963, "Pretrain/Step Time": 8.657109655439854} +{"Pretrain/Learning Rate": 8.951637130391976e-06, "Pretrain/Loss": 1.954033613204956, "Pretrain/Loss (Raw)": 2.1069753170013428, "Pretrain/Step": 6964, "Pretrain/Step Time": 8.652520179748535} +{"Pretrain/Learning Rate": 8.945128365314622e-06, "Pretrain/Loss": 1.9541698694229126, "Pretrain/Loss (Raw)": 1.8838162422180176, "Pretrain/Step": 6965, "Pretrain/Step Time": 8.654951848089695} +{"Pretrain/Learning Rate": 8.938621451760718e-06, "Pretrain/Loss": 1.951744794845581, "Pretrain/Loss (Raw)": 1.7768652439117432, "Pretrain/Step": 6966, "Pretrain/Step Time": 8.655512165278196} +{"Pretrain/Learning Rate": 8.932116390480663e-06, "Pretrain/Loss": 1.9531267881393433, "Pretrain/Loss (Raw)": 2.02337908744812, "Pretrain/Step": 6967, "Pretrain/Step Time": 8.65587368234992} +{"Pretrain/Learning Rate": 8.925613182224678e-06, "Pretrain/Loss": 1.9582154750823975, "Pretrain/Loss (Raw)": 1.9704012870788574, "Pretrain/Step": 6968, "Pretrain/Step Time": 8.653797401115298} +{"Pretrain/Learning Rate": 8.919111827742708e-06, "Pretrain/Loss": 1.9565620422363281, "Pretrain/Loss (Raw)": 1.78477144241333, "Pretrain/Step": 6969, "Pretrain/Step Time": 8.652583779767156} +{"Pretrain/Learning Rate": 8.912612327784547e-06, "Pretrain/Loss": 1.957132339477539, "Pretrain/Loss (Raw)": 1.8519792556762695, "Pretrain/Step": 6970, "Pretrain/Step Time": 8.650305598974228} +{"Pretrain/Learning Rate": 8.906114683099732e-06, "Pretrain/Loss": 1.955854892730713, "Pretrain/Loss (Raw)": 2.0470731258392334, "Pretrain/Step": 6971, "Pretrain/Step Time": 8.651590513065457} +{"Pretrain/Learning Rate": 8.899618894437622e-06, "Pretrain/Loss": 1.9567601680755615, "Pretrain/Loss (Raw)": 2.1062328815460205, "Pretrain/Step": 6972, "Pretrain/Step Time": 8.649517809972167} +{"Pretrain/Learning Rate": 8.893124962547311e-06, "Pretrain/Loss": 1.9562758207321167, "Pretrain/Loss (Raw)": 1.9902790784835815, "Pretrain/Step": 6973, "Pretrain/Step Time": 8.647667249664664} +{"Pretrain/Learning Rate": 8.88663288817774e-06, "Pretrain/Loss": 1.9575281143188477, "Pretrain/Loss (Raw)": 2.016634225845337, "Pretrain/Step": 6974, "Pretrain/Step Time": 8.65068987570703} +{"Pretrain/Learning Rate": 8.880142672077582e-06, "Pretrain/Loss": 1.9581787586212158, "Pretrain/Loss (Raw)": 2.0949299335479736, "Pretrain/Step": 6975, "Pretrain/Step Time": 8.647557202726603} +{"Pretrain/Learning Rate": 8.873654314995348e-06, "Pretrain/Loss": 1.958908200263977, "Pretrain/Loss (Raw)": 1.942478060722351, "Pretrain/Step": 6976, "Pretrain/Step Time": 8.646582750603557} +{"Pretrain/Learning Rate": 8.86716781767927e-06, "Pretrain/Loss": 1.9571762084960938, "Pretrain/Loss (Raw)": 1.7219736576080322, "Pretrain/Step": 6977, "Pretrain/Step Time": 8.645181022584438} +{"Pretrain/Learning Rate": 8.86068318087743e-06, "Pretrain/Loss": 1.9576125144958496, "Pretrain/Loss (Raw)": 2.1135377883911133, "Pretrain/Step": 6978, "Pretrain/Step Time": 8.647947296500206} +{"Pretrain/Learning Rate": 8.854200405337657e-06, "Pretrain/Loss": 1.9577927589416504, "Pretrain/Loss (Raw)": 1.9894194602966309, "Pretrain/Step": 6979, "Pretrain/Step Time": 8.645811619237065} +{"Pretrain/Learning Rate": 8.847719491807572e-06, "Pretrain/Loss": 1.9560198783874512, "Pretrain/Loss (Raw)": 1.7666765451431274, "Pretrain/Step": 6980, "Pretrain/Step Time": 8.647319244220853} +{"Pretrain/Learning Rate": 8.841240441034579e-06, "Pretrain/Loss": 1.9547237157821655, "Pretrain/Loss (Raw)": 2.0054242610931396, "Pretrain/Step": 6981, "Pretrain/Step Time": 8.646421799436212} +{"Pretrain/Learning Rate": 8.83476325376589e-06, "Pretrain/Loss": 1.952929973602295, "Pretrain/Loss (Raw)": 1.7912678718566895, "Pretrain/Step": 6982, "Pretrain/Step Time": 8.653146060183644} +{"Pretrain/Learning Rate": 8.828287930748477e-06, "Pretrain/Loss": 1.9545726776123047, "Pretrain/Loss (Raw)": 1.9163872003555298, "Pretrain/Step": 6983, "Pretrain/Step Time": 8.651879763230681} +{"Pretrain/Learning Rate": 8.821814472729104e-06, "Pretrain/Loss": 1.95352041721344, "Pretrain/Loss (Raw)": 1.8133200407028198, "Pretrain/Step": 6984, "Pretrain/Step Time": 8.6518874745816} +{"Pretrain/Learning Rate": 8.815342880454311e-06, "Pretrain/Loss": 1.9520390033721924, "Pretrain/Loss (Raw)": 1.8928593397140503, "Pretrain/Step": 6985, "Pretrain/Step Time": 8.650553720071912} +{"Pretrain/Learning Rate": 8.80887315467045e-06, "Pretrain/Loss": 1.953005075454712, "Pretrain/Loss (Raw)": 1.984981894493103, "Pretrain/Step": 6986, "Pretrain/Step Time": 8.651845432817936} +{"Pretrain/Learning Rate": 8.80240529612363e-06, "Pretrain/Loss": 1.9544075727462769, "Pretrain/Loss (Raw)": 2.0741429328918457, "Pretrain/Step": 6987, "Pretrain/Step Time": 8.652657004073262} +{"Pretrain/Learning Rate": 8.79593930555975e-06, "Pretrain/Loss": 1.9539401531219482, "Pretrain/Loss (Raw)": 1.8674030303955078, "Pretrain/Step": 6988, "Pretrain/Step Time": 8.654573636129498} +{"Pretrain/Learning Rate": 8.789475183724514e-06, "Pretrain/Loss": 1.955582857131958, "Pretrain/Loss (Raw)": 2.0430991649627686, "Pretrain/Step": 6989, "Pretrain/Step Time": 8.659086778759956} +{"Pretrain/Learning Rate": 8.783012931363385e-06, "Pretrain/Loss": 1.9561424255371094, "Pretrain/Loss (Raw)": 2.0290639400482178, "Pretrain/Step": 6990, "Pretrain/Step Time": 8.657301217317581} +{"Pretrain/Learning Rate": 8.776552549221623e-06, "Pretrain/Loss": 1.9535655975341797, "Pretrain/Loss (Raw)": 1.7360073328018188, "Pretrain/Step": 6991, "Pretrain/Step Time": 8.655712692067027} +{"Pretrain/Learning Rate": 8.770094038044257e-06, "Pretrain/Loss": 1.9546313285827637, "Pretrain/Loss (Raw)": 1.988978385925293, "Pretrain/Step": 6992, "Pretrain/Step Time": 8.658042138442397} +{"Pretrain/Learning Rate": 8.763637398576135e-06, "Pretrain/Loss": 1.9560655355453491, "Pretrain/Loss (Raw)": 2.0566089153289795, "Pretrain/Step": 6993, "Pretrain/Step Time": 8.658022571355104} +{"Pretrain/Learning Rate": 8.757182631561859e-06, "Pretrain/Loss": 1.954495906829834, "Pretrain/Loss (Raw)": 1.8228250741958618, "Pretrain/Step": 6994, "Pretrain/Step Time": 8.65305177308619} +{"Pretrain/Learning Rate": 8.750729737745819e-06, "Pretrain/Loss": 1.9538804292678833, "Pretrain/Loss (Raw)": 1.8986930847167969, "Pretrain/Step": 6995, "Pretrain/Step Time": 8.64852249249816} +{"Pretrain/Learning Rate": 8.744278717872185e-06, "Pretrain/Loss": 1.9537861347198486, "Pretrain/Loss (Raw)": 2.082472324371338, "Pretrain/Step": 6996, "Pretrain/Step Time": 8.65006355382502} +{"Pretrain/Learning Rate": 8.73782957268494e-06, "Pretrain/Loss": 1.9527435302734375, "Pretrain/Loss (Raw)": 2.048549175262451, "Pretrain/Step": 6997, "Pretrain/Step Time": 8.647036913782358} +{"Pretrain/Learning Rate": 8.731382302927813e-06, "Pretrain/Loss": 1.9546600580215454, "Pretrain/Loss (Raw)": 2.0686097145080566, "Pretrain/Step": 6998, "Pretrain/Step Time": 8.647177491337061} +{"Pretrain/Learning Rate": 8.724936909344342e-06, "Pretrain/Loss": 1.9552342891693115, "Pretrain/Loss (Raw)": 1.9669978618621826, "Pretrain/Step": 6999, "Pretrain/Step Time": 8.646343464031816} +{"Pretrain/Learning Rate": 8.718493392677829e-06, "Pretrain/Loss": 1.9576592445373535, "Pretrain/Loss (Raw)": 2.0900323390960693, "Pretrain/Step": 7000, "Pretrain/Step Time": 8.64771917834878} +{"Pretrain/Learning Rate": 8.712051753671389e-06, "Pretrain/Loss": 1.9574429988861084, "Pretrain/Loss (Raw)": 1.8293408155441284, "Pretrain/Step": 7001, "Pretrain/Step Time": 8.649967649951577} +{"Pretrain/Learning Rate": 8.705611993067892e-06, "Pretrain/Loss": 1.9580166339874268, "Pretrain/Loss (Raw)": 1.8277620077133179, "Pretrain/Step": 7002, "Pretrain/Step Time": 8.648972602561116} +{"Pretrain/Learning Rate": 8.699174111609998e-06, "Pretrain/Loss": 1.9572280645370483, "Pretrain/Loss (Raw)": 1.8939629793167114, "Pretrain/Step": 7003, "Pretrain/Step Time": 8.651078892871737} +{"Pretrain/Learning Rate": 8.692738110040152e-06, "Pretrain/Loss": 1.9554939270019531, "Pretrain/Loss (Raw)": 1.855614185333252, "Pretrain/Step": 7004, "Pretrain/Step Time": 8.651515761390328} +{"Pretrain/Learning Rate": 8.686303989100596e-06, "Pretrain/Loss": 1.9571154117584229, "Pretrain/Loss (Raw)": 2.0137548446655273, "Pretrain/Step": 7005, "Pretrain/Step Time": 8.65098361670971} +{"Pretrain/Learning Rate": 8.679871749533338e-06, "Pretrain/Loss": 1.9564266204833984, "Pretrain/Loss (Raw)": 1.8760929107666016, "Pretrain/Step": 7006, "Pretrain/Step Time": 8.648992735892534} +{"Pretrain/Learning Rate": 8.673441392080173e-06, "Pretrain/Loss": 1.9532849788665771, "Pretrain/Loss (Raw)": 1.6981358528137207, "Pretrain/Step": 7007, "Pretrain/Step Time": 8.64818368665874} +{"Pretrain/Learning Rate": 8.667012917482673e-06, "Pretrain/Loss": 1.951741099357605, "Pretrain/Loss (Raw)": 1.7305090427398682, "Pretrain/Step": 7008, "Pretrain/Step Time": 8.63982672803104} +{"Pretrain/Learning Rate": 8.66058632648222e-06, "Pretrain/Loss": 1.953086256980896, "Pretrain/Loss (Raw)": 2.105215072631836, "Pretrain/Step": 7009, "Pretrain/Step Time": 8.637245759367943} +{"Pretrain/Learning Rate": 8.654161619819931e-06, "Pretrain/Loss": 1.9511953592300415, "Pretrain/Loss (Raw)": 1.868255376815796, "Pretrain/Step": 7010, "Pretrain/Step Time": 8.687122944742441} +{"Pretrain/Learning Rate": 8.647738798236757e-06, "Pretrain/Loss": 1.9483258724212646, "Pretrain/Loss (Raw)": 1.7615151405334473, "Pretrain/Step": 7011, "Pretrain/Step Time": 8.68778276629746} +{"Pretrain/Learning Rate": 8.641317862473392e-06, "Pretrain/Loss": 1.9531753063201904, "Pretrain/Loss (Raw)": 1.851251244544983, "Pretrain/Step": 7012, "Pretrain/Step Time": 8.807615863159299} +{"Pretrain/Learning Rate": 8.634898813270348e-06, "Pretrain/Loss": 1.952554702758789, "Pretrain/Loss (Raw)": 1.7635724544525146, "Pretrain/Step": 7013, "Pretrain/Step Time": 8.825805809348822} +{"Pretrain/Learning Rate": 8.628481651367876e-06, "Pretrain/Loss": 1.9522913694381714, "Pretrain/Loss (Raw)": 1.9615710973739624, "Pretrain/Step": 7014, "Pretrain/Step Time": 8.949758185073733} +{"Pretrain/Learning Rate": 8.622066377506049e-06, "Pretrain/Loss": 1.951827883720398, "Pretrain/Loss (Raw)": 1.9635119438171387, "Pretrain/Step": 7015, "Pretrain/Step Time": 8.977873917669058} +{"Pretrain/Learning Rate": 8.615652992424697e-06, "Pretrain/Loss": 1.9508285522460938, "Pretrain/Loss (Raw)": 1.8881441354751587, "Pretrain/Step": 7016, "Pretrain/Step Time": 9.061694763600826} +{"Pretrain/Learning Rate": 8.609241496863463e-06, "Pretrain/Loss": 1.9508509635925293, "Pretrain/Loss (Raw)": 1.8789399862289429, "Pretrain/Step": 7017, "Pretrain/Step Time": 9.059150772169232} +{"Pretrain/Learning Rate": 8.602831891561718e-06, "Pretrain/Loss": 1.9566055536270142, "Pretrain/Loss (Raw)": 1.954681634902954, "Pretrain/Step": 7018, "Pretrain/Step Time": 9.122744800522923} +{"Pretrain/Learning Rate": 8.596424177258677e-06, "Pretrain/Loss": 1.9579912424087524, "Pretrain/Loss (Raw)": 1.9508140087127686, "Pretrain/Step": 7019, "Pretrain/Step Time": 9.120119173079729} +{"Pretrain/Learning Rate": 8.590018354693293e-06, "Pretrain/Loss": 1.9587624073028564, "Pretrain/Loss (Raw)": 2.0689287185668945, "Pretrain/Step": 7020, "Pretrain/Step Time": 9.12010837905109} +{"Pretrain/Learning Rate": 8.583614424604322e-06, "Pretrain/Loss": 1.9607493877410889, "Pretrain/Loss (Raw)": 1.9830621480941772, "Pretrain/Step": 7021, "Pretrain/Step Time": 9.115867478772998} +{"Pretrain/Learning Rate": 8.57721238773028e-06, "Pretrain/Loss": 1.9598571062088013, "Pretrain/Loss (Raw)": 1.852310061454773, "Pretrain/Step": 7022, "Pretrain/Step Time": 9.116037763655186} +{"Pretrain/Learning Rate": 8.570812244809504e-06, "Pretrain/Loss": 1.9600924253463745, "Pretrain/Loss (Raw)": 2.0150091648101807, "Pretrain/Step": 7023, "Pretrain/Step Time": 9.117793951183558} +{"Pretrain/Learning Rate": 8.564413996580073e-06, "Pretrain/Loss": 1.961073875427246, "Pretrain/Loss (Raw)": 2.280548095703125, "Pretrain/Step": 7024, "Pretrain/Step Time": 9.116383643820882} +{"Pretrain/Learning Rate": 8.55801764377987e-06, "Pretrain/Loss": 1.9631757736206055, "Pretrain/Loss (Raw)": 1.9287232160568237, "Pretrain/Step": 7025, "Pretrain/Step Time": 9.114781657233834} +{"Pretrain/Learning Rate": 8.551623187146537e-06, "Pretrain/Loss": 1.9647585153579712, "Pretrain/Loss (Raw)": 2.1090917587280273, "Pretrain/Step": 7026, "Pretrain/Step Time": 9.115928834304214} +{"Pretrain/Learning Rate": 8.545230627417539e-06, "Pretrain/Loss": 1.9645633697509766, "Pretrain/Loss (Raw)": 1.8876862525939941, "Pretrain/Step": 7027, "Pretrain/Step Time": 9.117047308012843} +{"Pretrain/Learning Rate": 8.538839965330079e-06, "Pretrain/Loss": 1.9648805856704712, "Pretrain/Loss (Raw)": 1.934492588043213, "Pretrain/Step": 7028, "Pretrain/Step Time": 9.11744069866836} +{"Pretrain/Learning Rate": 8.532451201621156e-06, "Pretrain/Loss": 1.963854193687439, "Pretrain/Loss (Raw)": 1.898215889930725, "Pretrain/Step": 7029, "Pretrain/Step Time": 9.118494281545281} +{"Pretrain/Learning Rate": 8.526064337027565e-06, "Pretrain/Loss": 1.9632163047790527, "Pretrain/Loss (Raw)": 2.0214693546295166, "Pretrain/Step": 7030, "Pretrain/Step Time": 9.119179707020521} +{"Pretrain/Learning Rate": 8.519679372285861e-06, "Pretrain/Loss": 1.9611576795578003, "Pretrain/Loss (Raw)": 1.797183632850647, "Pretrain/Step": 7031, "Pretrain/Step Time": 9.12190735526383} +{"Pretrain/Learning Rate": 8.51329630813239e-06, "Pretrain/Loss": 1.9599504470825195, "Pretrain/Loss (Raw)": 1.776837944984436, "Pretrain/Step": 7032, "Pretrain/Step Time": 9.111042698845267} +{"Pretrain/Learning Rate": 8.506915145303268e-06, "Pretrain/Loss": 1.9607871770858765, "Pretrain/Loss (Raw)": 2.0205812454223633, "Pretrain/Step": 7033, "Pretrain/Step Time": 9.111838353797793} +{"Pretrain/Learning Rate": 8.50053588453442e-06, "Pretrain/Loss": 1.960457444190979, "Pretrain/Loss (Raw)": 1.953127145767212, "Pretrain/Step": 7034, "Pretrain/Step Time": 9.11187495291233} +{"Pretrain/Learning Rate": 8.49415852656152e-06, "Pretrain/Loss": 1.9618232250213623, "Pretrain/Loss (Raw)": 1.9968385696411133, "Pretrain/Step": 7035, "Pretrain/Step Time": 9.112781703472137} +{"Pretrain/Learning Rate": 8.487783072120036e-06, "Pretrain/Loss": 1.9617345333099365, "Pretrain/Loss (Raw)": 1.856048583984375, "Pretrain/Step": 7036, "Pretrain/Step Time": 9.114219956099987} +{"Pretrain/Learning Rate": 8.48140952194521e-06, "Pretrain/Loss": 1.959063172340393, "Pretrain/Loss (Raw)": 1.7873828411102295, "Pretrain/Step": 7037, "Pretrain/Step Time": 9.106870708987117} +{"Pretrain/Learning Rate": 8.475037876772085e-06, "Pretrain/Loss": 1.9614965915679932, "Pretrain/Loss (Raw)": 2.1843271255493164, "Pretrain/Step": 7038, "Pretrain/Step Time": 9.105617033317685} +{"Pretrain/Learning Rate": 8.468668137335459e-06, "Pretrain/Loss": 1.958635687828064, "Pretrain/Loss (Raw)": 1.8475441932678223, "Pretrain/Step": 7039, "Pretrain/Step Time": 9.110544366762042} +{"Pretrain/Learning Rate": 8.462300304369921e-06, "Pretrain/Loss": 1.9610905647277832, "Pretrain/Loss (Raw)": 2.299811363220215, "Pretrain/Step": 7040, "Pretrain/Step Time": 9.105703806504607} +{"Pretrain/Learning Rate": 8.455934378609834e-06, "Pretrain/Loss": 1.9618542194366455, "Pretrain/Loss (Raw)": 2.124643325805664, "Pretrain/Step": 7041, "Pretrain/Step Time": 9.10661294311285} +{"Pretrain/Learning Rate": 8.449570360789358e-06, "Pretrain/Loss": 1.9638316631317139, "Pretrain/Loss (Raw)": 1.9852312803268433, "Pretrain/Step": 7042, "Pretrain/Step Time": 9.1036317627877} +{"Pretrain/Learning Rate": 8.443208251642417e-06, "Pretrain/Loss": 1.963786244392395, "Pretrain/Loss (Raw)": 2.062063694000244, "Pretrain/Step": 7043, "Pretrain/Step Time": 9.101132296025753} +{"Pretrain/Learning Rate": 8.436848051902721e-06, "Pretrain/Loss": 1.9647268056869507, "Pretrain/Loss (Raw)": 2.1432695388793945, "Pretrain/Step": 7044, "Pretrain/Step Time": 9.101340483874083} +{"Pretrain/Learning Rate": 8.430489762303745e-06, "Pretrain/Loss": 1.9642999172210693, "Pretrain/Loss (Raw)": 1.929789662361145, "Pretrain/Step": 7045, "Pretrain/Step Time": 9.108713332563639} +{"Pretrain/Learning Rate": 8.424133383578778e-06, "Pretrain/Loss": 1.963672399520874, "Pretrain/Loss (Raw)": 1.8641833066940308, "Pretrain/Step": 7046, "Pretrain/Step Time": 9.105873825028539} +{"Pretrain/Learning Rate": 8.417778916460856e-06, "Pretrain/Loss": 1.965597152709961, "Pretrain/Loss (Raw)": 2.0314695835113525, "Pretrain/Step": 7047, "Pretrain/Step Time": 9.101904552429914} +{"Pretrain/Learning Rate": 8.411426361682806e-06, "Pretrain/Loss": 1.9625171422958374, "Pretrain/Loss (Raw)": 1.7638076543807983, "Pretrain/Step": 7048, "Pretrain/Step Time": 9.10431951470673} +{"Pretrain/Learning Rate": 8.40507571997723e-06, "Pretrain/Loss": 1.9632432460784912, "Pretrain/Loss (Raw)": 2.0134329795837402, "Pretrain/Step": 7049, "Pretrain/Step Time": 9.105030419304967} +{"Pretrain/Learning Rate": 8.398726992076534e-06, "Pretrain/Loss": 1.964451551437378, "Pretrain/Loss (Raw)": 2.079968214035034, "Pretrain/Step": 7050, "Pretrain/Step Time": 9.099502826109529} +{"Pretrain/Learning Rate": 8.392380178712852e-06, "Pretrain/Loss": 1.9665842056274414, "Pretrain/Loss (Raw)": 2.2081520557403564, "Pretrain/Step": 7051, "Pretrain/Step Time": 9.099622098729014} +{"Pretrain/Learning Rate": 8.386035280618156e-06, "Pretrain/Loss": 1.9650450944900513, "Pretrain/Loss (Raw)": 1.8748050928115845, "Pretrain/Step": 7052, "Pretrain/Step Time": 9.101701064035296} +{"Pretrain/Learning Rate": 8.37969229852415e-06, "Pretrain/Loss": 1.9671359062194824, "Pretrain/Loss (Raw)": 1.960176944732666, "Pretrain/Step": 7053, "Pretrain/Step Time": 9.095296110957861} +{"Pretrain/Learning Rate": 8.373351233162362e-06, "Pretrain/Loss": 1.9683928489685059, "Pretrain/Loss (Raw)": 2.1487858295440674, "Pretrain/Step": 7054, "Pretrain/Step Time": 9.104440419003367} +{"Pretrain/Learning Rate": 8.367012085264042e-06, "Pretrain/Loss": 1.9685661792755127, "Pretrain/Loss (Raw)": 1.9609589576721191, "Pretrain/Step": 7055, "Pretrain/Step Time": 9.103066084906459} +{"Pretrain/Learning Rate": 8.360674855560274e-06, "Pretrain/Loss": 1.9704339504241943, "Pretrain/Loss (Raw)": 2.075416088104248, "Pretrain/Step": 7056, "Pretrain/Step Time": 9.098658161237836} +{"Pretrain/Learning Rate": 8.354339544781878e-06, "Pretrain/Loss": 1.9720616340637207, "Pretrain/Loss (Raw)": 2.2977118492126465, "Pretrain/Step": 7057, "Pretrain/Step Time": 9.095375273376703} +{"Pretrain/Learning Rate": 8.348006153659502e-06, "Pretrain/Loss": 1.9721662998199463, "Pretrain/Loss (Raw)": 1.975826621055603, "Pretrain/Step": 7058, "Pretrain/Step Time": 9.09882708080113} +{"Pretrain/Learning Rate": 8.341674682923503e-06, "Pretrain/Loss": 1.9724440574645996, "Pretrain/Loss (Raw)": 2.1269643306732178, "Pretrain/Step": 7059, "Pretrain/Step Time": 9.100330157205462} +{"Pretrain/Learning Rate": 8.335345133304088e-06, "Pretrain/Loss": 1.9726288318634033, "Pretrain/Loss (Raw)": 1.9754908084869385, "Pretrain/Step": 7060, "Pretrain/Step Time": 9.099143743515015} +{"Pretrain/Learning Rate": 8.329017505531195e-06, "Pretrain/Loss": 1.972290277481079, "Pretrain/Loss (Raw)": 2.2933828830718994, "Pretrain/Step": 7061, "Pretrain/Step Time": 9.100495908409357} +{"Pretrain/Learning Rate": 8.322691800334562e-06, "Pretrain/Loss": 1.9723036289215088, "Pretrain/Loss (Raw)": 2.0742130279541016, "Pretrain/Step": 7062, "Pretrain/Step Time": 9.101745273917913} +{"Pretrain/Learning Rate": 8.316368018443688e-06, "Pretrain/Loss": 1.972163200378418, "Pretrain/Loss (Raw)": 1.953057050704956, "Pretrain/Step": 7063, "Pretrain/Step Time": 9.105462728068233} +{"Pretrain/Learning Rate": 8.310046160587878e-06, "Pretrain/Loss": 1.9716598987579346, "Pretrain/Loss (Raw)": 2.0177059173583984, "Pretrain/Step": 7064, "Pretrain/Step Time": 9.10420429892838} +{"Pretrain/Learning Rate": 8.303726227496191e-06, "Pretrain/Loss": 1.9717941284179688, "Pretrain/Loss (Raw)": 1.8584038019180298, "Pretrain/Step": 7065, "Pretrain/Step Time": 9.10703287832439} +{"Pretrain/Learning Rate": 8.297408219897471e-06, "Pretrain/Loss": 1.9729554653167725, "Pretrain/Loss (Raw)": 2.371950149536133, "Pretrain/Step": 7066, "Pretrain/Step Time": 9.11039574444294} +{"Pretrain/Learning Rate": 8.291092138520332e-06, "Pretrain/Loss": 1.9723870754241943, "Pretrain/Loss (Raw)": 1.9683493375778198, "Pretrain/Step": 7067, "Pretrain/Step Time": 9.111080715432763} +{"Pretrain/Learning Rate": 8.28477798409319e-06, "Pretrain/Loss": 1.9695806503295898, "Pretrain/Loss (Raw)": 1.728529453277588, "Pretrain/Step": 7068, "Pretrain/Step Time": 9.10713885910809} +{"Pretrain/Learning Rate": 8.278465757344214e-06, "Pretrain/Loss": 1.9685213565826416, "Pretrain/Loss (Raw)": 2.0460736751556396, "Pretrain/Step": 7069, "Pretrain/Step Time": 9.111251134425402} +{"Pretrain/Learning Rate": 8.272155459001366e-06, "Pretrain/Loss": 1.970860481262207, "Pretrain/Loss (Raw)": 2.047138214111328, "Pretrain/Step": 7070, "Pretrain/Step Time": 9.107029793784022} +{"Pretrain/Learning Rate": 8.265847089792362e-06, "Pretrain/Loss": 1.969702959060669, "Pretrain/Loss (Raw)": 2.0504274368286133, "Pretrain/Step": 7071, "Pretrain/Step Time": 9.110818123444915} +{"Pretrain/Learning Rate": 8.259540650444736e-06, "Pretrain/Loss": 1.9706939458847046, "Pretrain/Loss (Raw)": 2.0962462425231934, "Pretrain/Step": 7072, "Pretrain/Step Time": 9.10461468435824} +{"Pretrain/Learning Rate": 8.253236141685764e-06, "Pretrain/Loss": 1.9712724685668945, "Pretrain/Loss (Raw)": 1.9892356395721436, "Pretrain/Step": 7073, "Pretrain/Step Time": 9.106739919632673} +{"Pretrain/Learning Rate": 8.246933564242506e-06, "Pretrain/Loss": 1.9720618724822998, "Pretrain/Loss (Raw)": 1.9435337781906128, "Pretrain/Step": 7074, "Pretrain/Step Time": 9.106189964339137} +{"Pretrain/Learning Rate": 8.240632918841823e-06, "Pretrain/Loss": 1.9733282327651978, "Pretrain/Loss (Raw)": 2.20110821723938, "Pretrain/Step": 7075, "Pretrain/Step Time": 9.109574032947421} +{"Pretrain/Learning Rate": 8.234334206210323e-06, "Pretrain/Loss": 1.9714269638061523, "Pretrain/Loss (Raw)": 1.8464810848236084, "Pretrain/Step": 7076, "Pretrain/Step Time": 9.108257504180074} +{"Pretrain/Learning Rate": 8.228037427074403e-06, "Pretrain/Loss": 1.970349907875061, "Pretrain/Loss (Raw)": 1.7607797384262085, "Pretrain/Step": 7077, "Pretrain/Step Time": 9.110638659447432} +{"Pretrain/Learning Rate": 8.221742582160233e-06, "Pretrain/Loss": 1.9696391820907593, "Pretrain/Loss (Raw)": 2.1179258823394775, "Pretrain/Step": 7078, "Pretrain/Step Time": 9.110524689778686} +{"Pretrain/Learning Rate": 8.215449672193776e-06, "Pretrain/Loss": 1.969287633895874, "Pretrain/Loss (Raw)": 1.981655240058899, "Pretrain/Step": 7079, "Pretrain/Step Time": 9.110011372715235} +{"Pretrain/Learning Rate": 8.209158697900757e-06, "Pretrain/Loss": 1.9653902053833008, "Pretrain/Loss (Raw)": 1.6492325067520142, "Pretrain/Step": 7080, "Pretrain/Step Time": 9.115869646891952} +{"Pretrain/Learning Rate": 8.202869660006676e-06, "Pretrain/Loss": 1.9651250839233398, "Pretrain/Loss (Raw)": 2.0435047149658203, "Pretrain/Step": 7081, "Pretrain/Step Time": 9.121743893250823} +{"Pretrain/Learning Rate": 8.19658255923681e-06, "Pretrain/Loss": 1.9650962352752686, "Pretrain/Loss (Raw)": 1.787353515625, "Pretrain/Step": 7082, "Pretrain/Step Time": 9.120919536799192} +{"Pretrain/Learning Rate": 8.19029739631623e-06, "Pretrain/Loss": 1.9697883129119873, "Pretrain/Loss (Raw)": 2.3758115768432617, "Pretrain/Step": 7083, "Pretrain/Step Time": 9.12187128700316} +{"Pretrain/Learning Rate": 8.184014171969765e-06, "Pretrain/Loss": 1.968762993812561, "Pretrain/Loss (Raw)": 2.011974573135376, "Pretrain/Step": 7084, "Pretrain/Step Time": 9.118074985221028} +{"Pretrain/Learning Rate": 8.177732886922023e-06, "Pretrain/Loss": 1.9684107303619385, "Pretrain/Loss (Raw)": 1.8347432613372803, "Pretrain/Step": 7085, "Pretrain/Step Time": 9.120972398668528} +{"Pretrain/Learning Rate": 8.17145354189739e-06, "Pretrain/Loss": 1.9696080684661865, "Pretrain/Loss (Raw)": 2.011472463607788, "Pretrain/Step": 7086, "Pretrain/Step Time": 9.119949292391539} +{"Pretrain/Learning Rate": 8.16517613762004e-06, "Pretrain/Loss": 1.9701064825057983, "Pretrain/Loss (Raw)": 1.9038828611373901, "Pretrain/Step": 7087, "Pretrain/Step Time": 9.119662433862686} +{"Pretrain/Learning Rate": 8.158900674813904e-06, "Pretrain/Loss": 1.9680880308151245, "Pretrain/Loss (Raw)": 1.8432408571243286, "Pretrain/Step": 7088, "Pretrain/Step Time": 9.120217269286513} +{"Pretrain/Learning Rate": 8.1526271542027e-06, "Pretrain/Loss": 1.9693949222564697, "Pretrain/Loss (Raw)": 2.07681941986084, "Pretrain/Step": 7089, "Pretrain/Step Time": 9.122248601168394} +{"Pretrain/Learning Rate": 8.146355576509915e-06, "Pretrain/Loss": 1.9685773849487305, "Pretrain/Loss (Raw)": 1.905156135559082, "Pretrain/Step": 7090, "Pretrain/Step Time": 9.121114637702703} +{"Pretrain/Learning Rate": 8.140085942458828e-06, "Pretrain/Loss": 1.9684605598449707, "Pretrain/Loss (Raw)": 2.034393310546875, "Pretrain/Step": 7091, "Pretrain/Step Time": 9.120812099426985} +{"Pretrain/Learning Rate": 8.133818252772476e-06, "Pretrain/Loss": 1.9687142372131348, "Pretrain/Loss (Raw)": 2.1394522190093994, "Pretrain/Step": 7092, "Pretrain/Step Time": 9.12690669670701} +{"Pretrain/Learning Rate": 8.12755250817368e-06, "Pretrain/Loss": 1.966684103012085, "Pretrain/Loss (Raw)": 1.6239569187164307, "Pretrain/Step": 7093, "Pretrain/Step Time": 9.129807878285646} +{"Pretrain/Learning Rate": 8.121288709385025e-06, "Pretrain/Loss": 1.969397783279419, "Pretrain/Loss (Raw)": 2.1242263317108154, "Pretrain/Step": 7094, "Pretrain/Step Time": 9.132892100140452} +{"Pretrain/Learning Rate": 8.11502685712891e-06, "Pretrain/Loss": 1.969270944595337, "Pretrain/Loss (Raw)": 2.0071308612823486, "Pretrain/Step": 7095, "Pretrain/Step Time": 9.133170124143362} +{"Pretrain/Learning Rate": 8.108766952127445e-06, "Pretrain/Loss": 1.9683349132537842, "Pretrain/Loss (Raw)": 1.8505940437316895, "Pretrain/Step": 7096, "Pretrain/Step Time": 9.132205665111542} +{"Pretrain/Learning Rate": 8.102508995102576e-06, "Pretrain/Loss": 1.9691693782806396, "Pretrain/Loss (Raw)": 1.8915925025939941, "Pretrain/Step": 7097, "Pretrain/Step Time": 9.132662001997232} +{"Pretrain/Learning Rate": 8.096252986775985e-06, "Pretrain/Loss": 1.9713599681854248, "Pretrain/Loss (Raw)": 2.1323704719543457, "Pretrain/Step": 7098, "Pretrain/Step Time": 9.131879407912493} +{"Pretrain/Learning Rate": 8.089998927869172e-06, "Pretrain/Loss": 1.9712622165679932, "Pretrain/Loss (Raw)": 2.034552574157715, "Pretrain/Step": 7099, "Pretrain/Step Time": 9.13292270898819} +{"Pretrain/Learning Rate": 8.083746819103346e-06, "Pretrain/Loss": 1.9697849750518799, "Pretrain/Loss (Raw)": 1.917160153388977, "Pretrain/Step": 7100, "Pretrain/Step Time": 9.131676694378257} +{"Pretrain/Learning Rate": 8.077496661199557e-06, "Pretrain/Loss": 1.9718983173370361, "Pretrain/Loss (Raw)": 2.260780096054077, "Pretrain/Step": 7101, "Pretrain/Step Time": 9.131585005670786} +{"Pretrain/Learning Rate": 8.071248454878596e-06, "Pretrain/Loss": 1.9718739986419678, "Pretrain/Loss (Raw)": 2.013517379760742, "Pretrain/Step": 7102, "Pretrain/Step Time": 9.134558076038957} +{"Pretrain/Learning Rate": 8.065002200861033e-06, "Pretrain/Loss": 1.9697788953781128, "Pretrain/Loss (Raw)": 1.8267544507980347, "Pretrain/Step": 7103, "Pretrain/Step Time": 9.13422971777618} +{"Pretrain/Learning Rate": 8.058757899867209e-06, "Pretrain/Loss": 1.9712742567062378, "Pretrain/Loss (Raw)": 2.1338958740234375, "Pretrain/Step": 7104, "Pretrain/Step Time": 9.131982572376728} +{"Pretrain/Learning Rate": 8.052515552617262e-06, "Pretrain/Loss": 1.9724980592727661, "Pretrain/Loss (Raw)": 1.8786232471466064, "Pretrain/Step": 7105, "Pretrain/Step Time": 9.135795982554555} +{"Pretrain/Learning Rate": 8.04627515983108e-06, "Pretrain/Loss": 1.9708974361419678, "Pretrain/Loss (Raw)": 1.9086500406265259, "Pretrain/Step": 7106, "Pretrain/Step Time": 9.131116071715951} +{"Pretrain/Learning Rate": 8.040036722228336e-06, "Pretrain/Loss": 1.9710209369659424, "Pretrain/Loss (Raw)": 2.0052170753479004, "Pretrain/Step": 7107, "Pretrain/Step Time": 9.134889977052808} +{"Pretrain/Learning Rate": 8.033800240528466e-06, "Pretrain/Loss": 1.9713231325149536, "Pretrain/Loss (Raw)": 1.8053531646728516, "Pretrain/Step": 7108, "Pretrain/Step Time": 9.136700995266438} +{"Pretrain/Learning Rate": 8.027565715450707e-06, "Pretrain/Loss": 1.9691144227981567, "Pretrain/Loss (Raw)": 1.722724437713623, "Pretrain/Step": 7109, "Pretrain/Step Time": 9.139761377125978} +{"Pretrain/Learning Rate": 8.02133314771405e-06, "Pretrain/Loss": 1.968897819519043, "Pretrain/Loss (Raw)": 1.7635266780853271, "Pretrain/Step": 7110, "Pretrain/Step Time": 9.136851534247398} +{"Pretrain/Learning Rate": 8.015102538037255e-06, "Pretrain/Loss": 1.9691009521484375, "Pretrain/Loss (Raw)": 1.9423989057540894, "Pretrain/Step": 7111, "Pretrain/Step Time": 9.13548175059259} +{"Pretrain/Learning Rate": 8.008873887138868e-06, "Pretrain/Loss": 1.9687426090240479, "Pretrain/Loss (Raw)": 1.7674661874771118, "Pretrain/Step": 7112, "Pretrain/Step Time": 9.13456030189991} +{"Pretrain/Learning Rate": 8.002647195737214e-06, "Pretrain/Loss": 1.966984748840332, "Pretrain/Loss (Raw)": 1.6678414344787598, "Pretrain/Step": 7113, "Pretrain/Step Time": 9.140465646982193} +{"Pretrain/Learning Rate": 7.996422464550382e-06, "Pretrain/Loss": 1.9677376747131348, "Pretrain/Loss (Raw)": 2.081347942352295, "Pretrain/Step": 7114, "Pretrain/Step Time": 9.137245969846845} +{"Pretrain/Learning Rate": 7.990199694296224e-06, "Pretrain/Loss": 1.9650641679763794, "Pretrain/Loss (Raw)": 1.7319377660751343, "Pretrain/Step": 7115, "Pretrain/Step Time": 9.138180846348405} +{"Pretrain/Learning Rate": 7.9839788856924e-06, "Pretrain/Loss": 1.9673936367034912, "Pretrain/Loss (Raw)": 2.1655821800231934, "Pretrain/Step": 7116, "Pretrain/Step Time": 9.13746521808207} +{"Pretrain/Learning Rate": 7.977760039456313e-06, "Pretrain/Loss": 1.9671401977539062, "Pretrain/Loss (Raw)": 2.010664224624634, "Pretrain/Step": 7117, "Pretrain/Step Time": 9.133511250838637} +{"Pretrain/Learning Rate": 7.97154315630515e-06, "Pretrain/Loss": 1.9678449630737305, "Pretrain/Loss (Raw)": 2.1192774772644043, "Pretrain/Step": 7118, "Pretrain/Step Time": 9.134404877200723} +{"Pretrain/Learning Rate": 7.965328236955862e-06, "Pretrain/Loss": 1.967644453048706, "Pretrain/Loss (Raw)": 1.710325837135315, "Pretrain/Step": 7119, "Pretrain/Step Time": 9.137558998540044} +{"Pretrain/Learning Rate": 7.959115282125198e-06, "Pretrain/Loss": 1.9657453298568726, "Pretrain/Loss (Raw)": 1.7458957433700562, "Pretrain/Step": 7120, "Pretrain/Step Time": 9.138655243441463} +{"Pretrain/Learning Rate": 7.952904292529661e-06, "Pretrain/Loss": 1.96401047706604, "Pretrain/Loss (Raw)": 1.8345547914505005, "Pretrain/Step": 7121, "Pretrain/Step Time": 9.137601759284735} +{"Pretrain/Learning Rate": 7.946695268885531e-06, "Pretrain/Loss": 1.963550329208374, "Pretrain/Loss (Raw)": 1.7639172077178955, "Pretrain/Step": 7122, "Pretrain/Step Time": 9.139972163364291} +{"Pretrain/Learning Rate": 7.94048821190885e-06, "Pretrain/Loss": 1.9645971059799194, "Pretrain/Loss (Raw)": 2.0326826572418213, "Pretrain/Step": 7123, "Pretrain/Step Time": 9.140126068145037} +{"Pretrain/Learning Rate": 7.934283122315464e-06, "Pretrain/Loss": 1.9639484882354736, "Pretrain/Loss (Raw)": 1.999440312385559, "Pretrain/Step": 7124, "Pretrain/Step Time": 9.139362841844559} +{"Pretrain/Learning Rate": 7.928080000820968e-06, "Pretrain/Loss": 1.963597059249878, "Pretrain/Loss (Raw)": 2.0035765171051025, "Pretrain/Step": 7125, "Pretrain/Step Time": 9.139343971386552} +{"Pretrain/Learning Rate": 7.921878848140727e-06, "Pretrain/Loss": 1.9626481533050537, "Pretrain/Loss (Raw)": 1.9471449851989746, "Pretrain/Step": 7126, "Pretrain/Step Time": 9.139154637232423} +{"Pretrain/Learning Rate": 7.915679664989887e-06, "Pretrain/Loss": 1.9616243839263916, "Pretrain/Loss (Raw)": 1.8359507322311401, "Pretrain/Step": 7127, "Pretrain/Step Time": 9.138697680085897} +{"Pretrain/Learning Rate": 7.909482452083378e-06, "Pretrain/Loss": 1.9602142572402954, "Pretrain/Loss (Raw)": 1.9095436334609985, "Pretrain/Step": 7128, "Pretrain/Step Time": 9.14093305543065} +{"Pretrain/Learning Rate": 7.903287210135888e-06, "Pretrain/Loss": 1.9607791900634766, "Pretrain/Loss (Raw)": 1.9016728401184082, "Pretrain/Step": 7129, "Pretrain/Step Time": 9.141698487102985} +{"Pretrain/Learning Rate": 7.897093939861877e-06, "Pretrain/Loss": 1.9591234922409058, "Pretrain/Loss (Raw)": 1.6158106327056885, "Pretrain/Step": 7130, "Pretrain/Step Time": 9.140069134533405} +{"Pretrain/Learning Rate": 7.890902641975576e-06, "Pretrain/Loss": 1.9590206146240234, "Pretrain/Loss (Raw)": 1.8807992935180664, "Pretrain/Step": 7131, "Pretrain/Step Time": 9.139902766793966} +{"Pretrain/Learning Rate": 7.884713317191011e-06, "Pretrain/Loss": 1.9612529277801514, "Pretrain/Loss (Raw)": 2.1413464546203613, "Pretrain/Step": 7132, "Pretrain/Step Time": 9.137776730582118} +{"Pretrain/Learning Rate": 7.878525966221958e-06, "Pretrain/Loss": 1.9600380659103394, "Pretrain/Loss (Raw)": 1.8582615852355957, "Pretrain/Step": 7133, "Pretrain/Step Time": 9.141762897372246} +{"Pretrain/Learning Rate": 7.87234058978197e-06, "Pretrain/Loss": 1.9565178155899048, "Pretrain/Loss (Raw)": 1.4255062341690063, "Pretrain/Step": 7134, "Pretrain/Step Time": 9.143084833398461} +{"Pretrain/Learning Rate": 7.866157188584364e-06, "Pretrain/Loss": 1.9596567153930664, "Pretrain/Loss (Raw)": 2.0999062061309814, "Pretrain/Step": 7135, "Pretrain/Step Time": 9.144838247448206} +{"Pretrain/Learning Rate": 7.859975763342264e-06, "Pretrain/Loss": 1.9614346027374268, "Pretrain/Loss (Raw)": 1.9580820798873901, "Pretrain/Step": 7136, "Pretrain/Step Time": 9.145882232114673} +{"Pretrain/Learning Rate": 7.85379631476851e-06, "Pretrain/Loss": 1.9589118957519531, "Pretrain/Loss (Raw)": 1.7823195457458496, "Pretrain/Step": 7137, "Pretrain/Step Time": 9.148154947906733} +{"Pretrain/Learning Rate": 7.847618843575769e-06, "Pretrain/Loss": 1.9560081958770752, "Pretrain/Loss (Raw)": 1.4965664148330688, "Pretrain/Step": 7138, "Pretrain/Step Time": 9.098302610218525} +{"Pretrain/Learning Rate": 7.84144335047644e-06, "Pretrain/Loss": 1.957604169845581, "Pretrain/Loss (Raw)": 1.965808629989624, "Pretrain/Step": 7139, "Pretrain/Step Time": 9.098644070327282} +{"Pretrain/Learning Rate": 7.835269836182733e-06, "Pretrain/Loss": 1.9563305377960205, "Pretrain/Loss (Raw)": 1.688219666481018, "Pretrain/Step": 7140, "Pretrain/Step Time": 8.979498280212283} +{"Pretrain/Learning Rate": 7.829098301406576e-06, "Pretrain/Loss": 1.9571952819824219, "Pretrain/Loss (Raw)": 1.874273419380188, "Pretrain/Step": 7141, "Pretrain/Step Time": 8.963119519874454} +{"Pretrain/Learning Rate": 7.82292874685972e-06, "Pretrain/Loss": 1.9575378894805908, "Pretrain/Loss (Raw)": 2.005406618118286, "Pretrain/Step": 7142, "Pretrain/Step Time": 8.837923597544432} +{"Pretrain/Learning Rate": 7.816761173253665e-06, "Pretrain/Loss": 1.9558143615722656, "Pretrain/Loss (Raw)": 1.7428967952728271, "Pretrain/Step": 7143, "Pretrain/Step Time": 8.808251332491636} +{"Pretrain/Learning Rate": 7.810595581299681e-06, "Pretrain/Loss": 1.9554929733276367, "Pretrain/Loss (Raw)": 1.8470218181610107, "Pretrain/Step": 7144, "Pretrain/Step Time": 8.725224878638983} +{"Pretrain/Learning Rate": 7.804431971708807e-06, "Pretrain/Loss": 1.9555875062942505, "Pretrain/Loss (Raw)": 1.8910354375839233, "Pretrain/Step": 7145, "Pretrain/Step Time": 8.72349869646132} +{"Pretrain/Learning Rate": 7.798270345191871e-06, "Pretrain/Loss": 1.9552749395370483, "Pretrain/Loss (Raw)": 1.914669156074524, "Pretrain/Step": 7146, "Pretrain/Step Time": 8.660611582919955} +{"Pretrain/Learning Rate": 7.792110702459456e-06, "Pretrain/Loss": 1.9554286003112793, "Pretrain/Loss (Raw)": 1.9704874753952026, "Pretrain/Step": 7147, "Pretrain/Step Time": 8.66304419375956} +{"Pretrain/Learning Rate": 7.785953044221924e-06, "Pretrain/Loss": 1.9554791450500488, "Pretrain/Loss (Raw)": 2.0753936767578125, "Pretrain/Step": 7148, "Pretrain/Step Time": 8.659327566623688} +{"Pretrain/Learning Rate": 7.779797371189394e-06, "Pretrain/Loss": 1.9568285942077637, "Pretrain/Loss (Raw)": 2.1557939052581787, "Pretrain/Step": 7149, "Pretrain/Step Time": 8.663289846852422} +{"Pretrain/Learning Rate": 7.77364368407178e-06, "Pretrain/Loss": 1.9554082155227661, "Pretrain/Loss (Raw)": 1.670508861541748, "Pretrain/Step": 7150, "Pretrain/Step Time": 8.66568636521697} +{"Pretrain/Learning Rate": 7.767491983578751e-06, "Pretrain/Loss": 1.9543015956878662, "Pretrain/Loss (Raw)": 1.8733413219451904, "Pretrain/Step": 7151, "Pretrain/Step Time": 8.66497715562582} +{"Pretrain/Learning Rate": 7.76134227041975e-06, "Pretrain/Loss": 1.949288249015808, "Pretrain/Loss (Raw)": 1.6388537883758545, "Pretrain/Step": 7152, "Pretrain/Step Time": 8.664378345012665} +{"Pretrain/Learning Rate": 7.755194545303982e-06, "Pretrain/Loss": 1.9510338306427002, "Pretrain/Loss (Raw)": 2.1521456241607666, "Pretrain/Step": 7153, "Pretrain/Step Time": 8.66867626272142} +{"Pretrain/Learning Rate": 7.749048808940445e-06, "Pretrain/Loss": 1.9507721662521362, "Pretrain/Loss (Raw)": 2.075610876083374, "Pretrain/Step": 7154, "Pretrain/Step Time": 8.666497521102428} +{"Pretrain/Learning Rate": 7.742905062037891e-06, "Pretrain/Loss": 1.9518624544143677, "Pretrain/Loss (Raw)": 2.027238130569458, "Pretrain/Step": 7155, "Pretrain/Step Time": 8.665581364184618} +{"Pretrain/Learning Rate": 7.736763305304834e-06, "Pretrain/Loss": 1.9500337839126587, "Pretrain/Loss (Raw)": 1.700433373451233, "Pretrain/Step": 7156, "Pretrain/Step Time": 8.663153793662786} +{"Pretrain/Learning Rate": 7.730623539449588e-06, "Pretrain/Loss": 1.949831485748291, "Pretrain/Loss (Raw)": 1.872315526008606, "Pretrain/Step": 7157, "Pretrain/Step Time": 8.666807873174548} +{"Pretrain/Learning Rate": 7.724485765180212e-06, "Pretrain/Loss": 1.949199914932251, "Pretrain/Loss (Raw)": 1.9406300783157349, "Pretrain/Step": 7158, "Pretrain/Step Time": 8.665212009102106} +{"Pretrain/Learning Rate": 7.71834998320454e-06, "Pretrain/Loss": 1.9483678340911865, "Pretrain/Loss (Raw)": 1.6906871795654297, "Pretrain/Step": 7159, "Pretrain/Step Time": 8.666317097842693} +{"Pretrain/Learning Rate": 7.712216194230177e-06, "Pretrain/Loss": 1.9497324228286743, "Pretrain/Loss (Raw)": 1.951493263244629, "Pretrain/Step": 7160, "Pretrain/Step Time": 8.665546268224716} +{"Pretrain/Learning Rate": 7.70608439896451e-06, "Pretrain/Loss": 1.94942307472229, "Pretrain/Loss (Raw)": 1.980994462966919, "Pretrain/Step": 7161, "Pretrain/Step Time": 8.667160937562585} +{"Pretrain/Learning Rate": 7.699954598114684e-06, "Pretrain/Loss": 1.9483870267868042, "Pretrain/Loss (Raw)": 1.8205074071884155, "Pretrain/Step": 7162, "Pretrain/Step Time": 8.666478611528873} +{"Pretrain/Learning Rate": 7.693826792387613e-06, "Pretrain/Loss": 1.9490423202514648, "Pretrain/Loss (Raw)": 2.080700635910034, "Pretrain/Step": 7163, "Pretrain/Step Time": 8.670470241457224} +{"Pretrain/Learning Rate": 7.68770098248998e-06, "Pretrain/Loss": 1.9503717422485352, "Pretrain/Loss (Raw)": 2.0262253284454346, "Pretrain/Step": 7164, "Pretrain/Step Time": 8.66649054735899} +{"Pretrain/Learning Rate": 7.681577169128251e-06, "Pretrain/Loss": 1.9509224891662598, "Pretrain/Loss (Raw)": 1.8578768968582153, "Pretrain/Step": 7165, "Pretrain/Step Time": 8.668482072651386} +{"Pretrain/Learning Rate": 7.675455353008653e-06, "Pretrain/Loss": 1.9490431547164917, "Pretrain/Loss (Raw)": 1.9437742233276367, "Pretrain/Step": 7166, "Pretrain/Step Time": 8.67299722880125} +{"Pretrain/Learning Rate": 7.669335534837183e-06, "Pretrain/Loss": 1.9510886669158936, "Pretrain/Loss (Raw)": 2.1093621253967285, "Pretrain/Step": 7167, "Pretrain/Step Time": 8.669758943840861} +{"Pretrain/Learning Rate": 7.66321771531959e-06, "Pretrain/Loss": 1.946725606918335, "Pretrain/Loss (Raw)": 1.741339087486267, "Pretrain/Step": 7168, "Pretrain/Step Time": 8.66959341429174} +{"Pretrain/Learning Rate": 7.657101895161437e-06, "Pretrain/Loss": 1.9455071687698364, "Pretrain/Loss (Raw)": 1.968686580657959, "Pretrain/Step": 7169, "Pretrain/Step Time": 8.6702149361372} +{"Pretrain/Learning Rate": 7.650988075068011e-06, "Pretrain/Loss": 1.944376826286316, "Pretrain/Loss (Raw)": 1.8405531644821167, "Pretrain/Step": 7170, "Pretrain/Step Time": 8.671620596200228} +{"Pretrain/Learning Rate": 7.644876255744393e-06, "Pretrain/Loss": 1.9420760869979858, "Pretrain/Loss (Raw)": 1.7675585746765137, "Pretrain/Step": 7171, "Pretrain/Step Time": 8.674180151894689} +{"Pretrain/Learning Rate": 7.63876643789542e-06, "Pretrain/Loss": 1.9401763677597046, "Pretrain/Loss (Raw)": 1.9001152515411377, "Pretrain/Step": 7172, "Pretrain/Step Time": 8.673001538962126} +{"Pretrain/Learning Rate": 7.632658622225713e-06, "Pretrain/Loss": 1.9408798217773438, "Pretrain/Loss (Raw)": 2.0198261737823486, "Pretrain/Step": 7173, "Pretrain/Step Time": 8.672144575044513} +{"Pretrain/Learning Rate": 7.626552809439655e-06, "Pretrain/Loss": 1.9410548210144043, "Pretrain/Loss (Raw)": 1.8866018056869507, "Pretrain/Step": 7174, "Pretrain/Step Time": 8.676758915185928} +{"Pretrain/Learning Rate": 7.620449000241395e-06, "Pretrain/Loss": 1.941367506980896, "Pretrain/Loss (Raw)": 2.0714755058288574, "Pretrain/Step": 7175, "Pretrain/Step Time": 8.68145140632987} +{"Pretrain/Learning Rate": 7.614347195334839e-06, "Pretrain/Loss": 1.9418792724609375, "Pretrain/Loss (Raw)": 1.8293147087097168, "Pretrain/Step": 7176, "Pretrain/Step Time": 8.67422023229301} +{"Pretrain/Learning Rate": 7.6082473954237066e-06, "Pretrain/Loss": 1.9421831369400024, "Pretrain/Loss (Raw)": 2.052328586578369, "Pretrain/Step": 7177, "Pretrain/Step Time": 8.674001766368747} +{"Pretrain/Learning Rate": 7.602149601211422e-06, "Pretrain/Loss": 1.9413118362426758, "Pretrain/Loss (Raw)": 1.968450665473938, "Pretrain/Step": 7178, "Pretrain/Step Time": 8.67544510960579} +{"Pretrain/Learning Rate": 7.596053813401233e-06, "Pretrain/Loss": 1.9406886100769043, "Pretrain/Loss (Raw)": 2.128355026245117, "Pretrain/Step": 7179, "Pretrain/Step Time": 8.670694783329964} +{"Pretrain/Learning Rate": 7.589960032696122e-06, "Pretrain/Loss": 1.9408996105194092, "Pretrain/Loss (Raw)": 1.9018337726593018, "Pretrain/Step": 7180, "Pretrain/Step Time": 8.6695521697402} +{"Pretrain/Learning Rate": 7.583868259798874e-06, "Pretrain/Loss": 1.9411537647247314, "Pretrain/Loss (Raw)": 1.9927027225494385, "Pretrain/Step": 7181, "Pretrain/Step Time": 8.673832608386874} +{"Pretrain/Learning Rate": 7.5777784954119885e-06, "Pretrain/Loss": 1.9401557445526123, "Pretrain/Loss (Raw)": 2.0210328102111816, "Pretrain/Step": 7182, "Pretrain/Step Time": 8.665253456681967} +{"Pretrain/Learning Rate": 7.5716907402377915e-06, "Pretrain/Loss": 1.9386082887649536, "Pretrain/Loss (Raw)": 1.7628816366195679, "Pretrain/Step": 7183, "Pretrain/Step Time": 8.661490831524134} +{"Pretrain/Learning Rate": 7.565604994978337e-06, "Pretrain/Loss": 1.937841534614563, "Pretrain/Loss (Raw)": 1.9772815704345703, "Pretrain/Step": 7184, "Pretrain/Step Time": 8.666191160678864} +{"Pretrain/Learning Rate": 7.559521260335483e-06, "Pretrain/Loss": 1.9363696575164795, "Pretrain/Loss (Raw)": 2.109314203262329, "Pretrain/Step": 7185, "Pretrain/Step Time": 8.665455125272274} +{"Pretrain/Learning Rate": 7.553439537010803e-06, "Pretrain/Loss": 1.938075304031372, "Pretrain/Loss (Raw)": 2.194154739379883, "Pretrain/Step": 7186, "Pretrain/Step Time": 8.667951930314302} +{"Pretrain/Learning Rate": 7.547359825705696e-06, "Pretrain/Loss": 1.9332334995269775, "Pretrain/Loss (Raw)": 1.5072011947631836, "Pretrain/Step": 7187, "Pretrain/Step Time": 8.665272461250424} +{"Pretrain/Learning Rate": 7.541282127121291e-06, "Pretrain/Loss": 1.933908224105835, "Pretrain/Loss (Raw)": 2.0618581771850586, "Pretrain/Step": 7188, "Pretrain/Step Time": 8.661216765642166} +{"Pretrain/Learning Rate": 7.5352064419585e-06, "Pretrain/Loss": 1.9315872192382812, "Pretrain/Loss (Raw)": 1.996292233467102, "Pretrain/Step": 7189, "Pretrain/Step Time": 8.659996902570128} +{"Pretrain/Learning Rate": 7.529132770917993e-06, "Pretrain/Loss": 1.9326790571212769, "Pretrain/Loss (Raw)": 2.2139689922332764, "Pretrain/Step": 7190, "Pretrain/Step Time": 8.658922558650374} +{"Pretrain/Learning Rate": 7.523061114700228e-06, "Pretrain/Loss": 1.9335672855377197, "Pretrain/Loss (Raw)": 2.0667412281036377, "Pretrain/Step": 7191, "Pretrain/Step Time": 8.657735873013735} +{"Pretrain/Learning Rate": 7.516991474005408e-06, "Pretrain/Loss": 1.931025505065918, "Pretrain/Loss (Raw)": 1.6923625469207764, "Pretrain/Step": 7192, "Pretrain/Step Time": 8.659542258828878} +{"Pretrain/Learning Rate": 7.510923849533513e-06, "Pretrain/Loss": 1.9306682348251343, "Pretrain/Loss (Raw)": 1.8126798868179321, "Pretrain/Step": 7193, "Pretrain/Step Time": 8.657180894166231} +{"Pretrain/Learning Rate": 7.504858241984286e-06, "Pretrain/Loss": 1.9267343282699585, "Pretrain/Loss (Raw)": 1.8684169054031372, "Pretrain/Step": 7194, "Pretrain/Step Time": 8.65315843001008} +{"Pretrain/Learning Rate": 7.498794652057251e-06, "Pretrain/Loss": 1.9264283180236816, "Pretrain/Loss (Raw)": 1.9291584491729736, "Pretrain/Step": 7195, "Pretrain/Step Time": 8.658183505758643} +{"Pretrain/Learning Rate": 7.492733080451686e-06, "Pretrain/Loss": 1.926893711090088, "Pretrain/Loss (Raw)": 1.788100242614746, "Pretrain/Step": 7196, "Pretrain/Step Time": 8.659506421536207} +{"Pretrain/Learning Rate": 7.486673527866633e-06, "Pretrain/Loss": 1.9264945983886719, "Pretrain/Loss (Raw)": 1.9949997663497925, "Pretrain/Step": 7197, "Pretrain/Step Time": 8.655131744220853} +{"Pretrain/Learning Rate": 7.4806159950009196e-06, "Pretrain/Loss": 1.9276649951934814, "Pretrain/Loss (Raw)": 2.196950912475586, "Pretrain/Step": 7198, "Pretrain/Step Time": 8.655785096809268} +{"Pretrain/Learning Rate": 7.474560482553125e-06, "Pretrain/Loss": 1.9277514219284058, "Pretrain/Loss (Raw)": 2.0614778995513916, "Pretrain/Step": 7199, "Pretrain/Step Time": 8.653961496427655} +{"Pretrain/Learning Rate": 7.468506991221599e-06, "Pretrain/Loss": 1.9299044609069824, "Pretrain/Loss (Raw)": 2.371846914291382, "Pretrain/Step": 7200, "Pretrain/Step Time": 8.656875478103757} +{"Pretrain/Learning Rate": 7.462455521704448e-06, "Pretrain/Loss": 1.9289770126342773, "Pretrain/Loss (Raw)": 1.8705155849456787, "Pretrain/Step": 7201, "Pretrain/Step Time": 8.65645332634449} +{"Pretrain/Learning Rate": 7.4564060746995765e-06, "Pretrain/Loss": 1.9279944896697998, "Pretrain/Loss (Raw)": 1.8177692890167236, "Pretrain/Step": 7202, "Pretrain/Step Time": 8.663320939987898} +{"Pretrain/Learning Rate": 7.450358650904621e-06, "Pretrain/Loss": 1.926296353340149, "Pretrain/Loss (Raw)": 1.9837530851364136, "Pretrain/Step": 7203, "Pretrain/Step Time": 8.660662865266204} +{"Pretrain/Learning Rate": 7.444313251017004e-06, "Pretrain/Loss": 1.9285438060760498, "Pretrain/Loss (Raw)": 2.134164571762085, "Pretrain/Step": 7204, "Pretrain/Step Time": 8.655755212530494} +{"Pretrain/Learning Rate": 7.438269875733903e-06, "Pretrain/Loss": 1.9299360513687134, "Pretrain/Loss (Raw)": 1.938970923423767, "Pretrain/Step": 7205, "Pretrain/Step Time": 8.659199515357614} +{"Pretrain/Learning Rate": 7.432228525752277e-06, "Pretrain/Loss": 1.9273573160171509, "Pretrain/Loss (Raw)": 1.7878499031066895, "Pretrain/Step": 7206, "Pretrain/Step Time": 8.663600612431765} +{"Pretrain/Learning Rate": 7.426189201768844e-06, "Pretrain/Loss": 1.9268121719360352, "Pretrain/Loss (Raw)": 1.911871075630188, "Pretrain/Step": 7207, "Pretrain/Step Time": 8.665909325703979} +{"Pretrain/Learning Rate": 7.42015190448008e-06, "Pretrain/Loss": 1.928849220275879, "Pretrain/Loss (Raw)": 1.9099787473678589, "Pretrain/Step": 7208, "Pretrain/Step Time": 8.65707510523498} +{"Pretrain/Learning Rate": 7.4141166345822274e-06, "Pretrain/Loss": 1.9280550479888916, "Pretrain/Loss (Raw)": 1.941854476928711, "Pretrain/Step": 7209, "Pretrain/Step Time": 8.651014007627964} +{"Pretrain/Learning Rate": 7.408083392771323e-06, "Pretrain/Loss": 1.9300826787948608, "Pretrain/Loss (Raw)": 2.0468924045562744, "Pretrain/Step": 7210, "Pretrain/Step Time": 8.654288042336702} +{"Pretrain/Learning Rate": 7.402052179743135e-06, "Pretrain/Loss": 1.9271953105926514, "Pretrain/Loss (Raw)": 2.0062408447265625, "Pretrain/Step": 7211, "Pretrain/Step Time": 8.648228181526065} +{"Pretrain/Learning Rate": 7.396022996193217e-06, "Pretrain/Loss": 1.9241316318511963, "Pretrain/Loss (Raw)": 1.619808554649353, "Pretrain/Step": 7212, "Pretrain/Step Time": 8.654129173606634} +{"Pretrain/Learning Rate": 7.389995842816871e-06, "Pretrain/Loss": 1.9248350858688354, "Pretrain/Loss (Raw)": 1.9247852563858032, "Pretrain/Step": 7213, "Pretrain/Step Time": 8.651843033730984} +{"Pretrain/Learning Rate": 7.383970720309191e-06, "Pretrain/Loss": 1.923022985458374, "Pretrain/Loss (Raw)": 1.7795236110687256, "Pretrain/Step": 7214, "Pretrain/Step Time": 8.653486866503954} +{"Pretrain/Learning Rate": 7.37794762936502e-06, "Pretrain/Loss": 1.9208756685256958, "Pretrain/Loss (Raw)": 1.6290338039398193, "Pretrain/Step": 7215, "Pretrain/Step Time": 8.655768632888794} +{"Pretrain/Learning Rate": 7.371926570678964e-06, "Pretrain/Loss": 1.9212976694107056, "Pretrain/Loss (Raw)": 1.8972445726394653, "Pretrain/Step": 7216, "Pretrain/Step Time": 8.658913731575012} +{"Pretrain/Learning Rate": 7.365907544945397e-06, "Pretrain/Loss": 1.9212228059768677, "Pretrain/Loss (Raw)": 2.067244291305542, "Pretrain/Step": 7217, "Pretrain/Step Time": 8.66118467412889} +{"Pretrain/Learning Rate": 7.359890552858478e-06, "Pretrain/Loss": 1.9213414192199707, "Pretrain/Loss (Raw)": 1.9203424453735352, "Pretrain/Step": 7218, "Pretrain/Step Time": 8.662014858797193} +{"Pretrain/Learning Rate": 7.353875595112092e-06, "Pretrain/Loss": 1.9208629131317139, "Pretrain/Loss (Raw)": 1.9731498956680298, "Pretrain/Step": 7219, "Pretrain/Step Time": 8.665392668917775} +{"Pretrain/Learning Rate": 7.347862672399927e-06, "Pretrain/Loss": 1.9196282625198364, "Pretrain/Loss (Raw)": 1.981410264968872, "Pretrain/Step": 7220, "Pretrain/Step Time": 8.660531364381313} +{"Pretrain/Learning Rate": 7.341851785415415e-06, "Pretrain/Loss": 1.9231610298156738, "Pretrain/Loss (Raw)": 2.0761544704437256, "Pretrain/Step": 7221, "Pretrain/Step Time": 8.655317217111588} +{"Pretrain/Learning Rate": 7.335842934851775e-06, "Pretrain/Loss": 1.9219601154327393, "Pretrain/Loss (Raw)": 1.9704911708831787, "Pretrain/Step": 7222, "Pretrain/Step Time": 8.65797758847475} +{"Pretrain/Learning Rate": 7.329836121401951e-06, "Pretrain/Loss": 1.9246294498443604, "Pretrain/Loss (Raw)": 2.348806858062744, "Pretrain/Step": 7223, "Pretrain/Step Time": 8.657044891268015} +{"Pretrain/Learning Rate": 7.323831345758697e-06, "Pretrain/Loss": 1.9246189594268799, "Pretrain/Loss (Raw)": 1.8492491245269775, "Pretrain/Step": 7224, "Pretrain/Step Time": 8.658696820959449} +{"Pretrain/Learning Rate": 7.317828608614496e-06, "Pretrain/Loss": 1.9251222610473633, "Pretrain/Loss (Raw)": 1.9560245275497437, "Pretrain/Step": 7225, "Pretrain/Step Time": 8.660974726080894} +{"Pretrain/Learning Rate": 7.311827910661639e-06, "Pretrain/Loss": 1.9240800142288208, "Pretrain/Loss (Raw)": 1.9989597797393799, "Pretrain/Step": 7226, "Pretrain/Step Time": 8.658904196694493} +{"Pretrain/Learning Rate": 7.3058292525921195e-06, "Pretrain/Loss": 1.9229562282562256, "Pretrain/Loss (Raw)": 1.890712857246399, "Pretrain/Step": 7227, "Pretrain/Step Time": 8.657211918383837} +{"Pretrain/Learning Rate": 7.299832635097756e-06, "Pretrain/Loss": 1.9223151206970215, "Pretrain/Loss (Raw)": 1.8351134061813354, "Pretrain/Step": 7228, "Pretrain/Step Time": 8.659273287281394} +{"Pretrain/Learning Rate": 7.293838058870098e-06, "Pretrain/Loss": 1.9198110103607178, "Pretrain/Loss (Raw)": 1.940244436264038, "Pretrain/Step": 7229, "Pretrain/Step Time": 8.659916311502457} +{"Pretrain/Learning Rate": 7.2878455246004704e-06, "Pretrain/Loss": 1.9220890998840332, "Pretrain/Loss (Raw)": 2.3051023483276367, "Pretrain/Step": 7230, "Pretrain/Step Time": 8.655645053833723} +{"Pretrain/Learning Rate": 7.281855032979954e-06, "Pretrain/Loss": 1.9203972816467285, "Pretrain/Loss (Raw)": 1.6102088689804077, "Pretrain/Step": 7231, "Pretrain/Step Time": 8.663346663117409} +{"Pretrain/Learning Rate": 7.275866584699409e-06, "Pretrain/Loss": 1.9188082218170166, "Pretrain/Loss (Raw)": 1.930480718612671, "Pretrain/Step": 7232, "Pretrain/Step Time": 8.662684939801693} +{"Pretrain/Learning Rate": 7.269880180449451e-06, "Pretrain/Loss": 1.919234275817871, "Pretrain/Loss (Raw)": 1.9331790208816528, "Pretrain/Step": 7233, "Pretrain/Step Time": 8.66162096709013} +{"Pretrain/Learning Rate": 7.263895820920458e-06, "Pretrain/Loss": 1.919358491897583, "Pretrain/Loss (Raw)": 1.9245508909225464, "Pretrain/Step": 7234, "Pretrain/Step Time": 8.66355494223535} +{"Pretrain/Learning Rate": 7.257913506802566e-06, "Pretrain/Loss": 1.9186445474624634, "Pretrain/Loss (Raw)": 1.9138280153274536, "Pretrain/Step": 7235, "Pretrain/Step Time": 8.65990281663835} +{"Pretrain/Learning Rate": 7.251933238785699e-06, "Pretrain/Loss": 1.9213733673095703, "Pretrain/Loss (Raw)": 2.154642343521118, "Pretrain/Step": 7236, "Pretrain/Step Time": 8.660140186548233} +{"Pretrain/Learning Rate": 7.245955017559522e-06, "Pretrain/Loss": 1.9259231090545654, "Pretrain/Loss (Raw)": 2.3050894737243652, "Pretrain/Step": 7237, "Pretrain/Step Time": 8.657456861808896} +{"Pretrain/Learning Rate": 7.2399788438134665e-06, "Pretrain/Loss": 1.9265315532684326, "Pretrain/Loss (Raw)": 1.8414005041122437, "Pretrain/Step": 7238, "Pretrain/Step Time": 8.66115585155785} +{"Pretrain/Learning Rate": 7.234004718236745e-06, "Pretrain/Loss": 1.9275579452514648, "Pretrain/Loss (Raw)": 2.0737786293029785, "Pretrain/Step": 7239, "Pretrain/Step Time": 8.660841803997755} +{"Pretrain/Learning Rate": 7.228032641518315e-06, "Pretrain/Loss": 1.9283568859100342, "Pretrain/Loss (Raw)": 1.8697301149368286, "Pretrain/Step": 7240, "Pretrain/Step Time": 8.665026878938079} +{"Pretrain/Learning Rate": 7.222062614346906e-06, "Pretrain/Loss": 1.928930640220642, "Pretrain/Loss (Raw)": 1.7412875890731812, "Pretrain/Step": 7241, "Pretrain/Step Time": 8.658957239240408} +{"Pretrain/Learning Rate": 7.216094637411e-06, "Pretrain/Loss": 1.9279624223709106, "Pretrain/Loss (Raw)": 1.9574120044708252, "Pretrain/Step": 7242, "Pretrain/Step Time": 8.659962348639965} +{"Pretrain/Learning Rate": 7.21012871139887e-06, "Pretrain/Loss": 1.9302396774291992, "Pretrain/Loss (Raw)": 2.0234172344207764, "Pretrain/Step": 7243, "Pretrain/Step Time": 8.660237172618508} +{"Pretrain/Learning Rate": 7.204164836998523e-06, "Pretrain/Loss": 1.9271951913833618, "Pretrain/Loss (Raw)": 1.7759006023406982, "Pretrain/Step": 7244, "Pretrain/Step Time": 8.658447725698352} +{"Pretrain/Learning Rate": 7.1982030148977474e-06, "Pretrain/Loss": 1.9267990589141846, "Pretrain/Loss (Raw)": 1.959965705871582, "Pretrain/Step": 7245, "Pretrain/Step Time": 8.657389285042882} +{"Pretrain/Learning Rate": 7.192243245784075e-06, "Pretrain/Loss": 1.9262781143188477, "Pretrain/Loss (Raw)": 2.052584409713745, "Pretrain/Step": 7246, "Pretrain/Step Time": 8.660034660249949} +{"Pretrain/Learning Rate": 7.186285530344833e-06, "Pretrain/Loss": 1.9280130863189697, "Pretrain/Loss (Raw)": 1.932396650314331, "Pretrain/Step": 7247, "Pretrain/Step Time": 8.65584390796721} +{"Pretrain/Learning Rate": 7.1803298692670825e-06, "Pretrain/Loss": 1.929675579071045, "Pretrain/Loss (Raw)": 1.9587037563323975, "Pretrain/Step": 7248, "Pretrain/Step Time": 8.65416688658297} +{"Pretrain/Learning Rate": 7.174376263237664e-06, "Pretrain/Loss": 1.9317257404327393, "Pretrain/Loss (Raw)": 2.096982955932617, "Pretrain/Step": 7249, "Pretrain/Step Time": 8.653459656983614} +{"Pretrain/Learning Rate": 7.1684247129431616e-06, "Pretrain/Loss": 1.9348863363265991, "Pretrain/Loss (Raw)": 2.1684696674346924, "Pretrain/Step": 7250, "Pretrain/Step Time": 8.649430699646473} +{"Pretrain/Learning Rate": 7.162475219069956e-06, "Pretrain/Loss": 1.9328399896621704, "Pretrain/Loss (Raw)": 1.770750641822815, "Pretrain/Step": 7251, "Pretrain/Step Time": 8.656251339241862} +{"Pretrain/Learning Rate": 7.1565277823041596e-06, "Pretrain/Loss": 1.9333112239837646, "Pretrain/Loss (Raw)": 2.0597681999206543, "Pretrain/Step": 7252, "Pretrain/Step Time": 8.656237384304404} +{"Pretrain/Learning Rate": 7.1505824033316596e-06, "Pretrain/Loss": 1.9304319620132446, "Pretrain/Loss (Raw)": 1.6350233554840088, "Pretrain/Step": 7253, "Pretrain/Step Time": 8.657352739945054} +{"Pretrain/Learning Rate": 7.1446390828381e-06, "Pretrain/Loss": 1.9299108982086182, "Pretrain/Loss (Raw)": 1.8804384469985962, "Pretrain/Step": 7254, "Pretrain/Step Time": 8.652881871908903} +{"Pretrain/Learning Rate": 7.138697821508908e-06, "Pretrain/Loss": 1.9315130710601807, "Pretrain/Loss (Raw)": 2.0410306453704834, "Pretrain/Step": 7255, "Pretrain/Step Time": 8.655940284952521} +{"Pretrain/Learning Rate": 7.132758620029248e-06, "Pretrain/Loss": 1.9329817295074463, "Pretrain/Loss (Raw)": 2.0975358486175537, "Pretrain/Step": 7256, "Pretrain/Step Time": 8.653413722291589} +{"Pretrain/Learning Rate": 7.126821479084056e-06, "Pretrain/Loss": 1.932497262954712, "Pretrain/Loss (Raw)": 1.8396673202514648, "Pretrain/Step": 7257, "Pretrain/Step Time": 8.652240181341767} +{"Pretrain/Learning Rate": 7.120886399358023e-06, "Pretrain/Loss": 1.9341719150543213, "Pretrain/Loss (Raw)": 1.830161452293396, "Pretrain/Step": 7258, "Pretrain/Step Time": 8.652813227847219} +{"Pretrain/Learning Rate": 7.114953381535627e-06, "Pretrain/Loss": 1.9359649419784546, "Pretrain/Loss (Raw)": 2.110299825668335, "Pretrain/Step": 7259, "Pretrain/Step Time": 8.652792949229479} +{"Pretrain/Learning Rate": 7.109022426301087e-06, "Pretrain/Loss": 1.932025671005249, "Pretrain/Loss (Raw)": 1.6371134519577026, "Pretrain/Step": 7260, "Pretrain/Step Time": 8.65264874882996} +{"Pretrain/Learning Rate": 7.103093534338384e-06, "Pretrain/Loss": 1.9312598705291748, "Pretrain/Loss (Raw)": 1.7602497339248657, "Pretrain/Step": 7261, "Pretrain/Step Time": 8.652112998068333} +{"Pretrain/Learning Rate": 7.0971667063312624e-06, "Pretrain/Loss": 1.9360401630401611, "Pretrain/Loss (Raw)": 2.0373804569244385, "Pretrain/Step": 7262, "Pretrain/Step Time": 8.65193804167211} +{"Pretrain/Learning Rate": 7.091241942963251e-06, "Pretrain/Loss": 1.9340027570724487, "Pretrain/Loss (Raw)": 1.8391212224960327, "Pretrain/Step": 7263, "Pretrain/Step Time": 8.650310827419162} +{"Pretrain/Learning Rate": 7.0853192449175905e-06, "Pretrain/Loss": 1.934234619140625, "Pretrain/Loss (Raw)": 1.9877547025680542, "Pretrain/Step": 7264, "Pretrain/Step Time": 8.655193174257874} +{"Pretrain/Learning Rate": 7.0793986128773415e-06, "Pretrain/Loss": 1.9360625743865967, "Pretrain/Loss (Raw)": 2.0163044929504395, "Pretrain/Step": 7265, "Pretrain/Step Time": 8.652429638430476} +{"Pretrain/Learning Rate": 7.07348004752528e-06, "Pretrain/Loss": 1.939673662185669, "Pretrain/Loss (Raw)": 1.9587830305099487, "Pretrain/Step": 7266, "Pretrain/Step Time": 8.654637329280376} +{"Pretrain/Learning Rate": 7.067563549543987e-06, "Pretrain/Loss": 1.9406940937042236, "Pretrain/Loss (Raw)": 2.096425771713257, "Pretrain/Step": 7267, "Pretrain/Step Time": 8.657769195735455} +{"Pretrain/Learning Rate": 7.061649119615752e-06, "Pretrain/Loss": 1.9425461292266846, "Pretrain/Loss (Raw)": 1.925291895866394, "Pretrain/Step": 7268, "Pretrain/Step Time": 8.655052522197366} +{"Pretrain/Learning Rate": 7.055736758422676e-06, "Pretrain/Loss": 1.943051815032959, "Pretrain/Loss (Raw)": 1.9389939308166504, "Pretrain/Step": 7269, "Pretrain/Step Time": 8.656758572906256} +{"Pretrain/Learning Rate": 7.049826466646592e-06, "Pretrain/Loss": 1.9422179460525513, "Pretrain/Loss (Raw)": 1.898675560951233, "Pretrain/Step": 7270, "Pretrain/Step Time": 8.656649485230446} +{"Pretrain/Learning Rate": 7.043918244969106e-06, "Pretrain/Loss": 1.9440677165985107, "Pretrain/Loss (Raw)": 1.979664921760559, "Pretrain/Step": 7271, "Pretrain/Step Time": 8.658399935811758} +{"Pretrain/Learning Rate": 7.038012094071572e-06, "Pretrain/Loss": 1.9433296918869019, "Pretrain/Loss (Raw)": 1.7525473833084106, "Pretrain/Step": 7272, "Pretrain/Step Time": 8.659009639173746} +{"Pretrain/Learning Rate": 7.032108014635128e-06, "Pretrain/Loss": 1.9439020156860352, "Pretrain/Loss (Raw)": 1.9643090963363647, "Pretrain/Step": 7273, "Pretrain/Step Time": 8.660913843661547} +{"Pretrain/Learning Rate": 7.026206007340658e-06, "Pretrain/Loss": 1.9437810182571411, "Pretrain/Loss (Raw)": 1.8991719484329224, "Pretrain/Step": 7274, "Pretrain/Step Time": 8.659852895885706} +{"Pretrain/Learning Rate": 7.020306072868804e-06, "Pretrain/Loss": 1.942104697227478, "Pretrain/Loss (Raw)": 1.7559107542037964, "Pretrain/Step": 7275, "Pretrain/Step Time": 8.659387569874525} +{"Pretrain/Learning Rate": 7.014408211899973e-06, "Pretrain/Loss": 1.9408938884735107, "Pretrain/Loss (Raw)": 1.9204074144363403, "Pretrain/Step": 7276, "Pretrain/Step Time": 8.659526279196143} +{"Pretrain/Learning Rate": 7.008512425114333e-06, "Pretrain/Loss": 1.941105604171753, "Pretrain/Loss (Raw)": 2.182896137237549, "Pretrain/Step": 7277, "Pretrain/Step Time": 8.659925006330013} +{"Pretrain/Learning Rate": 7.002618713191839e-06, "Pretrain/Loss": 1.9447238445281982, "Pretrain/Loss (Raw)": 2.1336562633514404, "Pretrain/Step": 7278, "Pretrain/Step Time": 8.656220331788063} +{"Pretrain/Learning Rate": 6.996727076812143e-06, "Pretrain/Loss": 1.944822907447815, "Pretrain/Loss (Raw)": 1.8860149383544922, "Pretrain/Step": 7279, "Pretrain/Step Time": 8.65653245151043} +{"Pretrain/Learning Rate": 6.990837516654722e-06, "Pretrain/Loss": 1.9477012157440186, "Pretrain/Loss (Raw)": 2.0072686672210693, "Pretrain/Step": 7280, "Pretrain/Step Time": 8.65616568364203} +{"Pretrain/Learning Rate": 6.984950033398782e-06, "Pretrain/Loss": 1.9429988861083984, "Pretrain/Loss (Raw)": 1.5502592325210571, "Pretrain/Step": 7281, "Pretrain/Step Time": 8.656557580456138} +{"Pretrain/Learning Rate": 6.979064627723292e-06, "Pretrain/Loss": 1.942152738571167, "Pretrain/Loss (Raw)": 1.967301607131958, "Pretrain/Step": 7282, "Pretrain/Step Time": 8.656816810369492} +{"Pretrain/Learning Rate": 6.97318130030698e-06, "Pretrain/Loss": 1.939151644706726, "Pretrain/Loss (Raw)": 1.643097162246704, "Pretrain/Step": 7283, "Pretrain/Step Time": 8.659712594002485} +{"Pretrain/Learning Rate": 6.967300051828355e-06, "Pretrain/Loss": 1.9402623176574707, "Pretrain/Loss (Raw)": 1.842602252960205, "Pretrain/Step": 7284, "Pretrain/Step Time": 8.665037039667368} +{"Pretrain/Learning Rate": 6.961420882965661e-06, "Pretrain/Loss": 1.940857172012329, "Pretrain/Loss (Raw)": 1.9484646320343018, "Pretrain/Step": 7285, "Pretrain/Step Time": 8.663094695657492} +{"Pretrain/Learning Rate": 6.9555437943969095e-06, "Pretrain/Loss": 1.938961386680603, "Pretrain/Loss (Raw)": 1.6979647874832153, "Pretrain/Step": 7286, "Pretrain/Step Time": 8.66364499181509} +{"Pretrain/Learning Rate": 6.949668786799867e-06, "Pretrain/Loss": 1.9417071342468262, "Pretrain/Loss (Raw)": 2.042132616043091, "Pretrain/Step": 7287, "Pretrain/Step Time": 8.66140541434288} +{"Pretrain/Learning Rate": 6.943795860852087e-06, "Pretrain/Loss": 1.939288854598999, "Pretrain/Loss (Raw)": 1.6419668197631836, "Pretrain/Step": 7288, "Pretrain/Step Time": 8.660083463415504} +{"Pretrain/Learning Rate": 6.937925017230848e-06, "Pretrain/Loss": 1.9394606351852417, "Pretrain/Loss (Raw)": 2.002974510192871, "Pretrain/Step": 7289, "Pretrain/Step Time": 8.66299444437027} +{"Pretrain/Learning Rate": 6.932056256613209e-06, "Pretrain/Loss": 1.9366883039474487, "Pretrain/Loss (Raw)": 1.4656476974487305, "Pretrain/Step": 7290, "Pretrain/Step Time": 8.662363193929195} +{"Pretrain/Learning Rate": 6.926189579675977e-06, "Pretrain/Loss": 1.9345965385437012, "Pretrain/Loss (Raw)": 1.8129560947418213, "Pretrain/Step": 7291, "Pretrain/Step Time": 8.6592624373734} +{"Pretrain/Learning Rate": 6.920324987095733e-06, "Pretrain/Loss": 1.9345248937606812, "Pretrain/Loss (Raw)": 2.0170481204986572, "Pretrain/Step": 7292, "Pretrain/Step Time": 8.661212695762515} +{"Pretrain/Learning Rate": 6.914462479548806e-06, "Pretrain/Loss": 1.9338798522949219, "Pretrain/Loss (Raw)": 1.7753243446350098, "Pretrain/Step": 7293, "Pretrain/Step Time": 8.65973244421184} +{"Pretrain/Learning Rate": 6.908602057711289e-06, "Pretrain/Loss": 1.9355067014694214, "Pretrain/Loss (Raw)": 2.152007818222046, "Pretrain/Step": 7294, "Pretrain/Step Time": 8.655677078291774} +{"Pretrain/Learning Rate": 6.902743722259025e-06, "Pretrain/Loss": 1.9357739686965942, "Pretrain/Loss (Raw)": 2.1435680389404297, "Pretrain/Step": 7295, "Pretrain/Step Time": 8.654924733564258} +{"Pretrain/Learning Rate": 6.8968874738676385e-06, "Pretrain/Loss": 1.936121940612793, "Pretrain/Loss (Raw)": 1.785883903503418, "Pretrain/Step": 7296, "Pretrain/Step Time": 8.657595243304968} +{"Pretrain/Learning Rate": 6.891033313212494e-06, "Pretrain/Loss": 1.935697078704834, "Pretrain/Loss (Raw)": 1.9143038988113403, "Pretrain/Step": 7297, "Pretrain/Step Time": 8.656180473044515} +{"Pretrain/Learning Rate": 6.885181240968719e-06, "Pretrain/Loss": 1.9372634887695312, "Pretrain/Loss (Raw)": 2.0410594940185547, "Pretrain/Step": 7298, "Pretrain/Step Time": 8.652849087491632} +{"Pretrain/Learning Rate": 6.879331257811195e-06, "Pretrain/Loss": 1.9403321743011475, "Pretrain/Loss (Raw)": 2.16033935546875, "Pretrain/Step": 7299, "Pretrain/Step Time": 8.65970721654594} +{"Pretrain/Learning Rate": 6.873483364414588e-06, "Pretrain/Loss": 1.9414465427398682, "Pretrain/Loss (Raw)": 2.0427587032318115, "Pretrain/Step": 7300, "Pretrain/Step Time": 8.658832913264632} +{"Pretrain/Learning Rate": 6.867637561453291e-06, "Pretrain/Loss": 1.9408944845199585, "Pretrain/Loss (Raw)": 1.9491640329360962, "Pretrain/Step": 7301, "Pretrain/Step Time": 8.656159745529294} +{"Pretrain/Learning Rate": 6.861793849601475e-06, "Pretrain/Loss": 1.9399495124816895, "Pretrain/Loss (Raw)": 1.765659213066101, "Pretrain/Step": 7302, "Pretrain/Step Time": 8.65483546629548} +{"Pretrain/Learning Rate": 6.855952229533055e-06, "Pretrain/Loss": 1.9389011859893799, "Pretrain/Loss (Raw)": 1.9372841119766235, "Pretrain/Step": 7303, "Pretrain/Step Time": 8.651568591594696} +{"Pretrain/Learning Rate": 6.8501127019217346e-06, "Pretrain/Loss": 1.9396240711212158, "Pretrain/Loss (Raw)": 1.921839952468872, "Pretrain/Step": 7304, "Pretrain/Step Time": 8.655102847144008} +{"Pretrain/Learning Rate": 6.844275267440931e-06, "Pretrain/Loss": 1.9406870603561401, "Pretrain/Loss (Raw)": 2.1883785724639893, "Pretrain/Step": 7305, "Pretrain/Step Time": 8.656425811350346} +{"Pretrain/Learning Rate": 6.838439926763859e-06, "Pretrain/Loss": 1.9398599863052368, "Pretrain/Loss (Raw)": 1.862591028213501, "Pretrain/Step": 7306, "Pretrain/Step Time": 8.654742110520601} +{"Pretrain/Learning Rate": 6.832606680563472e-06, "Pretrain/Loss": 1.9386351108551025, "Pretrain/Loss (Raw)": 1.9715609550476074, "Pretrain/Step": 7307, "Pretrain/Step Time": 8.66104706376791} +{"Pretrain/Learning Rate": 6.8267755295125024e-06, "Pretrain/Loss": 1.939948558807373, "Pretrain/Loss (Raw)": 2.069972038269043, "Pretrain/Step": 7308, "Pretrain/Step Time": 8.65876447968185} +{"Pretrain/Learning Rate": 6.820946474283399e-06, "Pretrain/Loss": 1.9401774406433105, "Pretrain/Loss (Raw)": 2.0219929218292236, "Pretrain/Step": 7309, "Pretrain/Step Time": 8.66137014515698} +{"Pretrain/Learning Rate": 6.815119515548418e-06, "Pretrain/Loss": 1.9401376247406006, "Pretrain/Loss (Raw)": 2.0159428119659424, "Pretrain/Step": 7310, "Pretrain/Step Time": 8.664224786683917} +{"Pretrain/Learning Rate": 6.809294653979545e-06, "Pretrain/Loss": 1.940961241722107, "Pretrain/Loss (Raw)": 1.868301510810852, "Pretrain/Step": 7311, "Pretrain/Step Time": 8.664851466193795} +{"Pretrain/Learning Rate": 6.803471890248531e-06, "Pretrain/Loss": 1.9442460536956787, "Pretrain/Loss (Raw)": 2.397724151611328, "Pretrain/Step": 7312, "Pretrain/Step Time": 8.66390996798873} +{"Pretrain/Learning Rate": 6.797651225026874e-06, "Pretrain/Loss": 1.9413204193115234, "Pretrain/Loss (Raw)": 1.7348380088806152, "Pretrain/Step": 7313, "Pretrain/Step Time": 8.667052360251546} +{"Pretrain/Learning Rate": 6.791832658985859e-06, "Pretrain/Loss": 1.9402294158935547, "Pretrain/Loss (Raw)": 2.054513931274414, "Pretrain/Step": 7314, "Pretrain/Step Time": 8.664160154759884} +{"Pretrain/Learning Rate": 6.786016192796499e-06, "Pretrain/Loss": 1.9408806562423706, "Pretrain/Loss (Raw)": 1.5905534029006958, "Pretrain/Step": 7315, "Pretrain/Step Time": 8.666721994057298} +{"Pretrain/Learning Rate": 6.7802018271295815e-06, "Pretrain/Loss": 1.939694881439209, "Pretrain/Loss (Raw)": 1.9100815057754517, "Pretrain/Step": 7316, "Pretrain/Step Time": 8.665502777323127} +{"Pretrain/Learning Rate": 6.774389562655634e-06, "Pretrain/Loss": 1.9405630826950073, "Pretrain/Loss (Raw)": 2.107424259185791, "Pretrain/Step": 7317, "Pretrain/Step Time": 8.665339475497603} +{"Pretrain/Learning Rate": 6.768579400044966e-06, "Pretrain/Loss": 1.9390790462493896, "Pretrain/Loss (Raw)": 2.024010419845581, "Pretrain/Step": 7318, "Pretrain/Step Time": 8.662742387503386} +{"Pretrain/Learning Rate": 6.762771339967644e-06, "Pretrain/Loss": 1.937552571296692, "Pretrain/Loss (Raw)": 1.8713537454605103, "Pretrain/Step": 7319, "Pretrain/Step Time": 8.660112161189318} +{"Pretrain/Learning Rate": 6.756965383093455e-06, "Pretrain/Loss": 1.9402742385864258, "Pretrain/Loss (Raw)": 2.040727138519287, "Pretrain/Step": 7320, "Pretrain/Step Time": 8.66135842166841} +{"Pretrain/Learning Rate": 6.751161530091988e-06, "Pretrain/Loss": 1.9416970014572144, "Pretrain/Loss (Raw)": 1.9947998523712158, "Pretrain/Step": 7321, "Pretrain/Step Time": 8.660197492688894} +{"Pretrain/Learning Rate": 6.745359781632565e-06, "Pretrain/Loss": 1.9433398246765137, "Pretrain/Loss (Raw)": 2.0787100791931152, "Pretrain/Step": 7322, "Pretrain/Step Time": 8.66268208809197} +{"Pretrain/Learning Rate": 6.739560138384271e-06, "Pretrain/Loss": 1.9423575401306152, "Pretrain/Loss (Raw)": 1.8034212589263916, "Pretrain/Step": 7323, "Pretrain/Step Time": 8.658097933977842} +{"Pretrain/Learning Rate": 6.733762601015942e-06, "Pretrain/Loss": 1.9439935684204102, "Pretrain/Loss (Raw)": 1.9975128173828125, "Pretrain/Step": 7324, "Pretrain/Step Time": 8.657995566725731} +{"Pretrain/Learning Rate": 6.727967170196186e-06, "Pretrain/Loss": 1.9445736408233643, "Pretrain/Loss (Raw)": 2.069246530532837, "Pretrain/Step": 7325, "Pretrain/Step Time": 8.661345031112432} +{"Pretrain/Learning Rate": 6.72217384659336e-06, "Pretrain/Loss": 1.9423189163208008, "Pretrain/Loss (Raw)": 1.9083572626113892, "Pretrain/Step": 7326, "Pretrain/Step Time": 8.65652123466134} +{"Pretrain/Learning Rate": 6.7163826308755725e-06, "Pretrain/Loss": 1.9423952102661133, "Pretrain/Loss (Raw)": 2.0712194442749023, "Pretrain/Step": 7327, "Pretrain/Step Time": 8.654978938400745} +{"Pretrain/Learning Rate": 6.7105935237106895e-06, "Pretrain/Loss": 1.9376440048217773, "Pretrain/Loss (Raw)": 1.7636973857879639, "Pretrain/Step": 7328, "Pretrain/Step Time": 8.65480018593371} +{"Pretrain/Learning Rate": 6.704806525766353e-06, "Pretrain/Loss": 1.9385117292404175, "Pretrain/Loss (Raw)": 1.981588363647461, "Pretrain/Step": 7329, "Pretrain/Step Time": 8.65622041746974} +{"Pretrain/Learning Rate": 6.699021637709935e-06, "Pretrain/Loss": 1.9404900074005127, "Pretrain/Loss (Raw)": 2.0709846019744873, "Pretrain/Step": 7330, "Pretrain/Step Time": 8.649848764762282} +{"Pretrain/Learning Rate": 6.693238860208578e-06, "Pretrain/Loss": 1.9402070045471191, "Pretrain/Loss (Raw)": 1.9475280046463013, "Pretrain/Step": 7331, "Pretrain/Step Time": 8.650388883426785} +{"Pretrain/Learning Rate": 6.687458193929172e-06, "Pretrain/Loss": 1.9378700256347656, "Pretrain/Loss (Raw)": 1.8350439071655273, "Pretrain/Step": 7332, "Pretrain/Step Time": 8.660053744912148} +{"Pretrain/Learning Rate": 6.681679639538388e-06, "Pretrain/Loss": 1.9372764825820923, "Pretrain/Loss (Raw)": 1.8629907369613647, "Pretrain/Step": 7333, "Pretrain/Step Time": 8.657254097983241} +{"Pretrain/Learning Rate": 6.675903197702627e-06, "Pretrain/Loss": 1.9391523599624634, "Pretrain/Loss (Raw)": 2.0279643535614014, "Pretrain/Step": 7334, "Pretrain/Step Time": 8.654223470017314} +{"Pretrain/Learning Rate": 6.6701288690880545e-06, "Pretrain/Loss": 1.9405739307403564, "Pretrain/Loss (Raw)": 2.093834638595581, "Pretrain/Step": 7335, "Pretrain/Step Time": 8.654838314279914} +{"Pretrain/Learning Rate": 6.664356654360588e-06, "Pretrain/Loss": 1.9387471675872803, "Pretrain/Loss (Raw)": 1.6761490106582642, "Pretrain/Step": 7336, "Pretrain/Step Time": 8.657577559351921} +{"Pretrain/Learning Rate": 6.658586554185916e-06, "Pretrain/Loss": 1.9385554790496826, "Pretrain/Loss (Raw)": 1.917323112487793, "Pretrain/Step": 7337, "Pretrain/Step Time": 8.65806321054697} +{"Pretrain/Learning Rate": 6.652818569229474e-06, "Pretrain/Loss": 1.9370203018188477, "Pretrain/Loss (Raw)": 1.8503823280334473, "Pretrain/Step": 7338, "Pretrain/Step Time": 8.653528228402138} +{"Pretrain/Learning Rate": 6.647052700156447e-06, "Pretrain/Loss": 1.9378243684768677, "Pretrain/Loss (Raw)": 2.1091647148132324, "Pretrain/Step": 7339, "Pretrain/Step Time": 8.657741628587246} +{"Pretrain/Learning Rate": 6.6412889476317765e-06, "Pretrain/Loss": 1.940293550491333, "Pretrain/Loss (Raw)": 1.9358547925949097, "Pretrain/Step": 7340, "Pretrain/Step Time": 8.657154200598598} +{"Pretrain/Learning Rate": 6.635527312320183e-06, "Pretrain/Loss": 1.941413402557373, "Pretrain/Loss (Raw)": 2.068127393722534, "Pretrain/Step": 7341, "Pretrain/Step Time": 8.658656632527709} +{"Pretrain/Learning Rate": 6.629767794886116e-06, "Pretrain/Loss": 1.9409894943237305, "Pretrain/Loss (Raw)": 1.7252734899520874, "Pretrain/Step": 7342, "Pretrain/Step Time": 8.662436749786139} +{"Pretrain/Learning Rate": 6.624010395993791e-06, "Pretrain/Loss": 1.9425671100616455, "Pretrain/Loss (Raw)": 1.8309564590454102, "Pretrain/Step": 7343, "Pretrain/Step Time": 8.659559017047286} +{"Pretrain/Learning Rate": 6.618255116307171e-06, "Pretrain/Loss": 1.9432690143585205, "Pretrain/Loss (Raw)": 1.9871046543121338, "Pretrain/Step": 7344, "Pretrain/Step Time": 8.661147067323327} +{"Pretrain/Learning Rate": 6.61250195649e-06, "Pretrain/Loss": 1.941910982131958, "Pretrain/Loss (Raw)": 1.8934098482131958, "Pretrain/Step": 7345, "Pretrain/Step Time": 8.65631160326302} +{"Pretrain/Learning Rate": 6.606750917205734e-06, "Pretrain/Loss": 1.9368624687194824, "Pretrain/Loss (Raw)": 1.2741444110870361, "Pretrain/Step": 7346, "Pretrain/Step Time": 8.66140483878553} +{"Pretrain/Learning Rate": 6.601001999117634e-06, "Pretrain/Loss": 1.9382410049438477, "Pretrain/Loss (Raw)": 2.1495895385742188, "Pretrain/Step": 7347, "Pretrain/Step Time": 8.65672893077135} +{"Pretrain/Learning Rate": 6.595255202888672e-06, "Pretrain/Loss": 1.9386132955551147, "Pretrain/Loss (Raw)": 2.029053211212158, "Pretrain/Step": 7348, "Pretrain/Step Time": 8.657027665525675} +{"Pretrain/Learning Rate": 6.589510529181622e-06, "Pretrain/Loss": 1.938653588294983, "Pretrain/Loss (Raw)": 2.0813262462615967, "Pretrain/Step": 7349, "Pretrain/Step Time": 8.657510865479708} +{"Pretrain/Learning Rate": 6.583767978658959e-06, "Pretrain/Loss": 1.9367833137512207, "Pretrain/Loss (Raw)": 1.7310903072357178, "Pretrain/Step": 7350, "Pretrain/Step Time": 8.651653667911887} +{"Pretrain/Learning Rate": 6.578027551982957e-06, "Pretrain/Loss": 1.9330499172210693, "Pretrain/Loss (Raw)": 1.8709304332733154, "Pretrain/Step": 7351, "Pretrain/Step Time": 8.653493721038103} +{"Pretrain/Learning Rate": 6.5722892498156165e-06, "Pretrain/Loss": 1.9350488185882568, "Pretrain/Loss (Raw)": 2.1051108837127686, "Pretrain/Step": 7352, "Pretrain/Step Time": 8.651014346629381} +{"Pretrain/Learning Rate": 6.566553072818729e-06, "Pretrain/Loss": 1.9353976249694824, "Pretrain/Loss (Raw)": 2.0006730556488037, "Pretrain/Step": 7353, "Pretrain/Step Time": 8.649578688666224} +{"Pretrain/Learning Rate": 6.560819021653791e-06, "Pretrain/Loss": 1.9360570907592773, "Pretrain/Loss (Raw)": 2.0833675861358643, "Pretrain/Step": 7354, "Pretrain/Step Time": 8.648035187274218} +{"Pretrain/Learning Rate": 6.555087096982096e-06, "Pretrain/Loss": 1.9384868144989014, "Pretrain/Loss (Raw)": 2.2017061710357666, "Pretrain/Step": 7355, "Pretrain/Step Time": 8.647021193057299} +{"Pretrain/Learning Rate": 6.549357299464673e-06, "Pretrain/Loss": 1.9389567375183105, "Pretrain/Loss (Raw)": 1.8952676057815552, "Pretrain/Step": 7356, "Pretrain/Step Time": 8.649364180862904} +{"Pretrain/Learning Rate": 6.54362962976231e-06, "Pretrain/Loss": 1.939095377922058, "Pretrain/Loss (Raw)": 1.9580011367797852, "Pretrain/Step": 7357, "Pretrain/Step Time": 8.645525744184852} +{"Pretrain/Learning Rate": 6.5379040885355376e-06, "Pretrain/Loss": 1.9374761581420898, "Pretrain/Loss (Raw)": 2.097834825515747, "Pretrain/Step": 7358, "Pretrain/Step Time": 8.650829574093223} +{"Pretrain/Learning Rate": 6.532180676444663e-06, "Pretrain/Loss": 1.936969518661499, "Pretrain/Loss (Raw)": 1.5453667640686035, "Pretrain/Step": 7359, "Pretrain/Step Time": 8.647755801677704} +{"Pretrain/Learning Rate": 6.52645939414975e-06, "Pretrain/Loss": 1.9369916915893555, "Pretrain/Loss (Raw)": 1.9333020448684692, "Pretrain/Step": 7360, "Pretrain/Step Time": 8.650563888251781} +{"Pretrain/Learning Rate": 6.5207402423105775e-06, "Pretrain/Loss": 1.9374064207077026, "Pretrain/Loss (Raw)": 1.9862858057022095, "Pretrain/Step": 7361, "Pretrain/Step Time": 8.648844469338655} +{"Pretrain/Learning Rate": 6.515023221586722e-06, "Pretrain/Loss": 1.9377833604812622, "Pretrain/Loss (Raw)": 1.9728004932403564, "Pretrain/Step": 7362, "Pretrain/Step Time": 8.651240846142173} +{"Pretrain/Learning Rate": 6.5093083326374954e-06, "Pretrain/Loss": 1.9386476278305054, "Pretrain/Loss (Raw)": 2.0244457721710205, "Pretrain/Step": 7363, "Pretrain/Step Time": 8.649252466857433} +{"Pretrain/Learning Rate": 6.50359557612196e-06, "Pretrain/Loss": 1.9372496604919434, "Pretrain/Loss (Raw)": 1.9756872653961182, "Pretrain/Step": 7364, "Pretrain/Step Time": 8.647918056696653} +{"Pretrain/Learning Rate": 6.497884952698935e-06, "Pretrain/Loss": 1.9338374137878418, "Pretrain/Loss (Raw)": 1.8683501482009888, "Pretrain/Step": 7365, "Pretrain/Step Time": 8.647060850635171} +{"Pretrain/Learning Rate": 6.492176463027009e-06, "Pretrain/Loss": 1.935298204421997, "Pretrain/Loss (Raw)": 2.0283775329589844, "Pretrain/Step": 7366, "Pretrain/Step Time": 8.640784129500389} +{"Pretrain/Learning Rate": 6.486470107764505e-06, "Pretrain/Loss": 1.9353806972503662, "Pretrain/Loss (Raw)": 2.084322690963745, "Pretrain/Step": 7367, "Pretrain/Step Time": 8.644544791430235} +{"Pretrain/Learning Rate": 6.480765887569506e-06, "Pretrain/Loss": 1.9336915016174316, "Pretrain/Loss (Raw)": 1.6535193920135498, "Pretrain/Step": 7368, "Pretrain/Step Time": 8.643974365666509} +{"Pretrain/Learning Rate": 6.475063803099846e-06, "Pretrain/Loss": 1.9348880052566528, "Pretrain/Loss (Raw)": 1.8944389820098877, "Pretrain/Step": 7369, "Pretrain/Step Time": 8.646744355559349} +{"Pretrain/Learning Rate": 6.469363855013125e-06, "Pretrain/Loss": 1.933955430984497, "Pretrain/Loss (Raw)": 1.8380546569824219, "Pretrain/Step": 7370, "Pretrain/Step Time": 8.64529113471508} +{"Pretrain/Learning Rate": 6.463666043966685e-06, "Pretrain/Loss": 1.9343066215515137, "Pretrain/Loss (Raw)": 2.0683605670928955, "Pretrain/Step": 7371, "Pretrain/Step Time": 8.6422627735883} +{"Pretrain/Learning Rate": 6.457970370617622e-06, "Pretrain/Loss": 1.9344840049743652, "Pretrain/Loss (Raw)": 1.7986027002334595, "Pretrain/Step": 7372, "Pretrain/Step Time": 8.643838519230485} +{"Pretrain/Learning Rate": 6.452276835622781e-06, "Pretrain/Loss": 1.9343780279159546, "Pretrain/Loss (Raw)": 1.9464012384414673, "Pretrain/Step": 7373, "Pretrain/Step Time": 8.645597841590643} +{"Pretrain/Learning Rate": 6.446585439638783e-06, "Pretrain/Loss": 1.9335814714431763, "Pretrain/Loss (Raw)": 1.9506206512451172, "Pretrain/Step": 7374, "Pretrain/Step Time": 8.646124802529812} +{"Pretrain/Learning Rate": 6.440896183321979e-06, "Pretrain/Loss": 1.9331384897232056, "Pretrain/Loss (Raw)": 1.8757059574127197, "Pretrain/Step": 7375, "Pretrain/Step Time": 8.646818483248353} +{"Pretrain/Learning Rate": 6.435209067328479e-06, "Pretrain/Loss": 1.9335715770721436, "Pretrain/Loss (Raw)": 2.014134407043457, "Pretrain/Step": 7376, "Pretrain/Step Time": 8.64611728489399} +{"Pretrain/Learning Rate": 6.429524092314143e-06, "Pretrain/Loss": 1.9325660467147827, "Pretrain/Loss (Raw)": 1.9682738780975342, "Pretrain/Step": 7377, "Pretrain/Step Time": 8.650020953267813} +{"Pretrain/Learning Rate": 6.423841258934604e-06, "Pretrain/Loss": 1.929718255996704, "Pretrain/Loss (Raw)": 1.803963541984558, "Pretrain/Step": 7378, "Pretrain/Step Time": 8.65360589697957} +{"Pretrain/Learning Rate": 6.418160567845224e-06, "Pretrain/Loss": 1.9318927526474, "Pretrain/Loss (Raw)": 2.049071788787842, "Pretrain/Step": 7379, "Pretrain/Step Time": 8.646350000053644} +{"Pretrain/Learning Rate": 6.412482019701127e-06, "Pretrain/Loss": 1.931222677230835, "Pretrain/Loss (Raw)": 1.9739880561828613, "Pretrain/Step": 7380, "Pretrain/Step Time": 8.652803717181087} +{"Pretrain/Learning Rate": 6.4068056151571855e-06, "Pretrain/Loss": 1.935089349746704, "Pretrain/Loss (Raw)": 2.1299736499786377, "Pretrain/Step": 7381, "Pretrain/Step Time": 8.651318497955799} +{"Pretrain/Learning Rate": 6.40113135486804e-06, "Pretrain/Loss": 1.9353587627410889, "Pretrain/Loss (Raw)": 1.9149249792099, "Pretrain/Step": 7382, "Pretrain/Step Time": 8.653454802930355} +{"Pretrain/Learning Rate": 6.395459239488069e-06, "Pretrain/Loss": 1.9323251247406006, "Pretrain/Loss (Raw)": 1.6527135372161865, "Pretrain/Step": 7383, "Pretrain/Step Time": 8.653901593759656} +{"Pretrain/Learning Rate": 6.389789269671403e-06, "Pretrain/Loss": 1.9305663108825684, "Pretrain/Loss (Raw)": 1.8724015951156616, "Pretrain/Step": 7384, "Pretrain/Step Time": 8.65197117626667} +{"Pretrain/Learning Rate": 6.384121446071928e-06, "Pretrain/Loss": 1.9326035976409912, "Pretrain/Loss (Raw)": 2.1004538536071777, "Pretrain/Step": 7385, "Pretrain/Step Time": 8.649463444948196} +{"Pretrain/Learning Rate": 6.378455769343302e-06, "Pretrain/Loss": 1.933828353881836, "Pretrain/Loss (Raw)": 1.9869242906570435, "Pretrain/Step": 7386, "Pretrain/Step Time": 8.648744411766529} +{"Pretrain/Learning Rate": 6.372792240138891e-06, "Pretrain/Loss": 1.9332959651947021, "Pretrain/Loss (Raw)": 2.042163848876953, "Pretrain/Step": 7387, "Pretrain/Step Time": 8.649161126464605} +{"Pretrain/Learning Rate": 6.3671308591118615e-06, "Pretrain/Loss": 1.9370366334915161, "Pretrain/Loss (Raw)": 2.1159205436706543, "Pretrain/Step": 7388, "Pretrain/Step Time": 8.648478155955672} +{"Pretrain/Learning Rate": 6.361471626915091e-06, "Pretrain/Loss": 1.9368960857391357, "Pretrain/Loss (Raw)": 1.7422548532485962, "Pretrain/Step": 7389, "Pretrain/Step Time": 8.646222436800599} +{"Pretrain/Learning Rate": 6.355814544201258e-06, "Pretrain/Loss": 1.9374192953109741, "Pretrain/Loss (Raw)": 2.1043426990509033, "Pretrain/Step": 7390, "Pretrain/Step Time": 8.647116305306554} +{"Pretrain/Learning Rate": 6.35015961162273e-06, "Pretrain/Loss": 1.9381122589111328, "Pretrain/Loss (Raw)": 1.927832841873169, "Pretrain/Step": 7391, "Pretrain/Step Time": 8.645630119368434} +{"Pretrain/Learning Rate": 6.344506829831684e-06, "Pretrain/Loss": 1.9376966953277588, "Pretrain/Loss (Raw)": 1.9345669746398926, "Pretrain/Step": 7392, "Pretrain/Step Time": 8.646808572113514} +{"Pretrain/Learning Rate": 6.3388561994800115e-06, "Pretrain/Loss": 1.9382905960083008, "Pretrain/Loss (Raw)": 2.0923244953155518, "Pretrain/Step": 7393, "Pretrain/Step Time": 8.65160339139402} +{"Pretrain/Learning Rate": 6.333207721219389e-06, "Pretrain/Loss": 1.9395731687545776, "Pretrain/Loss (Raw)": 2.1229403018951416, "Pretrain/Step": 7394, "Pretrain/Step Time": 8.6466324608773} +{"Pretrain/Learning Rate": 6.327561395701201e-06, "Pretrain/Loss": 1.9374256134033203, "Pretrain/Loss (Raw)": 1.821529507637024, "Pretrain/Step": 7395, "Pretrain/Step Time": 8.644776362925768} +{"Pretrain/Learning Rate": 6.321917223576626e-06, "Pretrain/Loss": 1.937671422958374, "Pretrain/Loss (Raw)": 1.9567584991455078, "Pretrain/Step": 7396, "Pretrain/Step Time": 8.646310774609447} +{"Pretrain/Learning Rate": 6.316275205496572e-06, "Pretrain/Loss": 1.9378936290740967, "Pretrain/Loss (Raw)": 1.9674469232559204, "Pretrain/Step": 7397, "Pretrain/Step Time": 8.650568157434464} +{"Pretrain/Learning Rate": 6.310635342111701e-06, "Pretrain/Loss": 1.9356575012207031, "Pretrain/Loss (Raw)": 1.6124398708343506, "Pretrain/Step": 7398, "Pretrain/Step Time": 8.648199189454317} +{"Pretrain/Learning Rate": 6.304997634072421e-06, "Pretrain/Loss": 1.935319423675537, "Pretrain/Loss (Raw)": 1.9363940954208374, "Pretrain/Step": 7399, "Pretrain/Step Time": 8.648312997072935} +{"Pretrain/Learning Rate": 6.299362082028909e-06, "Pretrain/Loss": 1.9356982707977295, "Pretrain/Loss (Raw)": 1.8010321855545044, "Pretrain/Step": 7400, "Pretrain/Step Time": 8.64556061848998} +{"Pretrain/Learning Rate": 6.293728686631095e-06, "Pretrain/Loss": 1.9358514547348022, "Pretrain/Loss (Raw)": 1.9839340448379517, "Pretrain/Step": 7401, "Pretrain/Step Time": 8.645652448758483} +{"Pretrain/Learning Rate": 6.288097448528624e-06, "Pretrain/Loss": 1.935408353805542, "Pretrain/Loss (Raw)": 1.8424535989761353, "Pretrain/Step": 7402, "Pretrain/Step Time": 8.64370259270072} +{"Pretrain/Learning Rate": 6.2824683683709335e-06, "Pretrain/Loss": 1.9344305992126465, "Pretrain/Loss (Raw)": 1.6307580471038818, "Pretrain/Step": 7403, "Pretrain/Step Time": 8.648092778399587} +{"Pretrain/Learning Rate": 6.2768414468071915e-06, "Pretrain/Loss": 1.934248447418213, "Pretrain/Loss (Raw)": 1.8971000909805298, "Pretrain/Step": 7404, "Pretrain/Step Time": 8.647283263504505} +{"Pretrain/Learning Rate": 6.27121668448632e-06, "Pretrain/Loss": 1.92825448513031, "Pretrain/Loss (Raw)": 1.415652871131897, "Pretrain/Step": 7405, "Pretrain/Step Time": 8.649411018937826} +{"Pretrain/Learning Rate": 6.265594082056986e-06, "Pretrain/Loss": 1.926468849182129, "Pretrain/Loss (Raw)": 1.9050973653793335, "Pretrain/Step": 7406, "Pretrain/Step Time": 8.652258405461907} +{"Pretrain/Learning Rate": 6.25997364016763e-06, "Pretrain/Loss": 1.927780270576477, "Pretrain/Loss (Raw)": 2.0538792610168457, "Pretrain/Step": 7407, "Pretrain/Step Time": 8.651928713545203} +{"Pretrain/Learning Rate": 6.254355359466418e-06, "Pretrain/Loss": 1.927915334701538, "Pretrain/Loss (Raw)": 2.0245609283447266, "Pretrain/Step": 7408, "Pretrain/Step Time": 8.648752622306347} +{"Pretrain/Learning Rate": 6.248739240601282e-06, "Pretrain/Loss": 1.9305181503295898, "Pretrain/Loss (Raw)": 1.8834182024002075, "Pretrain/Step": 7409, "Pretrain/Step Time": 8.644972544163465} +{"Pretrain/Learning Rate": 6.243125284219883e-06, "Pretrain/Loss": 1.9306695461273193, "Pretrain/Loss (Raw)": 1.9866852760314941, "Pretrain/Step": 7410, "Pretrain/Step Time": 8.649194749072194} +{"Pretrain/Learning Rate": 6.237513490969674e-06, "Pretrain/Loss": 1.9330201148986816, "Pretrain/Loss (Raw)": 1.9439737796783447, "Pretrain/Step": 7411, "Pretrain/Step Time": 8.646145433187485} +{"Pretrain/Learning Rate": 6.231903861497817e-06, "Pretrain/Loss": 1.9358234405517578, "Pretrain/Loss (Raw)": 2.201416492462158, "Pretrain/Step": 7412, "Pretrain/Step Time": 8.643990639597178} +{"Pretrain/Learning Rate": 6.226296396451245e-06, "Pretrain/Loss": 1.9372665882110596, "Pretrain/Loss (Raw)": 2.133178949356079, "Pretrain/Step": 7413, "Pretrain/Step Time": 8.643941946327686} +{"Pretrain/Learning Rate": 6.2206910964766325e-06, "Pretrain/Loss": 1.935608148574829, "Pretrain/Loss (Raw)": 1.4856789112091064, "Pretrain/Step": 7414, "Pretrain/Step Time": 8.645671058446169} +{"Pretrain/Learning Rate": 6.21508796222042e-06, "Pretrain/Loss": 1.9354424476623535, "Pretrain/Loss (Raw)": 2.020930051803589, "Pretrain/Step": 7415, "Pretrain/Step Time": 8.645474085584283} +{"Pretrain/Learning Rate": 6.2094869943287805e-06, "Pretrain/Loss": 1.9382719993591309, "Pretrain/Loss (Raw)": 2.004162549972534, "Pretrain/Step": 7416, "Pretrain/Step Time": 8.648330034688115} +{"Pretrain/Learning Rate": 6.203888193447646e-06, "Pretrain/Loss": 1.939197301864624, "Pretrain/Loss (Raw)": 2.121406078338623, "Pretrain/Step": 7417, "Pretrain/Step Time": 8.647489519789815} +{"Pretrain/Learning Rate": 6.198291560222685e-06, "Pretrain/Loss": 1.942783236503601, "Pretrain/Loss (Raw)": 1.9246454238891602, "Pretrain/Step": 7418, "Pretrain/Step Time": 8.655959041789174} +{"Pretrain/Learning Rate": 6.192697095299349e-06, "Pretrain/Loss": 1.9428112506866455, "Pretrain/Loss (Raw)": 1.8165597915649414, "Pretrain/Step": 7419, "Pretrain/Step Time": 8.654401022940874} +{"Pretrain/Learning Rate": 6.187104799322804e-06, "Pretrain/Loss": 1.941820502281189, "Pretrain/Loss (Raw)": 1.8902218341827393, "Pretrain/Step": 7420, "Pretrain/Step Time": 8.652554316446185} +{"Pretrain/Learning Rate": 6.1815146729379855e-06, "Pretrain/Loss": 1.941525936126709, "Pretrain/Loss (Raw)": 1.7376152276992798, "Pretrain/Step": 7421, "Pretrain/Step Time": 8.655050544068217} +{"Pretrain/Learning Rate": 6.17592671678956e-06, "Pretrain/Loss": 1.9412124156951904, "Pretrain/Loss (Raw)": 2.1118760108947754, "Pretrain/Step": 7422, "Pretrain/Step Time": 8.65635178424418} +{"Pretrain/Learning Rate": 6.170340931521976e-06, "Pretrain/Loss": 1.9388384819030762, "Pretrain/Loss (Raw)": 1.839707851409912, "Pretrain/Step": 7423, "Pretrain/Step Time": 8.656935047358274} +{"Pretrain/Learning Rate": 6.164757317779404e-06, "Pretrain/Loss": 1.9385768175125122, "Pretrain/Loss (Raw)": 1.7523943185806274, "Pretrain/Step": 7424, "Pretrain/Step Time": 8.653998071327806} +{"Pretrain/Learning Rate": 6.159175876205775e-06, "Pretrain/Loss": 1.9387683868408203, "Pretrain/Loss (Raw)": 1.938823938369751, "Pretrain/Step": 7425, "Pretrain/Step Time": 8.656114151701331} +{"Pretrain/Learning Rate": 6.153596607444756e-06, "Pretrain/Loss": 1.9376976490020752, "Pretrain/Loss (Raw)": 1.9040133953094482, "Pretrain/Step": 7426, "Pretrain/Step Time": 8.659275818616152} +{"Pretrain/Learning Rate": 6.148019512139797e-06, "Pretrain/Loss": 1.9353079795837402, "Pretrain/Loss (Raw)": 1.8544461727142334, "Pretrain/Step": 7427, "Pretrain/Step Time": 8.657322347164154} +{"Pretrain/Learning Rate": 6.142444590934046e-06, "Pretrain/Loss": 1.9346624612808228, "Pretrain/Loss (Raw)": 1.9601458311080933, "Pretrain/Step": 7428, "Pretrain/Step Time": 8.656481290236115} +{"Pretrain/Learning Rate": 6.136871844470454e-06, "Pretrain/Loss": 1.9346158504486084, "Pretrain/Loss (Raw)": 1.9431885480880737, "Pretrain/Step": 7429, "Pretrain/Step Time": 8.657486325129867} +{"Pretrain/Learning Rate": 6.131301273391679e-06, "Pretrain/Loss": 1.9347230195999146, "Pretrain/Loss (Raw)": 1.7793700695037842, "Pretrain/Step": 7430, "Pretrain/Step Time": 8.658584624528885} +{"Pretrain/Learning Rate": 6.125732878340168e-06, "Pretrain/Loss": 1.9345192909240723, "Pretrain/Loss (Raw)": 1.9112133979797363, "Pretrain/Step": 7431, "Pretrain/Step Time": 8.660260995849967} +{"Pretrain/Learning Rate": 6.120166659958065e-06, "Pretrain/Loss": 1.9348950386047363, "Pretrain/Loss (Raw)": 1.9699522256851196, "Pretrain/Step": 7432, "Pretrain/Step Time": 8.660249510779977} +{"Pretrain/Learning Rate": 6.1146026188873134e-06, "Pretrain/Loss": 1.9347645044326782, "Pretrain/Loss (Raw)": 2.171658754348755, "Pretrain/Step": 7433, "Pretrain/Step Time": 8.65974754281342} +{"Pretrain/Learning Rate": 6.1090407557695735e-06, "Pretrain/Loss": 1.9334520101547241, "Pretrain/Loss (Raw)": 1.694580078125, "Pretrain/Step": 7434, "Pretrain/Step Time": 8.664374167099595} +{"Pretrain/Learning Rate": 6.103481071246284e-06, "Pretrain/Loss": 1.9348039627075195, "Pretrain/Loss (Raw)": 2.1446268558502197, "Pretrain/Step": 7435, "Pretrain/Step Time": 8.657645139843225} +{"Pretrain/Learning Rate": 6.097923565958588e-06, "Pretrain/Loss": 1.9334056377410889, "Pretrain/Loss (Raw)": 1.8909868001937866, "Pretrain/Step": 7436, "Pretrain/Step Time": 8.662573242560029} +{"Pretrain/Learning Rate": 6.092368240547422e-06, "Pretrain/Loss": 1.9328371286392212, "Pretrain/Loss (Raw)": 1.9492253065109253, "Pretrain/Step": 7437, "Pretrain/Step Time": 8.657984528690577} +{"Pretrain/Learning Rate": 6.0868150956534445e-06, "Pretrain/Loss": 1.9319732189178467, "Pretrain/Loss (Raw)": 1.9053456783294678, "Pretrain/Step": 7438, "Pretrain/Step Time": 8.65617385134101} +{"Pretrain/Learning Rate": 6.081264131917075e-06, "Pretrain/Loss": 1.9326395988464355, "Pretrain/Loss (Raw)": 1.9535962343215942, "Pretrain/Step": 7439, "Pretrain/Step Time": 8.65801564231515} +{"Pretrain/Learning Rate": 6.075715349978464e-06, "Pretrain/Loss": 1.9269195795059204, "Pretrain/Loss (Raw)": 1.6655757427215576, "Pretrain/Step": 7440, "Pretrain/Step Time": 8.657668899744749} +{"Pretrain/Learning Rate": 6.070168750477534e-06, "Pretrain/Loss": 1.9265666007995605, "Pretrain/Loss (Raw)": 1.6896636486053467, "Pretrain/Step": 7441, "Pretrain/Step Time": 8.658750481903553} +{"Pretrain/Learning Rate": 6.0646243340539584e-06, "Pretrain/Loss": 1.9243981838226318, "Pretrain/Loss (Raw)": 1.7769454717636108, "Pretrain/Step": 7442, "Pretrain/Step Time": 8.6582122258842} +{"Pretrain/Learning Rate": 6.059082101347119e-06, "Pretrain/Loss": 1.9273812770843506, "Pretrain/Loss (Raw)": 1.9723799228668213, "Pretrain/Step": 7443, "Pretrain/Step Time": 8.657652342692018} +{"Pretrain/Learning Rate": 6.053542052996189e-06, "Pretrain/Loss": 1.9279382228851318, "Pretrain/Loss (Raw)": 1.9813724756240845, "Pretrain/Step": 7444, "Pretrain/Step Time": 8.656389674171805} +{"Pretrain/Learning Rate": 6.048004189640061e-06, "Pretrain/Loss": 1.9292527437210083, "Pretrain/Loss (Raw)": 2.275692939758301, "Pretrain/Step": 7445, "Pretrain/Step Time": 8.660151176154613} +{"Pretrain/Learning Rate": 6.0424685119174095e-06, "Pretrain/Loss": 1.9306037425994873, "Pretrain/Loss (Raw)": 2.1969363689422607, "Pretrain/Step": 7446, "Pretrain/Step Time": 8.663388688117266} +{"Pretrain/Learning Rate": 6.036935020466605e-06, "Pretrain/Loss": 1.931107997894287, "Pretrain/Loss (Raw)": 1.9358975887298584, "Pretrain/Step": 7447, "Pretrain/Step Time": 8.663202309980989} +{"Pretrain/Learning Rate": 6.031403715925818e-06, "Pretrain/Loss": 1.9297153949737549, "Pretrain/Loss (Raw)": 1.8624814748764038, "Pretrain/Step": 7448, "Pretrain/Step Time": 8.661667885258794} +{"Pretrain/Learning Rate": 6.025874598932937e-06, "Pretrain/Loss": 1.9294030666351318, "Pretrain/Loss (Raw)": 1.954813838005066, "Pretrain/Step": 7449, "Pretrain/Step Time": 8.662382503971457} +{"Pretrain/Learning Rate": 6.020347670125606e-06, "Pretrain/Loss": 1.9283922910690308, "Pretrain/Loss (Raw)": 1.9493287801742554, "Pretrain/Step": 7450, "Pretrain/Step Time": 8.662060510367155} +{"Pretrain/Learning Rate": 6.014822930141212e-06, "Pretrain/Loss": 1.9303257465362549, "Pretrain/Loss (Raw)": 2.050912380218506, "Pretrain/Step": 7451, "Pretrain/Step Time": 8.663574207574129} +{"Pretrain/Learning Rate": 6.0093003796169026e-06, "Pretrain/Loss": 1.9286694526672363, "Pretrain/Loss (Raw)": 1.785494327545166, "Pretrain/Step": 7452, "Pretrain/Step Time": 8.66202418319881} +{"Pretrain/Learning Rate": 6.003780019189565e-06, "Pretrain/Loss": 1.9272855520248413, "Pretrain/Loss (Raw)": 1.892113447189331, "Pretrain/Step": 7453, "Pretrain/Step Time": 8.65878919325769} +{"Pretrain/Learning Rate": 5.998261849495826e-06, "Pretrain/Loss": 1.9311226606369019, "Pretrain/Loss (Raw)": 2.3995039463043213, "Pretrain/Step": 7454, "Pretrain/Step Time": 8.661269107833505} +{"Pretrain/Learning Rate": 5.9927458711720615e-06, "Pretrain/Loss": 1.9307342767715454, "Pretrain/Loss (Raw)": 2.0215084552764893, "Pretrain/Step": 7455, "Pretrain/Step Time": 8.664640014991164} +{"Pretrain/Learning Rate": 5.9872320848544165e-06, "Pretrain/Loss": 1.9314589500427246, "Pretrain/Loss (Raw)": 1.8564623594284058, "Pretrain/Step": 7456, "Pretrain/Step Time": 8.665646469220519} +{"Pretrain/Learning Rate": 5.9817204911787576e-06, "Pretrain/Loss": 1.929226279258728, "Pretrain/Loss (Raw)": 1.695802092552185, "Pretrain/Step": 7457, "Pretrain/Step Time": 8.667079612612724} +{"Pretrain/Learning Rate": 5.976211090780712e-06, "Pretrain/Loss": 1.9272637367248535, "Pretrain/Loss (Raw)": 1.8197777271270752, "Pretrain/Step": 7458, "Pretrain/Step Time": 8.673036403954029} +{"Pretrain/Learning Rate": 5.970703884295636e-06, "Pretrain/Loss": 1.9266748428344727, "Pretrain/Loss (Raw)": 1.8721486330032349, "Pretrain/Step": 7459, "Pretrain/Step Time": 8.674351409077644} +{"Pretrain/Learning Rate": 5.965198872358665e-06, "Pretrain/Loss": 1.929875373840332, "Pretrain/Loss (Raw)": 2.2446999549865723, "Pretrain/Step": 7460, "Pretrain/Step Time": 8.667909884825349} +{"Pretrain/Learning Rate": 5.959696055604655e-06, "Pretrain/Loss": 1.9258198738098145, "Pretrain/Loss (Raw)": 1.3438990116119385, "Pretrain/Step": 7461, "Pretrain/Step Time": 8.66645989753306} +{"Pretrain/Learning Rate": 5.9541954346682165e-06, "Pretrain/Loss": 1.922441005706787, "Pretrain/Loss (Raw)": 1.5954796075820923, "Pretrain/Step": 7462, "Pretrain/Step Time": 8.665848281234503} +{"Pretrain/Learning Rate": 5.948697010183701e-06, "Pretrain/Loss": 1.9223817586898804, "Pretrain/Loss (Raw)": 2.086235761642456, "Pretrain/Step": 7463, "Pretrain/Step Time": 8.663841336965561} +{"Pretrain/Learning Rate": 5.943200782785227e-06, "Pretrain/Loss": 1.9246149063110352, "Pretrain/Loss (Raw)": 1.9619938135147095, "Pretrain/Step": 7464, "Pretrain/Step Time": 8.658576404675841} +{"Pretrain/Learning Rate": 5.937706753106634e-06, "Pretrain/Loss": 1.9249475002288818, "Pretrain/Loss (Raw)": 1.959902286529541, "Pretrain/Step": 7465, "Pretrain/Step Time": 8.660592496395111} +{"Pretrain/Learning Rate": 5.932214921781526e-06, "Pretrain/Loss": 1.9245126247406006, "Pretrain/Loss (Raw)": 1.7947218418121338, "Pretrain/Step": 7466, "Pretrain/Step Time": 8.673439096659422} +{"Pretrain/Learning Rate": 5.9267252894432355e-06, "Pretrain/Loss": 1.9223006963729858, "Pretrain/Loss (Raw)": 1.826036810874939, "Pretrain/Step": 7467, "Pretrain/Step Time": 8.671447318047285} +{"Pretrain/Learning Rate": 5.921237856724867e-06, "Pretrain/Loss": 1.9236972332000732, "Pretrain/Loss (Raw)": 2.1146059036254883, "Pretrain/Step": 7468, "Pretrain/Step Time": 8.665970969945192} +{"Pretrain/Learning Rate": 5.915752624259252e-06, "Pretrain/Loss": 1.9248480796813965, "Pretrain/Loss (Raw)": 2.215435028076172, "Pretrain/Step": 7469, "Pretrain/Step Time": 8.665764717385173} +{"Pretrain/Learning Rate": 5.910269592678971e-06, "Pretrain/Loss": 1.9271960258483887, "Pretrain/Loss (Raw)": 2.0258126258850098, "Pretrain/Step": 7470, "Pretrain/Step Time": 8.66096450202167} +{"Pretrain/Learning Rate": 5.904788762616348e-06, "Pretrain/Loss": 1.9290542602539062, "Pretrain/Loss (Raw)": 2.0688140392303467, "Pretrain/Step": 7471, "Pretrain/Step Time": 8.665321167558432} +{"Pretrain/Learning Rate": 5.899310134703479e-06, "Pretrain/Loss": 1.9295055866241455, "Pretrain/Loss (Raw)": 2.0448687076568604, "Pretrain/Step": 7472, "Pretrain/Step Time": 8.662058552727103} +{"Pretrain/Learning Rate": 5.893833709572155e-06, "Pretrain/Loss": 1.9311277866363525, "Pretrain/Loss (Raw)": 2.101057767868042, "Pretrain/Step": 7473, "Pretrain/Step Time": 8.665718514472246} +{"Pretrain/Learning Rate": 5.88835948785397e-06, "Pretrain/Loss": 1.9370291233062744, "Pretrain/Loss (Raw)": 2.0295088291168213, "Pretrain/Step": 7474, "Pretrain/Step Time": 8.661220751702785} +{"Pretrain/Learning Rate": 5.882887470180215e-06, "Pretrain/Loss": 1.9338186979293823, "Pretrain/Loss (Raw)": 1.7386562824249268, "Pretrain/Step": 7475, "Pretrain/Step Time": 8.66207586787641} +{"Pretrain/Learning Rate": 5.877417657181975e-06, "Pretrain/Loss": 1.9321825504302979, "Pretrain/Loss (Raw)": 1.8196299076080322, "Pretrain/Step": 7476, "Pretrain/Step Time": 8.663681242614985} +{"Pretrain/Learning Rate": 5.871950049490024e-06, "Pretrain/Loss": 1.9316227436065674, "Pretrain/Loss (Raw)": 2.0096755027770996, "Pretrain/Step": 7477, "Pretrain/Step Time": 8.664575522765517} +{"Pretrain/Learning Rate": 5.866484647734935e-06, "Pretrain/Loss": 1.932462215423584, "Pretrain/Loss (Raw)": 1.8385350704193115, "Pretrain/Step": 7478, "Pretrain/Step Time": 8.66629472374916} +{"Pretrain/Learning Rate": 5.861021452546997e-06, "Pretrain/Loss": 1.9323811531066895, "Pretrain/Loss (Raw)": 1.860549807548523, "Pretrain/Step": 7479, "Pretrain/Step Time": 8.662799928337336} +{"Pretrain/Learning Rate": 5.855560464556253e-06, "Pretrain/Loss": 1.9304423332214355, "Pretrain/Loss (Raw)": 1.8569356203079224, "Pretrain/Step": 7480, "Pretrain/Step Time": 8.663560690358281} +{"Pretrain/Learning Rate": 5.8501016843924785e-06, "Pretrain/Loss": 1.9312238693237305, "Pretrain/Loss (Raw)": 2.1007080078125, "Pretrain/Step": 7481, "Pretrain/Step Time": 8.666760064661503} +{"Pretrain/Learning Rate": 5.844645112685215e-06, "Pretrain/Loss": 1.9313722848892212, "Pretrain/Loss (Raw)": 2.1023809909820557, "Pretrain/Step": 7482, "Pretrain/Step Time": 8.674240095540881} +{"Pretrain/Learning Rate": 5.839190750063756e-06, "Pretrain/Loss": 1.929439902305603, "Pretrain/Loss (Raw)": 1.9543535709381104, "Pretrain/Step": 7483, "Pretrain/Step Time": 8.673980075865984} +{"Pretrain/Learning Rate": 5.833738597157093e-06, "Pretrain/Loss": 1.929809331893921, "Pretrain/Loss (Raw)": 1.9425703287124634, "Pretrain/Step": 7484, "Pretrain/Step Time": 8.674423485994339} +{"Pretrain/Learning Rate": 5.828288654594016e-06, "Pretrain/Loss": 1.9295355081558228, "Pretrain/Loss (Raw)": 1.9229369163513184, "Pretrain/Step": 7485, "Pretrain/Step Time": 8.676711717620492} +{"Pretrain/Learning Rate": 5.822840923003023e-06, "Pretrain/Loss": 1.9290322065353394, "Pretrain/Loss (Raw)": 2.033416271209717, "Pretrain/Step": 7486, "Pretrain/Step Time": 8.673748072236776} +{"Pretrain/Learning Rate": 5.817395403012396e-06, "Pretrain/Loss": 1.933270812034607, "Pretrain/Loss (Raw)": 2.0879013538360596, "Pretrain/Step": 7487, "Pretrain/Step Time": 8.668195629492402} +{"Pretrain/Learning Rate": 5.8119520952501085e-06, "Pretrain/Loss": 1.932724118232727, "Pretrain/Loss (Raw)": 1.8633251190185547, "Pretrain/Step": 7488, "Pretrain/Step Time": 8.666914505884051} +{"Pretrain/Learning Rate": 5.806511000343931e-06, "Pretrain/Loss": 1.9325768947601318, "Pretrain/Loss (Raw)": 1.9674445390701294, "Pretrain/Step": 7489, "Pretrain/Step Time": 8.664605256170034} +{"Pretrain/Learning Rate": 5.801072118921347e-06, "Pretrain/Loss": 1.9330308437347412, "Pretrain/Loss (Raw)": 2.0309059619903564, "Pretrain/Step": 7490, "Pretrain/Step Time": 8.664575098082423} +{"Pretrain/Learning Rate": 5.7956354516095935e-06, "Pretrain/Loss": 1.932340145111084, "Pretrain/Loss (Raw)": 1.936028003692627, "Pretrain/Step": 7491, "Pretrain/Step Time": 8.667448580265045} +{"Pretrain/Learning Rate": 5.790200999035647e-06, "Pretrain/Loss": 1.932680368423462, "Pretrain/Loss (Raw)": 2.019252300262451, "Pretrain/Step": 7492, "Pretrain/Step Time": 8.666248366236687} +{"Pretrain/Learning Rate": 5.784768761826248e-06, "Pretrain/Loss": 1.9340726137161255, "Pretrain/Loss (Raw)": 2.046549081802368, "Pretrain/Step": 7493, "Pretrain/Step Time": 8.665539490059018} +{"Pretrain/Learning Rate": 5.779338740607859e-06, "Pretrain/Loss": 1.934309482574463, "Pretrain/Loss (Raw)": 2.058696985244751, "Pretrain/Step": 7494, "Pretrain/Step Time": 8.667517812922597} +{"Pretrain/Learning Rate": 5.773910936006699e-06, "Pretrain/Loss": 1.9325872659683228, "Pretrain/Loss (Raw)": 1.8638830184936523, "Pretrain/Step": 7495, "Pretrain/Step Time": 8.666029652580619} +{"Pretrain/Learning Rate": 5.768485348648719e-06, "Pretrain/Loss": 1.9347925186157227, "Pretrain/Loss (Raw)": 1.935788631439209, "Pretrain/Step": 7496, "Pretrain/Step Time": 8.664333498105407} +{"Pretrain/Learning Rate": 5.763061979159637e-06, "Pretrain/Loss": 1.9346609115600586, "Pretrain/Loss (Raw)": 1.8775832653045654, "Pretrain/Step": 7497, "Pretrain/Step Time": 8.67129236459732} +{"Pretrain/Learning Rate": 5.757640828164895e-06, "Pretrain/Loss": 1.9366533756256104, "Pretrain/Loss (Raw)": 2.093106269836426, "Pretrain/Step": 7498, "Pretrain/Step Time": 8.67342589981854} +{"Pretrain/Learning Rate": 5.7522218962896865e-06, "Pretrain/Loss": 1.9344656467437744, "Pretrain/Loss (Raw)": 1.7883200645446777, "Pretrain/Step": 7499, "Pretrain/Step Time": 8.680285232141614} +{"Pretrain/Learning Rate": 5.746805184158941e-06, "Pretrain/Loss": 1.937694787979126, "Pretrain/Loss (Raw)": 2.211942434310913, "Pretrain/Step": 7500, "Pretrain/Step Time": 8.676678452640772} +{"Pretrain/Learning Rate": 5.74139069239735e-06, "Pretrain/Loss": 1.9351913928985596, "Pretrain/Loss (Raw)": 1.6259552240371704, "Pretrain/Step": 7501, "Pretrain/Step Time": 8.677780756726861} +{"Pretrain/Learning Rate": 5.735978421629337e-06, "Pretrain/Loss": 1.9328583478927612, "Pretrain/Loss (Raw)": 1.651989459991455, "Pretrain/Step": 7502, "Pretrain/Step Time": 8.675254318863153} +{"Pretrain/Learning Rate": 5.730568372479064e-06, "Pretrain/Loss": 1.9339505434036255, "Pretrain/Loss (Raw)": 2.015514850616455, "Pretrain/Step": 7503, "Pretrain/Step Time": 8.676774768158793} +{"Pretrain/Learning Rate": 5.725160545570443e-06, "Pretrain/Loss": 1.9351632595062256, "Pretrain/Loss (Raw)": 2.169353723526001, "Pretrain/Step": 7504, "Pretrain/Step Time": 8.677380342036486} +{"Pretrain/Learning Rate": 5.719754941527139e-06, "Pretrain/Loss": 1.9325859546661377, "Pretrain/Loss (Raw)": 1.6383776664733887, "Pretrain/Step": 7505, "Pretrain/Step Time": 8.679145051166415} +{"Pretrain/Learning Rate": 5.7143515609725475e-06, "Pretrain/Loss": 1.9341740608215332, "Pretrain/Loss (Raw)": 2.007251739501953, "Pretrain/Step": 7506, "Pretrain/Step Time": 8.67691277526319} +{"Pretrain/Learning Rate": 5.7089504045298115e-06, "Pretrain/Loss": 1.9345593452453613, "Pretrain/Loss (Raw)": 2.0983810424804688, "Pretrain/Step": 7507, "Pretrain/Step Time": 8.679528733715415} +{"Pretrain/Learning Rate": 5.703551472821808e-06, "Pretrain/Loss": 1.9319570064544678, "Pretrain/Loss (Raw)": 1.6408969163894653, "Pretrain/Step": 7508, "Pretrain/Step Time": 8.675113186240196} +{"Pretrain/Learning Rate": 5.698154766471186e-06, "Pretrain/Loss": 1.9311168193817139, "Pretrain/Loss (Raw)": 2.0224194526672363, "Pretrain/Step": 7509, "Pretrain/Step Time": 8.675160147249699} +{"Pretrain/Learning Rate": 5.692760286100307e-06, "Pretrain/Loss": 1.9320809841156006, "Pretrain/Loss (Raw)": 2.0383334159851074, "Pretrain/Step": 7510, "Pretrain/Step Time": 8.678256692364812} +{"Pretrain/Learning Rate": 5.6873680323312916e-06, "Pretrain/Loss": 1.935354232788086, "Pretrain/Loss (Raw)": 2.071712017059326, "Pretrain/Step": 7511, "Pretrain/Step Time": 8.675106402486563} +{"Pretrain/Learning Rate": 5.681978005785993e-06, "Pretrain/Loss": 1.936894416809082, "Pretrain/Loss (Raw)": 2.0695149898529053, "Pretrain/Step": 7512, "Pretrain/Step Time": 8.679900106042624} +{"Pretrain/Learning Rate": 5.676590207086035e-06, "Pretrain/Loss": 1.9374606609344482, "Pretrain/Loss (Raw)": 2.1729540824890137, "Pretrain/Step": 7513, "Pretrain/Step Time": 8.679409984499216} +{"Pretrain/Learning Rate": 5.671204636852734e-06, "Pretrain/Loss": 1.9361114501953125, "Pretrain/Loss (Raw)": 1.814228892326355, "Pretrain/Step": 7514, "Pretrain/Step Time": 8.68602529540658} +{"Pretrain/Learning Rate": 5.6658212957071995e-06, "Pretrain/Loss": 1.9360008239746094, "Pretrain/Loss (Raw)": 2.0279927253723145, "Pretrain/Step": 7515, "Pretrain/Step Time": 8.685839522629976} +{"Pretrain/Learning Rate": 5.6604401842702545e-06, "Pretrain/Loss": 1.9362566471099854, "Pretrain/Loss (Raw)": 2.1486704349517822, "Pretrain/Step": 7516, "Pretrain/Step Time": 8.68527497164905} +{"Pretrain/Learning Rate": 5.6550613031624925e-06, "Pretrain/Loss": 1.9377115964889526, "Pretrain/Loss (Raw)": 1.9284887313842773, "Pretrain/Step": 7517, "Pretrain/Step Time": 8.685904916375875} +{"Pretrain/Learning Rate": 5.649684653004203e-06, "Pretrain/Loss": 1.9313123226165771, "Pretrain/Loss (Raw)": 1.2852274179458618, "Pretrain/Step": 7518, "Pretrain/Step Time": 8.688881497830153} +{"Pretrain/Learning Rate": 5.644310234415467e-06, "Pretrain/Loss": 1.9328150749206543, "Pretrain/Loss (Raw)": 2.1202034950256348, "Pretrain/Step": 7519, "Pretrain/Step Time": 8.687809906899929} +{"Pretrain/Learning Rate": 5.638938048016082e-06, "Pretrain/Loss": 1.9324016571044922, "Pretrain/Loss (Raw)": 1.8816274404525757, "Pretrain/Step": 7520, "Pretrain/Step Time": 8.686329808086157} +{"Pretrain/Learning Rate": 5.633568094425593e-06, "Pretrain/Loss": 1.9318742752075195, "Pretrain/Loss (Raw)": 2.024834394454956, "Pretrain/Step": 7521, "Pretrain/Step Time": 8.681211046874523} +{"Pretrain/Learning Rate": 5.6282003742632846e-06, "Pretrain/Loss": 1.931300401687622, "Pretrain/Loss (Raw)": 2.049475908279419, "Pretrain/Step": 7522, "Pretrain/Step Time": 8.684433076530695} +{"Pretrain/Learning Rate": 5.622834888148188e-06, "Pretrain/Loss": 1.931822657585144, "Pretrain/Loss (Raw)": 1.8883917331695557, "Pretrain/Step": 7523, "Pretrain/Step Time": 8.683852711692452} +{"Pretrain/Learning Rate": 5.617471636699098e-06, "Pretrain/Loss": 1.9322922229766846, "Pretrain/Loss (Raw)": 2.0168614387512207, "Pretrain/Step": 7524, "Pretrain/Step Time": 8.68533713184297} +{"Pretrain/Learning Rate": 5.612110620534497e-06, "Pretrain/Loss": 1.9306155443191528, "Pretrain/Loss (Raw)": 1.7528234720230103, "Pretrain/Step": 7525, "Pretrain/Step Time": 8.68179938942194} +{"Pretrain/Learning Rate": 5.606751840272664e-06, "Pretrain/Loss": 1.9340828657150269, "Pretrain/Loss (Raw)": 2.0562593936920166, "Pretrain/Step": 7526, "Pretrain/Step Time": 8.68183808028698} +{"Pretrain/Learning Rate": 5.601395296531586e-06, "Pretrain/Loss": 1.9342377185821533, "Pretrain/Loss (Raw)": 1.956229567527771, "Pretrain/Step": 7527, "Pretrain/Step Time": 8.679028753191233} +{"Pretrain/Learning Rate": 5.596040989929027e-06, "Pretrain/Loss": 1.9360861778259277, "Pretrain/Loss (Raw)": 2.037611722946167, "Pretrain/Step": 7528, "Pretrain/Step Time": 8.685613889247179} +{"Pretrain/Learning Rate": 5.5906889210824405e-06, "Pretrain/Loss": 1.9345899820327759, "Pretrain/Loss (Raw)": 1.7924294471740723, "Pretrain/Step": 7529, "Pretrain/Step Time": 8.681438732892275} +{"Pretrain/Learning Rate": 5.585339090609073e-06, "Pretrain/Loss": 1.9353771209716797, "Pretrain/Loss (Raw)": 1.943200707435608, "Pretrain/Step": 7530, "Pretrain/Step Time": 8.689508467912674} +{"Pretrain/Learning Rate": 5.579991499125889e-06, "Pretrain/Loss": 1.9366798400878906, "Pretrain/Loss (Raw)": 1.7975053787231445, "Pretrain/Step": 7531, "Pretrain/Step Time": 8.685199404135346} +{"Pretrain/Learning Rate": 5.574646147249596e-06, "Pretrain/Loss": 1.93817937374115, "Pretrain/Loss (Raw)": 2.0890493392944336, "Pretrain/Step": 7532, "Pretrain/Step Time": 8.683522211387753} +{"Pretrain/Learning Rate": 5.569303035596635e-06, "Pretrain/Loss": 1.940883755683899, "Pretrain/Loss (Raw)": 1.76181161403656, "Pretrain/Step": 7533, "Pretrain/Step Time": 8.681822020560503} +{"Pretrain/Learning Rate": 5.563962164783215e-06, "Pretrain/Loss": 1.9416673183441162, "Pretrain/Loss (Raw)": 2.005385637283325, "Pretrain/Step": 7534, "Pretrain/Step Time": 8.684668930247426} +{"Pretrain/Learning Rate": 5.558623535425267e-06, "Pretrain/Loss": 1.9411211013793945, "Pretrain/Loss (Raw)": 1.9839732646942139, "Pretrain/Step": 7535, "Pretrain/Step Time": 8.684403160586953} +{"Pretrain/Learning Rate": 5.553287148138461e-06, "Pretrain/Loss": 1.9370129108428955, "Pretrain/Loss (Raw)": 1.4987045526504517, "Pretrain/Step": 7536, "Pretrain/Step Time": 8.685928575694561} +{"Pretrain/Learning Rate": 5.5479530035382115e-06, "Pretrain/Loss": 1.93723464012146, "Pretrain/Loss (Raw)": 1.9118176698684692, "Pretrain/Step": 7537, "Pretrain/Step Time": 8.683434626087546} +{"Pretrain/Learning Rate": 5.542621102239686e-06, "Pretrain/Loss": 1.9380122423171997, "Pretrain/Loss (Raw)": 2.086211919784546, "Pretrain/Step": 7538, "Pretrain/Step Time": 8.680747577920556} +{"Pretrain/Learning Rate": 5.537291444857787e-06, "Pretrain/Loss": 1.9367631673812866, "Pretrain/Loss (Raw)": 1.7840877771377563, "Pretrain/Step": 7539, "Pretrain/Step Time": 8.679360022768378} +{"Pretrain/Learning Rate": 5.531964032007144e-06, "Pretrain/Loss": 1.9337377548217773, "Pretrain/Loss (Raw)": 1.8141666650772095, "Pretrain/Step": 7540, "Pretrain/Step Time": 8.679429164156318} +{"Pretrain/Learning Rate": 5.526638864302144e-06, "Pretrain/Loss": 1.933149814605713, "Pretrain/Loss (Raw)": 2.0579075813293457, "Pretrain/Step": 7541, "Pretrain/Step Time": 8.677841503173113} +{"Pretrain/Learning Rate": 5.521315942356914e-06, "Pretrain/Loss": 1.935778260231018, "Pretrain/Loss (Raw)": 1.822131633758545, "Pretrain/Step": 7542, "Pretrain/Step Time": 8.679874250665307} +{"Pretrain/Learning Rate": 5.5159952667853204e-06, "Pretrain/Loss": 1.931910753250122, "Pretrain/Loss (Raw)": 1.525896668434143, "Pretrain/Step": 7543, "Pretrain/Step Time": 8.679161924868822} +{"Pretrain/Learning Rate": 5.510676838200959e-06, "Pretrain/Loss": 1.9299026727676392, "Pretrain/Loss (Raw)": 1.74712073802948, "Pretrain/Step": 7544, "Pretrain/Step Time": 8.675055922940373} +{"Pretrain/Learning Rate": 5.505360657217179e-06, "Pretrain/Loss": 1.9284125566482544, "Pretrain/Loss (Raw)": 1.930677890777588, "Pretrain/Step": 7545, "Pretrain/Step Time": 8.672645933926105} +{"Pretrain/Learning Rate": 5.5000467244470745e-06, "Pretrain/Loss": 1.9287595748901367, "Pretrain/Loss (Raw)": 1.9690502882003784, "Pretrain/Step": 7546, "Pretrain/Step Time": 8.662008751183748} +{"Pretrain/Learning Rate": 5.494735040503468e-06, "Pretrain/Loss": 1.9316637516021729, "Pretrain/Loss (Raw)": 2.188295841217041, "Pretrain/Step": 7547, "Pretrain/Step Time": 8.663433281704783} +{"Pretrain/Learning Rate": 5.48942560599893e-06, "Pretrain/Loss": 1.932410717010498, "Pretrain/Loss (Raw)": 1.9858343601226807, "Pretrain/Step": 7548, "Pretrain/Step Time": 8.664220111444592} +{"Pretrain/Learning Rate": 5.4841184215457615e-06, "Pretrain/Loss": 1.933414101600647, "Pretrain/Loss (Raw)": 1.86604905128479, "Pretrain/Step": 7549, "Pretrain/Step Time": 8.66577779315412} +{"Pretrain/Learning Rate": 5.478813487756024e-06, "Pretrain/Loss": 1.9318222999572754, "Pretrain/Loss (Raw)": 1.908139705657959, "Pretrain/Step": 7550, "Pretrain/Step Time": 8.664576180279255} +{"Pretrain/Learning Rate": 5.473510805241502e-06, "Pretrain/Loss": 1.9325430393218994, "Pretrain/Loss (Raw)": 1.9319632053375244, "Pretrain/Step": 7551, "Pretrain/Step Time": 8.663957819342613} +{"Pretrain/Learning Rate": 5.468210374613727e-06, "Pretrain/Loss": 1.9348636865615845, "Pretrain/Loss (Raw)": 2.0494279861450195, "Pretrain/Step": 7552, "Pretrain/Step Time": 8.66072908975184} +{"Pretrain/Learning Rate": 5.46291219648396e-06, "Pretrain/Loss": 1.9354212284088135, "Pretrain/Loss (Raw)": 2.010195016860962, "Pretrain/Step": 7553, "Pretrain/Step Time": 8.6598900873214} +{"Pretrain/Learning Rate": 5.457616271463234e-06, "Pretrain/Loss": 1.9338865280151367, "Pretrain/Loss (Raw)": 1.707572340965271, "Pretrain/Step": 7554, "Pretrain/Step Time": 8.659552736207843} +{"Pretrain/Learning Rate": 5.452322600162274e-06, "Pretrain/Loss": 1.9334303140640259, "Pretrain/Loss (Raw)": 1.7960385084152222, "Pretrain/Step": 7555, "Pretrain/Step Time": 8.654421303421259} +{"Pretrain/Learning Rate": 5.447031183191589e-06, "Pretrain/Loss": 1.932755947113037, "Pretrain/Loss (Raw)": 1.8738150596618652, "Pretrain/Step": 7556, "Pretrain/Step Time": 8.656890699639916} +{"Pretrain/Learning Rate": 5.441742021161398e-06, "Pretrain/Loss": 1.9313668012619019, "Pretrain/Loss (Raw)": 1.7653931379318237, "Pretrain/Step": 7557, "Pretrain/Step Time": 8.656596587970853} +{"Pretrain/Learning Rate": 5.436455114681693e-06, "Pretrain/Loss": 1.9349466562271118, "Pretrain/Loss (Raw)": 2.237588405609131, "Pretrain/Step": 7558, "Pretrain/Step Time": 8.651587687432766} +{"Pretrain/Learning Rate": 5.431170464362157e-06, "Pretrain/Loss": 1.9359673261642456, "Pretrain/Loss (Raw)": 2.041865825653076, "Pretrain/Step": 7559, "Pretrain/Step Time": 8.651952523738146} +{"Pretrain/Learning Rate": 5.42588807081226e-06, "Pretrain/Loss": 1.9361618757247925, "Pretrain/Loss (Raw)": 1.994848370552063, "Pretrain/Step": 7560, "Pretrain/Step Time": 8.6520936768502} +{"Pretrain/Learning Rate": 5.420607934641181e-06, "Pretrain/Loss": 1.9341578483581543, "Pretrain/Loss (Raw)": 1.9151506423950195, "Pretrain/Step": 7561, "Pretrain/Step Time": 8.656391490250826} +{"Pretrain/Learning Rate": 5.415330056457871e-06, "Pretrain/Loss": 1.9349544048309326, "Pretrain/Loss (Raw)": 1.7965389490127563, "Pretrain/Step": 7562, "Pretrain/Step Time": 8.653841754421592} +{"Pretrain/Learning Rate": 5.410054436870968e-06, "Pretrain/Loss": 1.9345417022705078, "Pretrain/Loss (Raw)": 2.091784715652466, "Pretrain/Step": 7563, "Pretrain/Step Time": 8.657019760459661} +{"Pretrain/Learning Rate": 5.404781076488901e-06, "Pretrain/Loss": 1.9338414669036865, "Pretrain/Loss (Raw)": 1.8013619184494019, "Pretrain/Step": 7564, "Pretrain/Step Time": 8.656373258680105} +{"Pretrain/Learning Rate": 5.399509975919828e-06, "Pretrain/Loss": 1.9326045513153076, "Pretrain/Loss (Raw)": 1.7909163236618042, "Pretrain/Step": 7565, "Pretrain/Step Time": 8.65564438700676} +{"Pretrain/Learning Rate": 5.394241135771613e-06, "Pretrain/Loss": 1.932223916053772, "Pretrain/Loss (Raw)": 1.8566160202026367, "Pretrain/Step": 7566, "Pretrain/Step Time": 8.657253496348858} +{"Pretrain/Learning Rate": 5.388974556651902e-06, "Pretrain/Loss": 1.931363821029663, "Pretrain/Loss (Raw)": 1.8435112237930298, "Pretrain/Step": 7567, "Pretrain/Step Time": 8.658103564754128} +{"Pretrain/Learning Rate": 5.3837102391680465e-06, "Pretrain/Loss": 1.9346957206726074, "Pretrain/Loss (Raw)": 2.09206223487854, "Pretrain/Step": 7568, "Pretrain/Step Time": 8.654452895745635} +{"Pretrain/Learning Rate": 5.378448183927176e-06, "Pretrain/Loss": 1.9363758563995361, "Pretrain/Loss (Raw)": 1.904719352722168, "Pretrain/Step": 7569, "Pretrain/Step Time": 8.651471870020032} +{"Pretrain/Learning Rate": 5.373188391536108e-06, "Pretrain/Loss": 1.9367752075195312, "Pretrain/Loss (Raw)": 1.828039526939392, "Pretrain/Step": 7570, "Pretrain/Step Time": 8.652320630848408} +{"Pretrain/Learning Rate": 5.3679308626014445e-06, "Pretrain/Loss": 1.9352483749389648, "Pretrain/Loss (Raw)": 1.7769606113433838, "Pretrain/Step": 7571, "Pretrain/Step Time": 8.65583599358797} +{"Pretrain/Learning Rate": 5.362675597729505e-06, "Pretrain/Loss": 1.9327489137649536, "Pretrain/Loss (Raw)": 1.6614326238632202, "Pretrain/Step": 7572, "Pretrain/Step Time": 8.658373838290572} +{"Pretrain/Learning Rate": 5.357422597526349e-06, "Pretrain/Loss": 1.9296053647994995, "Pretrain/Loss (Raw)": 1.873331904411316, "Pretrain/Step": 7573, "Pretrain/Step Time": 8.65840751491487} +{"Pretrain/Learning Rate": 5.3521718625977715e-06, "Pretrain/Loss": 1.929165244102478, "Pretrain/Loss (Raw)": 2.1405866146087646, "Pretrain/Step": 7574, "Pretrain/Step Time": 8.659750252962112} +{"Pretrain/Learning Rate": 5.346923393549325e-06, "Pretrain/Loss": 1.9287655353546143, "Pretrain/Loss (Raw)": 1.8847492933273315, "Pretrain/Step": 7575, "Pretrain/Step Time": 8.66053032502532} +{"Pretrain/Learning Rate": 5.34167719098628e-06, "Pretrain/Loss": 1.9293252229690552, "Pretrain/Loss (Raw)": 1.9341120719909668, "Pretrain/Step": 7576, "Pretrain/Step Time": 8.657153528183699} +{"Pretrain/Learning Rate": 5.336433255513656e-06, "Pretrain/Loss": 1.9271142482757568, "Pretrain/Loss (Raw)": 1.6718064546585083, "Pretrain/Step": 7577, "Pretrain/Step Time": 8.655501425266266} +{"Pretrain/Learning Rate": 5.331191587736198e-06, "Pretrain/Loss": 1.9266464710235596, "Pretrain/Loss (Raw)": 1.88945472240448, "Pretrain/Step": 7578, "Pretrain/Step Time": 8.654281148687005} +{"Pretrain/Learning Rate": 5.325952188258418e-06, "Pretrain/Loss": 1.9264109134674072, "Pretrain/Loss (Raw)": 2.020775318145752, "Pretrain/Step": 7579, "Pretrain/Step Time": 8.653495088219643} +{"Pretrain/Learning Rate": 5.320715057684536e-06, "Pretrain/Loss": 1.9291162490844727, "Pretrain/Loss (Raw)": 2.1317572593688965, "Pretrain/Step": 7580, "Pretrain/Step Time": 8.657109813764691} +{"Pretrain/Learning Rate": 5.315480196618527e-06, "Pretrain/Loss": 1.9297255277633667, "Pretrain/Loss (Raw)": 1.9701120853424072, "Pretrain/Step": 7581, "Pretrain/Step Time": 8.657749965786934} +{"Pretrain/Learning Rate": 5.310247605664093e-06, "Pretrain/Loss": 1.9265133142471313, "Pretrain/Loss (Raw)": 1.9883451461791992, "Pretrain/Step": 7582, "Pretrain/Step Time": 8.657656591385603} +{"Pretrain/Learning Rate": 5.30501728542469e-06, "Pretrain/Loss": 1.924546480178833, "Pretrain/Loss (Raw)": 1.7697629928588867, "Pretrain/Step": 7583, "Pretrain/Step Time": 8.652881771326065} +{"Pretrain/Learning Rate": 5.299789236503503e-06, "Pretrain/Loss": 1.9265339374542236, "Pretrain/Loss (Raw)": 2.110853910446167, "Pretrain/Step": 7584, "Pretrain/Step Time": 8.647500650957227} +{"Pretrain/Learning Rate": 5.294563459503449e-06, "Pretrain/Loss": 1.927819013595581, "Pretrain/Loss (Raw)": 1.8602896928787231, "Pretrain/Step": 7585, "Pretrain/Step Time": 8.652862653136253} +{"Pretrain/Learning Rate": 5.2893399550271835e-06, "Pretrain/Loss": 1.9290316104888916, "Pretrain/Loss (Raw)": 1.974985122680664, "Pretrain/Step": 7586, "Pretrain/Step Time": 8.64684583991766} +{"Pretrain/Learning Rate": 5.2841187236771226e-06, "Pretrain/Loss": 1.9305660724639893, "Pretrain/Loss (Raw)": 2.0685617923736572, "Pretrain/Step": 7587, "Pretrain/Step Time": 8.6454022154212} +{"Pretrain/Learning Rate": 5.278899766055395e-06, "Pretrain/Loss": 1.9278085231781006, "Pretrain/Loss (Raw)": 1.891714096069336, "Pretrain/Step": 7588, "Pretrain/Step Time": 8.64553389325738} +{"Pretrain/Learning Rate": 5.273683082763875e-06, "Pretrain/Loss": 1.9329724311828613, "Pretrain/Loss (Raw)": 2.004896402359009, "Pretrain/Step": 7589, "Pretrain/Step Time": 8.64509098418057} +{"Pretrain/Learning Rate": 5.26846867440417e-06, "Pretrain/Loss": 1.9347493648529053, "Pretrain/Loss (Raw)": 1.8229180574417114, "Pretrain/Step": 7590, "Pretrain/Step Time": 8.643858021125197} +{"Pretrain/Learning Rate": 5.263256541577641e-06, "Pretrain/Loss": 1.9349677562713623, "Pretrain/Loss (Raw)": 2.114210367202759, "Pretrain/Step": 7591, "Pretrain/Step Time": 8.643103970214725} +{"Pretrain/Learning Rate": 5.25804668488537e-06, "Pretrain/Loss": 1.934985637664795, "Pretrain/Loss (Raw)": 1.9642771482467651, "Pretrain/Step": 7592, "Pretrain/Step Time": 8.64830574579537} +{"Pretrain/Learning Rate": 5.252839104928184e-06, "Pretrain/Loss": 1.9338972568511963, "Pretrain/Loss (Raw)": 1.8205692768096924, "Pretrain/Step": 7593, "Pretrain/Step Time": 8.646562861278653} +{"Pretrain/Learning Rate": 5.247633802306637e-06, "Pretrain/Loss": 1.9368630647659302, "Pretrain/Loss (Raw)": 2.174356698989868, "Pretrain/Step": 7594, "Pretrain/Step Time": 8.634658936411142} +{"Pretrain/Learning Rate": 5.242430777621049e-06, "Pretrain/Loss": 1.938254475593567, "Pretrain/Loss (Raw)": 2.004141330718994, "Pretrain/Step": 7595, "Pretrain/Step Time": 8.638282595202327} +{"Pretrain/Learning Rate": 5.2372300314714295e-06, "Pretrain/Loss": 1.9381568431854248, "Pretrain/Loss (Raw)": 2.1021029949188232, "Pretrain/Step": 7596, "Pretrain/Step Time": 8.642155539244413} +{"Pretrain/Learning Rate": 5.232031564457576e-06, "Pretrain/Loss": 1.9335567951202393, "Pretrain/Loss (Raw)": 1.626613736152649, "Pretrain/Step": 7597, "Pretrain/Step Time": 8.642507074400783} +{"Pretrain/Learning Rate": 5.226835377178984e-06, "Pretrain/Loss": 1.9343929290771484, "Pretrain/Loss (Raw)": 2.1328587532043457, "Pretrain/Step": 7598, "Pretrain/Step Time": 8.641089737415314} +{"Pretrain/Learning Rate": 5.221641470234928e-06, "Pretrain/Loss": 1.9311728477478027, "Pretrain/Loss (Raw)": 1.6566394567489624, "Pretrain/Step": 7599, "Pretrain/Step Time": 8.6374297067523} +{"Pretrain/Learning Rate": 5.216449844224358e-06, "Pretrain/Loss": 1.9311444759368896, "Pretrain/Loss (Raw)": 2.0412352085113525, "Pretrain/Step": 7600, "Pretrain/Step Time": 8.639740904793143} +{"Pretrain/Learning Rate": 5.211260499746026e-06, "Pretrain/Loss": 1.9311152696609497, "Pretrain/Loss (Raw)": 2.097317695617676, "Pretrain/Step": 7601, "Pretrain/Step Time": 8.636776426807046} +{"Pretrain/Learning Rate": 5.206073437398371e-06, "Pretrain/Loss": 1.9309771060943604, "Pretrain/Loss (Raw)": 2.011824607849121, "Pretrain/Step": 7602, "Pretrain/Step Time": 8.63824212923646} +{"Pretrain/Learning Rate": 5.200888657779615e-06, "Pretrain/Loss": 1.9328744411468506, "Pretrain/Loss (Raw)": 1.9815279245376587, "Pretrain/Step": 7603, "Pretrain/Step Time": 8.639690617099404} +{"Pretrain/Learning Rate": 5.19570616148766e-06, "Pretrain/Loss": 1.9325804710388184, "Pretrain/Loss (Raw)": 1.7819865942001343, "Pretrain/Step": 7604, "Pretrain/Step Time": 8.644012335687876} +{"Pretrain/Learning Rate": 5.190525949120193e-06, "Pretrain/Loss": 1.9315285682678223, "Pretrain/Loss (Raw)": 1.8750364780426025, "Pretrain/Step": 7605, "Pretrain/Step Time": 8.640770614147186} +{"Pretrain/Learning Rate": 5.18534802127463e-06, "Pretrain/Loss": 1.931965708732605, "Pretrain/Loss (Raw)": 1.8944839239120483, "Pretrain/Step": 7606, "Pretrain/Step Time": 8.641840951517224} +{"Pretrain/Learning Rate": 5.1801723785480925e-06, "Pretrain/Loss": 1.9335968494415283, "Pretrain/Loss (Raw)": 2.069338321685791, "Pretrain/Step": 7607, "Pretrain/Step Time": 8.643264746293426} +{"Pretrain/Learning Rate": 5.174999021537475e-06, "Pretrain/Loss": 1.932481288909912, "Pretrain/Loss (Raw)": 1.7141364812850952, "Pretrain/Step": 7608, "Pretrain/Step Time": 8.644947381690145} +{"Pretrain/Learning Rate": 5.169827950839384e-06, "Pretrain/Loss": 1.932085633277893, "Pretrain/Loss (Raw)": 2.0500707626342773, "Pretrain/Step": 7609, "Pretrain/Step Time": 8.641511287540197} +{"Pretrain/Learning Rate": 5.164659167050187e-06, "Pretrain/Loss": 1.931167721748352, "Pretrain/Loss (Raw)": 1.984886884689331, "Pretrain/Step": 7610, "Pretrain/Step Time": 8.640644440427423} +{"Pretrain/Learning Rate": 5.15949267076595e-06, "Pretrain/Loss": 1.9332629442214966, "Pretrain/Loss (Raw)": 2.222551107406616, "Pretrain/Step": 7611, "Pretrain/Step Time": 8.645155031234026} +{"Pretrain/Learning Rate": 5.1543284625825165e-06, "Pretrain/Loss": 1.9362555742263794, "Pretrain/Loss (Raw)": 2.3256213665008545, "Pretrain/Step": 7612, "Pretrain/Step Time": 8.6410302054137} +{"Pretrain/Learning Rate": 5.149166543095444e-06, "Pretrain/Loss": 1.9373224973678589, "Pretrain/Loss (Raw)": 2.059493064880371, "Pretrain/Step": 7613, "Pretrain/Step Time": 8.640434401109815} +{"Pretrain/Learning Rate": 5.144006912900021e-06, "Pretrain/Loss": 1.9374483823776245, "Pretrain/Loss (Raw)": 2.0495429039001465, "Pretrain/Step": 7614, "Pretrain/Step Time": 8.63969412818551} +{"Pretrain/Learning Rate": 5.138849572591281e-06, "Pretrain/Loss": 1.9352867603302002, "Pretrain/Loss (Raw)": 1.8112274408340454, "Pretrain/Step": 7615, "Pretrain/Step Time": 8.64386598020792} +{"Pretrain/Learning Rate": 5.133694522764002e-06, "Pretrain/Loss": 1.932870864868164, "Pretrain/Loss (Raw)": 1.554073691368103, "Pretrain/Step": 7616, "Pretrain/Step Time": 8.643974056467414} +{"Pretrain/Learning Rate": 5.128541764012687e-06, "Pretrain/Loss": 1.932352900505066, "Pretrain/Loss (Raw)": 1.901146411895752, "Pretrain/Step": 7617, "Pretrain/Step Time": 8.643946759402752} +{"Pretrain/Learning Rate": 5.123391296931571e-06, "Pretrain/Loss": 1.9311349391937256, "Pretrain/Loss (Raw)": 1.8750052452087402, "Pretrain/Step": 7618, "Pretrain/Step Time": 8.642795892432332} +{"Pretrain/Learning Rate": 5.118243122114625e-06, "Pretrain/Loss": 1.9311625957489014, "Pretrain/Loss (Raw)": 1.939573884010315, "Pretrain/Step": 7619, "Pretrain/Step Time": 8.645461667329073} +{"Pretrain/Learning Rate": 5.113097240155576e-06, "Pretrain/Loss": 1.9287453889846802, "Pretrain/Loss (Raw)": 1.7098515033721924, "Pretrain/Step": 7620, "Pretrain/Step Time": 8.645521873608232} +{"Pretrain/Learning Rate": 5.107953651647862e-06, "Pretrain/Loss": 1.9272366762161255, "Pretrain/Loss (Raw)": 1.8534256219863892, "Pretrain/Step": 7621, "Pretrain/Step Time": 8.646058555692434} +{"Pretrain/Learning Rate": 5.10281235718467e-06, "Pretrain/Loss": 1.925553321838379, "Pretrain/Loss (Raw)": 1.8432278633117676, "Pretrain/Step": 7622, "Pretrain/Step Time": 8.644941156730056} +{"Pretrain/Learning Rate": 5.097673357358907e-06, "Pretrain/Loss": 1.9265145063400269, "Pretrain/Loss (Raw)": 1.9869276285171509, "Pretrain/Step": 7623, "Pretrain/Step Time": 8.646433614194393} +{"Pretrain/Learning Rate": 5.092536652763241e-06, "Pretrain/Loss": 1.9268243312835693, "Pretrain/Loss (Raw)": 1.975440263748169, "Pretrain/Step": 7624, "Pretrain/Step Time": 8.646086629480124} +{"Pretrain/Learning Rate": 5.087402243990056e-06, "Pretrain/Loss": 1.9254639148712158, "Pretrain/Loss (Raw)": 1.703449010848999, "Pretrain/Step": 7625, "Pretrain/Step Time": 8.641835557296872} +{"Pretrain/Learning Rate": 5.0822701316314755e-06, "Pretrain/Loss": 1.9236088991165161, "Pretrain/Loss (Raw)": 1.85566246509552, "Pretrain/Step": 7626, "Pretrain/Step Time": 8.642345124855638} +{"Pretrain/Learning Rate": 5.0771403162793525e-06, "Pretrain/Loss": 1.9266114234924316, "Pretrain/Loss (Raw)": 2.172650098800659, "Pretrain/Step": 7627, "Pretrain/Step Time": 8.637130128219724} +{"Pretrain/Learning Rate": 5.072012798525294e-06, "Pretrain/Loss": 1.9250221252441406, "Pretrain/Loss (Raw)": 2.0085060596466064, "Pretrain/Step": 7628, "Pretrain/Step Time": 8.642971377819777} +{"Pretrain/Learning Rate": 5.0668875789606245e-06, "Pretrain/Loss": 1.926632046699524, "Pretrain/Loss (Raw)": 1.8320138454437256, "Pretrain/Step": 7629, "Pretrain/Step Time": 8.64084828644991} +{"Pretrain/Learning Rate": 5.061764658176407e-06, "Pretrain/Loss": 1.9298715591430664, "Pretrain/Loss (Raw)": 2.066667079925537, "Pretrain/Step": 7630, "Pretrain/Step Time": 8.63702529668808} +{"Pretrain/Learning Rate": 5.056644036763433e-06, "Pretrain/Loss": 1.9284486770629883, "Pretrain/Loss (Raw)": 1.8333929777145386, "Pretrain/Step": 7631, "Pretrain/Step Time": 8.64187272824347} +{"Pretrain/Learning Rate": 5.051525715312253e-06, "Pretrain/Loss": 1.927475929260254, "Pretrain/Loss (Raw)": 2.04482364654541, "Pretrain/Step": 7632, "Pretrain/Step Time": 8.640798550099134} +{"Pretrain/Learning Rate": 5.046409694413129e-06, "Pretrain/Loss": 1.931570291519165, "Pretrain/Loss (Raw)": 2.162458658218384, "Pretrain/Step": 7633, "Pretrain/Step Time": 8.642007468268275} +{"Pretrain/Learning Rate": 5.04129597465606e-06, "Pretrain/Loss": 1.9286868572235107, "Pretrain/Loss (Raw)": 1.6381829977035522, "Pretrain/Step": 7634, "Pretrain/Step Time": 8.643865093588829} +{"Pretrain/Learning Rate": 5.0361845566307825e-06, "Pretrain/Loss": 1.9272048473358154, "Pretrain/Loss (Raw)": 1.90868079662323, "Pretrain/Step": 7635, "Pretrain/Step Time": 8.643894476816058} +{"Pretrain/Learning Rate": 5.0310754409267886e-06, "Pretrain/Loss": 1.9306578636169434, "Pretrain/Loss (Raw)": 2.082878589630127, "Pretrain/Step": 7636, "Pretrain/Step Time": 8.640236116945744} +{"Pretrain/Learning Rate": 5.025968628133259e-06, "Pretrain/Loss": 1.9301083087921143, "Pretrain/Loss (Raw)": 1.9520738124847412, "Pretrain/Step": 7637, "Pretrain/Step Time": 8.644526777788997} +{"Pretrain/Learning Rate": 5.020864118839152e-06, "Pretrain/Loss": 1.929168939590454, "Pretrain/Loss (Raw)": 1.9181040525436401, "Pretrain/Step": 7638, "Pretrain/Step Time": 8.64141170680523} +{"Pretrain/Learning Rate": 5.015761913633135e-06, "Pretrain/Loss": 1.927276611328125, "Pretrain/Loss (Raw)": 1.8294912576675415, "Pretrain/Step": 7639, "Pretrain/Step Time": 8.650284150615335} +{"Pretrain/Learning Rate": 5.010662013103637e-06, "Pretrain/Loss": 1.9255402088165283, "Pretrain/Loss (Raw)": 1.8472342491149902, "Pretrain/Step": 7640, "Pretrain/Step Time": 8.649508966132998} +{"Pretrain/Learning Rate": 5.0055644178387735e-06, "Pretrain/Loss": 1.9253032207489014, "Pretrain/Loss (Raw)": 2.1426284313201904, "Pretrain/Step": 7641, "Pretrain/Step Time": 8.651056276634336} +{"Pretrain/Learning Rate": 5.0004691284264435e-06, "Pretrain/Loss": 1.927538275718689, "Pretrain/Loss (Raw)": 2.1003262996673584, "Pretrain/Step": 7642, "Pretrain/Step Time": 8.643490528687835} +{"Pretrain/Learning Rate": 4.99537614545425e-06, "Pretrain/Loss": 1.9273412227630615, "Pretrain/Loss (Raw)": 2.0027778148651123, "Pretrain/Step": 7643, "Pretrain/Step Time": 8.642640992999077} +{"Pretrain/Learning Rate": 4.990285469509559e-06, "Pretrain/Loss": 1.9244024753570557, "Pretrain/Loss (Raw)": 1.7725110054016113, "Pretrain/Step": 7644, "Pretrain/Step Time": 8.643674936145544} +{"Pretrain/Learning Rate": 4.98519710117942e-06, "Pretrain/Loss": 1.9255123138427734, "Pretrain/Loss (Raw)": 2.070526361465454, "Pretrain/Step": 7645, "Pretrain/Step Time": 8.64365810342133} +{"Pretrain/Learning Rate": 4.980111041050667e-06, "Pretrain/Loss": 1.9291270971298218, "Pretrain/Loss (Raw)": 1.747928261756897, "Pretrain/Step": 7646, "Pretrain/Step Time": 8.63989307358861} +{"Pretrain/Learning Rate": 4.975027289709855e-06, "Pretrain/Loss": 1.9281952381134033, "Pretrain/Loss (Raw)": 2.0009355545043945, "Pretrain/Step": 7647, "Pretrain/Step Time": 8.642781060189009} +{"Pretrain/Learning Rate": 4.969945847743246e-06, "Pretrain/Loss": 1.9282046556472778, "Pretrain/Loss (Raw)": 1.8828247785568237, "Pretrain/Step": 7648, "Pretrain/Step Time": 8.640965092927217} +{"Pretrain/Learning Rate": 4.964866715736874e-06, "Pretrain/Loss": 1.928755283355713, "Pretrain/Loss (Raw)": 2.095304012298584, "Pretrain/Step": 7649, "Pretrain/Step Time": 8.642167694866657} +{"Pretrain/Learning Rate": 4.959789894276473e-06, "Pretrain/Loss": 1.924542784690857, "Pretrain/Loss (Raw)": 1.5102941989898682, "Pretrain/Step": 7650, "Pretrain/Step Time": 8.64103010110557} +{"Pretrain/Learning Rate": 4.9547153839475476e-06, "Pretrain/Loss": 1.9234325885772705, "Pretrain/Loss (Raw)": 1.7462775707244873, "Pretrain/Step": 7651, "Pretrain/Step Time": 8.644900700077415} +{"Pretrain/Learning Rate": 4.949643185335287e-06, "Pretrain/Loss": 1.9243223667144775, "Pretrain/Loss (Raw)": 2.130751132965088, "Pretrain/Step": 7652, "Pretrain/Step Time": 8.644014379009604} +{"Pretrain/Learning Rate": 4.944573299024663e-06, "Pretrain/Loss": 1.9274733066558838, "Pretrain/Loss (Raw)": 2.1561505794525146, "Pretrain/Step": 7653, "Pretrain/Step Time": 8.64314460195601} +{"Pretrain/Learning Rate": 4.939505725600341e-06, "Pretrain/Loss": 1.9282300472259521, "Pretrain/Loss (Raw)": 2.15312123298645, "Pretrain/Step": 7654, "Pretrain/Step Time": 8.65037008561194} +{"Pretrain/Learning Rate": 4.934440465646762e-06, "Pretrain/Loss": 1.9288607835769653, "Pretrain/Loss (Raw)": 2.036961793899536, "Pretrain/Step": 7655, "Pretrain/Step Time": 8.647003630176187} +{"Pretrain/Learning Rate": 4.929377519748046e-06, "Pretrain/Loss": 1.9299771785736084, "Pretrain/Loss (Raw)": 2.1805098056793213, "Pretrain/Step": 7656, "Pretrain/Step Time": 8.643790293484926} +{"Pretrain/Learning Rate": 4.924316888488098e-06, "Pretrain/Loss": 1.932554006576538, "Pretrain/Loss (Raw)": 2.1222662925720215, "Pretrain/Step": 7657, "Pretrain/Step Time": 8.64659515209496} +{"Pretrain/Learning Rate": 4.919258572450527e-06, "Pretrain/Loss": 1.9335274696350098, "Pretrain/Loss (Raw)": 2.067812204360962, "Pretrain/Step": 7658, "Pretrain/Step Time": 8.641110045835376} +{"Pretrain/Learning Rate": 4.914202572218679e-06, "Pretrain/Loss": 1.9341782331466675, "Pretrain/Loss (Raw)": 1.8807915449142456, "Pretrain/Step": 7659, "Pretrain/Step Time": 8.641998512670398} +{"Pretrain/Learning Rate": 4.909148888375631e-06, "Pretrain/Loss": 1.9332458972930908, "Pretrain/Loss (Raw)": 1.969710111618042, "Pretrain/Step": 7660, "Pretrain/Step Time": 8.643130276352167} +{"Pretrain/Learning Rate": 4.904097521504214e-06, "Pretrain/Loss": 1.9337520599365234, "Pretrain/Loss (Raw)": 1.82659912109375, "Pretrain/Step": 7661, "Pretrain/Step Time": 8.641728034242988} +{"Pretrain/Learning Rate": 4.899048472186962e-06, "Pretrain/Loss": 1.933201551437378, "Pretrain/Loss (Raw)": 1.9349279403686523, "Pretrain/Step": 7662, "Pretrain/Step Time": 8.637306900694966} +{"Pretrain/Learning Rate": 4.8940017410061625e-06, "Pretrain/Loss": 1.932547926902771, "Pretrain/Loss (Raw)": 1.9002983570098877, "Pretrain/Step": 7663, "Pretrain/Step Time": 8.63689961656928} +{"Pretrain/Learning Rate": 4.888957328543817e-06, "Pretrain/Loss": 1.9367755651474, "Pretrain/Loss (Raw)": 2.0398471355438232, "Pretrain/Step": 7664, "Pretrain/Step Time": 8.636818530038} +{"Pretrain/Learning Rate": 4.8839152353816835e-06, "Pretrain/Loss": 1.9352259635925293, "Pretrain/Loss (Raw)": 1.713475227355957, "Pretrain/Step": 7665, "Pretrain/Step Time": 8.639914214611053} +{"Pretrain/Learning Rate": 4.8788754621012375e-06, "Pretrain/Loss": 1.935288429260254, "Pretrain/Loss (Raw)": 2.094207525253296, "Pretrain/Step": 7666, "Pretrain/Step Time": 8.641568709164858} +{"Pretrain/Learning Rate": 4.873838009283685e-06, "Pretrain/Loss": 1.9349045753479004, "Pretrain/Loss (Raw)": 1.734950065612793, "Pretrain/Step": 7667, "Pretrain/Step Time": 8.643804343417287} +{"Pretrain/Learning Rate": 4.868802877509965e-06, "Pretrain/Loss": 1.937584400177002, "Pretrain/Loss (Raw)": 2.1571781635284424, "Pretrain/Step": 7668, "Pretrain/Step Time": 8.643317988142371} +{"Pretrain/Learning Rate": 4.863770067360765e-06, "Pretrain/Loss": 1.9383890628814697, "Pretrain/Loss (Raw)": 2.160900831222534, "Pretrain/Step": 7669, "Pretrain/Step Time": 8.64389236830175} +{"Pretrain/Learning Rate": 4.858739579416488e-06, "Pretrain/Loss": 1.9402929544448853, "Pretrain/Loss (Raw)": 2.065833806991577, "Pretrain/Step": 7670, "Pretrain/Step Time": 8.639894450083375} +{"Pretrain/Learning Rate": 4.85371141425727e-06, "Pretrain/Loss": 1.9435274600982666, "Pretrain/Loss (Raw)": 1.939923644065857, "Pretrain/Step": 7671, "Pretrain/Step Time": 8.645805610343814} +{"Pretrain/Learning Rate": 4.848685572462977e-06, "Pretrain/Loss": 1.9443318843841553, "Pretrain/Loss (Raw)": 1.8500748872756958, "Pretrain/Step": 7672, "Pretrain/Step Time": 8.646019879728556} +{"Pretrain/Learning Rate": 4.843662054613227e-06, "Pretrain/Loss": 1.9451820850372314, "Pretrain/Loss (Raw)": 2.0395073890686035, "Pretrain/Step": 7673, "Pretrain/Step Time": 8.646493058651686} +{"Pretrain/Learning Rate": 4.838640861287347e-06, "Pretrain/Loss": 1.944809913635254, "Pretrain/Loss (Raw)": 1.9214215278625488, "Pretrain/Step": 7674, "Pretrain/Step Time": 8.651506340131164} +{"Pretrain/Learning Rate": 4.833621993064408e-06, "Pretrain/Loss": 1.9420137405395508, "Pretrain/Loss (Raw)": 1.8303654193878174, "Pretrain/Step": 7675, "Pretrain/Step Time": 8.651640191674232} +{"Pretrain/Learning Rate": 4.8286054505231994e-06, "Pretrain/Loss": 1.941899061203003, "Pretrain/Loss (Raw)": 1.971155047416687, "Pretrain/Step": 7676, "Pretrain/Step Time": 8.6540218424052} +{"Pretrain/Learning Rate": 4.823591234242269e-06, "Pretrain/Loss": 1.942089319229126, "Pretrain/Loss (Raw)": 1.890399694442749, "Pretrain/Step": 7677, "Pretrain/Step Time": 8.652448955923319} +{"Pretrain/Learning Rate": 4.818579344799873e-06, "Pretrain/Loss": 1.9426732063293457, "Pretrain/Loss (Raw)": 1.982893943786621, "Pretrain/Step": 7678, "Pretrain/Step Time": 8.651911087334156} +{"Pretrain/Learning Rate": 4.813569782774005e-06, "Pretrain/Loss": 1.9436089992523193, "Pretrain/Loss (Raw)": 2.051731824874878, "Pretrain/Step": 7679, "Pretrain/Step Time": 8.651515504345298} +{"Pretrain/Learning Rate": 4.808562548742382e-06, "Pretrain/Loss": 1.9411187171936035, "Pretrain/Loss (Raw)": 1.730679988861084, "Pretrain/Step": 7680, "Pretrain/Step Time": 8.655548874288797} +{"Pretrain/Learning Rate": 4.803557643282486e-06, "Pretrain/Loss": 1.9421828985214233, "Pretrain/Loss (Raw)": 2.1464154720306396, "Pretrain/Step": 7681, "Pretrain/Step Time": 8.651192855089903} +{"Pretrain/Learning Rate": 4.798555066971478e-06, "Pretrain/Loss": 1.9439117908477783, "Pretrain/Loss (Raw)": 1.928861141204834, "Pretrain/Step": 7682, "Pretrain/Step Time": 8.654980773106217} +{"Pretrain/Learning Rate": 4.793554820386298e-06, "Pretrain/Loss": 1.9447572231292725, "Pretrain/Loss (Raw)": 1.904250144958496, "Pretrain/Step": 7683, "Pretrain/Step Time": 8.654721299186349} +{"Pretrain/Learning Rate": 4.788556904103586e-06, "Pretrain/Loss": 1.946394681930542, "Pretrain/Loss (Raw)": 2.08341908454895, "Pretrain/Step": 7684, "Pretrain/Step Time": 8.656894514337182} +{"Pretrain/Learning Rate": 4.783561318699745e-06, "Pretrain/Loss": 1.9489809274673462, "Pretrain/Loss (Raw)": 2.0964317321777344, "Pretrain/Step": 7685, "Pretrain/Step Time": 8.659623231738806} +{"Pretrain/Learning Rate": 4.778568064750863e-06, "Pretrain/Loss": 1.9467241764068604, "Pretrain/Loss (Raw)": 1.9487248659133911, "Pretrain/Step": 7686, "Pretrain/Step Time": 8.66544046998024} +{"Pretrain/Learning Rate": 4.773577142832797e-06, "Pretrain/Loss": 1.9470150470733643, "Pretrain/Loss (Raw)": 2.079094409942627, "Pretrain/Step": 7687, "Pretrain/Step Time": 8.661987196654081} +{"Pretrain/Learning Rate": 4.768588553521136e-06, "Pretrain/Loss": 1.9455511569976807, "Pretrain/Loss (Raw)": 1.80747389793396, "Pretrain/Step": 7688, "Pretrain/Step Time": 8.659830711781979} +{"Pretrain/Learning Rate": 4.763602297391167e-06, "Pretrain/Loss": 1.9462816715240479, "Pretrain/Loss (Raw)": 2.008657455444336, "Pretrain/Step": 7689, "Pretrain/Step Time": 8.656411623582244} +{"Pretrain/Learning Rate": 4.758618375017943e-06, "Pretrain/Loss": 1.9462029933929443, "Pretrain/Loss (Raw)": 1.7864623069763184, "Pretrain/Step": 7690, "Pretrain/Step Time": 8.655491760000587} +{"Pretrain/Learning Rate": 4.753636786976223e-06, "Pretrain/Loss": 1.9458403587341309, "Pretrain/Loss (Raw)": 2.045369863510132, "Pretrain/Step": 7691, "Pretrain/Step Time": 8.653693346306682} +{"Pretrain/Learning Rate": 4.748657533840525e-06, "Pretrain/Loss": 1.94826078414917, "Pretrain/Loss (Raw)": 2.111168622970581, "Pretrain/Step": 7692, "Pretrain/Step Time": 8.652171332389116} +{"Pretrain/Learning Rate": 4.743680616185053e-06, "Pretrain/Loss": 1.948042869567871, "Pretrain/Loss (Raw)": 1.763026237487793, "Pretrain/Step": 7693, "Pretrain/Step Time": 8.651168486103415} +{"Pretrain/Learning Rate": 4.738706034583793e-06, "Pretrain/Loss": 1.9500374794006348, "Pretrain/Loss (Raw)": 2.1119277477264404, "Pretrain/Step": 7694, "Pretrain/Step Time": 8.650881126523018} +{"Pretrain/Learning Rate": 4.73373378961042e-06, "Pretrain/Loss": 1.9521024227142334, "Pretrain/Loss (Raw)": 2.1078262329101562, "Pretrain/Step": 7695, "Pretrain/Step Time": 8.649912407621741} +{"Pretrain/Learning Rate": 4.728763881838375e-06, "Pretrain/Loss": 1.9510186910629272, "Pretrain/Loss (Raw)": 1.9533478021621704, "Pretrain/Step": 7696, "Pretrain/Step Time": 8.649681093171239} +{"Pretrain/Learning Rate": 4.723796311840789e-06, "Pretrain/Loss": 1.951038122177124, "Pretrain/Loss (Raw)": 1.9072016477584839, "Pretrain/Step": 7697, "Pretrain/Step Time": 8.654810843989253} +{"Pretrain/Learning Rate": 4.7188310801905635e-06, "Pretrain/Loss": 1.9515846967697144, "Pretrain/Loss (Raw)": 1.8980010747909546, "Pretrain/Step": 7698, "Pretrain/Step Time": 8.651283394545317} +{"Pretrain/Learning Rate": 4.713868187460307e-06, "Pretrain/Loss": 1.9557969570159912, "Pretrain/Loss (Raw)": 2.3161165714263916, "Pretrain/Step": 7699, "Pretrain/Step Time": 8.653818180784583} +{"Pretrain/Learning Rate": 4.708907634222359e-06, "Pretrain/Loss": 1.959153175354004, "Pretrain/Loss (Raw)": 2.091052293777466, "Pretrain/Step": 7700, "Pretrain/Step Time": 8.658103102818131} +{"Pretrain/Learning Rate": 4.703949421048795e-06, "Pretrain/Loss": 1.95978844165802, "Pretrain/Loss (Raw)": 1.9546445608139038, "Pretrain/Step": 7701, "Pretrain/Step Time": 8.652222013100982} +{"Pretrain/Learning Rate": 4.698993548511427e-06, "Pretrain/Loss": 1.9568085670471191, "Pretrain/Loss (Raw)": 1.7591472864151, "Pretrain/Step": 7702, "Pretrain/Step Time": 8.648808483034372} +{"Pretrain/Learning Rate": 4.6940400171817835e-06, "Pretrain/Loss": 1.957329511642456, "Pretrain/Loss (Raw)": 1.9514394998550415, "Pretrain/Step": 7703, "Pretrain/Step Time": 8.65103304386139} +{"Pretrain/Learning Rate": 4.68908882763113e-06, "Pretrain/Loss": 1.9580312967300415, "Pretrain/Loss (Raw)": 2.0239365100860596, "Pretrain/Step": 7704, "Pretrain/Step Time": 8.652527652680874} +{"Pretrain/Learning Rate": 4.684139980430455e-06, "Pretrain/Loss": 1.9558510780334473, "Pretrain/Loss (Raw)": 1.392746090888977, "Pretrain/Step": 7705, "Pretrain/Step Time": 8.65664129331708} +{"Pretrain/Learning Rate": 4.679193476150495e-06, "Pretrain/Loss": 1.9570670127868652, "Pretrain/Loss (Raw)": 2.0450987815856934, "Pretrain/Step": 7706, "Pretrain/Step Time": 8.654865523800254} +{"Pretrain/Learning Rate": 4.674249315361698e-06, "Pretrain/Loss": 1.9567091464996338, "Pretrain/Loss (Raw)": 1.9749507904052734, "Pretrain/Step": 7707, "Pretrain/Step Time": 8.654832728207111} +{"Pretrain/Learning Rate": 4.669307498634251e-06, "Pretrain/Loss": 1.9501261711120605, "Pretrain/Loss (Raw)": 1.2891391515731812, "Pretrain/Step": 7708, "Pretrain/Step Time": 8.655813992023468} +{"Pretrain/Learning Rate": 4.664368026538054e-06, "Pretrain/Loss": 1.9514873027801514, "Pretrain/Loss (Raw)": 2.144338369369507, "Pretrain/Step": 7709, "Pretrain/Step Time": 8.656951257959008} +{"Pretrain/Learning Rate": 4.6594308996427694e-06, "Pretrain/Loss": 1.95157790184021, "Pretrain/Loss (Raw)": 1.9999370574951172, "Pretrain/Step": 7710, "Pretrain/Step Time": 8.658822814002633} +{"Pretrain/Learning Rate": 4.654496118517762e-06, "Pretrain/Loss": 1.947603702545166, "Pretrain/Loss (Raw)": 1.2610783576965332, "Pretrain/Step": 7711, "Pretrain/Step Time": 8.665845913812518} +{"Pretrain/Learning Rate": 4.64956368373213e-06, "Pretrain/Loss": 1.9479420185089111, "Pretrain/Loss (Raw)": 2.1541593074798584, "Pretrain/Step": 7712, "Pretrain/Step Time": 8.6728206127882} +{"Pretrain/Learning Rate": 4.644633595854706e-06, "Pretrain/Loss": 1.947817325592041, "Pretrain/Loss (Raw)": 1.8443238735198975, "Pretrain/Step": 7713, "Pretrain/Step Time": 8.664054807275534} +{"Pretrain/Learning Rate": 4.6397058554540575e-06, "Pretrain/Loss": 1.9456368684768677, "Pretrain/Loss (Raw)": 1.6958839893341064, "Pretrain/Step": 7714, "Pretrain/Step Time": 8.669070648029447} +{"Pretrain/Learning Rate": 4.6347804630984735e-06, "Pretrain/Loss": 1.9442590475082397, "Pretrain/Loss (Raw)": 1.8921971321105957, "Pretrain/Step": 7715, "Pretrain/Step Time": 8.669285310432315} +{"Pretrain/Learning Rate": 4.629857419355968e-06, "Pretrain/Loss": 1.9475085735321045, "Pretrain/Loss (Raw)": 2.3076486587524414, "Pretrain/Step": 7716, "Pretrain/Step Time": 8.670131660997868} +{"Pretrain/Learning Rate": 4.624936724794285e-06, "Pretrain/Loss": 1.9470183849334717, "Pretrain/Loss (Raw)": 1.9421656131744385, "Pretrain/Step": 7717, "Pretrain/Step Time": 8.668521353974938} +{"Pretrain/Learning Rate": 4.620018379980917e-06, "Pretrain/Loss": 1.9480645656585693, "Pretrain/Loss (Raw)": 1.95681631565094, "Pretrain/Step": 7718, "Pretrain/Step Time": 8.674322333186865} +{"Pretrain/Learning Rate": 4.6151023854830635e-06, "Pretrain/Loss": 1.9456249475479126, "Pretrain/Loss (Raw)": 1.8019521236419678, "Pretrain/Step": 7719, "Pretrain/Step Time": 8.673380423337221} +{"Pretrain/Learning Rate": 4.610188741867657e-06, "Pretrain/Loss": 1.9426813125610352, "Pretrain/Loss (Raw)": 1.5874956846237183, "Pretrain/Step": 7720, "Pretrain/Step Time": 8.670443870127201} +{"Pretrain/Learning Rate": 4.6052774497013615e-06, "Pretrain/Loss": 1.9452029466629028, "Pretrain/Loss (Raw)": 2.1433281898498535, "Pretrain/Step": 7721, "Pretrain/Step Time": 8.671183574944735} +{"Pretrain/Learning Rate": 4.600368509550584e-06, "Pretrain/Loss": 1.9432694911956787, "Pretrain/Loss (Raw)": 1.9268766641616821, "Pretrain/Step": 7722, "Pretrain/Step Time": 8.67618764564395} +{"Pretrain/Learning Rate": 4.5954619219814254e-06, "Pretrain/Loss": 1.9432967901229858, "Pretrain/Loss (Raw)": 2.0076358318328857, "Pretrain/Step": 7723, "Pretrain/Step Time": 8.67281474545598} +{"Pretrain/Learning Rate": 4.590557687559754e-06, "Pretrain/Loss": 1.9412696361541748, "Pretrain/Loss (Raw)": 1.8426167964935303, "Pretrain/Step": 7724, "Pretrain/Step Time": 8.674228316172957} +{"Pretrain/Learning Rate": 4.585655806851136e-06, "Pretrain/Loss": 1.944272518157959, "Pretrain/Loss (Raw)": 2.0110011100769043, "Pretrain/Step": 7725, "Pretrain/Step Time": 8.672728879377246} +{"Pretrain/Learning Rate": 4.5807562804208975e-06, "Pretrain/Loss": 1.943648099899292, "Pretrain/Loss (Raw)": 2.0529258251190186, "Pretrain/Step": 7726, "Pretrain/Step Time": 8.670821594074368} +{"Pretrain/Learning Rate": 4.575859108834049e-06, "Pretrain/Loss": 1.946312665939331, "Pretrain/Loss (Raw)": 1.9977061748504639, "Pretrain/Step": 7727, "Pretrain/Step Time": 8.671379122883081} +{"Pretrain/Learning Rate": 4.570964292655372e-06, "Pretrain/Loss": 1.9473464488983154, "Pretrain/Loss (Raw)": 2.1735668182373047, "Pretrain/Step": 7728, "Pretrain/Step Time": 8.671666331589222} +{"Pretrain/Learning Rate": 4.56607183244937e-06, "Pretrain/Loss": 1.9477365016937256, "Pretrain/Loss (Raw)": 2.147247076034546, "Pretrain/Step": 7729, "Pretrain/Step Time": 8.671632159501314} +{"Pretrain/Learning Rate": 4.56118172878024e-06, "Pretrain/Loss": 1.9457948207855225, "Pretrain/Loss (Raw)": 1.763277530670166, "Pretrain/Step": 7730, "Pretrain/Step Time": 8.677909262478352} +{"Pretrain/Learning Rate": 4.556293982211951e-06, "Pretrain/Loss": 1.9458470344543457, "Pretrain/Loss (Raw)": 1.9882166385650635, "Pretrain/Step": 7731, "Pretrain/Step Time": 8.678509211167693} +{"Pretrain/Learning Rate": 4.551408593308165e-06, "Pretrain/Loss": 1.9477386474609375, "Pretrain/Loss (Raw)": 2.0241098403930664, "Pretrain/Step": 7732, "Pretrain/Step Time": 8.67073467001319} +{"Pretrain/Learning Rate": 4.5465255626323116e-06, "Pretrain/Loss": 1.947704553604126, "Pretrain/Loss (Raw)": 1.8706706762313843, "Pretrain/Step": 7733, "Pretrain/Step Time": 8.675755705684423} +{"Pretrain/Learning Rate": 4.541644890747495e-06, "Pretrain/Loss": 1.9482409954071045, "Pretrain/Loss (Raw)": 1.9631412029266357, "Pretrain/Step": 7734, "Pretrain/Step Time": 8.67369924671948} +{"Pretrain/Learning Rate": 4.536766578216603e-06, "Pretrain/Loss": 1.9483654499053955, "Pretrain/Loss (Raw)": 2.085289478302002, "Pretrain/Step": 7735, "Pretrain/Step Time": 8.673624485731125} +{"Pretrain/Learning Rate": 4.531890625602206e-06, "Pretrain/Loss": 1.9496573209762573, "Pretrain/Loss (Raw)": 1.8794817924499512, "Pretrain/Step": 7736, "Pretrain/Step Time": 8.67734506726265} +{"Pretrain/Learning Rate": 4.5270170334666435e-06, "Pretrain/Loss": 1.9493250846862793, "Pretrain/Loss (Raw)": 2.007542848587036, "Pretrain/Step": 7737, "Pretrain/Step Time": 8.68300579674542} +{"Pretrain/Learning Rate": 4.522145802371936e-06, "Pretrain/Loss": 1.949629783630371, "Pretrain/Loss (Raw)": 2.023894786834717, "Pretrain/Step": 7738, "Pretrain/Step Time": 8.678121205419302} +{"Pretrain/Learning Rate": 4.517276932879877e-06, "Pretrain/Loss": 1.9474985599517822, "Pretrain/Loss (Raw)": 1.9497532844543457, "Pretrain/Step": 7739, "Pretrain/Step Time": 8.672617353498936} +{"Pretrain/Learning Rate": 4.512410425551958e-06, "Pretrain/Loss": 1.9425170421600342, "Pretrain/Loss (Raw)": 1.6879721879959106, "Pretrain/Step": 7740, "Pretrain/Step Time": 8.677385104820132} +{"Pretrain/Learning Rate": 4.507546280949413e-06, "Pretrain/Loss": 1.941532850265503, "Pretrain/Loss (Raw)": 1.9335330724716187, "Pretrain/Step": 7741, "Pretrain/Step Time": 8.67681585624814} +{"Pretrain/Learning Rate": 4.502684499633183e-06, "Pretrain/Loss": 1.9415496587753296, "Pretrain/Loss (Raw)": 2.0516865253448486, "Pretrain/Step": 7742, "Pretrain/Step Time": 8.677250484004617} +{"Pretrain/Learning Rate": 4.4978250821639725e-06, "Pretrain/Loss": 1.9431517124176025, "Pretrain/Loss (Raw)": 2.016291379928589, "Pretrain/Step": 7743, "Pretrain/Step Time": 8.674485391005874} +{"Pretrain/Learning Rate": 4.492968029102182e-06, "Pretrain/Loss": 1.9466980695724487, "Pretrain/Loss (Raw)": 2.0080161094665527, "Pretrain/Step": 7744, "Pretrain/Step Time": 8.677033619955182} +{"Pretrain/Learning Rate": 4.488113341007951e-06, "Pretrain/Loss": 1.9462069272994995, "Pretrain/Loss (Raw)": 1.8382813930511475, "Pretrain/Step": 7745, "Pretrain/Step Time": 8.682426558807492} +{"Pretrain/Learning Rate": 4.48326101844114e-06, "Pretrain/Loss": 1.9462302923202515, "Pretrain/Loss (Raw)": 1.8780001401901245, "Pretrain/Step": 7746, "Pretrain/Step Time": 8.680137868970633} +{"Pretrain/Learning Rate": 4.4784110619613514e-06, "Pretrain/Loss": 1.9464154243469238, "Pretrain/Loss (Raw)": 1.9632636308670044, "Pretrain/Step": 7747, "Pretrain/Step Time": 8.67648889310658} +{"Pretrain/Learning Rate": 4.473563472127898e-06, "Pretrain/Loss": 1.9481027126312256, "Pretrain/Loss (Raw)": 1.9258249998092651, "Pretrain/Step": 7748, "Pretrain/Step Time": 8.674291618168354} +{"Pretrain/Learning Rate": 4.468718249499831e-06, "Pretrain/Loss": 1.9451589584350586, "Pretrain/Loss (Raw)": 1.476610541343689, "Pretrain/Step": 7749, "Pretrain/Step Time": 8.675531465560198} +{"Pretrain/Learning Rate": 4.463875394635916e-06, "Pretrain/Loss": 1.9473110437393188, "Pretrain/Loss (Raw)": 2.1187033653259277, "Pretrain/Step": 7750, "Pretrain/Step Time": 8.675214979797602} +{"Pretrain/Learning Rate": 4.459034908094664e-06, "Pretrain/Loss": 1.9468742609024048, "Pretrain/Loss (Raw)": 1.931028127670288, "Pretrain/Step": 7751, "Pretrain/Step Time": 8.672243291512132} +{"Pretrain/Learning Rate": 4.454196790434301e-06, "Pretrain/Loss": 1.9470694065093994, "Pretrain/Loss (Raw)": 2.0004124641418457, "Pretrain/Step": 7752, "Pretrain/Step Time": 8.675537457689643} +{"Pretrain/Learning Rate": 4.44936104221278e-06, "Pretrain/Loss": 1.9504282474517822, "Pretrain/Loss (Raw)": 2.133376359939575, "Pretrain/Step": 7753, "Pretrain/Step Time": 8.670721270143986} +{"Pretrain/Learning Rate": 4.444527663987771e-06, "Pretrain/Loss": 1.9535350799560547, "Pretrain/Loss (Raw)": 2.253352165222168, "Pretrain/Step": 7754, "Pretrain/Step Time": 8.668928107246757} +{"Pretrain/Learning Rate": 4.439696656316703e-06, "Pretrain/Loss": 1.951338529586792, "Pretrain/Loss (Raw)": 1.8914928436279297, "Pretrain/Step": 7755, "Pretrain/Step Time": 8.672237444669008} +{"Pretrain/Learning Rate": 4.434868019756697e-06, "Pretrain/Loss": 1.9499409198760986, "Pretrain/Loss (Raw)": 1.829604148864746, "Pretrain/Step": 7756, "Pretrain/Step Time": 8.670658299699426} +{"Pretrain/Learning Rate": 4.430041754864617e-06, "Pretrain/Loss": 1.9511972665786743, "Pretrain/Loss (Raw)": 1.9928219318389893, "Pretrain/Step": 7757, "Pretrain/Step Time": 8.669839171692729} +{"Pretrain/Learning Rate": 4.4252178621970455e-06, "Pretrain/Loss": 1.9493811130523682, "Pretrain/Loss (Raw)": 1.8342007398605347, "Pretrain/Step": 7758, "Pretrain/Step Time": 8.673847991973162} +{"Pretrain/Learning Rate": 4.420396342310309e-06, "Pretrain/Loss": 1.951865792274475, "Pretrain/Loss (Raw)": 2.1514334678649902, "Pretrain/Step": 7759, "Pretrain/Step Time": 8.672243373468518} +{"Pretrain/Learning Rate": 4.41557719576044e-06, "Pretrain/Loss": 1.9505287408828735, "Pretrain/Loss (Raw)": 1.8736804723739624, "Pretrain/Step": 7760, "Pretrain/Step Time": 8.673589313402772} +{"Pretrain/Learning Rate": 4.410760423103205e-06, "Pretrain/Loss": 1.9477527141571045, "Pretrain/Loss (Raw)": 1.8071247339248657, "Pretrain/Step": 7761, "Pretrain/Step Time": 8.66729779727757} +{"Pretrain/Learning Rate": 4.405946024894092e-06, "Pretrain/Loss": 1.950090765953064, "Pretrain/Loss (Raw)": 1.9374628067016602, "Pretrain/Step": 7762, "Pretrain/Step Time": 8.666930129751563} +{"Pretrain/Learning Rate": 4.401134001688337e-06, "Pretrain/Loss": 1.949760913848877, "Pretrain/Loss (Raw)": 1.8664603233337402, "Pretrain/Step": 7763, "Pretrain/Step Time": 8.663861062377691} +{"Pretrain/Learning Rate": 4.396324354040862e-06, "Pretrain/Loss": 1.9494796991348267, "Pretrain/Loss (Raw)": 2.0468733310699463, "Pretrain/Step": 7764, "Pretrain/Step Time": 8.67137978039682} +{"Pretrain/Learning Rate": 4.391517082506358e-06, "Pretrain/Loss": 1.9486913681030273, "Pretrain/Loss (Raw)": 1.8511719703674316, "Pretrain/Step": 7765, "Pretrain/Step Time": 8.666344134137034} +{"Pretrain/Learning Rate": 4.386712187639205e-06, "Pretrain/Loss": 1.9478269815444946, "Pretrain/Loss (Raw)": 1.8074662685394287, "Pretrain/Step": 7766, "Pretrain/Step Time": 8.669044688344002} +{"Pretrain/Learning Rate": 4.38190966999355e-06, "Pretrain/Loss": 1.9467196464538574, "Pretrain/Loss (Raw)": 1.6877490282058716, "Pretrain/Step": 7767, "Pretrain/Step Time": 8.659122690558434} +{"Pretrain/Learning Rate": 4.377109530123217e-06, "Pretrain/Loss": 1.94700026512146, "Pretrain/Loss (Raw)": 1.8831636905670166, "Pretrain/Step": 7768, "Pretrain/Step Time": 8.659511080011725} +{"Pretrain/Learning Rate": 4.372311768581794e-06, "Pretrain/Loss": 1.9468843936920166, "Pretrain/Loss (Raw)": 2.127786159515381, "Pretrain/Step": 7769, "Pretrain/Step Time": 8.66457180865109} +{"Pretrain/Learning Rate": 4.367516385922574e-06, "Pretrain/Loss": 1.9463999271392822, "Pretrain/Loss (Raw)": 2.0383212566375732, "Pretrain/Step": 7770, "Pretrain/Step Time": 8.666353028267622} +{"Pretrain/Learning Rate": 4.362723382698594e-06, "Pretrain/Loss": 1.9458779096603394, "Pretrain/Loss (Raw)": 1.935950517654419, "Pretrain/Step": 7771, "Pretrain/Step Time": 8.66547985188663} +{"Pretrain/Learning Rate": 4.357932759462599e-06, "Pretrain/Loss": 1.9471852779388428, "Pretrain/Loss (Raw)": 1.9398603439331055, "Pretrain/Step": 7772, "Pretrain/Step Time": 8.665976034477353} +{"Pretrain/Learning Rate": 4.35314451676706e-06, "Pretrain/Loss": 1.9473179578781128, "Pretrain/Loss (Raw)": 2.087509870529175, "Pretrain/Step": 7773, "Pretrain/Step Time": 8.665803471580148} +{"Pretrain/Learning Rate": 4.348358655164203e-06, "Pretrain/Loss": 1.9500229358673096, "Pretrain/Loss (Raw)": 2.0941593647003174, "Pretrain/Step": 7774, "Pretrain/Step Time": 8.66821924969554} +{"Pretrain/Learning Rate": 4.343575175205922e-06, "Pretrain/Loss": 1.9504318237304688, "Pretrain/Loss (Raw)": 2.053278684616089, "Pretrain/Step": 7775, "Pretrain/Step Time": 8.664303936064243} +{"Pretrain/Learning Rate": 4.338794077443897e-06, "Pretrain/Loss": 1.9512300491333008, "Pretrain/Loss (Raw)": 1.9849801063537598, "Pretrain/Step": 7776, "Pretrain/Step Time": 8.66734648682177} +{"Pretrain/Learning Rate": 4.334015362429491e-06, "Pretrain/Loss": 1.9496572017669678, "Pretrain/Loss (Raw)": 1.8940006494522095, "Pretrain/Step": 7777, "Pretrain/Step Time": 8.66708343103528} +{"Pretrain/Learning Rate": 4.329239030713827e-06, "Pretrain/Loss": 1.953231930732727, "Pretrain/Loss (Raw)": 1.9678573608398438, "Pretrain/Step": 7778, "Pretrain/Step Time": 8.667788561433554} +{"Pretrain/Learning Rate": 4.3244650828477114e-06, "Pretrain/Loss": 1.9558520317077637, "Pretrain/Loss (Raw)": 2.0816307067871094, "Pretrain/Step": 7779, "Pretrain/Step Time": 8.663716796785593} +{"Pretrain/Learning Rate": 4.319693519381712e-06, "Pretrain/Loss": 1.9567129611968994, "Pretrain/Loss (Raw)": 2.2409534454345703, "Pretrain/Step": 7780, "Pretrain/Step Time": 8.66106416657567} +{"Pretrain/Learning Rate": 4.314924340866105e-06, "Pretrain/Loss": 1.954298496246338, "Pretrain/Loss (Raw)": 1.847114086151123, "Pretrain/Step": 7781, "Pretrain/Step Time": 8.660712661221623} +{"Pretrain/Learning Rate": 4.310157547850896e-06, "Pretrain/Loss": 1.951159954071045, "Pretrain/Loss (Raw)": 1.7513939142227173, "Pretrain/Step": 7782, "Pretrain/Step Time": 8.660404186695814} +{"Pretrain/Learning Rate": 4.3053931408858055e-06, "Pretrain/Loss": 1.9491279125213623, "Pretrain/Loss (Raw)": 1.776839256286621, "Pretrain/Step": 7783, "Pretrain/Step Time": 8.664747446775436} +{"Pretrain/Learning Rate": 4.300631120520301e-06, "Pretrain/Loss": 1.9475736618041992, "Pretrain/Loss (Raw)": 1.9815752506256104, "Pretrain/Step": 7784, "Pretrain/Step Time": 8.662933697924018} +{"Pretrain/Learning Rate": 4.295871487303554e-06, "Pretrain/Loss": 1.9430341720581055, "Pretrain/Loss (Raw)": 1.5412126779556274, "Pretrain/Step": 7785, "Pretrain/Step Time": 8.66738822683692} +{"Pretrain/Learning Rate": 4.291114241784467e-06, "Pretrain/Loss": 1.9426817893981934, "Pretrain/Loss (Raw)": 2.0227043628692627, "Pretrain/Step": 7786, "Pretrain/Step Time": 8.664946060627699} +{"Pretrain/Learning Rate": 4.286359384511662e-06, "Pretrain/Loss": 1.9421221017837524, "Pretrain/Loss (Raw)": 1.8091440200805664, "Pretrain/Step": 7787, "Pretrain/Step Time": 8.66501354239881} +{"Pretrain/Learning Rate": 4.281606916033507e-06, "Pretrain/Loss": 1.942806601524353, "Pretrain/Loss (Raw)": 2.057333469390869, "Pretrain/Step": 7788, "Pretrain/Step Time": 8.665491867810488} +{"Pretrain/Learning Rate": 4.276856836898072e-06, "Pretrain/Loss": 1.9445650577545166, "Pretrain/Loss (Raw)": 2.0516855716705322, "Pretrain/Step": 7789, "Pretrain/Step Time": 8.665595876052976} +{"Pretrain/Learning Rate": 4.272109147653155e-06, "Pretrain/Loss": 1.9453049898147583, "Pretrain/Loss (Raw)": 2.029635190963745, "Pretrain/Step": 7790, "Pretrain/Step Time": 8.668171491473913} +{"Pretrain/Learning Rate": 4.267363848846278e-06, "Pretrain/Loss": 1.9447674751281738, "Pretrain/Loss (Raw)": 1.8314982652664185, "Pretrain/Step": 7791, "Pretrain/Step Time": 8.673371370881796} +{"Pretrain/Learning Rate": 4.262620941024703e-06, "Pretrain/Loss": 1.9428634643554688, "Pretrain/Loss (Raw)": 1.7961409091949463, "Pretrain/Step": 7792, "Pretrain/Step Time": 8.671996925026178} +{"Pretrain/Learning Rate": 4.2578804247353996e-06, "Pretrain/Loss": 1.9451627731323242, "Pretrain/Loss (Raw)": 2.0077755451202393, "Pretrain/Step": 7793, "Pretrain/Step Time": 8.670410400256515} +{"Pretrain/Learning Rate": 4.253142300525068e-06, "Pretrain/Loss": 1.945059061050415, "Pretrain/Loss (Raw)": 2.080944538116455, "Pretrain/Step": 7794, "Pretrain/Step Time": 8.666944177821279} +{"Pretrain/Learning Rate": 4.248406568940119e-06, "Pretrain/Loss": 1.9475343227386475, "Pretrain/Loss (Raw)": 2.0517711639404297, "Pretrain/Step": 7795, "Pretrain/Step Time": 8.670030001550913} +{"Pretrain/Learning Rate": 4.243673230526715e-06, "Pretrain/Loss": 1.9467427730560303, "Pretrain/Loss (Raw)": 2.0558526515960693, "Pretrain/Step": 7796, "Pretrain/Step Time": 8.666505610570312} +{"Pretrain/Learning Rate": 4.238942285830724e-06, "Pretrain/Loss": 1.9458413124084473, "Pretrain/Loss (Raw)": 2.0455150604248047, "Pretrain/Step": 7797, "Pretrain/Step Time": 8.667021790519357} +{"Pretrain/Learning Rate": 4.234213735397738e-06, "Pretrain/Loss": 1.9446172714233398, "Pretrain/Loss (Raw)": 1.9091551303863525, "Pretrain/Step": 7798, "Pretrain/Step Time": 8.668026411905885} +{"Pretrain/Learning Rate": 4.229487579773067e-06, "Pretrain/Loss": 1.9433562755584717, "Pretrain/Loss (Raw)": 1.778528094291687, "Pretrain/Step": 7799, "Pretrain/Step Time": 8.664178751409054} +{"Pretrain/Learning Rate": 4.22476381950177e-06, "Pretrain/Loss": 1.9441859722137451, "Pretrain/Loss (Raw)": 1.9562675952911377, "Pretrain/Step": 7800, "Pretrain/Step Time": 8.663819201290607} +{"Pretrain/Learning Rate": 4.220042455128603e-06, "Pretrain/Loss": 1.9429352283477783, "Pretrain/Loss (Raw)": 1.87942636013031, "Pretrain/Step": 7801, "Pretrain/Step Time": 8.664981620386243} +{"Pretrain/Learning Rate": 4.215323487198061e-06, "Pretrain/Loss": 1.9405174255371094, "Pretrain/Loss (Raw)": 1.6119266748428345, "Pretrain/Step": 7802, "Pretrain/Step Time": 8.66095188818872} +{"Pretrain/Learning Rate": 4.210606916254348e-06, "Pretrain/Loss": 1.9427345991134644, "Pretrain/Loss (Raw)": 2.114168167114258, "Pretrain/Step": 7803, "Pretrain/Step Time": 8.656952356919646} +{"Pretrain/Learning Rate": 4.205892742841422e-06, "Pretrain/Loss": 1.9437098503112793, "Pretrain/Loss (Raw)": 2.095994234085083, "Pretrain/Step": 7804, "Pretrain/Step Time": 8.659484464675188} +{"Pretrain/Learning Rate": 4.2011809675029154e-06, "Pretrain/Loss": 1.9440069198608398, "Pretrain/Loss (Raw)": 1.928431510925293, "Pretrain/Step": 7805, "Pretrain/Step Time": 8.656481213867664} +{"Pretrain/Learning Rate": 4.196471590782236e-06, "Pretrain/Loss": 1.9430787563323975, "Pretrain/Loss (Raw)": 1.8640813827514648, "Pretrain/Step": 7806, "Pretrain/Step Time": 8.661041816696525} +{"Pretrain/Learning Rate": 4.191764613222474e-06, "Pretrain/Loss": 1.942610740661621, "Pretrain/Loss (Raw)": 1.9918177127838135, "Pretrain/Step": 7807, "Pretrain/Step Time": 8.659606466069818} +{"Pretrain/Learning Rate": 4.18706003536648e-06, "Pretrain/Loss": 1.9453562498092651, "Pretrain/Loss (Raw)": 2.0821099281311035, "Pretrain/Step": 7808, "Pretrain/Step Time": 8.661465620622039} +{"Pretrain/Learning Rate": 4.182357857756786e-06, "Pretrain/Loss": 1.9435951709747314, "Pretrain/Loss (Raw)": 1.921007752418518, "Pretrain/Step": 7809, "Pretrain/Step Time": 8.662730425596237} +{"Pretrain/Learning Rate": 4.1776580809356845e-06, "Pretrain/Loss": 1.942724347114563, "Pretrain/Loss (Raw)": 1.8173977136611938, "Pretrain/Step": 7810, "Pretrain/Step Time": 8.657879685983062} +{"Pretrain/Learning Rate": 4.172960705445164e-06, "Pretrain/Loss": 1.94412100315094, "Pretrain/Loss (Raw)": 2.083009958267212, "Pretrain/Step": 7811, "Pretrain/Step Time": 8.66038984246552} +{"Pretrain/Learning Rate": 4.168265731826965e-06, "Pretrain/Loss": 1.9417424201965332, "Pretrain/Loss (Raw)": 1.7789567708969116, "Pretrain/Step": 7812, "Pretrain/Step Time": 8.659218449145555} +{"Pretrain/Learning Rate": 4.163573160622522e-06, "Pretrain/Loss": 1.9398126602172852, "Pretrain/Loss (Raw)": 1.8494207859039307, "Pretrain/Step": 7813, "Pretrain/Step Time": 8.654920952394605} +{"Pretrain/Learning Rate": 4.1588829923730005e-06, "Pretrain/Loss": 1.93900728225708, "Pretrain/Loss (Raw)": 1.845645546913147, "Pretrain/Step": 7814, "Pretrain/Step Time": 8.661726396530867} +{"Pretrain/Learning Rate": 4.1541952276193095e-06, "Pretrain/Loss": 1.9360052347183228, "Pretrain/Loss (Raw)": 1.694831132888794, "Pretrain/Step": 7815, "Pretrain/Step Time": 8.662437092512846} +{"Pretrain/Learning Rate": 4.149509866902043e-06, "Pretrain/Loss": 1.938539743423462, "Pretrain/Loss (Raw)": 2.131892442703247, "Pretrain/Step": 7816, "Pretrain/Step Time": 8.668198492377996} +{"Pretrain/Learning Rate": 4.144826910761556e-06, "Pretrain/Loss": 1.9384273290634155, "Pretrain/Loss (Raw)": 1.9942729473114014, "Pretrain/Step": 7817, "Pretrain/Step Time": 8.669879376888275} +{"Pretrain/Learning Rate": 4.140146359737895e-06, "Pretrain/Loss": 1.9404222965240479, "Pretrain/Loss (Raw)": 2.0418193340301514, "Pretrain/Step": 7818, "Pretrain/Step Time": 8.668398598209023} +{"Pretrain/Learning Rate": 4.135468214370864e-06, "Pretrain/Loss": 1.937667965888977, "Pretrain/Loss (Raw)": 1.6928095817565918, "Pretrain/Step": 7819, "Pretrain/Step Time": 8.671348648145795} +{"Pretrain/Learning Rate": 4.130792475199943e-06, "Pretrain/Loss": 1.9342399835586548, "Pretrain/Loss (Raw)": 1.67238450050354, "Pretrain/Step": 7820, "Pretrain/Step Time": 8.669828854501247} +{"Pretrain/Learning Rate": 4.126119142764379e-06, "Pretrain/Loss": 1.9376837015151978, "Pretrain/Loss (Raw)": 2.2038278579711914, "Pretrain/Step": 7821, "Pretrain/Step Time": 8.673043055459857} +{"Pretrain/Learning Rate": 4.121448217603116e-06, "Pretrain/Loss": 1.9351576566696167, "Pretrain/Loss (Raw)": 1.7885912656784058, "Pretrain/Step": 7822, "Pretrain/Step Time": 8.672511564567685} +{"Pretrain/Learning Rate": 4.116779700254828e-06, "Pretrain/Loss": 1.9341838359832764, "Pretrain/Loss (Raw)": 1.983176827430725, "Pretrain/Step": 7823, "Pretrain/Step Time": 8.67374330945313} +{"Pretrain/Learning Rate": 4.1121135912579044e-06, "Pretrain/Loss": 1.93434739112854, "Pretrain/Loss (Raw)": 1.974283218383789, "Pretrain/Step": 7824, "Pretrain/Step Time": 8.676365291699767} +{"Pretrain/Learning Rate": 4.1074498911504725e-06, "Pretrain/Loss": 1.9332995414733887, "Pretrain/Loss (Raw)": 1.7730718851089478, "Pretrain/Step": 7825, "Pretrain/Step Time": 8.672015545889735} +{"Pretrain/Learning Rate": 4.102788600470369e-06, "Pretrain/Loss": 1.933898687362671, "Pretrain/Loss (Raw)": 1.9747060537338257, "Pretrain/Step": 7826, "Pretrain/Step Time": 8.68029922246933} +{"Pretrain/Learning Rate": 4.098129719755156e-06, "Pretrain/Loss": 1.931347131729126, "Pretrain/Loss (Raw)": 1.9894955158233643, "Pretrain/Step": 7827, "Pretrain/Step Time": 8.674033422023058} +{"Pretrain/Learning Rate": 4.093473249542109e-06, "Pretrain/Loss": 1.9307481050491333, "Pretrain/Loss (Raw)": 2.0143871307373047, "Pretrain/Step": 7828, "Pretrain/Step Time": 8.67071488685906} +{"Pretrain/Learning Rate": 4.0888191903682485e-06, "Pretrain/Loss": 1.9306437969207764, "Pretrain/Loss (Raw)": 1.9412837028503418, "Pretrain/Step": 7829, "Pretrain/Step Time": 8.67337340861559} +{"Pretrain/Learning Rate": 4.084167542770295e-06, "Pretrain/Loss": 1.931526780128479, "Pretrain/Loss (Raw)": 1.8721848726272583, "Pretrain/Step": 7830, "Pretrain/Step Time": 8.674103887751698} +{"Pretrain/Learning Rate": 4.079518307284699e-06, "Pretrain/Loss": 1.9326510429382324, "Pretrain/Loss (Raw)": 2.095329761505127, "Pretrain/Step": 7831, "Pretrain/Step Time": 8.671505639329553} +{"Pretrain/Learning Rate": 4.074871484447626e-06, "Pretrain/Loss": 1.932536244392395, "Pretrain/Loss (Raw)": 2.0092523097991943, "Pretrain/Step": 7832, "Pretrain/Step Time": 8.671784395352006} +{"Pretrain/Learning Rate": 4.070227074794983e-06, "Pretrain/Loss": 1.936399221420288, "Pretrain/Loss (Raw)": 1.8872014284133911, "Pretrain/Step": 7833, "Pretrain/Step Time": 8.667686838656664} +{"Pretrain/Learning Rate": 4.06558507886238e-06, "Pretrain/Loss": 1.9370516538619995, "Pretrain/Loss (Raw)": 2.128617286682129, "Pretrain/Step": 7834, "Pretrain/Step Time": 8.674469906836748} +{"Pretrain/Learning Rate": 4.0609454971851476e-06, "Pretrain/Loss": 1.936425805091858, "Pretrain/Loss (Raw)": 1.8948391675949097, "Pretrain/Step": 7835, "Pretrain/Step Time": 8.676720159128308} +{"Pretrain/Learning Rate": 4.0563083302983444e-06, "Pretrain/Loss": 1.9402958154678345, "Pretrain/Loss (Raw)": 1.7845014333724976, "Pretrain/Step": 7836, "Pretrain/Step Time": 8.67737266793847} +{"Pretrain/Learning Rate": 4.051673578736761e-06, "Pretrain/Loss": 1.9381651878356934, "Pretrain/Loss (Raw)": 1.8716274499893188, "Pretrain/Step": 7837, "Pretrain/Step Time": 8.680852241814137} +{"Pretrain/Learning Rate": 4.047041243034894e-06, "Pretrain/Loss": 1.9374158382415771, "Pretrain/Loss (Raw)": 1.9040042161941528, "Pretrain/Step": 7838, "Pretrain/Step Time": 8.677199017256498} +{"Pretrain/Learning Rate": 4.04241132372696e-06, "Pretrain/Loss": 1.94465172290802, "Pretrain/Loss (Raw)": 2.1872706413269043, "Pretrain/Step": 7839, "Pretrain/Step Time": 8.673364654183388} +{"Pretrain/Learning Rate": 4.037783821346905e-06, "Pretrain/Loss": 1.9428786039352417, "Pretrain/Loss (Raw)": 1.927201509475708, "Pretrain/Step": 7840, "Pretrain/Step Time": 8.66899412497878} +{"Pretrain/Learning Rate": 4.033158736428402e-06, "Pretrain/Loss": 1.9450284242630005, "Pretrain/Loss (Raw)": 2.1195058822631836, "Pretrain/Step": 7841, "Pretrain/Step Time": 8.676546603441238} +{"Pretrain/Learning Rate": 4.0285360695048316e-06, "Pretrain/Loss": 1.9475398063659668, "Pretrain/Loss (Raw)": 2.0173470973968506, "Pretrain/Step": 7842, "Pretrain/Step Time": 8.672704432159662} +{"Pretrain/Learning Rate": 4.023915821109306e-06, "Pretrain/Loss": 1.9496710300445557, "Pretrain/Loss (Raw)": 2.1649842262268066, "Pretrain/Step": 7843, "Pretrain/Step Time": 8.670920683071017} +{"Pretrain/Learning Rate": 4.01929799177464e-06, "Pretrain/Loss": 1.9483447074890137, "Pretrain/Loss (Raw)": 2.137890577316284, "Pretrain/Step": 7844, "Pretrain/Step Time": 8.670729914680123} +{"Pretrain/Learning Rate": 4.014682582033407e-06, "Pretrain/Loss": 1.9469966888427734, "Pretrain/Loss (Raw)": 1.76960027217865, "Pretrain/Step": 7845, "Pretrain/Step Time": 8.67637169547379} +{"Pretrain/Learning Rate": 4.010069592417853e-06, "Pretrain/Loss": 1.9464936256408691, "Pretrain/Loss (Raw)": 1.8924400806427002, "Pretrain/Step": 7846, "Pretrain/Step Time": 8.673981823027134} +{"Pretrain/Learning Rate": 4.00545902345999e-06, "Pretrain/Loss": 1.947305679321289, "Pretrain/Loss (Raw)": 1.9058929681777954, "Pretrain/Step": 7847, "Pretrain/Step Time": 8.676941649988294} +{"Pretrain/Learning Rate": 4.000850875691514e-06, "Pretrain/Loss": 1.9498374462127686, "Pretrain/Loss (Raw)": 1.9115526676177979, "Pretrain/Step": 7848, "Pretrain/Step Time": 8.67780201509595} +{"Pretrain/Learning Rate": 3.9962451496438765e-06, "Pretrain/Loss": 1.9487359523773193, "Pretrain/Loss (Raw)": 2.0023317337036133, "Pretrain/Step": 7849, "Pretrain/Step Time": 8.677749991416931} +{"Pretrain/Learning Rate": 3.99164184584821e-06, "Pretrain/Loss": 1.9487053155899048, "Pretrain/Loss (Raw)": 1.9229661226272583, "Pretrain/Step": 7850, "Pretrain/Step Time": 8.671027306467295} +{"Pretrain/Learning Rate": 3.987040964835409e-06, "Pretrain/Loss": 1.9475696086883545, "Pretrain/Loss (Raw)": 1.8622568845748901, "Pretrain/Step": 7851, "Pretrain/Step Time": 8.671313090249896} +{"Pretrain/Learning Rate": 3.9824425071360525e-06, "Pretrain/Loss": 1.9474486112594604, "Pretrain/Loss (Raw)": 1.8271400928497314, "Pretrain/Step": 7852, "Pretrain/Step Time": 8.67013313062489} +{"Pretrain/Learning Rate": 3.977846473280469e-06, "Pretrain/Loss": 1.945753574371338, "Pretrain/Loss (Raw)": 1.794033408164978, "Pretrain/Step": 7853, "Pretrain/Step Time": 8.671745661646128} +{"Pretrain/Learning Rate": 3.973252863798691e-06, "Pretrain/Loss": 1.942356824874878, "Pretrain/Loss (Raw)": 1.6181418895721436, "Pretrain/Step": 7854, "Pretrain/Step Time": 8.674654534086585} +{"Pretrain/Learning Rate": 3.968661679220468e-06, "Pretrain/Loss": 1.9448107481002808, "Pretrain/Loss (Raw)": 2.311811923980713, "Pretrain/Step": 7855, "Pretrain/Step Time": 8.676052242517471} +{"Pretrain/Learning Rate": 3.964072920075296e-06, "Pretrain/Loss": 1.9444046020507812, "Pretrain/Loss (Raw)": 2.1215648651123047, "Pretrain/Step": 7856, "Pretrain/Step Time": 8.67134546302259} +{"Pretrain/Learning Rate": 3.959486586892344e-06, "Pretrain/Loss": 1.9413223266601562, "Pretrain/Loss (Raw)": 1.7527213096618652, "Pretrain/Step": 7857, "Pretrain/Step Time": 8.676309393718839} +{"Pretrain/Learning Rate": 3.954902680200553e-06, "Pretrain/Loss": 1.939942717552185, "Pretrain/Loss (Raw)": 1.5866907835006714, "Pretrain/Step": 7858, "Pretrain/Step Time": 8.669013230130076} +{"Pretrain/Learning Rate": 3.950321200528548e-06, "Pretrain/Loss": 1.9383480548858643, "Pretrain/Loss (Raw)": 1.7841098308563232, "Pretrain/Step": 7859, "Pretrain/Step Time": 8.670021064579487} +{"Pretrain/Learning Rate": 3.9457421484047015e-06, "Pretrain/Loss": 1.9372073411941528, "Pretrain/Loss (Raw)": 1.8780896663665771, "Pretrain/Step": 7860, "Pretrain/Step Time": 8.667533023282886} +{"Pretrain/Learning Rate": 3.941165524357071e-06, "Pretrain/Loss": 1.9361281394958496, "Pretrain/Loss (Raw)": 1.7325369119644165, "Pretrain/Step": 7861, "Pretrain/Step Time": 8.668201135471463} +{"Pretrain/Learning Rate": 3.936591328913472e-06, "Pretrain/Loss": 1.936647653579712, "Pretrain/Loss (Raw)": 2.0296411514282227, "Pretrain/Step": 7862, "Pretrain/Step Time": 8.66829395852983} +{"Pretrain/Learning Rate": 3.932019562601405e-06, "Pretrain/Loss": 1.9345166683197021, "Pretrain/Loss (Raw)": 1.8125208616256714, "Pretrain/Step": 7863, "Pretrain/Step Time": 8.669785723090172} +{"Pretrain/Learning Rate": 3.927450225948132e-06, "Pretrain/Loss": 1.9342834949493408, "Pretrain/Loss (Raw)": 1.8496335744857788, "Pretrain/Step": 7864, "Pretrain/Step Time": 8.663126459345222} +{"Pretrain/Learning Rate": 3.922883319480586e-06, "Pretrain/Loss": 1.9341447353363037, "Pretrain/Loss (Raw)": 1.9897798299789429, "Pretrain/Step": 7865, "Pretrain/Step Time": 8.658372456207871} +{"Pretrain/Learning Rate": 3.9183188437254576e-06, "Pretrain/Loss": 1.9345487356185913, "Pretrain/Loss (Raw)": 2.0756020545959473, "Pretrain/Step": 7866, "Pretrain/Step Time": 8.660264207050204} +{"Pretrain/Learning Rate": 3.9137567992091394e-06, "Pretrain/Loss": 1.9347820281982422, "Pretrain/Loss (Raw)": 1.9796257019042969, "Pretrain/Step": 7867, "Pretrain/Step Time": 8.663639141246676} +{"Pretrain/Learning Rate": 3.90919718645775e-06, "Pretrain/Loss": 1.935869812965393, "Pretrain/Loss (Raw)": 1.8272075653076172, "Pretrain/Step": 7868, "Pretrain/Step Time": 8.667724080383778} +{"Pretrain/Learning Rate": 3.904640005997118e-06, "Pretrain/Loss": 1.935786247253418, "Pretrain/Loss (Raw)": 1.9228339195251465, "Pretrain/Step": 7869, "Pretrain/Step Time": 8.666821600869298} +{"Pretrain/Learning Rate": 3.900085258352812e-06, "Pretrain/Loss": 1.9351561069488525, "Pretrain/Loss (Raw)": 1.9710140228271484, "Pretrain/Step": 7870, "Pretrain/Step Time": 8.670894602313638} +{"Pretrain/Learning Rate": 3.895532944050098e-06, "Pretrain/Loss": 1.9343392848968506, "Pretrain/Loss (Raw)": 1.9117622375488281, "Pretrain/Step": 7871, "Pretrain/Step Time": 8.669219009578228} +{"Pretrain/Learning Rate": 3.890983063613976e-06, "Pretrain/Loss": 1.935095191001892, "Pretrain/Loss (Raw)": 2.1047606468200684, "Pretrain/Step": 7872, "Pretrain/Step Time": 8.668922314420342} +{"Pretrain/Learning Rate": 3.886435617569148e-06, "Pretrain/Loss": 1.9355926513671875, "Pretrain/Loss (Raw)": 1.901950478553772, "Pretrain/Step": 7873, "Pretrain/Step Time": 8.664022151380777} +{"Pretrain/Learning Rate": 3.881890606440058e-06, "Pretrain/Loss": 1.9375377893447876, "Pretrain/Loss (Raw)": 2.126978874206543, "Pretrain/Step": 7874, "Pretrain/Step Time": 8.666681855916977} +{"Pretrain/Learning Rate": 3.87734803075086e-06, "Pretrain/Loss": 1.9392564296722412, "Pretrain/Loss (Raw)": 2.1832516193389893, "Pretrain/Step": 7875, "Pretrain/Step Time": 8.66361828893423} +{"Pretrain/Learning Rate": 3.872807891025418e-06, "Pretrain/Loss": 1.9389235973358154, "Pretrain/Loss (Raw)": 1.883225679397583, "Pretrain/Step": 7876, "Pretrain/Step Time": 8.665732368826866} +{"Pretrain/Learning Rate": 3.868270187787318e-06, "Pretrain/Loss": 1.943063497543335, "Pretrain/Loss (Raw)": 2.0065128803253174, "Pretrain/Step": 7877, "Pretrain/Step Time": 8.6650205347687} +{"Pretrain/Learning Rate": 3.863734921559884e-06, "Pretrain/Loss": 1.9410955905914307, "Pretrain/Loss (Raw)": 1.8668235540390015, "Pretrain/Step": 7878, "Pretrain/Step Time": 8.66623792052269} +{"Pretrain/Learning Rate": 3.859202092866135e-06, "Pretrain/Loss": 1.9393378496170044, "Pretrain/Loss (Raw)": 1.7060331106185913, "Pretrain/Step": 7879, "Pretrain/Step Time": 8.669026389718056} +{"Pretrain/Learning Rate": 3.854671702228818e-06, "Pretrain/Loss": 1.9397073984146118, "Pretrain/Loss (Raw)": 2.047718048095703, "Pretrain/Step": 7880, "Pretrain/Step Time": 8.66511632502079} +{"Pretrain/Learning Rate": 3.850143750170395e-06, "Pretrain/Loss": 1.9395157098770142, "Pretrain/Loss (Raw)": 2.1088271141052246, "Pretrain/Step": 7881, "Pretrain/Step Time": 8.66643893532455} +{"Pretrain/Learning Rate": 3.8456182372130636e-06, "Pretrain/Loss": 1.9375983476638794, "Pretrain/Loss (Raw)": 2.0079329013824463, "Pretrain/Step": 7882, "Pretrain/Step Time": 8.665979260578752} +{"Pretrain/Learning Rate": 3.841095163878719e-06, "Pretrain/Loss": 1.9372501373291016, "Pretrain/Loss (Raw)": 1.846935749053955, "Pretrain/Step": 7883, "Pretrain/Step Time": 8.664665754884481} +{"Pretrain/Learning Rate": 3.836574530688983e-06, "Pretrain/Loss": 1.9385381937026978, "Pretrain/Loss (Raw)": 1.9944642782211304, "Pretrain/Step": 7884, "Pretrain/Step Time": 8.660731874406338} +{"Pretrain/Learning Rate": 3.832056338165193e-06, "Pretrain/Loss": 1.9368013143539429, "Pretrain/Loss (Raw)": 1.7704966068267822, "Pretrain/Step": 7885, "Pretrain/Step Time": 8.661635100841522} +{"Pretrain/Learning Rate": 3.827540586828418e-06, "Pretrain/Loss": 1.9370369911193848, "Pretrain/Loss (Raw)": 1.864365816116333, "Pretrain/Step": 7886, "Pretrain/Step Time": 8.65968369692564} +{"Pretrain/Learning Rate": 3.823027277199432e-06, "Pretrain/Loss": 1.935388445854187, "Pretrain/Loss (Raw)": 1.940429449081421, "Pretrain/Step": 7887, "Pretrain/Step Time": 8.6582818813622} +{"Pretrain/Learning Rate": 3.818516409798728e-06, "Pretrain/Loss": 1.9339982271194458, "Pretrain/Loss (Raw)": 1.6957268714904785, "Pretrain/Step": 7888, "Pretrain/Step Time": 8.658062014728785} +{"Pretrain/Learning Rate": 3.814007985146517e-06, "Pretrain/Loss": 1.933335542678833, "Pretrain/Loss (Raw)": 1.7223063707351685, "Pretrain/Step": 7889, "Pretrain/Step Time": 8.662391724064946} +{"Pretrain/Learning Rate": 3.8095020037627467e-06, "Pretrain/Loss": 1.9326903820037842, "Pretrain/Loss (Raw)": 1.854886770248413, "Pretrain/Step": 7890, "Pretrain/Step Time": 8.661599574610591} +{"Pretrain/Learning Rate": 3.8049984661670477e-06, "Pretrain/Loss": 1.9336802959442139, "Pretrain/Loss (Raw)": 1.9931654930114746, "Pretrain/Step": 7891, "Pretrain/Step Time": 8.661453349515796} +{"Pretrain/Learning Rate": 3.8004973728788057e-06, "Pretrain/Loss": 1.9336072206497192, "Pretrain/Loss (Raw)": 2.0375118255615234, "Pretrain/Step": 7892, "Pretrain/Step Time": 8.659474346786737} +{"Pretrain/Learning Rate": 3.795998724417096e-06, "Pretrain/Loss": 1.9347290992736816, "Pretrain/Loss (Raw)": 1.9947755336761475, "Pretrain/Step": 7893, "Pretrain/Step Time": 8.663267713040113} +{"Pretrain/Learning Rate": 3.7915025213007354e-06, "Pretrain/Loss": 1.9362822771072388, "Pretrain/Loss (Raw)": 2.006275177001953, "Pretrain/Step": 7894, "Pretrain/Step Time": 8.66149639338255} +{"Pretrain/Learning Rate": 3.7870087640482444e-06, "Pretrain/Loss": 1.9371800422668457, "Pretrain/Loss (Raw)": 1.8026543855667114, "Pretrain/Step": 7895, "Pretrain/Step Time": 8.664549645036459} +{"Pretrain/Learning Rate": 3.782517453177853e-06, "Pretrain/Loss": 1.9380624294281006, "Pretrain/Loss (Raw)": 1.9961152076721191, "Pretrain/Step": 7896, "Pretrain/Step Time": 8.663239007815719} +{"Pretrain/Learning Rate": 3.778028589207541e-06, "Pretrain/Loss": 1.9367144107818604, "Pretrain/Loss (Raw)": 1.9552242755889893, "Pretrain/Step": 7897, "Pretrain/Step Time": 8.656699385493994} +{"Pretrain/Learning Rate": 3.773542172654962e-06, "Pretrain/Loss": 1.9359712600708008, "Pretrain/Loss (Raw)": 1.9432191848754883, "Pretrain/Step": 7898, "Pretrain/Step Time": 8.655708337202668} +{"Pretrain/Learning Rate": 3.769058204037526e-06, "Pretrain/Loss": 1.937117576599121, "Pretrain/Loss (Raw)": 2.0826709270477295, "Pretrain/Step": 7899, "Pretrain/Step Time": 8.658114003017545} +{"Pretrain/Learning Rate": 3.7645766838723395e-06, "Pretrain/Loss": 1.9370981454849243, "Pretrain/Loss (Raw)": 1.9373794794082642, "Pretrain/Step": 7900, "Pretrain/Step Time": 8.658208474516869} +{"Pretrain/Learning Rate": 3.7600976126762415e-06, "Pretrain/Loss": 1.9384760856628418, "Pretrain/Loss (Raw)": 2.263878345489502, "Pretrain/Step": 7901, "Pretrain/Step Time": 8.656976686790586} +{"Pretrain/Learning Rate": 3.7556209909657635e-06, "Pretrain/Loss": 1.9382095336914062, "Pretrain/Loss (Raw)": 2.060059070587158, "Pretrain/Step": 7902, "Pretrain/Step Time": 8.650887185707688} +{"Pretrain/Learning Rate": 3.751146819257187e-06, "Pretrain/Loss": 1.938854694366455, "Pretrain/Loss (Raw)": 2.13584566116333, "Pretrain/Step": 7903, "Pretrain/Step Time": 8.658831052482128} +{"Pretrain/Learning Rate": 3.7466750980664795e-06, "Pretrain/Loss": 1.9374405145645142, "Pretrain/Loss (Raw)": 1.8039575815200806, "Pretrain/Step": 7904, "Pretrain/Step Time": 8.655481666326523} +{"Pretrain/Learning Rate": 3.7422058279093593e-06, "Pretrain/Loss": 1.936884880065918, "Pretrain/Loss (Raw)": 1.8228801488876343, "Pretrain/Step": 7905, "Pretrain/Step Time": 8.655897185206413} +{"Pretrain/Learning Rate": 3.737739009301222e-06, "Pretrain/Loss": 1.9378337860107422, "Pretrain/Loss (Raw)": 2.089334726333618, "Pretrain/Step": 7906, "Pretrain/Step Time": 8.653927624225616} +{"Pretrain/Learning Rate": 3.73327464275722e-06, "Pretrain/Loss": 1.937436580657959, "Pretrain/Loss (Raw)": 2.0307838916778564, "Pretrain/Step": 7907, "Pretrain/Step Time": 8.655610013753176} +{"Pretrain/Learning Rate": 3.728812728792197e-06, "Pretrain/Loss": 1.93497896194458, "Pretrain/Loss (Raw)": 1.9263676404953003, "Pretrain/Step": 7908, "Pretrain/Step Time": 8.661503186449409} +{"Pretrain/Learning Rate": 3.7243532679207242e-06, "Pretrain/Loss": 1.935346245765686, "Pretrain/Loss (Raw)": 1.894132137298584, "Pretrain/Step": 7909, "Pretrain/Step Time": 8.659895054996014} +{"Pretrain/Learning Rate": 3.7198962606570826e-06, "Pretrain/Loss": 1.9368733167648315, "Pretrain/Loss (Raw)": 1.9468625783920288, "Pretrain/Step": 7910, "Pretrain/Step Time": 8.66201133467257} +{"Pretrain/Learning Rate": 3.7154417075152826e-06, "Pretrain/Loss": 1.938079595565796, "Pretrain/Loss (Raw)": 1.931235909461975, "Pretrain/Step": 7911, "Pretrain/Step Time": 8.65993913449347} +{"Pretrain/Learning Rate": 3.7109896090090413e-06, "Pretrain/Loss": 1.9359173774719238, "Pretrain/Loss (Raw)": 1.7048068046569824, "Pretrain/Step": 7912, "Pretrain/Step Time": 8.660681625828147} +{"Pretrain/Learning Rate": 3.7065399656517953e-06, "Pretrain/Loss": 1.9391998052597046, "Pretrain/Loss (Raw)": 1.9613704681396484, "Pretrain/Step": 7913, "Pretrain/Step Time": 8.653126137331128} +{"Pretrain/Learning Rate": 3.702092777956692e-06, "Pretrain/Loss": 1.9397319555282593, "Pretrain/Loss (Raw)": 2.0908257961273193, "Pretrain/Step": 7914, "Pretrain/Step Time": 8.657923091202974} +{"Pretrain/Learning Rate": 3.6976480464366162e-06, "Pretrain/Loss": 1.9430720806121826, "Pretrain/Loss (Raw)": 2.2366724014282227, "Pretrain/Step": 7915, "Pretrain/Step Time": 8.656889852136374} +{"Pretrain/Learning Rate": 3.693205771604147e-06, "Pretrain/Loss": 1.9422646760940552, "Pretrain/Loss (Raw)": 1.9539971351623535, "Pretrain/Step": 7916, "Pretrain/Step Time": 8.656570570543408} +{"Pretrain/Learning Rate": 3.68876595397159e-06, "Pretrain/Loss": 1.9420318603515625, "Pretrain/Loss (Raw)": 2.0218892097473145, "Pretrain/Step": 7917, "Pretrain/Step Time": 8.655382944270968} +{"Pretrain/Learning Rate": 3.6843285940509594e-06, "Pretrain/Loss": 1.9416065216064453, "Pretrain/Loss (Raw)": 1.9751780033111572, "Pretrain/Step": 7918, "Pretrain/Step Time": 8.656009815633297} +{"Pretrain/Learning Rate": 3.6798936923540027e-06, "Pretrain/Loss": 1.9421501159667969, "Pretrain/Loss (Raw)": 1.9010741710662842, "Pretrain/Step": 7919, "Pretrain/Step Time": 8.650551466271281} +{"Pretrain/Learning Rate": 3.6754612493921675e-06, "Pretrain/Loss": 1.9437029361724854, "Pretrain/Loss (Raw)": 1.9949054718017578, "Pretrain/Step": 7920, "Pretrain/Step Time": 8.65690384991467} +{"Pretrain/Learning Rate": 3.6710312656766276e-06, "Pretrain/Loss": 1.944291353225708, "Pretrain/Loss (Raw)": 2.0831027030944824, "Pretrain/Step": 7921, "Pretrain/Step Time": 8.654598902910948} +{"Pretrain/Learning Rate": 3.6666037417182607e-06, "Pretrain/Loss": 1.9411020278930664, "Pretrain/Loss (Raw)": 1.6727008819580078, "Pretrain/Step": 7922, "Pretrain/Step Time": 8.658607225865126} +{"Pretrain/Learning Rate": 3.6621786780276834e-06, "Pretrain/Loss": 1.9366734027862549, "Pretrain/Loss (Raw)": 1.48491370677948, "Pretrain/Step": 7923, "Pretrain/Step Time": 8.66029697842896} +{"Pretrain/Learning Rate": 3.6577560751152096e-06, "Pretrain/Loss": 1.9358320236206055, "Pretrain/Loss (Raw)": 1.9481544494628906, "Pretrain/Step": 7924, "Pretrain/Step Time": 8.663001500070095} +{"Pretrain/Learning Rate": 3.65333593349087e-06, "Pretrain/Loss": 1.9348163604736328, "Pretrain/Loss (Raw)": 1.9155066013336182, "Pretrain/Step": 7925, "Pretrain/Step Time": 8.663555346429348} +{"Pretrain/Learning Rate": 3.6489182536644156e-06, "Pretrain/Loss": 1.9353840351104736, "Pretrain/Loss (Raw)": 1.9818317890167236, "Pretrain/Step": 7926, "Pretrain/Step Time": 8.66111603192985} +{"Pretrain/Learning Rate": 3.644503036145322e-06, "Pretrain/Loss": 1.9381299018859863, "Pretrain/Loss (Raw)": 2.12998366355896, "Pretrain/Step": 7927, "Pretrain/Step Time": 8.6604008898139} +{"Pretrain/Learning Rate": 3.6400902814427707e-06, "Pretrain/Loss": 1.9359605312347412, "Pretrain/Loss (Raw)": 1.6785963773727417, "Pretrain/Step": 7928, "Pretrain/Step Time": 8.662303959950805} +{"Pretrain/Learning Rate": 3.6356799900656576e-06, "Pretrain/Loss": 1.9357285499572754, "Pretrain/Loss (Raw)": 1.8497436046600342, "Pretrain/Step": 7929, "Pretrain/Step Time": 8.662507327273488} +{"Pretrain/Learning Rate": 3.6312721625225947e-06, "Pretrain/Loss": 1.938938856124878, "Pretrain/Loss (Raw)": 2.0228254795074463, "Pretrain/Step": 7930, "Pretrain/Step Time": 8.6656338814646} +{"Pretrain/Learning Rate": 3.626866799321929e-06, "Pretrain/Loss": 1.9373681545257568, "Pretrain/Loss (Raw)": 1.9131147861480713, "Pretrain/Step": 7931, "Pretrain/Step Time": 8.66784126125276} +{"Pretrain/Learning Rate": 3.622463900971687e-06, "Pretrain/Loss": 1.9347859621047974, "Pretrain/Loss (Raw)": 1.765484094619751, "Pretrain/Step": 7932, "Pretrain/Step Time": 8.661254283040762} +{"Pretrain/Learning Rate": 3.618063467979649e-06, "Pretrain/Loss": 1.9336533546447754, "Pretrain/Loss (Raw)": 1.783455491065979, "Pretrain/Step": 7933, "Pretrain/Step Time": 8.66283487714827} +{"Pretrain/Learning Rate": 3.6136655008532807e-06, "Pretrain/Loss": 1.9352089166641235, "Pretrain/Loss (Raw)": 2.063190460205078, "Pretrain/Step": 7934, "Pretrain/Step Time": 8.6592639349401} +{"Pretrain/Learning Rate": 3.6092700000997876e-06, "Pretrain/Loss": 1.9351271390914917, "Pretrain/Loss (Raw)": 1.9813464879989624, "Pretrain/Step": 7935, "Pretrain/Step Time": 8.66558102145791} +{"Pretrain/Learning Rate": 3.6048769662260757e-06, "Pretrain/Loss": 1.9350281953811646, "Pretrain/Loss (Raw)": 2.0694496631622314, "Pretrain/Step": 7936, "Pretrain/Step Time": 8.661507543176413} +{"Pretrain/Learning Rate": 3.600486399738762e-06, "Pretrain/Loss": 1.9336516857147217, "Pretrain/Loss (Raw)": 1.744824767112732, "Pretrain/Step": 7937, "Pretrain/Step Time": 8.666185667738318} +{"Pretrain/Learning Rate": 3.596098301144207e-06, "Pretrain/Loss": 1.9348928928375244, "Pretrain/Loss (Raw)": 1.9762706756591797, "Pretrain/Step": 7938, "Pretrain/Step Time": 8.66849315725267} +{"Pretrain/Learning Rate": 3.591712670948444e-06, "Pretrain/Loss": 1.933441162109375, "Pretrain/Loss (Raw)": 1.897190809249878, "Pretrain/Step": 7939, "Pretrain/Step Time": 8.665743915364146} +{"Pretrain/Learning Rate": 3.5873295096572583e-06, "Pretrain/Loss": 1.9350039958953857, "Pretrain/Loss (Raw)": 1.9790019989013672, "Pretrain/Step": 7940, "Pretrain/Step Time": 8.666058225557208} +{"Pretrain/Learning Rate": 3.58294881777613e-06, "Pretrain/Loss": 1.9338326454162598, "Pretrain/Loss (Raw)": 1.6994738578796387, "Pretrain/Step": 7941, "Pretrain/Step Time": 8.6674541272223} +{"Pretrain/Learning Rate": 3.578570595810274e-06, "Pretrain/Loss": 1.9345349073410034, "Pretrain/Loss (Raw)": 1.935532808303833, "Pretrain/Step": 7942, "Pretrain/Step Time": 8.656371429562569} +{"Pretrain/Learning Rate": 3.5741948442645864e-06, "Pretrain/Loss": 1.9343225955963135, "Pretrain/Loss (Raw)": 1.667675256729126, "Pretrain/Step": 7943, "Pretrain/Step Time": 8.65751351043582} +{"Pretrain/Learning Rate": 3.569821563643719e-06, "Pretrain/Loss": 1.9329445362091064, "Pretrain/Loss (Raw)": 1.9554823637008667, "Pretrain/Step": 7944, "Pretrain/Step Time": 8.652234859764576} +{"Pretrain/Learning Rate": 3.5654507544520016e-06, "Pretrain/Loss": 1.932002067565918, "Pretrain/Loss (Raw)": 1.873635172843933, "Pretrain/Step": 7945, "Pretrain/Step Time": 8.647328652441502} +{"Pretrain/Learning Rate": 3.5610824171935205e-06, "Pretrain/Loss": 1.9312596321105957, "Pretrain/Loss (Raw)": 1.9467899799346924, "Pretrain/Step": 7946, "Pretrain/Step Time": 8.649962840601802} +{"Pretrain/Learning Rate": 3.5567165523720275e-06, "Pretrain/Loss": 1.934504508972168, "Pretrain/Loss (Raw)": 2.1081478595733643, "Pretrain/Step": 7947, "Pretrain/Step Time": 8.649555873125792} +{"Pretrain/Learning Rate": 3.552353160491029e-06, "Pretrain/Loss": 1.9365029335021973, "Pretrain/Loss (Raw)": 1.92818021774292, "Pretrain/Step": 7948, "Pretrain/Step Time": 8.653057180345058} +{"Pretrain/Learning Rate": 3.54799224205373e-06, "Pretrain/Loss": 1.9318723678588867, "Pretrain/Loss (Raw)": 1.6111259460449219, "Pretrain/Step": 7949, "Pretrain/Step Time": 8.650820141658187} +{"Pretrain/Learning Rate": 3.5436337975630536e-06, "Pretrain/Loss": 1.9323312044143677, "Pretrain/Loss (Raw)": 1.8473149538040161, "Pretrain/Step": 7950, "Pretrain/Step Time": 8.655640350654721} +{"Pretrain/Learning Rate": 3.5392778275216227e-06, "Pretrain/Loss": 1.929365634918213, "Pretrain/Loss (Raw)": 1.603603482246399, "Pretrain/Step": 7951, "Pretrain/Step Time": 8.654737412929535} +{"Pretrain/Learning Rate": 3.5349243324318076e-06, "Pretrain/Loss": 1.9262003898620605, "Pretrain/Loss (Raw)": 1.5691144466400146, "Pretrain/Step": 7952, "Pretrain/Step Time": 8.6570945084095} +{"Pretrain/Learning Rate": 3.5305733127956654e-06, "Pretrain/Loss": 1.9282433986663818, "Pretrain/Loss (Raw)": 2.034583806991577, "Pretrain/Step": 7953, "Pretrain/Step Time": 8.659034933894873} +{"Pretrain/Learning Rate": 3.5262247691149747e-06, "Pretrain/Loss": 1.9280760288238525, "Pretrain/Loss (Raw)": 1.953284740447998, "Pretrain/Step": 7954, "Pretrain/Step Time": 8.651655061170459} +{"Pretrain/Learning Rate": 3.5218787018912263e-06, "Pretrain/Loss": 1.9270122051239014, "Pretrain/Loss (Raw)": 1.8533318042755127, "Pretrain/Step": 7955, "Pretrain/Step Time": 8.65375467389822} +{"Pretrain/Learning Rate": 3.517535111625639e-06, "Pretrain/Loss": 1.9256962537765503, "Pretrain/Loss (Raw)": 1.845934271812439, "Pretrain/Step": 7956, "Pretrain/Step Time": 8.651501460000873} +{"Pretrain/Learning Rate": 3.5131939988191335e-06, "Pretrain/Loss": 1.9267358779907227, "Pretrain/Loss (Raw)": 2.0743603706359863, "Pretrain/Step": 7957, "Pretrain/Step Time": 8.658442538231611} +{"Pretrain/Learning Rate": 3.508855363972344e-06, "Pretrain/Loss": 1.9250273704528809, "Pretrain/Loss (Raw)": 1.653478741645813, "Pretrain/Step": 7958, "Pretrain/Step Time": 8.660000629723072} +{"Pretrain/Learning Rate": 3.5045192075856186e-06, "Pretrain/Loss": 1.9241712093353271, "Pretrain/Loss (Raw)": 1.9857661724090576, "Pretrain/Step": 7959, "Pretrain/Step Time": 8.664217283949256} +{"Pretrain/Learning Rate": 3.5001855301590336e-06, "Pretrain/Loss": 1.9247231483459473, "Pretrain/Loss (Raw)": 2.0798745155334473, "Pretrain/Step": 7960, "Pretrain/Step Time": 8.662682089954615} +{"Pretrain/Learning Rate": 3.495854332192361e-06, "Pretrain/Loss": 1.9245243072509766, "Pretrain/Loss (Raw)": 1.8617686033248901, "Pretrain/Step": 7961, "Pretrain/Step Time": 8.663585210219026} +{"Pretrain/Learning Rate": 3.491525614185101e-06, "Pretrain/Loss": 1.9223711490631104, "Pretrain/Loss (Raw)": 1.853017807006836, "Pretrain/Step": 7962, "Pretrain/Step Time": 8.660296218469739} +{"Pretrain/Learning Rate": 3.4871993766364518e-06, "Pretrain/Loss": 1.9240626096725464, "Pretrain/Loss (Raw)": 2.1113383769989014, "Pretrain/Step": 7963, "Pretrain/Step Time": 8.660601526498795} +{"Pretrain/Learning Rate": 3.482875620045348e-06, "Pretrain/Loss": 1.9258346557617188, "Pretrain/Loss (Raw)": 2.011319160461426, "Pretrain/Step": 7964, "Pretrain/Step Time": 8.655549244955182} +{"Pretrain/Learning Rate": 3.4785543449104173e-06, "Pretrain/Loss": 1.9231631755828857, "Pretrain/Loss (Raw)": 1.5296810865402222, "Pretrain/Step": 7965, "Pretrain/Step Time": 8.653412399813533} +{"Pretrain/Learning Rate": 3.474235551730015e-06, "Pretrain/Loss": 1.9228720664978027, "Pretrain/Loss (Raw)": 1.866748332977295, "Pretrain/Step": 7966, "Pretrain/Step Time": 8.65460830181837} +{"Pretrain/Learning Rate": 3.4699192410021953e-06, "Pretrain/Loss": 1.9190196990966797, "Pretrain/Loss (Raw)": 1.6941587924957275, "Pretrain/Step": 7967, "Pretrain/Step Time": 8.654884660616517} +{"Pretrain/Learning Rate": 3.4656054132247483e-06, "Pretrain/Loss": 1.916670560836792, "Pretrain/Loss (Raw)": 1.626508355140686, "Pretrain/Step": 7968, "Pretrain/Step Time": 8.654434842988849} +{"Pretrain/Learning Rate": 3.4612940688951574e-06, "Pretrain/Loss": 1.9159854650497437, "Pretrain/Loss (Raw)": 2.031815528869629, "Pretrain/Step": 7969, "Pretrain/Step Time": 8.646163906902075} +{"Pretrain/Learning Rate": 3.456985208510627e-06, "Pretrain/Loss": 1.9150798320770264, "Pretrain/Loss (Raw)": 1.9014294147491455, "Pretrain/Step": 7970, "Pretrain/Step Time": 8.650765212252736} +{"Pretrain/Learning Rate": 3.452678832568071e-06, "Pretrain/Loss": 1.9121001958847046, "Pretrain/Loss (Raw)": 1.7835960388183594, "Pretrain/Step": 7971, "Pretrain/Step Time": 8.653447920456529} +{"Pretrain/Learning Rate": 3.448374941564139e-06, "Pretrain/Loss": 1.9108530282974243, "Pretrain/Loss (Raw)": 1.9782514572143555, "Pretrain/Step": 7972, "Pretrain/Step Time": 8.651744470000267} +{"Pretrain/Learning Rate": 3.4440735359951515e-06, "Pretrain/Loss": 1.9128577709197998, "Pretrain/Loss (Raw)": 2.0262012481689453, "Pretrain/Step": 7973, "Pretrain/Step Time": 8.647048870101571} +{"Pretrain/Learning Rate": 3.439774616357183e-06, "Pretrain/Loss": 1.9137842655181885, "Pretrain/Loss (Raw)": 2.011031150817871, "Pretrain/Step": 7974, "Pretrain/Step Time": 8.646200304850936} +{"Pretrain/Learning Rate": 3.4354781831459985e-06, "Pretrain/Loss": 1.9143142700195312, "Pretrain/Loss (Raw)": 1.973737359046936, "Pretrain/Step": 7975, "Pretrain/Step Time": 8.647133057937026} +{"Pretrain/Learning Rate": 3.431184236857088e-06, "Pretrain/Loss": 1.915523886680603, "Pretrain/Loss (Raw)": 2.0663795471191406, "Pretrain/Step": 7976, "Pretrain/Step Time": 8.64666093699634} +{"Pretrain/Learning Rate": 3.426892777985646e-06, "Pretrain/Loss": 1.915766716003418, "Pretrain/Loss (Raw)": 2.0334181785583496, "Pretrain/Step": 7977, "Pretrain/Step Time": 8.64773459918797} +{"Pretrain/Learning Rate": 3.4226038070265837e-06, "Pretrain/Loss": 1.9117062091827393, "Pretrain/Loss (Raw)": 1.4032145738601685, "Pretrain/Step": 7978, "Pretrain/Step Time": 8.649859985336661} +{"Pretrain/Learning Rate": 3.418317324474529e-06, "Pretrain/Loss": 1.9105193614959717, "Pretrain/Loss (Raw)": 1.7103533744812012, "Pretrain/Step": 7979, "Pretrain/Step Time": 8.651141833513975} +{"Pretrain/Learning Rate": 3.414033330823815e-06, "Pretrain/Loss": 1.9129877090454102, "Pretrain/Loss (Raw)": 2.143097400665283, "Pretrain/Step": 7980, "Pretrain/Step Time": 8.650236425921321} +{"Pretrain/Learning Rate": 3.409751826568497e-06, "Pretrain/Loss": 1.9141755104064941, "Pretrain/Loss (Raw)": 1.9460623264312744, "Pretrain/Step": 7981, "Pretrain/Step Time": 8.64695524610579} +{"Pretrain/Learning Rate": 3.405472812202326e-06, "Pretrain/Loss": 1.9172124862670898, "Pretrain/Loss (Raw)": 2.006866216659546, "Pretrain/Step": 7982, "Pretrain/Step Time": 8.64860112965107} +{"Pretrain/Learning Rate": 3.4011962882188024e-06, "Pretrain/Loss": 1.9135704040527344, "Pretrain/Loss (Raw)": 1.845624566078186, "Pretrain/Step": 7983, "Pretrain/Step Time": 8.648652374744415} +{"Pretrain/Learning Rate": 3.3969222551110845e-06, "Pretrain/Loss": 1.912335991859436, "Pretrain/Loss (Raw)": 1.9635645151138306, "Pretrain/Step": 7984, "Pretrain/Step Time": 8.648884795606136} +{"Pretrain/Learning Rate": 3.3926507133720973e-06, "Pretrain/Loss": 1.9133155345916748, "Pretrain/Loss (Raw)": 1.8781040906906128, "Pretrain/Step": 7985, "Pretrain/Step Time": 8.646375177428126} +{"Pretrain/Learning Rate": 3.3883816634944416e-06, "Pretrain/Loss": 1.9173601865768433, "Pretrain/Loss (Raw)": 2.1044106483459473, "Pretrain/Step": 7986, "Pretrain/Step Time": 8.645657097920775} +{"Pretrain/Learning Rate": 3.384115105970459e-06, "Pretrain/Loss": 1.9204202890396118, "Pretrain/Loss (Raw)": 2.175800085067749, "Pretrain/Step": 7987, "Pretrain/Step Time": 8.64473656564951} +{"Pretrain/Learning Rate": 3.3798510412921702e-06, "Pretrain/Loss": 1.9209179878234863, "Pretrain/Loss (Raw)": 1.9418057203292847, "Pretrain/Step": 7988, "Pretrain/Step Time": 8.647318398579955} +{"Pretrain/Learning Rate": 3.37558946995134e-06, "Pretrain/Loss": 1.923622965812683, "Pretrain/Loss (Raw)": 2.078766345977783, "Pretrain/Step": 7989, "Pretrain/Step Time": 8.646993050351739} +{"Pretrain/Learning Rate": 3.371330392439434e-06, "Pretrain/Loss": 1.921041488647461, "Pretrain/Loss (Raw)": 1.6992087364196777, "Pretrain/Step": 7990, "Pretrain/Step Time": 8.644474513828754} +{"Pretrain/Learning Rate": 3.36707380924762e-06, "Pretrain/Loss": 1.923742413520813, "Pretrain/Loss (Raw)": 2.1582367420196533, "Pretrain/Step": 7991, "Pretrain/Step Time": 8.646942192688584} +{"Pretrain/Learning Rate": 3.362819720866789e-06, "Pretrain/Loss": 1.9248600006103516, "Pretrain/Loss (Raw)": 1.9926880598068237, "Pretrain/Step": 7992, "Pretrain/Step Time": 8.648298528045416} +{"Pretrain/Learning Rate": 3.358568127787551e-06, "Pretrain/Loss": 1.9247827529907227, "Pretrain/Loss (Raw)": 1.9798898696899414, "Pretrain/Step": 7993, "Pretrain/Step Time": 8.650471542030573} +{"Pretrain/Learning Rate": 3.3543190305002136e-06, "Pretrain/Loss": 1.9247139692306519, "Pretrain/Loss (Raw)": 2.066796064376831, "Pretrain/Step": 7994, "Pretrain/Step Time": 8.649288671091199} +{"Pretrain/Learning Rate": 3.350072429494805e-06, "Pretrain/Loss": 1.9230514764785767, "Pretrain/Loss (Raw)": 1.7668379545211792, "Pretrain/Step": 7995, "Pretrain/Step Time": 8.648694733157754} +{"Pretrain/Learning Rate": 3.345828325261055e-06, "Pretrain/Loss": 1.9242780208587646, "Pretrain/Loss (Raw)": 1.9842004776000977, "Pretrain/Step": 7996, "Pretrain/Step Time": 8.642396630719304} +{"Pretrain/Learning Rate": 3.341586718288425e-06, "Pretrain/Loss": 1.9261246919631958, "Pretrain/Loss (Raw)": 2.159203290939331, "Pretrain/Step": 7997, "Pretrain/Step Time": 8.64222607202828} +{"Pretrain/Learning Rate": 3.3373476090660745e-06, "Pretrain/Loss": 1.9255199432373047, "Pretrain/Loss (Raw)": 1.8936165571212769, "Pretrain/Step": 7998, "Pretrain/Step Time": 8.639177463948727} +{"Pretrain/Learning Rate": 3.333110998082875e-06, "Pretrain/Loss": 1.925794005393982, "Pretrain/Loss (Raw)": 1.9468302726745605, "Pretrain/Step": 7999, "Pretrain/Step Time": 8.640476893633604} +{"Pretrain/Learning Rate": 3.3288768858274063e-06, "Pretrain/Loss": 1.9244325160980225, "Pretrain/Loss (Raw)": 1.9304770231246948, "Pretrain/Step": 8000, "Pretrain/Step Time": 8.637455871328712} +{"Pretrain/Learning Rate": 3.3246452727879797e-06, "Pretrain/Loss": 1.924370288848877, "Pretrain/Loss (Raw)": 1.8939968347549438, "Pretrain/Step": 8001, "Pretrain/Step Time": 8.637566987425089} +{"Pretrain/Learning Rate": 3.3204161594525967e-06, "Pretrain/Loss": 1.9234929084777832, "Pretrain/Loss (Raw)": 2.014667272567749, "Pretrain/Step": 8002, "Pretrain/Step Time": 8.638062965124846} +{"Pretrain/Learning Rate": 3.3161895463089787e-06, "Pretrain/Loss": 1.9214222431182861, "Pretrain/Loss (Raw)": 1.9182181358337402, "Pretrain/Step": 8003, "Pretrain/Step Time": 8.639193272218108} +{"Pretrain/Learning Rate": 3.311965433844555e-06, "Pretrain/Loss": 1.9228510856628418, "Pretrain/Loss (Raw)": 2.0661215782165527, "Pretrain/Step": 8004, "Pretrain/Step Time": 8.642129223793745} +{"Pretrain/Learning Rate": 3.3077438225464803e-06, "Pretrain/Loss": 1.9230785369873047, "Pretrain/Loss (Raw)": 2.035614490509033, "Pretrain/Step": 8005, "Pretrain/Step Time": 8.643853675574064} +{"Pretrain/Learning Rate": 3.3035247129016065e-06, "Pretrain/Loss": 1.9231114387512207, "Pretrain/Loss (Raw)": 1.8710523843765259, "Pretrain/Step": 8006, "Pretrain/Step Time": 8.644252283498645} +{"Pretrain/Learning Rate": 3.2993081053964982e-06, "Pretrain/Loss": 1.925051212310791, "Pretrain/Loss (Raw)": 1.9543155431747437, "Pretrain/Step": 8007, "Pretrain/Step Time": 8.640651194378734} +{"Pretrain/Learning Rate": 3.295094000517432e-06, "Pretrain/Loss": 1.9247069358825684, "Pretrain/Loss (Raw)": 2.003631353378296, "Pretrain/Step": 8008, "Pretrain/Step Time": 8.642313683405519} +{"Pretrain/Learning Rate": 3.2908823987504085e-06, "Pretrain/Loss": 1.9236226081848145, "Pretrain/Loss (Raw)": 1.9700464010238647, "Pretrain/Step": 8009, "Pretrain/Step Time": 8.642273977398872} +{"Pretrain/Learning Rate": 3.286673300581122e-06, "Pretrain/Loss": 1.9223047494888306, "Pretrain/Loss (Raw)": 1.839248538017273, "Pretrain/Step": 8010, "Pretrain/Step Time": 8.64634806662798} +{"Pretrain/Learning Rate": 3.2824667064949883e-06, "Pretrain/Loss": 1.9240702390670776, "Pretrain/Loss (Raw)": 2.0729241371154785, "Pretrain/Step": 8011, "Pretrain/Step Time": 8.647816555574536} +{"Pretrain/Learning Rate": 3.2782626169771236e-06, "Pretrain/Loss": 1.9237223863601685, "Pretrain/Loss (Raw)": 1.949928641319275, "Pretrain/Step": 8012, "Pretrain/Step Time": 8.646272517740726} +{"Pretrain/Learning Rate": 3.2740610325123823e-06, "Pretrain/Loss": 1.924363374710083, "Pretrain/Loss (Raw)": 1.8525404930114746, "Pretrain/Step": 8013, "Pretrain/Step Time": 8.652633043006063} +{"Pretrain/Learning Rate": 3.2698619535852877e-06, "Pretrain/Loss": 1.9245638847351074, "Pretrain/Loss (Raw)": 1.8900372982025146, "Pretrain/Step": 8014, "Pretrain/Step Time": 8.652299620211124} +{"Pretrain/Learning Rate": 3.2656653806801134e-06, "Pretrain/Loss": 1.9241549968719482, "Pretrain/Loss (Raw)": 1.8880904912948608, "Pretrain/Step": 8015, "Pretrain/Step Time": 8.650882601737976} +{"Pretrain/Learning Rate": 3.261471314280817e-06, "Pretrain/Loss": 1.9251114130020142, "Pretrain/Loss (Raw)": 1.8181382417678833, "Pretrain/Step": 8016, "Pretrain/Step Time": 8.651238782331347} +{"Pretrain/Learning Rate": 3.2572797548710897e-06, "Pretrain/Loss": 1.9268162250518799, "Pretrain/Loss (Raw)": 1.9405258893966675, "Pretrain/Step": 8017, "Pretrain/Step Time": 8.651236396282911} +{"Pretrain/Learning Rate": 3.2530907029343165e-06, "Pretrain/Loss": 1.9276695251464844, "Pretrain/Loss (Raw)": 1.964118480682373, "Pretrain/Step": 8018, "Pretrain/Step Time": 8.652934916317463} +{"Pretrain/Learning Rate": 3.2489041589535948e-06, "Pretrain/Loss": 1.926727294921875, "Pretrain/Loss (Raw)": 1.8725650310516357, "Pretrain/Step": 8019, "Pretrain/Step Time": 8.656492657959461} +{"Pretrain/Learning Rate": 3.244720123411743e-06, "Pretrain/Loss": 1.9277781248092651, "Pretrain/Loss (Raw)": 2.1720125675201416, "Pretrain/Step": 8020, "Pretrain/Step Time": 8.654421830549836} +{"Pretrain/Learning Rate": 3.2405385967912787e-06, "Pretrain/Loss": 1.9300572872161865, "Pretrain/Loss (Raw)": 2.2865028381347656, "Pretrain/Step": 8021, "Pretrain/Step Time": 8.652755469083786} +{"Pretrain/Learning Rate": 3.2363595795744413e-06, "Pretrain/Loss": 1.9296557903289795, "Pretrain/Loss (Raw)": 1.9548896551132202, "Pretrain/Step": 8022, "Pretrain/Step Time": 8.652178462594748} +{"Pretrain/Learning Rate": 3.232183072243164e-06, "Pretrain/Loss": 1.9314284324645996, "Pretrain/Loss (Raw)": 2.029541015625, "Pretrain/Step": 8023, "Pretrain/Step Time": 8.65228376723826} +{"Pretrain/Learning Rate": 3.2280090752791175e-06, "Pretrain/Loss": 1.9311007261276245, "Pretrain/Loss (Raw)": 1.9541802406311035, "Pretrain/Step": 8024, "Pretrain/Step Time": 8.654775809496641} +{"Pretrain/Learning Rate": 3.2238375891636504e-06, "Pretrain/Loss": 1.9304205179214478, "Pretrain/Loss (Raw)": 1.8681401014328003, "Pretrain/Step": 8025, "Pretrain/Step Time": 8.659475395455956} +{"Pretrain/Learning Rate": 3.2196686143778467e-06, "Pretrain/Loss": 1.930356740951538, "Pretrain/Loss (Raw)": 1.9350783824920654, "Pretrain/Step": 8026, "Pretrain/Step Time": 8.662175238132477} +{"Pretrain/Learning Rate": 3.2155021514024857e-06, "Pretrain/Loss": 1.9286768436431885, "Pretrain/Loss (Raw)": 1.8676321506500244, "Pretrain/Step": 8027, "Pretrain/Step Time": 8.658818313851953} +{"Pretrain/Learning Rate": 3.211338200718081e-06, "Pretrain/Loss": 1.9287371635437012, "Pretrain/Loss (Raw)": 1.9451048374176025, "Pretrain/Step": 8028, "Pretrain/Step Time": 8.659887753427029} +{"Pretrain/Learning Rate": 3.2071767628048145e-06, "Pretrain/Loss": 1.9271637201309204, "Pretrain/Loss (Raw)": 2.0624704360961914, "Pretrain/Step": 8029, "Pretrain/Step Time": 8.661966506391764} +{"Pretrain/Learning Rate": 3.203017838142622e-06, "Pretrain/Loss": 1.9253818988800049, "Pretrain/Loss (Raw)": 1.8319957256317139, "Pretrain/Step": 8030, "Pretrain/Step Time": 8.666601166129112} +{"Pretrain/Learning Rate": 3.198861427211122e-06, "Pretrain/Loss": 1.9227166175842285, "Pretrain/Loss (Raw)": 1.7946885824203491, "Pretrain/Step": 8031, "Pretrain/Step Time": 8.664820298552513} +{"Pretrain/Learning Rate": 3.1947075304896516e-06, "Pretrain/Loss": 1.9227838516235352, "Pretrain/Loss (Raw)": 1.812549114227295, "Pretrain/Step": 8032, "Pretrain/Step Time": 8.664012214168906} +{"Pretrain/Learning Rate": 3.190556148457255e-06, "Pretrain/Loss": 1.924030065536499, "Pretrain/Loss (Raw)": 1.9824120998382568, "Pretrain/Step": 8033, "Pretrain/Step Time": 8.667310336604714} +{"Pretrain/Learning Rate": 3.1864072815926988e-06, "Pretrain/Loss": 1.923417091369629, "Pretrain/Loss (Raw)": 2.010871171951294, "Pretrain/Step": 8034, "Pretrain/Step Time": 8.666020845994353} +{"Pretrain/Learning Rate": 3.1822609303744423e-06, "Pretrain/Loss": 1.9218852519989014, "Pretrain/Loss (Raw)": 1.8347022533416748, "Pretrain/Step": 8035, "Pretrain/Step Time": 8.66617595218122} +{"Pretrain/Learning Rate": 3.178117095280664e-06, "Pretrain/Loss": 1.9231266975402832, "Pretrain/Loss (Raw)": 2.085280656814575, "Pretrain/Step": 8036, "Pretrain/Step Time": 8.661993138492107} +{"Pretrain/Learning Rate": 3.173975776789245e-06, "Pretrain/Loss": 1.9248077869415283, "Pretrain/Loss (Raw)": 2.1092939376831055, "Pretrain/Step": 8037, "Pretrain/Step Time": 8.663032313808799} +{"Pretrain/Learning Rate": 3.1698369753777933e-06, "Pretrain/Loss": 1.925369381904602, "Pretrain/Loss (Raw)": 2.0187716484069824, "Pretrain/Step": 8038, "Pretrain/Step Time": 8.654250998049974} +{"Pretrain/Learning Rate": 3.165700691523607e-06, "Pretrain/Loss": 1.9250028133392334, "Pretrain/Loss (Raw)": 1.884303092956543, "Pretrain/Step": 8039, "Pretrain/Step Time": 8.660786068066955} +{"Pretrain/Learning Rate": 3.1615669257037045e-06, "Pretrain/Loss": 1.9280731678009033, "Pretrain/Loss (Raw)": 2.097820997238159, "Pretrain/Step": 8040, "Pretrain/Step Time": 8.66177219338715} +{"Pretrain/Learning Rate": 3.1574356783948047e-06, "Pretrain/Loss": 1.927932620048523, "Pretrain/Loss (Raw)": 1.943367600440979, "Pretrain/Step": 8041, "Pretrain/Step Time": 8.667198242619634} +{"Pretrain/Learning Rate": 3.1533069500733534e-06, "Pretrain/Loss": 1.9265341758728027, "Pretrain/Loss (Raw)": 1.911846399307251, "Pretrain/Step": 8042, "Pretrain/Step Time": 8.661535492166877} +{"Pretrain/Learning Rate": 3.1491807412154905e-06, "Pretrain/Loss": 1.9253230094909668, "Pretrain/Loss (Raw)": 2.0816261768341064, "Pretrain/Step": 8043, "Pretrain/Step Time": 8.664247293025255} +{"Pretrain/Learning Rate": 3.145057052297068e-06, "Pretrain/Loss": 1.9259916543960571, "Pretrain/Loss (Raw)": 2.039588451385498, "Pretrain/Step": 8044, "Pretrain/Step Time": 8.66627817414701} +{"Pretrain/Learning Rate": 3.140935883793644e-06, "Pretrain/Loss": 1.923236608505249, "Pretrain/Loss (Raw)": 1.669237732887268, "Pretrain/Step": 8045, "Pretrain/Step Time": 8.666007086634636} +{"Pretrain/Learning Rate": 3.136817236180503e-06, "Pretrain/Loss": 1.9249074459075928, "Pretrain/Loss (Raw)": 2.189058780670166, "Pretrain/Step": 8046, "Pretrain/Step Time": 8.665521098300815} +{"Pretrain/Learning Rate": 3.1327011099326233e-06, "Pretrain/Loss": 1.926081895828247, "Pretrain/Loss (Raw)": 2.0513980388641357, "Pretrain/Step": 8047, "Pretrain/Step Time": 8.663744606077671} +{"Pretrain/Learning Rate": 3.128587505524691e-06, "Pretrain/Loss": 1.9271845817565918, "Pretrain/Loss (Raw)": 2.136039972305298, "Pretrain/Step": 8048, "Pretrain/Step Time": 8.662858325988054} +{"Pretrain/Learning Rate": 3.124476423431105e-06, "Pretrain/Loss": 1.9280362129211426, "Pretrain/Loss (Raw)": 2.1921186447143555, "Pretrain/Step": 8049, "Pretrain/Step Time": 8.666705487295985} +{"Pretrain/Learning Rate": 3.1203678641259836e-06, "Pretrain/Loss": 1.9334217309951782, "Pretrain/Loss (Raw)": 2.3620498180389404, "Pretrain/Step": 8050, "Pretrain/Step Time": 8.660645116120577} +{"Pretrain/Learning Rate": 3.116261828083139e-06, "Pretrain/Loss": 1.9395999908447266, "Pretrain/Loss (Raw)": 2.27573561668396, "Pretrain/Step": 8051, "Pretrain/Step Time": 8.657579271122813} +{"Pretrain/Learning Rate": 3.112158315776104e-06, "Pretrain/Loss": 1.9409078359603882, "Pretrain/Loss (Raw)": 2.115550994873047, "Pretrain/Step": 8052, "Pretrain/Step Time": 8.658805144950747} +{"Pretrain/Learning Rate": 3.108057327678102e-06, "Pretrain/Loss": 1.941004753112793, "Pretrain/Loss (Raw)": 1.927916169166565, "Pretrain/Step": 8053, "Pretrain/Step Time": 8.657799359411001} +{"Pretrain/Learning Rate": 3.1039588642620937e-06, "Pretrain/Loss": 1.9411756992340088, "Pretrain/Loss (Raw)": 2.0037119388580322, "Pretrain/Step": 8054, "Pretrain/Step Time": 8.660557666793466} +{"Pretrain/Learning Rate": 3.099862926000724e-06, "Pretrain/Loss": 1.94194757938385, "Pretrain/Loss (Raw)": 2.228787422180176, "Pretrain/Step": 8055, "Pretrain/Step Time": 8.661833375692368} +{"Pretrain/Learning Rate": 3.0957695133663616e-06, "Pretrain/Loss": 1.9436662197113037, "Pretrain/Loss (Raw)": 1.8985837697982788, "Pretrain/Step": 8056, "Pretrain/Step Time": 8.66224424354732} +{"Pretrain/Learning Rate": 3.091678626831071e-06, "Pretrain/Loss": 1.9460474252700806, "Pretrain/Loss (Raw)": 2.1545326709747314, "Pretrain/Step": 8057, "Pretrain/Step Time": 8.662997171282768} +{"Pretrain/Learning Rate": 3.0875902668666383e-06, "Pretrain/Loss": 1.9463902711868286, "Pretrain/Loss (Raw)": 2.066706418991089, "Pretrain/Step": 8058, "Pretrain/Step Time": 8.663295719772577} +{"Pretrain/Learning Rate": 3.0835044339445536e-06, "Pretrain/Loss": 1.947438359260559, "Pretrain/Loss (Raw)": 2.0472781658172607, "Pretrain/Step": 8059, "Pretrain/Step Time": 8.662673709914088} +{"Pretrain/Learning Rate": 3.079421128536003e-06, "Pretrain/Loss": 1.9497857093811035, "Pretrain/Loss (Raw)": 2.0659472942352295, "Pretrain/Step": 8060, "Pretrain/Step Time": 8.662499906495214} +{"Pretrain/Learning Rate": 3.075340351111908e-06, "Pretrain/Loss": 1.9500668048858643, "Pretrain/Loss (Raw)": 1.8194230794906616, "Pretrain/Step": 8061, "Pretrain/Step Time": 8.663209743797779} +{"Pretrain/Learning Rate": 3.071262102142877e-06, "Pretrain/Loss": 1.948512315750122, "Pretrain/Loss (Raw)": 1.8642127513885498, "Pretrain/Step": 8062, "Pretrain/Step Time": 8.66244445182383} +{"Pretrain/Learning Rate": 3.0671863820992324e-06, "Pretrain/Loss": 1.9487409591674805, "Pretrain/Loss (Raw)": 2.0106146335601807, "Pretrain/Step": 8063, "Pretrain/Step Time": 8.659913547337055} +{"Pretrain/Learning Rate": 3.0631131914509977e-06, "Pretrain/Loss": 1.9462757110595703, "Pretrain/Loss (Raw)": 1.7538965940475464, "Pretrain/Step": 8064, "Pretrain/Step Time": 8.665004961192608} +{"Pretrain/Learning Rate": 3.0590425306679327e-06, "Pretrain/Loss": 1.9496099948883057, "Pretrain/Loss (Raw)": 2.1716058254241943, "Pretrain/Step": 8065, "Pretrain/Step Time": 8.658885838463902} +{"Pretrain/Learning Rate": 3.0549744002194597e-06, "Pretrain/Loss": 1.949334740638733, "Pretrain/Loss (Raw)": 1.9410488605499268, "Pretrain/Step": 8066, "Pretrain/Step Time": 8.654854748398066} +{"Pretrain/Learning Rate": 3.0509088005747534e-06, "Pretrain/Loss": 1.9502588510513306, "Pretrain/Loss (Raw)": 2.015471935272217, "Pretrain/Step": 8067, "Pretrain/Step Time": 8.657026030123234} +{"Pretrain/Learning Rate": 3.0468457322026663e-06, "Pretrain/Loss": 1.9498927593231201, "Pretrain/Loss (Raw)": 1.9321577548980713, "Pretrain/Step": 8068, "Pretrain/Step Time": 8.653883431106806} +{"Pretrain/Learning Rate": 3.0427851955717846e-06, "Pretrain/Loss": 1.9535701274871826, "Pretrain/Loss (Raw)": 2.1701791286468506, "Pretrain/Step": 8069, "Pretrain/Step Time": 8.655634965747595} +{"Pretrain/Learning Rate": 3.0387271911503728e-06, "Pretrain/Loss": 1.951216459274292, "Pretrain/Loss (Raw)": 1.6342471837997437, "Pretrain/Step": 8070, "Pretrain/Step Time": 8.655771298334002} +{"Pretrain/Learning Rate": 3.034671719406429e-06, "Pretrain/Loss": 1.9537899494171143, "Pretrain/Loss (Raw)": 1.9970849752426147, "Pretrain/Step": 8071, "Pretrain/Step Time": 8.658410284668207} +{"Pretrain/Learning Rate": 3.0306187808076423e-06, "Pretrain/Loss": 1.9519407749176025, "Pretrain/Loss (Raw)": 1.7187957763671875, "Pretrain/Step": 8072, "Pretrain/Step Time": 8.660307733342052} +{"Pretrain/Learning Rate": 3.0265683758214315e-06, "Pretrain/Loss": 1.9534924030303955, "Pretrain/Loss (Raw)": 2.072234630584717, "Pretrain/Step": 8073, "Pretrain/Step Time": 8.664195638149977} +{"Pretrain/Learning Rate": 3.022520504914886e-06, "Pretrain/Loss": 1.955275058746338, "Pretrain/Loss (Raw)": 2.1749701499938965, "Pretrain/Step": 8074, "Pretrain/Step Time": 8.664983619004488} +{"Pretrain/Learning Rate": 3.0184751685548435e-06, "Pretrain/Loss": 1.95367431640625, "Pretrain/Loss (Raw)": 1.9032504558563232, "Pretrain/Step": 8075, "Pretrain/Step Time": 8.663908183574677} +{"Pretrain/Learning Rate": 3.0144323672078256e-06, "Pretrain/Loss": 1.9547492265701294, "Pretrain/Loss (Raw)": 2.0657756328582764, "Pretrain/Step": 8076, "Pretrain/Step Time": 8.661825427785516} +{"Pretrain/Learning Rate": 3.0103921013400647e-06, "Pretrain/Loss": 1.9582467079162598, "Pretrain/Loss (Raw)": 2.0588018894195557, "Pretrain/Step": 8077, "Pretrain/Step Time": 8.65959589742124} +{"Pretrain/Learning Rate": 3.0063543714175024e-06, "Pretrain/Loss": 1.9587786197662354, "Pretrain/Loss (Raw)": 1.9154044389724731, "Pretrain/Step": 8078, "Pretrain/Step Time": 8.657323557883501} +{"Pretrain/Learning Rate": 3.0023191779057963e-06, "Pretrain/Loss": 1.9620659351348877, "Pretrain/Loss (Raw)": 2.0243852138519287, "Pretrain/Step": 8079, "Pretrain/Step Time": 8.657174089923501} +{"Pretrain/Learning Rate": 2.9982865212702965e-06, "Pretrain/Loss": 1.966019630432129, "Pretrain/Loss (Raw)": 2.0751733779907227, "Pretrain/Step": 8080, "Pretrain/Step Time": 8.655046006664634} +{"Pretrain/Learning Rate": 2.994256401976073e-06, "Pretrain/Loss": 1.96586275100708, "Pretrain/Loss (Raw)": 2.0144970417022705, "Pretrain/Step": 8081, "Pretrain/Step Time": 8.651395285502076} +{"Pretrain/Learning Rate": 2.9902288204878894e-06, "Pretrain/Loss": 1.9653695821762085, "Pretrain/Loss (Raw)": 1.8901695013046265, "Pretrain/Step": 8082, "Pretrain/Step Time": 8.652847409248352} +{"Pretrain/Learning Rate": 2.9862037772702356e-06, "Pretrain/Loss": 1.9651172161102295, "Pretrain/Loss (Raw)": 1.8210203647613525, "Pretrain/Step": 8083, "Pretrain/Step Time": 8.651612086221576} +{"Pretrain/Learning Rate": 2.982181272787296e-06, "Pretrain/Loss": 1.9669275283813477, "Pretrain/Loss (Raw)": 2.077669382095337, "Pretrain/Step": 8084, "Pretrain/Step Time": 8.653517287224531} +{"Pretrain/Learning Rate": 2.9781613075029636e-06, "Pretrain/Loss": 1.9645882844924927, "Pretrain/Loss (Raw)": 1.774932622909546, "Pretrain/Step": 8085, "Pretrain/Step Time": 8.645870381966233} +{"Pretrain/Learning Rate": 2.9741438818808366e-06, "Pretrain/Loss": 1.966442346572876, "Pretrain/Loss (Raw)": 1.8908096551895142, "Pretrain/Step": 8086, "Pretrain/Step Time": 8.654359515756369} +{"Pretrain/Learning Rate": 2.9701289963842276e-06, "Pretrain/Loss": 1.9669538736343384, "Pretrain/Loss (Raw)": 2.051227331161499, "Pretrain/Step": 8087, "Pretrain/Step Time": 8.646724024787545} +{"Pretrain/Learning Rate": 2.966116651476153e-06, "Pretrain/Loss": 1.9642384052276611, "Pretrain/Loss (Raw)": 1.7323007583618164, "Pretrain/Step": 8088, "Pretrain/Step Time": 8.65253147482872} +{"Pretrain/Learning Rate": 2.9621068476193335e-06, "Pretrain/Loss": 1.962946891784668, "Pretrain/Loss (Raw)": 1.6964397430419922, "Pretrain/Step": 8089, "Pretrain/Step Time": 8.65008444339037} +{"Pretrain/Learning Rate": 2.958099585276192e-06, "Pretrain/Loss": 1.9631013870239258, "Pretrain/Loss (Raw)": 1.8728009462356567, "Pretrain/Step": 8090, "Pretrain/Step Time": 8.647842701524496} +{"Pretrain/Learning Rate": 2.9540948649088767e-06, "Pretrain/Loss": 1.9624931812286377, "Pretrain/Loss (Raw)": 2.0334975719451904, "Pretrain/Step": 8091, "Pretrain/Step Time": 8.64674643613398} +{"Pretrain/Learning Rate": 2.950092686979225e-06, "Pretrain/Loss": 1.962313175201416, "Pretrain/Loss (Raw)": 1.988254189491272, "Pretrain/Step": 8092, "Pretrain/Step Time": 8.646138533949852} +{"Pretrain/Learning Rate": 2.9460930519487865e-06, "Pretrain/Loss": 1.965240240097046, "Pretrain/Loss (Raw)": 1.904353141784668, "Pretrain/Step": 8093, "Pretrain/Step Time": 8.648636693134904} +{"Pretrain/Learning Rate": 2.942095960278815e-06, "Pretrain/Loss": 1.967252492904663, "Pretrain/Loss (Raw)": 2.1243364810943604, "Pretrain/Step": 8094, "Pretrain/Step Time": 8.650148209184408} +{"Pretrain/Learning Rate": 2.938101412430283e-06, "Pretrain/Loss": 1.9690955877304077, "Pretrain/Loss (Raw)": 1.930060625076294, "Pretrain/Step": 8095, "Pretrain/Step Time": 8.649939861148596} +{"Pretrain/Learning Rate": 2.9341094088638527e-06, "Pretrain/Loss": 1.9713964462280273, "Pretrain/Loss (Raw)": 1.9210140705108643, "Pretrain/Step": 8096, "Pretrain/Step Time": 8.654383739456534} +{"Pretrain/Learning Rate": 2.9301199500399057e-06, "Pretrain/Loss": 1.9713034629821777, "Pretrain/Loss (Raw)": 2.019911050796509, "Pretrain/Step": 8097, "Pretrain/Step Time": 8.653721494600177} +{"Pretrain/Learning Rate": 2.9261330364185184e-06, "Pretrain/Loss": 1.9704856872558594, "Pretrain/Loss (Raw)": 1.7967602014541626, "Pretrain/Step": 8098, "Pretrain/Step Time": 8.651904374361038} +{"Pretrain/Learning Rate": 2.9221486684594873e-06, "Pretrain/Loss": 1.9708645343780518, "Pretrain/Loss (Raw)": 1.8320914506912231, "Pretrain/Step": 8099, "Pretrain/Step Time": 8.651640381664038} +{"Pretrain/Learning Rate": 2.9181668466223084e-06, "Pretrain/Loss": 1.970054268836975, "Pretrain/Loss (Raw)": 1.8745348453521729, "Pretrain/Step": 8100, "Pretrain/Step Time": 8.653646290302277} +{"Pretrain/Learning Rate": 2.914187571366175e-06, "Pretrain/Loss": 1.9679689407348633, "Pretrain/Loss (Raw)": 1.759289026260376, "Pretrain/Step": 8101, "Pretrain/Step Time": 8.655641179531813} +{"Pretrain/Learning Rate": 2.9102108431500076e-06, "Pretrain/Loss": 1.9665896892547607, "Pretrain/Loss (Raw)": 1.8344851732254028, "Pretrain/Step": 8102, "Pretrain/Step Time": 8.65551932901144} +{"Pretrain/Learning Rate": 2.9062366624324154e-06, "Pretrain/Loss": 1.9640297889709473, "Pretrain/Loss (Raw)": 1.6460585594177246, "Pretrain/Step": 8103, "Pretrain/Step Time": 8.654658081009984} +{"Pretrain/Learning Rate": 2.9022650296717245e-06, "Pretrain/Loss": 1.9636698961257935, "Pretrain/Loss (Raw)": 2.0203211307525635, "Pretrain/Step": 8104, "Pretrain/Step Time": 8.657069073989987} +{"Pretrain/Learning Rate": 2.898295945325949e-06, "Pretrain/Loss": 1.962154507637024, "Pretrain/Loss (Raw)": 1.8394396305084229, "Pretrain/Step": 8105, "Pretrain/Step Time": 8.659500604495406} +{"Pretrain/Learning Rate": 2.8943294098528447e-06, "Pretrain/Loss": 1.9665567874908447, "Pretrain/Loss (Raw)": 1.9667152166366577, "Pretrain/Step": 8106, "Pretrain/Step Time": 8.658683203160763} +{"Pretrain/Learning Rate": 2.890365423709826e-06, "Pretrain/Loss": 1.9650123119354248, "Pretrain/Loss (Raw)": 1.5126701593399048, "Pretrain/Step": 8107, "Pretrain/Step Time": 8.660151027143002} +{"Pretrain/Learning Rate": 2.8864039873540583e-06, "Pretrain/Loss": 1.9636212587356567, "Pretrain/Loss (Raw)": 1.9650300741195679, "Pretrain/Step": 8108, "Pretrain/Step Time": 8.65909630805254} +{"Pretrain/Learning Rate": 2.8824451012423786e-06, "Pretrain/Loss": 1.964475154876709, "Pretrain/Loss (Raw)": 2.0553739070892334, "Pretrain/Step": 8109, "Pretrain/Step Time": 8.661452814936638} +{"Pretrain/Learning Rate": 2.878488765831361e-06, "Pretrain/Loss": 1.9632623195648193, "Pretrain/Loss (Raw)": 1.8516228199005127, "Pretrain/Step": 8110, "Pretrain/Step Time": 8.659494187682867} +{"Pretrain/Learning Rate": 2.874534981577248e-06, "Pretrain/Loss": 1.96470046043396, "Pretrain/Loss (Raw)": 2.029696226119995, "Pretrain/Step": 8111, "Pretrain/Step Time": 8.657578125596046} +{"Pretrain/Learning Rate": 2.870583748936026e-06, "Pretrain/Loss": 1.9636082649230957, "Pretrain/Loss (Raw)": 1.8237736225128174, "Pretrain/Step": 8112, "Pretrain/Step Time": 8.66257675550878} +{"Pretrain/Learning Rate": 2.8666350683633576e-06, "Pretrain/Loss": 1.9653189182281494, "Pretrain/Loss (Raw)": 2.0970520973205566, "Pretrain/Step": 8113, "Pretrain/Step Time": 8.661545734852552} +{"Pretrain/Learning Rate": 2.8626889403146395e-06, "Pretrain/Loss": 1.9627293348312378, "Pretrain/Loss (Raw)": 1.7729445695877075, "Pretrain/Step": 8114, "Pretrain/Step Time": 8.662231346592307} +{"Pretrain/Learning Rate": 2.8587453652449386e-06, "Pretrain/Loss": 1.960802435874939, "Pretrain/Loss (Raw)": 1.9291638135910034, "Pretrain/Step": 8115, "Pretrain/Step Time": 8.664417700842023} +{"Pretrain/Learning Rate": 2.8548043436090577e-06, "Pretrain/Loss": 1.9604856967926025, "Pretrain/Loss (Raw)": 1.9012665748596191, "Pretrain/Step": 8116, "Pretrain/Step Time": 8.668324761092663} +{"Pretrain/Learning Rate": 2.8508658758614944e-06, "Pretrain/Loss": 1.9593555927276611, "Pretrain/Loss (Raw)": 1.9341011047363281, "Pretrain/Step": 8117, "Pretrain/Step Time": 8.667093830183148} +{"Pretrain/Learning Rate": 2.846929962456446e-06, "Pretrain/Loss": 1.9621882438659668, "Pretrain/Loss (Raw)": 2.061803102493286, "Pretrain/Step": 8118, "Pretrain/Step Time": 8.66893289797008} +{"Pretrain/Learning Rate": 2.8429966038478196e-06, "Pretrain/Loss": 1.9598840475082397, "Pretrain/Loss (Raw)": 1.8632893562316895, "Pretrain/Step": 8119, "Pretrain/Step Time": 8.669731348752975} +{"Pretrain/Learning Rate": 2.839065800489235e-06, "Pretrain/Loss": 1.9589383602142334, "Pretrain/Loss (Raw)": 1.8716479539871216, "Pretrain/Step": 8120, "Pretrain/Step Time": 8.669501876458526} +{"Pretrain/Learning Rate": 2.835137552834008e-06, "Pretrain/Loss": 1.9612115621566772, "Pretrain/Loss (Raw)": 2.2708489894866943, "Pretrain/Step": 8121, "Pretrain/Step Time": 8.666593171656132} +{"Pretrain/Learning Rate": 2.8312118613351644e-06, "Pretrain/Loss": 1.959377408027649, "Pretrain/Loss (Raw)": 1.8320324420928955, "Pretrain/Step": 8122, "Pretrain/Step Time": 8.668619530275464} +{"Pretrain/Learning Rate": 2.8272887264454262e-06, "Pretrain/Loss": 1.9633677005767822, "Pretrain/Loss (Raw)": 2.2775990962982178, "Pretrain/Step": 8123, "Pretrain/Step Time": 8.664336122572422} +{"Pretrain/Learning Rate": 2.8233681486172393e-06, "Pretrain/Loss": 1.9640789031982422, "Pretrain/Loss (Raw)": 2.075230121612549, "Pretrain/Step": 8124, "Pretrain/Step Time": 8.664954595267773} +{"Pretrain/Learning Rate": 2.8194501283027366e-06, "Pretrain/Loss": 1.960985779762268, "Pretrain/Loss (Raw)": 1.7632765769958496, "Pretrain/Step": 8125, "Pretrain/Step Time": 8.664887281134725} +{"Pretrain/Learning Rate": 2.815534665953762e-06, "Pretrain/Loss": 1.9618009328842163, "Pretrain/Loss (Raw)": 1.9979708194732666, "Pretrain/Step": 8126, "Pretrain/Step Time": 8.664744578301907} +{"Pretrain/Learning Rate": 2.8116217620218626e-06, "Pretrain/Loss": 1.9628679752349854, "Pretrain/Loss (Raw)": 2.0833985805511475, "Pretrain/Step": 8127, "Pretrain/Step Time": 8.665157916024327} +{"Pretrain/Learning Rate": 2.8077114169583e-06, "Pretrain/Loss": 1.9634182453155518, "Pretrain/Loss (Raw)": 2.0009143352508545, "Pretrain/Step": 8128, "Pretrain/Step Time": 8.670810259878635} +{"Pretrain/Learning Rate": 2.8038036312140333e-06, "Pretrain/Loss": 1.9631643295288086, "Pretrain/Loss (Raw)": 1.8614915609359741, "Pretrain/Step": 8129, "Pretrain/Step Time": 8.669475024566054} +{"Pretrain/Learning Rate": 2.79989840523972e-06, "Pretrain/Loss": 1.9604028463363647, "Pretrain/Loss (Raw)": 1.6611979007720947, "Pretrain/Step": 8130, "Pretrain/Step Time": 8.669789381325245} +{"Pretrain/Learning Rate": 2.795995739485732e-06, "Pretrain/Loss": 1.9602904319763184, "Pretrain/Loss (Raw)": 1.9038282632827759, "Pretrain/Step": 8131, "Pretrain/Step Time": 8.669197233393788} +{"Pretrain/Learning Rate": 2.7920956344021475e-06, "Pretrain/Loss": 1.9578608274459839, "Pretrain/Loss (Raw)": 1.7551372051239014, "Pretrain/Step": 8132, "Pretrain/Step Time": 8.671231070533395} +{"Pretrain/Learning Rate": 2.78819809043874e-06, "Pretrain/Loss": 1.957125186920166, "Pretrain/Loss (Raw)": 1.9414442777633667, "Pretrain/Step": 8133, "Pretrain/Step Time": 8.668515728786588} +{"Pretrain/Learning Rate": 2.7843031080449944e-06, "Pretrain/Loss": 1.9581607580184937, "Pretrain/Loss (Raw)": 2.0036206245422363, "Pretrain/Step": 8134, "Pretrain/Step Time": 8.673963548615575} +{"Pretrain/Learning Rate": 2.780410687670096e-06, "Pretrain/Loss": 1.960780143737793, "Pretrain/Loss (Raw)": 2.2895750999450684, "Pretrain/Step": 8135, "Pretrain/Step Time": 8.673200402408838} +{"Pretrain/Learning Rate": 2.776520829762941e-06, "Pretrain/Loss": 1.9597755670547485, "Pretrain/Loss (Raw)": 1.8750633001327515, "Pretrain/Step": 8136, "Pretrain/Step Time": 8.672659965232015} +{"Pretrain/Learning Rate": 2.7726335347721263e-06, "Pretrain/Loss": 1.9580276012420654, "Pretrain/Loss (Raw)": 1.7463029623031616, "Pretrain/Step": 8137, "Pretrain/Step Time": 8.671673711389303} +{"Pretrain/Learning Rate": 2.7687488031459484e-06, "Pretrain/Loss": 1.9593443870544434, "Pretrain/Loss (Raw)": 2.0077998638153076, "Pretrain/Step": 8138, "Pretrain/Step Time": 8.669342700392008} +{"Pretrain/Learning Rate": 2.7648666353324136e-06, "Pretrain/Loss": 1.9589247703552246, "Pretrain/Loss (Raw)": 2.019211530685425, "Pretrain/Step": 8139, "Pretrain/Step Time": 8.665551299229264} +{"Pretrain/Learning Rate": 2.7609870317792385e-06, "Pretrain/Loss": 1.9582024812698364, "Pretrain/Loss (Raw)": 1.8574793338775635, "Pretrain/Step": 8140, "Pretrain/Step Time": 8.669373923912644} +{"Pretrain/Learning Rate": 2.757109992933832e-06, "Pretrain/Loss": 1.9595438241958618, "Pretrain/Loss (Raw)": 2.024221658706665, "Pretrain/Step": 8141, "Pretrain/Step Time": 8.662204632535577} +{"Pretrain/Learning Rate": 2.753235519243308e-06, "Pretrain/Loss": 1.9610413312911987, "Pretrain/Loss (Raw)": 2.0817270278930664, "Pretrain/Step": 8142, "Pretrain/Step Time": 8.662249928340316} +{"Pretrain/Learning Rate": 2.7493636111544985e-06, "Pretrain/Loss": 1.9620341062545776, "Pretrain/Loss (Raw)": 2.015165328979492, "Pretrain/Step": 8143, "Pretrain/Step Time": 8.66387589648366} +{"Pretrain/Learning Rate": 2.745494269113927e-06, "Pretrain/Loss": 1.963538408279419, "Pretrain/Loss (Raw)": 2.0106911659240723, "Pretrain/Step": 8144, "Pretrain/Step Time": 8.661606697365642} +{"Pretrain/Learning Rate": 2.741627493567822e-06, "Pretrain/Loss": 1.9637317657470703, "Pretrain/Loss (Raw)": 1.965258240699768, "Pretrain/Step": 8145, "Pretrain/Step Time": 8.660940321162343} +{"Pretrain/Learning Rate": 2.7377632849621164e-06, "Pretrain/Loss": 1.9640755653381348, "Pretrain/Loss (Raw)": 2.008132219314575, "Pretrain/Step": 8146, "Pretrain/Step Time": 8.658568441867828} +{"Pretrain/Learning Rate": 2.7339016437424535e-06, "Pretrain/Loss": 1.9633448123931885, "Pretrain/Loss (Raw)": 1.779038429260254, "Pretrain/Step": 8147, "Pretrain/Step Time": 8.658540273085237} +{"Pretrain/Learning Rate": 2.7300425703541773e-06, "Pretrain/Loss": 1.9611129760742188, "Pretrain/Loss (Raw)": 1.8863165378570557, "Pretrain/Step": 8148, "Pretrain/Step Time": 8.655028717592359} +{"Pretrain/Learning Rate": 2.726186065242331e-06, "Pretrain/Loss": 1.95749831199646, "Pretrain/Loss (Raw)": 1.82384192943573, "Pretrain/Step": 8149, "Pretrain/Step Time": 8.655240388587117} +{"Pretrain/Learning Rate": 2.7223321288516597e-06, "Pretrain/Loss": 1.957558035850525, "Pretrain/Loss (Raw)": 1.9625283479690552, "Pretrain/Step": 8150, "Pretrain/Step Time": 8.658612890169024} +{"Pretrain/Learning Rate": 2.7184807616266323e-06, "Pretrain/Loss": 1.957440733909607, "Pretrain/Loss (Raw)": 2.014530897140503, "Pretrain/Step": 8151, "Pretrain/Step Time": 8.659512668848038} +{"Pretrain/Learning Rate": 2.714631964011388e-06, "Pretrain/Loss": 1.9595701694488525, "Pretrain/Loss (Raw)": 2.2267560958862305, "Pretrain/Step": 8152, "Pretrain/Step Time": 8.65720334649086} +{"Pretrain/Learning Rate": 2.7107857364498027e-06, "Pretrain/Loss": 1.9598619937896729, "Pretrain/Loss (Raw)": 1.905480980873108, "Pretrain/Step": 8153, "Pretrain/Step Time": 8.65388847514987} +{"Pretrain/Learning Rate": 2.7069420793854298e-06, "Pretrain/Loss": 1.959319829940796, "Pretrain/Loss (Raw)": 1.8656800985336304, "Pretrain/Step": 8154, "Pretrain/Step Time": 8.651352381333709} +{"Pretrain/Learning Rate": 2.7031009932615563e-06, "Pretrain/Loss": 1.960362195968628, "Pretrain/Loss (Raw)": 2.0010693073272705, "Pretrain/Step": 8155, "Pretrain/Step Time": 8.654019122943282} +{"Pretrain/Learning Rate": 2.6992624785211334e-06, "Pretrain/Loss": 1.9585758447647095, "Pretrain/Loss (Raw)": 1.7164431810379028, "Pretrain/Step": 8156, "Pretrain/Step Time": 8.650367490947247} +{"Pretrain/Learning Rate": 2.6954265356068515e-06, "Pretrain/Loss": 1.9570538997650146, "Pretrain/Loss (Raw)": 1.8676652908325195, "Pretrain/Step": 8157, "Pretrain/Step Time": 8.649629596620798} +{"Pretrain/Learning Rate": 2.691593164961084e-06, "Pretrain/Loss": 1.9587522745132446, "Pretrain/Loss (Raw)": 2.049381732940674, "Pretrain/Step": 8158, "Pretrain/Step Time": 8.653078891336918} +{"Pretrain/Learning Rate": 2.6877623670259115e-06, "Pretrain/Loss": 1.960472583770752, "Pretrain/Loss (Raw)": 2.0148932933807373, "Pretrain/Step": 8159, "Pretrain/Step Time": 8.647692942991853} +{"Pretrain/Learning Rate": 2.6839341422431165e-06, "Pretrain/Loss": 1.9602913856506348, "Pretrain/Loss (Raw)": 1.7893480062484741, "Pretrain/Step": 8160, "Pretrain/Step Time": 8.657515112310648} +{"Pretrain/Learning Rate": 2.6801084910542008e-06, "Pretrain/Loss": 1.9617199897766113, "Pretrain/Loss (Raw)": 2.1652777194976807, "Pretrain/Step": 8161, "Pretrain/Step Time": 8.655331932008266} +{"Pretrain/Learning Rate": 2.6762854139003452e-06, "Pretrain/Loss": 1.9616599082946777, "Pretrain/Loss (Raw)": 2.003185272216797, "Pretrain/Step": 8162, "Pretrain/Step Time": 8.658138547092676} +{"Pretrain/Learning Rate": 2.6724649112224496e-06, "Pretrain/Loss": 1.9636411666870117, "Pretrain/Loss (Raw)": 2.0882930755615234, "Pretrain/Step": 8163, "Pretrain/Step Time": 8.655956709757447} +{"Pretrain/Learning Rate": 2.6686469834611066e-06, "Pretrain/Loss": 1.9627666473388672, "Pretrain/Loss (Raw)": 1.9733344316482544, "Pretrain/Step": 8164, "Pretrain/Step Time": 8.658695120364428} +{"Pretrain/Learning Rate": 2.66483163105663e-06, "Pretrain/Loss": 1.9618303775787354, "Pretrain/Loss (Raw)": 1.9894723892211914, "Pretrain/Step": 8165, "Pretrain/Step Time": 8.658238556236029} +{"Pretrain/Learning Rate": 2.6610188544490126e-06, "Pretrain/Loss": 1.9614417552947998, "Pretrain/Loss (Raw)": 1.9690266847610474, "Pretrain/Step": 8166, "Pretrain/Step Time": 8.660021828487515} +{"Pretrain/Learning Rate": 2.657208654077967e-06, "Pretrain/Loss": 1.962930679321289, "Pretrain/Loss (Raw)": 2.0748744010925293, "Pretrain/Step": 8167, "Pretrain/Step Time": 8.654162036255002} +{"Pretrain/Learning Rate": 2.653401030382896e-06, "Pretrain/Loss": 1.9617891311645508, "Pretrain/Loss (Raw)": 1.9517043828964233, "Pretrain/Step": 8168, "Pretrain/Step Time": 8.655709067359567} +{"Pretrain/Learning Rate": 2.649595983802927e-06, "Pretrain/Loss": 1.9613780975341797, "Pretrain/Loss (Raw)": 1.8907593488693237, "Pretrain/Step": 8169, "Pretrain/Step Time": 8.652430936694145} +{"Pretrain/Learning Rate": 2.645793514776865e-06, "Pretrain/Loss": 1.9603114128112793, "Pretrain/Loss (Raw)": 1.7753069400787354, "Pretrain/Step": 8170, "Pretrain/Step Time": 8.657472560182214} +{"Pretrain/Learning Rate": 2.64199362374323e-06, "Pretrain/Loss": 1.961976170539856, "Pretrain/Loss (Raw)": 2.29472017288208, "Pretrain/Step": 8171, "Pretrain/Step Time": 8.653308428823948} +{"Pretrain/Learning Rate": 2.6381963111402423e-06, "Pretrain/Loss": 1.960472822189331, "Pretrain/Loss (Raw)": 1.8471522331237793, "Pretrain/Step": 8172, "Pretrain/Step Time": 8.65059968456626} +{"Pretrain/Learning Rate": 2.6344015774058345e-06, "Pretrain/Loss": 1.962950587272644, "Pretrain/Loss (Raw)": 1.9864039421081543, "Pretrain/Step": 8173, "Pretrain/Step Time": 8.654827654361725} +{"Pretrain/Learning Rate": 2.630609422977623e-06, "Pretrain/Loss": 1.9600627422332764, "Pretrain/Loss (Raw)": 1.8194175958633423, "Pretrain/Step": 8174, "Pretrain/Step Time": 8.649977844208479} +{"Pretrain/Learning Rate": 2.6268198482929442e-06, "Pretrain/Loss": 1.957876205444336, "Pretrain/Loss (Raw)": 1.7715035676956177, "Pretrain/Step": 8175, "Pretrain/Step Time": 8.656448924914002} +{"Pretrain/Learning Rate": 2.6230328537888204e-06, "Pretrain/Loss": 1.9559986591339111, "Pretrain/Loss (Raw)": 1.895731806755066, "Pretrain/Step": 8176, "Pretrain/Step Time": 8.650918930768967} +{"Pretrain/Learning Rate": 2.6192484399019947e-06, "Pretrain/Loss": 1.9514888525009155, "Pretrain/Loss (Raw)": 1.6148649454116821, "Pretrain/Step": 8177, "Pretrain/Step Time": 8.652011409401894} +{"Pretrain/Learning Rate": 2.615466607068903e-06, "Pretrain/Loss": 1.9490474462509155, "Pretrain/Loss (Raw)": 2.049544095993042, "Pretrain/Step": 8178, "Pretrain/Step Time": 8.65767978131771} +{"Pretrain/Learning Rate": 2.611687355725681e-06, "Pretrain/Loss": 1.9455065727233887, "Pretrain/Loss (Raw)": 1.822513222694397, "Pretrain/Step": 8179, "Pretrain/Step Time": 8.65738781914115} +{"Pretrain/Learning Rate": 2.6079106863081655e-06, "Pretrain/Loss": 1.9435522556304932, "Pretrain/Loss (Raw)": 1.865400791168213, "Pretrain/Step": 8180, "Pretrain/Step Time": 8.659132922068238} +{"Pretrain/Learning Rate": 2.604136599251908e-06, "Pretrain/Loss": 1.9408248662948608, "Pretrain/Loss (Raw)": 1.5787992477416992, "Pretrain/Step": 8181, "Pretrain/Step Time": 8.6606335490942} +{"Pretrain/Learning Rate": 2.600365094992152e-06, "Pretrain/Loss": 1.9391403198242188, "Pretrain/Loss (Raw)": 1.7880957126617432, "Pretrain/Step": 8182, "Pretrain/Step Time": 8.659529019147158} +{"Pretrain/Learning Rate": 2.596596173963839e-06, "Pretrain/Loss": 1.9367172718048096, "Pretrain/Loss (Raw)": 1.918617844581604, "Pretrain/Step": 8183, "Pretrain/Step Time": 8.661510838195682} +{"Pretrain/Learning Rate": 2.592829836601629e-06, "Pretrain/Loss": 1.9365510940551758, "Pretrain/Loss (Raw)": 1.8773325681686401, "Pretrain/Step": 8184, "Pretrain/Step Time": 8.66340165771544} +{"Pretrain/Learning Rate": 2.5890660833398667e-06, "Pretrain/Loss": 1.9356428384780884, "Pretrain/Loss (Raw)": 2.03826642036438, "Pretrain/Step": 8185, "Pretrain/Step Time": 8.660363122820854} +{"Pretrain/Learning Rate": 2.5853049146126076e-06, "Pretrain/Loss": 1.9341635704040527, "Pretrain/Loss (Raw)": 1.8773541450500488, "Pretrain/Step": 8186, "Pretrain/Step Time": 8.66176780499518} +{"Pretrain/Learning Rate": 2.581546330853604e-06, "Pretrain/Loss": 1.934229850769043, "Pretrain/Loss (Raw)": 2.055777072906494, "Pretrain/Step": 8187, "Pretrain/Step Time": 8.662932800129056} +{"Pretrain/Learning Rate": 2.5777903324963187e-06, "Pretrain/Loss": 1.9342955350875854, "Pretrain/Loss (Raw)": 2.074345827102661, "Pretrain/Step": 8188, "Pretrain/Step Time": 8.664873488247395} +{"Pretrain/Learning Rate": 2.574036919973913e-06, "Pretrain/Loss": 1.9373266696929932, "Pretrain/Loss (Raw)": 2.2074170112609863, "Pretrain/Step": 8189, "Pretrain/Step Time": 8.664598058909178} +{"Pretrain/Learning Rate": 2.5702860937192403e-06, "Pretrain/Loss": 1.940347671508789, "Pretrain/Loss (Raw)": 2.250889539718628, "Pretrain/Step": 8190, "Pretrain/Step Time": 8.665568012744188} +{"Pretrain/Learning Rate": 2.566537854164866e-06, "Pretrain/Loss": 1.9368507862091064, "Pretrain/Loss (Raw)": 1.5630193948745728, "Pretrain/Step": 8191, "Pretrain/Step Time": 8.664511354640126} +{"Pretrain/Learning Rate": 2.5627922017430637e-06, "Pretrain/Loss": 1.937502384185791, "Pretrain/Loss (Raw)": 1.8373017311096191, "Pretrain/Step": 8192, "Pretrain/Step Time": 8.660610621795058} +{"Pretrain/Learning Rate": 2.559049136885783e-06, "Pretrain/Loss": 1.9372777938842773, "Pretrain/Loss (Raw)": 2.142848491668701, "Pretrain/Step": 8193, "Pretrain/Step Time": 8.667389644309878} +{"Pretrain/Learning Rate": 2.555308660024708e-06, "Pretrain/Loss": 1.9371838569641113, "Pretrain/Loss (Raw)": 1.9290300607681274, "Pretrain/Step": 8194, "Pretrain/Step Time": 8.6689546816051} +{"Pretrain/Learning Rate": 2.551570771591194e-06, "Pretrain/Loss": 1.9365935325622559, "Pretrain/Loss (Raw)": 1.939909815788269, "Pretrain/Step": 8195, "Pretrain/Step Time": 8.674529429525137} +{"Pretrain/Learning Rate": 2.54783547201633e-06, "Pretrain/Loss": 1.9370200634002686, "Pretrain/Loss (Raw)": 1.9867618083953857, "Pretrain/Step": 8196, "Pretrain/Step Time": 8.681403543800116} +{"Pretrain/Learning Rate": 2.5441027617308684e-06, "Pretrain/Loss": 1.9377981424331665, "Pretrain/Loss (Raw)": 2.2697606086730957, "Pretrain/Step": 8197, "Pretrain/Step Time": 8.674390217289329} +{"Pretrain/Learning Rate": 2.540372641165295e-06, "Pretrain/Loss": 1.9389622211456299, "Pretrain/Loss (Raw)": 1.7832506895065308, "Pretrain/Step": 8198, "Pretrain/Step Time": 8.679077591747046} +{"Pretrain/Learning Rate": 2.536645110749783e-06, "Pretrain/Loss": 1.938685655593872, "Pretrain/Loss (Raw)": 1.9616889953613281, "Pretrain/Step": 8199, "Pretrain/Step Time": 8.673675930127501} +{"Pretrain/Learning Rate": 2.5329201709142074e-06, "Pretrain/Loss": 1.9418623447418213, "Pretrain/Loss (Raw)": 2.1254191398620605, "Pretrain/Step": 8200, "Pretrain/Step Time": 8.669415837153792} +{"Pretrain/Learning Rate": 2.5291978220881416e-06, "Pretrain/Loss": 1.9417493343353271, "Pretrain/Loss (Raw)": 2.0577552318573, "Pretrain/Step": 8201, "Pretrain/Step Time": 8.669979339465499} +{"Pretrain/Learning Rate": 2.525478064700873e-06, "Pretrain/Loss": 1.9388258457183838, "Pretrain/Loss (Raw)": 1.8007676601409912, "Pretrain/Step": 8202, "Pretrain/Step Time": 8.668709630146623} +{"Pretrain/Learning Rate": 2.5217608991813776e-06, "Pretrain/Loss": 1.9381940364837646, "Pretrain/Loss (Raw)": 1.8223820924758911, "Pretrain/Step": 8203, "Pretrain/Step Time": 8.670618234202266} +{"Pretrain/Learning Rate": 2.5180463259583344e-06, "Pretrain/Loss": 1.938280463218689, "Pretrain/Loss (Raw)": 2.0768356323242188, "Pretrain/Step": 8204, "Pretrain/Step Time": 8.669088192284107} +{"Pretrain/Learning Rate": 2.514334345460126e-06, "Pretrain/Loss": 1.9352521896362305, "Pretrain/Loss (Raw)": 1.6711937189102173, "Pretrain/Step": 8205, "Pretrain/Step Time": 8.671539455652237} +{"Pretrain/Learning Rate": 2.5106249581148406e-06, "Pretrain/Loss": 1.9369392395019531, "Pretrain/Loss (Raw)": 2.1313321590423584, "Pretrain/Step": 8206, "Pretrain/Step Time": 8.668521460145712} +{"Pretrain/Learning Rate": 2.5069181643502552e-06, "Pretrain/Loss": 1.934040904045105, "Pretrain/Loss (Raw)": 1.6533976793289185, "Pretrain/Step": 8207, "Pretrain/Step Time": 8.666577611118555} +{"Pretrain/Learning Rate": 2.503213964593862e-06, "Pretrain/Loss": 1.9361119270324707, "Pretrain/Loss (Raw)": 2.3402748107910156, "Pretrain/Step": 8208, "Pretrain/Step Time": 8.669072203338146} +{"Pretrain/Learning Rate": 2.4995123592728374e-06, "Pretrain/Loss": 1.9356993436813354, "Pretrain/Loss (Raw)": 1.9616793394088745, "Pretrain/Step": 8209, "Pretrain/Step Time": 8.668759938329458} +{"Pretrain/Learning Rate": 2.495813348814077e-06, "Pretrain/Loss": 1.935154676437378, "Pretrain/Loss (Raw)": 1.8204478025436401, "Pretrain/Step": 8210, "Pretrain/Step Time": 8.673188975080848} +{"Pretrain/Learning Rate": 2.4921169336441645e-06, "Pretrain/Loss": 1.935514211654663, "Pretrain/Loss (Raw)": 1.867052435874939, "Pretrain/Step": 8211, "Pretrain/Step Time": 8.674999486654997} +{"Pretrain/Learning Rate": 2.4884231141893864e-06, "Pretrain/Loss": 1.9340064525604248, "Pretrain/Loss (Raw)": 1.8846790790557861, "Pretrain/Step": 8212, "Pretrain/Step Time": 8.675706412643194} +{"Pretrain/Learning Rate": 2.48473189087573e-06, "Pretrain/Loss": 1.936385154724121, "Pretrain/Loss (Raw)": 2.0793874263763428, "Pretrain/Step": 8213, "Pretrain/Step Time": 8.674546035006642} +{"Pretrain/Learning Rate": 2.4810432641288933e-06, "Pretrain/Loss": 1.9373502731323242, "Pretrain/Loss (Raw)": 2.014364719390869, "Pretrain/Step": 8214, "Pretrain/Step Time": 8.665163222700357} +{"Pretrain/Learning Rate": 2.4773572343742584e-06, "Pretrain/Loss": 1.9358832836151123, "Pretrain/Loss (Raw)": 1.8634402751922607, "Pretrain/Step": 8215, "Pretrain/Step Time": 8.669723495841026} +{"Pretrain/Learning Rate": 2.473673802036916e-06, "Pretrain/Loss": 1.9378795623779297, "Pretrain/Loss (Raw)": 1.9878195524215698, "Pretrain/Step": 8216, "Pretrain/Step Time": 8.669379439204931} +{"Pretrain/Learning Rate": 2.4699929675416565e-06, "Pretrain/Loss": 1.9399518966674805, "Pretrain/Loss (Raw)": 1.9617133140563965, "Pretrain/Step": 8217, "Pretrain/Step Time": 8.67331432364881} +{"Pretrain/Learning Rate": 2.466314731312977e-06, "Pretrain/Loss": 1.9411479234695435, "Pretrain/Loss (Raw)": 2.0258848667144775, "Pretrain/Step": 8218, "Pretrain/Step Time": 8.677130471915007} +{"Pretrain/Learning Rate": 2.4626390937750624e-06, "Pretrain/Loss": 1.9413414001464844, "Pretrain/Loss (Raw)": 2.0582664012908936, "Pretrain/Step": 8219, "Pretrain/Step Time": 8.67504983022809} +{"Pretrain/Learning Rate": 2.4589660553518108e-06, "Pretrain/Loss": 1.9430677890777588, "Pretrain/Loss (Raw)": 2.209233045578003, "Pretrain/Step": 8220, "Pretrain/Step Time": 8.678074084222317} +{"Pretrain/Learning Rate": 2.4552956164668018e-06, "Pretrain/Loss": 1.9410881996154785, "Pretrain/Loss (Raw)": 1.6509678363800049, "Pretrain/Step": 8221, "Pretrain/Step Time": 8.673411194235086} +{"Pretrain/Learning Rate": 2.4516277775433443e-06, "Pretrain/Loss": 1.9382628202438354, "Pretrain/Loss (Raw)": 1.7626855373382568, "Pretrain/Step": 8222, "Pretrain/Step Time": 8.67302929982543} +{"Pretrain/Learning Rate": 2.4479625390044226e-06, "Pretrain/Loss": 1.9388840198516846, "Pretrain/Loss (Raw)": 2.009567975997925, "Pretrain/Step": 8223, "Pretrain/Step Time": 8.674641244113445} +{"Pretrain/Learning Rate": 2.444299901272723e-06, "Pretrain/Loss": 1.9360201358795166, "Pretrain/Loss (Raw)": 1.5544449090957642, "Pretrain/Step": 8224, "Pretrain/Step Time": 8.670819588005543} +{"Pretrain/Learning Rate": 2.4406398647706523e-06, "Pretrain/Loss": 1.9332258701324463, "Pretrain/Loss (Raw)": 1.6622488498687744, "Pretrain/Step": 8225, "Pretrain/Step Time": 8.67590563185513} +{"Pretrain/Learning Rate": 2.4369824299202926e-06, "Pretrain/Loss": 1.9366590976715088, "Pretrain/Loss (Raw)": 2.2361936569213867, "Pretrain/Step": 8226, "Pretrain/Step Time": 8.676004247739911} +{"Pretrain/Learning Rate": 2.433327597143442e-06, "Pretrain/Loss": 1.9380971193313599, "Pretrain/Loss (Raw)": 2.016167640686035, "Pretrain/Step": 8227, "Pretrain/Step Time": 8.672303536906838} +{"Pretrain/Learning Rate": 2.4296753668615833e-06, "Pretrain/Loss": 1.9386781454086304, "Pretrain/Loss (Raw)": 1.9489206075668335, "Pretrain/Step": 8228, "Pretrain/Step Time": 8.672946218401194} +{"Pretrain/Learning Rate": 2.4260257394959213e-06, "Pretrain/Loss": 1.939910650253296, "Pretrain/Loss (Raw)": 1.9170279502868652, "Pretrain/Step": 8229, "Pretrain/Step Time": 8.671126998960972} +{"Pretrain/Learning Rate": 2.422378715467344e-06, "Pretrain/Loss": 1.9398812055587769, "Pretrain/Loss (Raw)": 1.8307299613952637, "Pretrain/Step": 8230, "Pretrain/Step Time": 8.669288208708167} +{"Pretrain/Learning Rate": 2.4187342951964424e-06, "Pretrain/Loss": 1.944258451461792, "Pretrain/Loss (Raw)": 2.2063486576080322, "Pretrain/Step": 8231, "Pretrain/Step Time": 8.66597698815167} +{"Pretrain/Learning Rate": 2.4150924791035035e-06, "Pretrain/Loss": 1.9430197477340698, "Pretrain/Loss (Raw)": 1.8617606163024902, "Pretrain/Step": 8232, "Pretrain/Step Time": 8.666673686355352} +{"Pretrain/Learning Rate": 2.411453267608535e-06, "Pretrain/Loss": 1.9418797492980957, "Pretrain/Loss (Raw)": 1.6935112476348877, "Pretrain/Step": 8233, "Pretrain/Step Time": 8.662294516339898} +{"Pretrain/Learning Rate": 2.4078166611312044e-06, "Pretrain/Loss": 1.941881537437439, "Pretrain/Loss (Raw)": 1.966957926750183, "Pretrain/Step": 8234, "Pretrain/Step Time": 8.6639349963516} +{"Pretrain/Learning Rate": 2.40418266009092e-06, "Pretrain/Loss": 1.9444730281829834, "Pretrain/Loss (Raw)": 1.8443846702575684, "Pretrain/Step": 8235, "Pretrain/Step Time": 8.661931270733476} +{"Pretrain/Learning Rate": 2.4005512649067612e-06, "Pretrain/Loss": 1.943076252937317, "Pretrain/Loss (Raw)": 1.786232829093933, "Pretrain/Step": 8236, "Pretrain/Step Time": 8.666274758055806} +{"Pretrain/Learning Rate": 2.396922475997532e-06, "Pretrain/Loss": 1.9403455257415771, "Pretrain/Loss (Raw)": 1.7058465480804443, "Pretrain/Step": 8237, "Pretrain/Step Time": 8.666570246219635} +{"Pretrain/Learning Rate": 2.393296293781702e-06, "Pretrain/Loss": 1.943922996520996, "Pretrain/Loss (Raw)": 2.3095288276672363, "Pretrain/Step": 8238, "Pretrain/Step Time": 8.664695914834738} +{"Pretrain/Learning Rate": 2.3896727186774744e-06, "Pretrain/Loss": 1.944281816482544, "Pretrain/Loss (Raw)": 2.07562255859375, "Pretrain/Step": 8239, "Pretrain/Step Time": 8.666936803609133} +{"Pretrain/Learning Rate": 2.386051751102733e-06, "Pretrain/Loss": 1.9435253143310547, "Pretrain/Loss (Raw)": 1.7269377708435059, "Pretrain/Step": 8240, "Pretrain/Step Time": 8.664810542017221} +{"Pretrain/Learning Rate": 2.382433391475064e-06, "Pretrain/Loss": 1.943360447883606, "Pretrain/Loss (Raw)": 2.0759615898132324, "Pretrain/Step": 8241, "Pretrain/Step Time": 8.668170735239983} +{"Pretrain/Learning Rate": 2.3788176402117502e-06, "Pretrain/Loss": 1.9451589584350586, "Pretrain/Loss (Raw)": 2.003150701522827, "Pretrain/Step": 8242, "Pretrain/Step Time": 8.67034768499434} +{"Pretrain/Learning Rate": 2.3752044977297827e-06, "Pretrain/Loss": 1.9444522857666016, "Pretrain/Loss (Raw)": 1.8387221097946167, "Pretrain/Step": 8243, "Pretrain/Step Time": 8.665087215602398} +{"Pretrain/Learning Rate": 2.371593964445845e-06, "Pretrain/Loss": 1.9458279609680176, "Pretrain/Loss (Raw)": 2.0773448944091797, "Pretrain/Step": 8244, "Pretrain/Step Time": 8.660854930058122} +{"Pretrain/Learning Rate": 2.367986040776321e-06, "Pretrain/Loss": 1.9454946517944336, "Pretrain/Loss (Raw)": 1.8914339542388916, "Pretrain/Step": 8245, "Pretrain/Step Time": 8.66402580216527} +{"Pretrain/Learning Rate": 2.3643807271372886e-06, "Pretrain/Loss": 1.947811484336853, "Pretrain/Loss (Raw)": 2.358358144760132, "Pretrain/Step": 8246, "Pretrain/Step Time": 8.661717338487506} +{"Pretrain/Learning Rate": 2.360778023944535e-06, "Pretrain/Loss": 1.948355793952942, "Pretrain/Loss (Raw)": 1.9329580068588257, "Pretrain/Step": 8247, "Pretrain/Step Time": 8.659673802554607} +{"Pretrain/Learning Rate": 2.3571779316135413e-06, "Pretrain/Loss": 1.9486674070358276, "Pretrain/Loss (Raw)": 1.9115384817123413, "Pretrain/Step": 8248, "Pretrain/Step Time": 8.65860447473824} +{"Pretrain/Learning Rate": 2.3535804505594837e-06, "Pretrain/Loss": 1.945091724395752, "Pretrain/Loss (Raw)": 1.813162922859192, "Pretrain/Step": 8249, "Pretrain/Step Time": 8.659453891217709} +{"Pretrain/Learning Rate": 2.3499855811972393e-06, "Pretrain/Loss": 1.946092128753662, "Pretrain/Loss (Raw)": 1.9600919485092163, "Pretrain/Step": 8250, "Pretrain/Step Time": 8.66203659772873} +{"Pretrain/Learning Rate": 2.34639332394139e-06, "Pretrain/Loss": 1.9438196420669556, "Pretrain/Loss (Raw)": 1.9867137670516968, "Pretrain/Step": 8251, "Pretrain/Step Time": 8.667227942496538} +{"Pretrain/Learning Rate": 2.3428036792062124e-06, "Pretrain/Loss": 1.942574381828308, "Pretrain/Loss (Raw)": 1.9158307313919067, "Pretrain/Step": 8252, "Pretrain/Step Time": 8.664733938872814} +{"Pretrain/Learning Rate": 2.3392166474056758e-06, "Pretrain/Loss": 1.9434281587600708, "Pretrain/Loss (Raw)": 1.8725718259811401, "Pretrain/Step": 8253, "Pretrain/Step Time": 8.66541488096118} +{"Pretrain/Learning Rate": 2.3356322289534547e-06, "Pretrain/Loss": 1.9412171840667725, "Pretrain/Loss (Raw)": 1.7149516344070435, "Pretrain/Step": 8254, "Pretrain/Step Time": 8.668918432667851} +{"Pretrain/Learning Rate": 2.332050424262927e-06, "Pretrain/Loss": 1.939394474029541, "Pretrain/Loss (Raw)": 1.8500988483428955, "Pretrain/Step": 8255, "Pretrain/Step Time": 8.669176207855344} +{"Pretrain/Learning Rate": 2.3284712337471593e-06, "Pretrain/Loss": 1.9393714666366577, "Pretrain/Loss (Raw)": 1.9979596138000488, "Pretrain/Step": 8256, "Pretrain/Step Time": 8.667942486703396} +{"Pretrain/Learning Rate": 2.3248946578189186e-06, "Pretrain/Loss": 1.9405696392059326, "Pretrain/Loss (Raw)": 2.014857292175293, "Pretrain/Step": 8257, "Pretrain/Step Time": 8.669920602813363} +{"Pretrain/Learning Rate": 2.321320696890672e-06, "Pretrain/Loss": 1.9437921047210693, "Pretrain/Loss (Raw)": 2.073683261871338, "Pretrain/Step": 8258, "Pretrain/Step Time": 8.667297316715121} +{"Pretrain/Learning Rate": 2.317749351374593e-06, "Pretrain/Loss": 1.9436604976654053, "Pretrain/Loss (Raw)": 1.8869889974594116, "Pretrain/Step": 8259, "Pretrain/Step Time": 8.673676928505301} +{"Pretrain/Learning Rate": 2.3141806216825405e-06, "Pretrain/Loss": 1.9458401203155518, "Pretrain/Loss (Raw)": 2.0341131687164307, "Pretrain/Step": 8260, "Pretrain/Step Time": 8.666737692430615} +{"Pretrain/Learning Rate": 2.310614508226078e-06, "Pretrain/Loss": 1.94507896900177, "Pretrain/Loss (Raw)": 1.844026803970337, "Pretrain/Step": 8261, "Pretrain/Step Time": 8.666527742519975} +{"Pretrain/Learning Rate": 2.3070510114164613e-06, "Pretrain/Loss": 1.9444658756256104, "Pretrain/Loss (Raw)": 1.925133466720581, "Pretrain/Step": 8262, "Pretrain/Step Time": 8.663242891430855} +{"Pretrain/Learning Rate": 2.303490131664657e-06, "Pretrain/Loss": 1.9422203302383423, "Pretrain/Loss (Raw)": 2.0021564960479736, "Pretrain/Step": 8263, "Pretrain/Step Time": 8.665670849382877} +{"Pretrain/Learning Rate": 2.299931869381322e-06, "Pretrain/Loss": 1.943519949913025, "Pretrain/Loss (Raw)": 2.041412830352783, "Pretrain/Step": 8264, "Pretrain/Step Time": 8.665058013051748} +{"Pretrain/Learning Rate": 2.2963762249768067e-06, "Pretrain/Loss": 1.9442718029022217, "Pretrain/Loss (Raw)": 1.8425369262695312, "Pretrain/Step": 8265, "Pretrain/Step Time": 8.666950356215239} +{"Pretrain/Learning Rate": 2.2928231988611716e-06, "Pretrain/Loss": 1.94402277469635, "Pretrain/Loss (Raw)": 1.9759328365325928, "Pretrain/Step": 8266, "Pretrain/Step Time": 8.66755543090403} +{"Pretrain/Learning Rate": 2.289272791444166e-06, "Pretrain/Loss": 1.9408221244812012, "Pretrain/Loss (Raw)": 1.6095269918441772, "Pretrain/Step": 8267, "Pretrain/Step Time": 8.668150758370757} +{"Pretrain/Learning Rate": 2.285725003135239e-06, "Pretrain/Loss": 1.94258713722229, "Pretrain/Loss (Raw)": 2.0833938121795654, "Pretrain/Step": 8268, "Pretrain/Step Time": 8.66739558801055} +{"Pretrain/Learning Rate": 2.2821798343435314e-06, "Pretrain/Loss": 1.940029263496399, "Pretrain/Loss (Raw)": 1.696821928024292, "Pretrain/Step": 8269, "Pretrain/Step Time": 8.66958998888731} +{"Pretrain/Learning Rate": 2.2786372854779e-06, "Pretrain/Loss": 1.9383660554885864, "Pretrain/Loss (Raw)": 1.8688234090805054, "Pretrain/Step": 8270, "Pretrain/Step Time": 8.67362379655242} +{"Pretrain/Learning Rate": 2.2750973569468843e-06, "Pretrain/Loss": 1.9387295246124268, "Pretrain/Loss (Raw)": 2.061697244644165, "Pretrain/Step": 8271, "Pretrain/Step Time": 8.671477384865284} +{"Pretrain/Learning Rate": 2.2715600491587245e-06, "Pretrain/Loss": 1.9390426874160767, "Pretrain/Loss (Raw)": 2.0507760047912598, "Pretrain/Step": 8272, "Pretrain/Step Time": 8.671095022931695} +{"Pretrain/Learning Rate": 2.268025362521353e-06, "Pretrain/Loss": 1.9394257068634033, "Pretrain/Loss (Raw)": 2.014270067214966, "Pretrain/Step": 8273, "Pretrain/Step Time": 8.679303999990225} +{"Pretrain/Learning Rate": 2.264493297442424e-06, "Pretrain/Loss": 1.940665602684021, "Pretrain/Loss (Raw)": 2.1668479442596436, "Pretrain/Step": 8274, "Pretrain/Step Time": 8.680082239210606} +{"Pretrain/Learning Rate": 2.260963854329254e-06, "Pretrain/Loss": 1.9426417350769043, "Pretrain/Loss (Raw)": 2.031980514526367, "Pretrain/Step": 8275, "Pretrain/Step Time": 8.67653188481927} +{"Pretrain/Learning Rate": 2.2574370335888854e-06, "Pretrain/Loss": 1.9432356357574463, "Pretrain/Loss (Raw)": 1.962349534034729, "Pretrain/Step": 8276, "Pretrain/Step Time": 8.678586516529322} +{"Pretrain/Learning Rate": 2.2539128356280387e-06, "Pretrain/Loss": 1.9430582523345947, "Pretrain/Loss (Raw)": 1.801138997077942, "Pretrain/Step": 8277, "Pretrain/Step Time": 8.679245075210929} +{"Pretrain/Learning Rate": 2.2503912608531576e-06, "Pretrain/Loss": 1.9428399801254272, "Pretrain/Loss (Raw)": 1.9345815181732178, "Pretrain/Step": 8278, "Pretrain/Step Time": 8.678031116724014} +{"Pretrain/Learning Rate": 2.2468723096703447e-06, "Pretrain/Loss": 1.942658543586731, "Pretrain/Loss (Raw)": 1.9913160800933838, "Pretrain/Step": 8279, "Pretrain/Step Time": 8.679431030526757} +{"Pretrain/Learning Rate": 2.24335598248544e-06, "Pretrain/Loss": 1.9408552646636963, "Pretrain/Loss (Raw)": 1.9959237575531006, "Pretrain/Step": 8280, "Pretrain/Step Time": 8.677369616925716} +{"Pretrain/Learning Rate": 2.239842279703952e-06, "Pretrain/Loss": 1.9391047954559326, "Pretrain/Loss (Raw)": 1.6814192533493042, "Pretrain/Step": 8281, "Pretrain/Step Time": 8.678127098828554} +{"Pretrain/Learning Rate": 2.2363312017311094e-06, "Pretrain/Loss": 1.938759684562683, "Pretrain/Loss (Raw)": 1.8215090036392212, "Pretrain/Step": 8282, "Pretrain/Step Time": 8.67852807417512} +{"Pretrain/Learning Rate": 2.2328227489718106e-06, "Pretrain/Loss": 1.9378564357757568, "Pretrain/Loss (Raw)": 1.8854491710662842, "Pretrain/Step": 8283, "Pretrain/Step Time": 8.676177598536015} +{"Pretrain/Learning Rate": 2.229316921830679e-06, "Pretrain/Loss": 1.9407498836517334, "Pretrain/Loss (Raw)": 2.0868074893951416, "Pretrain/Step": 8284, "Pretrain/Step Time": 8.677679339423776} +{"Pretrain/Learning Rate": 2.2258137207120165e-06, "Pretrain/Loss": 1.9425374269485474, "Pretrain/Loss (Raw)": 2.096477746963501, "Pretrain/Step": 8285, "Pretrain/Step Time": 8.679119085893035} +{"Pretrain/Learning Rate": 2.222313146019833e-06, "Pretrain/Loss": 1.9405295848846436, "Pretrain/Loss (Raw)": 1.7923773527145386, "Pretrain/Step": 8286, "Pretrain/Step Time": 8.674101576209068} +{"Pretrain/Learning Rate": 2.2188151981578252e-06, "Pretrain/Loss": 1.9417328834533691, "Pretrain/Loss (Raw)": 2.168900728225708, "Pretrain/Step": 8287, "Pretrain/Step Time": 8.677854657173157} +{"Pretrain/Learning Rate": 2.215319877529404e-06, "Pretrain/Loss": 1.941827416419983, "Pretrain/Loss (Raw)": 1.8014613389968872, "Pretrain/Step": 8288, "Pretrain/Step Time": 8.671852285042405} +{"Pretrain/Learning Rate": 2.211827184537657e-06, "Pretrain/Loss": 1.9389002323150635, "Pretrain/Loss (Raw)": 1.7906018495559692, "Pretrain/Step": 8289, "Pretrain/Step Time": 8.671328336000443} +{"Pretrain/Learning Rate": 2.2083371195853796e-06, "Pretrain/Loss": 1.9399265050888062, "Pretrain/Loss (Raw)": 2.1345419883728027, "Pretrain/Step": 8290, "Pretrain/Step Time": 8.670861894264817} +{"Pretrain/Learning Rate": 2.204849683075061e-06, "Pretrain/Loss": 1.9380247592926025, "Pretrain/Loss (Raw)": 1.8448609113693237, "Pretrain/Step": 8291, "Pretrain/Step Time": 8.669709675014019} +{"Pretrain/Learning Rate": 2.2013648754088954e-06, "Pretrain/Loss": 1.939054012298584, "Pretrain/Loss (Raw)": 2.1051056385040283, "Pretrain/Step": 8292, "Pretrain/Step Time": 8.668307425454259} +{"Pretrain/Learning Rate": 2.1978826969887624e-06, "Pretrain/Loss": 1.9375107288360596, "Pretrain/Loss (Raw)": 1.7919306755065918, "Pretrain/Step": 8293, "Pretrain/Step Time": 8.672176921740174} +{"Pretrain/Learning Rate": 2.1944031482162425e-06, "Pretrain/Loss": 1.9377940893173218, "Pretrain/Loss (Raw)": 2.0052807331085205, "Pretrain/Step": 8294, "Pretrain/Step Time": 8.67160103470087} +{"Pretrain/Learning Rate": 2.1909262294926126e-06, "Pretrain/Loss": 1.9350025653839111, "Pretrain/Loss (Raw)": 1.7175596952438354, "Pretrain/Step": 8295, "Pretrain/Step Time": 8.67236458323896} +{"Pretrain/Learning Rate": 2.1874519412188545e-06, "Pretrain/Loss": 1.9349913597106934, "Pretrain/Loss (Raw)": 1.9502854347229004, "Pretrain/Step": 8296, "Pretrain/Step Time": 8.672344487160444} +{"Pretrain/Learning Rate": 2.1839802837956336e-06, "Pretrain/Loss": 1.9359211921691895, "Pretrain/Loss (Raw)": 2.009767532348633, "Pretrain/Step": 8297, "Pretrain/Step Time": 8.673020450398326} +{"Pretrain/Learning Rate": 2.180511257623319e-06, "Pretrain/Loss": 1.9375454187393188, "Pretrain/Loss (Raw)": 1.9831956624984741, "Pretrain/Step": 8298, "Pretrain/Step Time": 8.670173792168498} +{"Pretrain/Learning Rate": 2.1770448631019708e-06, "Pretrain/Loss": 1.935133457183838, "Pretrain/Loss (Raw)": 1.9859963655471802, "Pretrain/Step": 8299, "Pretrain/Step Time": 8.67394651286304} +{"Pretrain/Learning Rate": 2.1735811006313583e-06, "Pretrain/Loss": 1.9368082284927368, "Pretrain/Loss (Raw)": 2.0615222454071045, "Pretrain/Step": 8300, "Pretrain/Step Time": 8.675710322335362} +{"Pretrain/Learning Rate": 2.170119970610937e-06, "Pretrain/Loss": 1.9366860389709473, "Pretrain/Loss (Raw)": 1.970772385597229, "Pretrain/Step": 8301, "Pretrain/Step Time": 8.674051448702812} +{"Pretrain/Learning Rate": 2.1666614734398573e-06, "Pretrain/Loss": 1.9362610578536987, "Pretrain/Loss (Raw)": 1.765015721321106, "Pretrain/Step": 8302, "Pretrain/Step Time": 8.677218606695533} +{"Pretrain/Learning Rate": 2.163205609516966e-06, "Pretrain/Loss": 1.938403606414795, "Pretrain/Loss (Raw)": 2.045740842819214, "Pretrain/Step": 8303, "Pretrain/Step Time": 8.680278772488236} +{"Pretrain/Learning Rate": 2.1597523792408176e-06, "Pretrain/Loss": 1.9364941120147705, "Pretrain/Loss (Raw)": 1.651324987411499, "Pretrain/Step": 8304, "Pretrain/Step Time": 8.68348167464137} +{"Pretrain/Learning Rate": 2.156301783009654e-06, "Pretrain/Loss": 1.9400792121887207, "Pretrain/Loss (Raw)": 2.0737521648406982, "Pretrain/Step": 8305, "Pretrain/Step Time": 8.679259575903416} +{"Pretrain/Learning Rate": 2.1528538212214066e-06, "Pretrain/Loss": 1.9410712718963623, "Pretrain/Loss (Raw)": 2.1765449047088623, "Pretrain/Step": 8306, "Pretrain/Step Time": 8.678320417180657} +{"Pretrain/Learning Rate": 2.1494084942737193e-06, "Pretrain/Loss": 1.9404997825622559, "Pretrain/Loss (Raw)": 1.7493597269058228, "Pretrain/Step": 8307, "Pretrain/Step Time": 8.674854861572385} +{"Pretrain/Learning Rate": 2.1459658025639208e-06, "Pretrain/Loss": 1.940812110900879, "Pretrain/Loss (Raw)": 1.9053775072097778, "Pretrain/Step": 8308, "Pretrain/Step Time": 8.67255400493741} +{"Pretrain/Learning Rate": 2.142525746489038e-06, "Pretrain/Loss": 1.9441521167755127, "Pretrain/Loss (Raw)": 2.0063233375549316, "Pretrain/Step": 8309, "Pretrain/Step Time": 8.671646570786834} +{"Pretrain/Learning Rate": 2.1390883264457903e-06, "Pretrain/Loss": 1.9464547634124756, "Pretrain/Loss (Raw)": 2.082834243774414, "Pretrain/Step": 8310, "Pretrain/Step Time": 8.669782912358642} +{"Pretrain/Learning Rate": 2.135653542830604e-06, "Pretrain/Loss": 1.947384238243103, "Pretrain/Loss (Raw)": 2.037574291229248, "Pretrain/Step": 8311, "Pretrain/Step Time": 8.671693937852979} +{"Pretrain/Learning Rate": 2.132221396039591e-06, "Pretrain/Loss": 1.9478586912155151, "Pretrain/Loss (Raw)": 1.9380666017532349, "Pretrain/Step": 8312, "Pretrain/Step Time": 8.667761962860823} +{"Pretrain/Learning Rate": 2.1287918864685645e-06, "Pretrain/Loss": 1.9459582567214966, "Pretrain/Loss (Raw)": 1.7950206995010376, "Pretrain/Step": 8313, "Pretrain/Step Time": 8.668961437419057} +{"Pretrain/Learning Rate": 2.1253650145130254e-06, "Pretrain/Loss": 1.9467395544052124, "Pretrain/Loss (Raw)": 1.977345585823059, "Pretrain/Step": 8314, "Pretrain/Step Time": 8.669872503727674} +{"Pretrain/Learning Rate": 2.121940780568188e-06, "Pretrain/Loss": 1.9463601112365723, "Pretrain/Loss (Raw)": 2.0072171688079834, "Pretrain/Step": 8315, "Pretrain/Step Time": 8.667540073394775} +{"Pretrain/Learning Rate": 2.1185191850289386e-06, "Pretrain/Loss": 1.9463529586791992, "Pretrain/Loss (Raw)": 2.0734140872955322, "Pretrain/Step": 8316, "Pretrain/Step Time": 8.67240246385336} +{"Pretrain/Learning Rate": 2.115100228289882e-06, "Pretrain/Loss": 1.9450669288635254, "Pretrain/Loss (Raw)": 2.0428266525268555, "Pretrain/Step": 8317, "Pretrain/Step Time": 8.672599602490664} +{"Pretrain/Learning Rate": 2.111683910745299e-06, "Pretrain/Loss": 1.9421415328979492, "Pretrain/Loss (Raw)": 1.8764233589172363, "Pretrain/Step": 8318, "Pretrain/Step Time": 8.67480019107461} +{"Pretrain/Learning Rate": 2.108270232789192e-06, "Pretrain/Loss": 1.9444365501403809, "Pretrain/Loss (Raw)": 1.8567827939987183, "Pretrain/Step": 8319, "Pretrain/Step Time": 8.674264051020145} +{"Pretrain/Learning Rate": 2.10485919481522e-06, "Pretrain/Loss": 1.9436898231506348, "Pretrain/Loss (Raw)": 1.7417222261428833, "Pretrain/Step": 8320, "Pretrain/Step Time": 8.673986457288265} +{"Pretrain/Learning Rate": 2.101450797216775e-06, "Pretrain/Loss": 1.942102313041687, "Pretrain/Loss (Raw)": 1.9396545886993408, "Pretrain/Step": 8321, "Pretrain/Step Time": 8.671060437336564} +{"Pretrain/Learning Rate": 2.098045040386923e-06, "Pretrain/Loss": 1.9432628154754639, "Pretrain/Loss (Raw)": 2.077561140060425, "Pretrain/Step": 8322, "Pretrain/Step Time": 8.671854678541422} +{"Pretrain/Learning Rate": 2.0946419247184435e-06, "Pretrain/Loss": 1.9438695907592773, "Pretrain/Loss (Raw)": 2.0175957679748535, "Pretrain/Step": 8323, "Pretrain/Step Time": 8.665695529431105} +{"Pretrain/Learning Rate": 2.0912414506037814e-06, "Pretrain/Loss": 1.9430345296859741, "Pretrain/Loss (Raw)": 1.8798655271530151, "Pretrain/Step": 8324, "Pretrain/Step Time": 8.659960184246302} +{"Pretrain/Learning Rate": 2.087843618435109e-06, "Pretrain/Loss": 1.941483497619629, "Pretrain/Loss (Raw)": 2.071239471435547, "Pretrain/Step": 8325, "Pretrain/Step Time": 8.662502409890294} +{"Pretrain/Learning Rate": 2.0844484286042744e-06, "Pretrain/Loss": 1.945330023765564, "Pretrain/Loss (Raw)": 2.2755980491638184, "Pretrain/Step": 8326, "Pretrain/Step Time": 8.65834479033947} +{"Pretrain/Learning Rate": 2.0810558815028303e-06, "Pretrain/Loss": 1.945530891418457, "Pretrain/Loss (Raw)": 1.9873988628387451, "Pretrain/Step": 8327, "Pretrain/Step Time": 8.663339095190167} +{"Pretrain/Learning Rate": 2.077665977522017e-06, "Pretrain/Loss": 1.9443652629852295, "Pretrain/Loss (Raw)": 1.9762094020843506, "Pretrain/Step": 8328, "Pretrain/Step Time": 8.666910327970982} +{"Pretrain/Learning Rate": 2.07427871705278e-06, "Pretrain/Loss": 1.941853642463684, "Pretrain/Loss (Raw)": 1.7362802028656006, "Pretrain/Step": 8329, "Pretrain/Step Time": 8.664321802556515} +{"Pretrain/Learning Rate": 2.0708941004857485e-06, "Pretrain/Loss": 1.94386887550354, "Pretrain/Loss (Raw)": 2.0587122440338135, "Pretrain/Step": 8330, "Pretrain/Step Time": 8.664373956620693} +{"Pretrain/Learning Rate": 2.0675121282112577e-06, "Pretrain/Loss": 1.9452168941497803, "Pretrain/Loss (Raw)": 1.994930624961853, "Pretrain/Step": 8331, "Pretrain/Step Time": 8.660451145842671} +{"Pretrain/Learning Rate": 2.064132800619323e-06, "Pretrain/Loss": 1.9444890022277832, "Pretrain/Loss (Raw)": 1.9836708307266235, "Pretrain/Step": 8332, "Pretrain/Step Time": 8.664384024217725} +{"Pretrain/Learning Rate": 2.0607561180996772e-06, "Pretrain/Loss": 1.9482662677764893, "Pretrain/Loss (Raw)": 2.1546857357025146, "Pretrain/Step": 8333, "Pretrain/Step Time": 8.66299601085484} +{"Pretrain/Learning Rate": 2.0573820810417283e-06, "Pretrain/Loss": 1.9451427459716797, "Pretrain/Loss (Raw)": 1.7315051555633545, "Pretrain/Step": 8334, "Pretrain/Step Time": 8.664961913600564} +{"Pretrain/Learning Rate": 2.0540106898345874e-06, "Pretrain/Loss": 1.948477864265442, "Pretrain/Loss (Raw)": 2.0803017616271973, "Pretrain/Step": 8335, "Pretrain/Step Time": 8.66618944145739} +{"Pretrain/Learning Rate": 2.0506419448670543e-06, "Pretrain/Loss": 1.945349097251892, "Pretrain/Loss (Raw)": 1.9397873878479004, "Pretrain/Step": 8336, "Pretrain/Step Time": 8.662844881415367} +{"Pretrain/Learning Rate": 2.047275846527638e-06, "Pretrain/Loss": 1.9434101581573486, "Pretrain/Loss (Raw)": 1.7135027647018433, "Pretrain/Step": 8337, "Pretrain/Step Time": 8.667404057458043} +{"Pretrain/Learning Rate": 2.043912395204525e-06, "Pretrain/Loss": 1.9441108703613281, "Pretrain/Loss (Raw)": 1.9101405143737793, "Pretrain/Step": 8338, "Pretrain/Step Time": 8.663556147366762} +{"Pretrain/Learning Rate": 2.040551591285611e-06, "Pretrain/Loss": 1.9453203678131104, "Pretrain/Loss (Raw)": 2.021848678588867, "Pretrain/Step": 8339, "Pretrain/Step Time": 8.661122892051935} +{"Pretrain/Learning Rate": 2.0371934351584716e-06, "Pretrain/Loss": 1.9458061456680298, "Pretrain/Loss (Raw)": 1.9468731880187988, "Pretrain/Step": 8340, "Pretrain/Step Time": 8.662644071504474} +{"Pretrain/Learning Rate": 2.0338379272103915e-06, "Pretrain/Loss": 1.940643310546875, "Pretrain/Loss (Raw)": 1.4185583591461182, "Pretrain/Step": 8341, "Pretrain/Step Time": 8.66884752176702} +{"Pretrain/Learning Rate": 2.0304850678283415e-06, "Pretrain/Loss": 1.94028902053833, "Pretrain/Loss (Raw)": 1.9689991474151611, "Pretrain/Step": 8342, "Pretrain/Step Time": 8.667637750506401} +{"Pretrain/Learning Rate": 2.027134857398991e-06, "Pretrain/Loss": 1.9431869983673096, "Pretrain/Loss (Raw)": 2.234391927719116, "Pretrain/Step": 8343, "Pretrain/Step Time": 8.671225298196077} +{"Pretrain/Learning Rate": 2.023787296308696e-06, "Pretrain/Loss": 1.943408727645874, "Pretrain/Loss (Raw)": 2.016188859939575, "Pretrain/Step": 8344, "Pretrain/Step Time": 8.665191924199462} +{"Pretrain/Learning Rate": 2.0204423849435216e-06, "Pretrain/Loss": 1.9442239999771118, "Pretrain/Loss (Raw)": 2.066068410873413, "Pretrain/Step": 8345, "Pretrain/Step Time": 8.664287969470024} +{"Pretrain/Learning Rate": 2.017100123689214e-06, "Pretrain/Loss": 1.9457933902740479, "Pretrain/Loss (Raw)": 2.2267708778381348, "Pretrain/Step": 8346, "Pretrain/Step Time": 8.659099956974387} +{"Pretrain/Learning Rate": 2.013760512931215e-06, "Pretrain/Loss": 1.9442017078399658, "Pretrain/Loss (Raw)": 1.8545249700546265, "Pretrain/Step": 8347, "Pretrain/Step Time": 8.659086048603058} +{"Pretrain/Learning Rate": 2.0104235530546743e-06, "Pretrain/Loss": 1.942651629447937, "Pretrain/Loss (Raw)": 2.010836362838745, "Pretrain/Step": 8348, "Pretrain/Step Time": 8.658089373260736} +{"Pretrain/Learning Rate": 2.0070892444444185e-06, "Pretrain/Loss": 1.945271611213684, "Pretrain/Loss (Raw)": 1.9863269329071045, "Pretrain/Step": 8349, "Pretrain/Step Time": 8.661494279280305} +{"Pretrain/Learning Rate": 2.0037575874849753e-06, "Pretrain/Loss": 1.945044755935669, "Pretrain/Loss (Raw)": 1.7336297035217285, "Pretrain/Step": 8350, "Pretrain/Step Time": 8.662119306623936} +{"Pretrain/Learning Rate": 2.0004285825605677e-06, "Pretrain/Loss": 1.9444539546966553, "Pretrain/Loss (Raw)": 1.933970332145691, "Pretrain/Step": 8351, "Pretrain/Step Time": 8.65999125316739} +{"Pretrain/Learning Rate": 1.9971022300551174e-06, "Pretrain/Loss": 1.948789358139038, "Pretrain/Loss (Raw)": 2.1093616485595703, "Pretrain/Step": 8352, "Pretrain/Step Time": 8.662292366847396} +{"Pretrain/Learning Rate": 1.9937785303522303e-06, "Pretrain/Loss": 1.9532084465026855, "Pretrain/Loss (Raw)": 2.227900743484497, "Pretrain/Step": 8353, "Pretrain/Step Time": 8.658667149022222} +{"Pretrain/Learning Rate": 1.990457483835212e-06, "Pretrain/Loss": 1.9513413906097412, "Pretrain/Loss (Raw)": 1.997213363647461, "Pretrain/Step": 8354, "Pretrain/Step Time": 8.657112451270223} +{"Pretrain/Learning Rate": 1.9871390908870554e-06, "Pretrain/Loss": 1.9518930912017822, "Pretrain/Loss (Raw)": 2.086772918701172, "Pretrain/Step": 8355, "Pretrain/Step Time": 8.65959733352065} +{"Pretrain/Learning Rate": 1.9838233518904655e-06, "Pretrain/Loss": 1.9493443965911865, "Pretrain/Loss (Raw)": 1.622697114944458, "Pretrain/Step": 8356, "Pretrain/Step Time": 8.661554807797074} +{"Pretrain/Learning Rate": 1.9805102672278226e-06, "Pretrain/Loss": 1.9509575366973877, "Pretrain/Loss (Raw)": 2.1235146522521973, "Pretrain/Step": 8357, "Pretrain/Step Time": 8.662680316716433} +{"Pretrain/Learning Rate": 1.9771998372812044e-06, "Pretrain/Loss": 1.9508347511291504, "Pretrain/Loss (Raw)": 1.8150086402893066, "Pretrain/Step": 8358, "Pretrain/Step Time": 8.66694507934153} +{"Pretrain/Learning Rate": 1.9738920624323862e-06, "Pretrain/Loss": 1.9508914947509766, "Pretrain/Loss (Raw)": 2.2136077880859375, "Pretrain/Step": 8359, "Pretrain/Step Time": 8.6693701967597} +{"Pretrain/Learning Rate": 1.9705869430628465e-06, "Pretrain/Loss": 1.9511266946792603, "Pretrain/Loss (Raw)": 1.8918644189834595, "Pretrain/Step": 8360, "Pretrain/Step Time": 8.668209861963987} +{"Pretrain/Learning Rate": 1.96728447955373e-06, "Pretrain/Loss": 1.9545433521270752, "Pretrain/Loss (Raw)": 2.130833148956299, "Pretrain/Step": 8361, "Pretrain/Step Time": 8.670469999313354} +{"Pretrain/Learning Rate": 1.963984672285904e-06, "Pretrain/Loss": 1.953006625175476, "Pretrain/Loss (Raw)": 1.7702617645263672, "Pretrain/Step": 8362, "Pretrain/Step Time": 8.672349331900477} +{"Pretrain/Learning Rate": 1.960687521639912e-06, "Pretrain/Loss": 1.9536631107330322, "Pretrain/Loss (Raw)": 1.9284279346466064, "Pretrain/Step": 8363, "Pretrain/Step Time": 8.669885881245136} +{"Pretrain/Learning Rate": 1.9573930279960073e-06, "Pretrain/Loss": 1.955084204673767, "Pretrain/Loss (Raw)": 1.9681342840194702, "Pretrain/Step": 8364, "Pretrain/Step Time": 8.667663872241974} +{"Pretrain/Learning Rate": 1.954101191734112e-06, "Pretrain/Loss": 1.956565022468567, "Pretrain/Loss (Raw)": 1.8953839540481567, "Pretrain/Step": 8365, "Pretrain/Step Time": 8.668220490217209} +{"Pretrain/Learning Rate": 1.9508120132338657e-06, "Pretrain/Loss": 1.9522416591644287, "Pretrain/Loss (Raw)": 1.7561410665512085, "Pretrain/Step": 8366, "Pretrain/Step Time": 8.672698982059956} +{"Pretrain/Learning Rate": 1.9475254928745883e-06, "Pretrain/Loss": 1.9504234790802002, "Pretrain/Loss (Raw)": 1.842903733253479, "Pretrain/Step": 8367, "Pretrain/Step Time": 8.66955721564591} +{"Pretrain/Learning Rate": 1.9442416310353012e-06, "Pretrain/Loss": 1.9521311521530151, "Pretrain/Loss (Raw)": 1.945502758026123, "Pretrain/Step": 8368, "Pretrain/Step Time": 8.673027459532022} +{"Pretrain/Learning Rate": 1.940960428094704e-06, "Pretrain/Loss": 1.9537978172302246, "Pretrain/Loss (Raw)": 2.2893049716949463, "Pretrain/Step": 8369, "Pretrain/Step Time": 8.66858865506947} +{"Pretrain/Learning Rate": 1.937681884431214e-06, "Pretrain/Loss": 1.953869342803955, "Pretrain/Loss (Raw)": 2.0122904777526855, "Pretrain/Step": 8370, "Pretrain/Step Time": 8.664397493004799} +{"Pretrain/Learning Rate": 1.9344060004229225e-06, "Pretrain/Loss": 1.9548816680908203, "Pretrain/Loss (Raw)": 1.9683058261871338, "Pretrain/Step": 8371, "Pretrain/Step Time": 8.669487157836556} +{"Pretrain/Learning Rate": 1.9311327764476196e-06, "Pretrain/Loss": 1.953768014907837, "Pretrain/Loss (Raw)": 1.9348024129867554, "Pretrain/Step": 8372, "Pretrain/Step Time": 8.67630230076611} +{"Pretrain/Learning Rate": 1.927862212882783e-06, "Pretrain/Loss": 1.955191969871521, "Pretrain/Loss (Raw)": 2.0736923217773438, "Pretrain/Step": 8373, "Pretrain/Step Time": 8.67380030080676} +{"Pretrain/Learning Rate": 1.9245943101056014e-06, "Pretrain/Loss": 1.9533171653747559, "Pretrain/Loss (Raw)": 2.118391752243042, "Pretrain/Step": 8374, "Pretrain/Step Time": 8.678596585988998} +{"Pretrain/Learning Rate": 1.9213290684929386e-06, "Pretrain/Loss": 1.9546661376953125, "Pretrain/Loss (Raw)": 2.10561203956604, "Pretrain/Step": 8375, "Pretrain/Step Time": 8.675601715222001} +{"Pretrain/Learning Rate": 1.9180664884213577e-06, "Pretrain/Loss": 1.956040620803833, "Pretrain/Loss (Raw)": 2.087479591369629, "Pretrain/Step": 8376, "Pretrain/Step Time": 8.67527699843049} +{"Pretrain/Learning Rate": 1.9148065702671108e-06, "Pretrain/Loss": 1.9572312831878662, "Pretrain/Loss (Raw)": 1.965563416481018, "Pretrain/Step": 8377, "Pretrain/Step Time": 8.674161126837134} +{"Pretrain/Learning Rate": 1.9115493144061555e-06, "Pretrain/Loss": 1.9570517539978027, "Pretrain/Loss (Raw)": 1.937111735343933, "Pretrain/Step": 8378, "Pretrain/Step Time": 8.673034539446235} +{"Pretrain/Learning Rate": 1.9082947212141293e-06, "Pretrain/Loss": 1.956845998764038, "Pretrain/Loss (Raw)": 1.9603939056396484, "Pretrain/Step": 8379, "Pretrain/Step Time": 8.66975886002183} +{"Pretrain/Learning Rate": 1.9050427910663693e-06, "Pretrain/Loss": 1.9538147449493408, "Pretrain/Loss (Raw)": 1.5278221368789673, "Pretrain/Step": 8380, "Pretrain/Step Time": 8.670229360461235} +{"Pretrain/Learning Rate": 1.901793524337897e-06, "Pretrain/Loss": 1.95353102684021, "Pretrain/Loss (Raw)": 1.836255669593811, "Pretrain/Step": 8381, "Pretrain/Step Time": 8.671429699286819} +{"Pretrain/Learning Rate": 1.8985469214034407e-06, "Pretrain/Loss": 1.9556903839111328, "Pretrain/Loss (Raw)": 1.9913537502288818, "Pretrain/Step": 8382, "Pretrain/Step Time": 8.66866840608418} +{"Pretrain/Learning Rate": 1.8953029826374119e-06, "Pretrain/Loss": 1.951224446296692, "Pretrain/Loss (Raw)": 1.2784513235092163, "Pretrain/Step": 8383, "Pretrain/Step Time": 8.669090632349253} +{"Pretrain/Learning Rate": 1.8920617084139142e-06, "Pretrain/Loss": 1.9494737386703491, "Pretrain/Loss (Raw)": 1.773870587348938, "Pretrain/Step": 8384, "Pretrain/Step Time": 8.66486064530909} +{"Pretrain/Learning Rate": 1.8888230991067457e-06, "Pretrain/Loss": 1.9496164321899414, "Pretrain/Loss (Raw)": 2.0331308841705322, "Pretrain/Step": 8385, "Pretrain/Step Time": 8.663804799318314} +{"Pretrain/Learning Rate": 1.885587155089405e-06, "Pretrain/Loss": 1.9494593143463135, "Pretrain/Loss (Raw)": 2.053557872772217, "Pretrain/Step": 8386, "Pretrain/Step Time": 8.66539123468101} +{"Pretrain/Learning Rate": 1.8823538767350712e-06, "Pretrain/Loss": 1.9509695768356323, "Pretrain/Loss (Raw)": 2.080315589904785, "Pretrain/Step": 8387, "Pretrain/Step Time": 8.661238433793187} +{"Pretrain/Learning Rate": 1.8791232644166212e-06, "Pretrain/Loss": 1.9487478733062744, "Pretrain/Loss (Raw)": 1.749725341796875, "Pretrain/Step": 8388, "Pretrain/Step Time": 8.6621358320117} +{"Pretrain/Learning Rate": 1.8758953185066264e-06, "Pretrain/Loss": 1.9506521224975586, "Pretrain/Loss (Raw)": 2.0877599716186523, "Pretrain/Step": 8389, "Pretrain/Step Time": 8.666016543284059} +{"Pretrain/Learning Rate": 1.87267003937735e-06, "Pretrain/Loss": 1.953230857849121, "Pretrain/Loss (Raw)": 2.255225658416748, "Pretrain/Step": 8390, "Pretrain/Step Time": 8.663277121260762} +{"Pretrain/Learning Rate": 1.8694474274007417e-06, "Pretrain/Loss": 1.9536951780319214, "Pretrain/Loss (Raw)": 2.061586618423462, "Pretrain/Step": 8391, "Pretrain/Step Time": 8.66255315952003} +{"Pretrain/Learning Rate": 1.8662274829484488e-06, "Pretrain/Loss": 1.9534218311309814, "Pretrain/Loss (Raw)": 2.00642991065979, "Pretrain/Step": 8392, "Pretrain/Step Time": 8.6646797824651} +{"Pretrain/Learning Rate": 1.8630102063918158e-06, "Pretrain/Loss": 1.9543851613998413, "Pretrain/Loss (Raw)": 1.9658315181732178, "Pretrain/Step": 8393, "Pretrain/Step Time": 8.663793632760644} +{"Pretrain/Learning Rate": 1.859795598101871e-06, "Pretrain/Loss": 1.9549586772918701, "Pretrain/Loss (Raw)": 2.049354314804077, "Pretrain/Step": 8394, "Pretrain/Step Time": 8.669954024255276} +{"Pretrain/Learning Rate": 1.8565836584493374e-06, "Pretrain/Loss": 1.9564133882522583, "Pretrain/Loss (Raw)": 1.7957288026809692, "Pretrain/Step": 8395, "Pretrain/Step Time": 8.671706521883607} +{"Pretrain/Learning Rate": 1.8533743878046295e-06, "Pretrain/Loss": 1.9540269374847412, "Pretrain/Loss (Raw)": 1.7779346704483032, "Pretrain/Step": 8396, "Pretrain/Step Time": 8.670968633145094} +{"Pretrain/Learning Rate": 1.8501677865378597e-06, "Pretrain/Loss": 1.9540960788726807, "Pretrain/Loss (Raw)": 1.7056599855422974, "Pretrain/Step": 8397, "Pretrain/Step Time": 8.6715073492378} +{"Pretrain/Learning Rate": 1.8469638550188267e-06, "Pretrain/Loss": 1.9553494453430176, "Pretrain/Loss (Raw)": 2.029261827468872, "Pretrain/Step": 8398, "Pretrain/Step Time": 8.668721066787839} +{"Pretrain/Learning Rate": 1.8437625936170239e-06, "Pretrain/Loss": 1.9556447267532349, "Pretrain/Loss (Raw)": 2.099482774734497, "Pretrain/Step": 8399, "Pretrain/Step Time": 8.66606374271214} +{"Pretrain/Learning Rate": 1.8405640027016307e-06, "Pretrain/Loss": 1.9544694423675537, "Pretrain/Loss (Raw)": 1.900357723236084, "Pretrain/Step": 8400, "Pretrain/Step Time": 8.665877148509026} +{"Pretrain/Learning Rate": 1.8373680826415358e-06, "Pretrain/Loss": 1.9546006917953491, "Pretrain/Loss (Raw)": 2.0310542583465576, "Pretrain/Step": 8401, "Pretrain/Step Time": 8.657207218930125} +{"Pretrain/Learning Rate": 1.8341748338052882e-06, "Pretrain/Loss": 1.9537278413772583, "Pretrain/Loss (Raw)": 2.055128335952759, "Pretrain/Step": 8402, "Pretrain/Step Time": 8.659860398620367} +{"Pretrain/Learning Rate": 1.8309842565611663e-06, "Pretrain/Loss": 1.952260971069336, "Pretrain/Loss (Raw)": 1.844207763671875, "Pretrain/Step": 8403, "Pretrain/Step Time": 8.661654759198427} +{"Pretrain/Learning Rate": 1.8277963512771112e-06, "Pretrain/Loss": 1.9528417587280273, "Pretrain/Loss (Raw)": 2.036705732345581, "Pretrain/Step": 8404, "Pretrain/Step Time": 8.662123696878552} +{"Pretrain/Learning Rate": 1.824611118320782e-06, "Pretrain/Loss": 1.953583002090454, "Pretrain/Loss (Raw)": 1.896011233329773, "Pretrain/Step": 8405, "Pretrain/Step Time": 8.661573145538568} +{"Pretrain/Learning Rate": 1.8214285580594931e-06, "Pretrain/Loss": 1.9549229145050049, "Pretrain/Loss (Raw)": 2.1060922145843506, "Pretrain/Step": 8406, "Pretrain/Step Time": 8.660708535462618} +{"Pretrain/Learning Rate": 1.8182486708602898e-06, "Pretrain/Loss": 1.955359697341919, "Pretrain/Loss (Raw)": 2.047236204147339, "Pretrain/Step": 8407, "Pretrain/Step Time": 8.6580216512084} +{"Pretrain/Learning Rate": 1.8150714570898868e-06, "Pretrain/Loss": 1.955794334411621, "Pretrain/Loss (Raw)": 2.0515480041503906, "Pretrain/Step": 8408, "Pretrain/Step Time": 8.65729253180325} +{"Pretrain/Learning Rate": 1.8118969171146915e-06, "Pretrain/Loss": 1.95735764503479, "Pretrain/Loss (Raw)": 1.8815110921859741, "Pretrain/Step": 8409, "Pretrain/Step Time": 8.659822275862098} +{"Pretrain/Learning Rate": 1.8087250513008082e-06, "Pretrain/Loss": 1.9590257406234741, "Pretrain/Loss (Raw)": 2.035048246383667, "Pretrain/Step": 8410, "Pretrain/Step Time": 8.660191852599382} +{"Pretrain/Learning Rate": 1.8055558600140354e-06, "Pretrain/Loss": 1.9596927165985107, "Pretrain/Loss (Raw)": 1.9708138704299927, "Pretrain/Step": 8411, "Pretrain/Step Time": 8.663295559585094} +{"Pretrain/Learning Rate": 1.8023893436198592e-06, "Pretrain/Loss": 1.9593112468719482, "Pretrain/Loss (Raw)": 2.0379638671875, "Pretrain/Step": 8412, "Pretrain/Step Time": 8.662872051820159} +{"Pretrain/Learning Rate": 1.7992255024834509e-06, "Pretrain/Loss": 1.9584259986877441, "Pretrain/Loss (Raw)": 1.9831781387329102, "Pretrain/Step": 8413, "Pretrain/Step Time": 8.662929320707917} +{"Pretrain/Learning Rate": 1.79606433696968e-06, "Pretrain/Loss": 1.9597628116607666, "Pretrain/Loss (Raw)": 1.9634870290756226, "Pretrain/Step": 8414, "Pretrain/Step Time": 8.664143435657024} +{"Pretrain/Learning Rate": 1.792905847443116e-06, "Pretrain/Loss": 1.9584156274795532, "Pretrain/Loss (Raw)": 1.996463656425476, "Pretrain/Step": 8415, "Pretrain/Step Time": 8.6610736399889} +{"Pretrain/Learning Rate": 1.7897500342680063e-06, "Pretrain/Loss": 1.9616122245788574, "Pretrain/Loss (Raw)": 2.2106242179870605, "Pretrain/Step": 8416, "Pretrain/Step Time": 8.657654032111168} +{"Pretrain/Learning Rate": 1.7865968978082903e-06, "Pretrain/Loss": 1.9609848260879517, "Pretrain/Loss (Raw)": 1.7102930545806885, "Pretrain/Step": 8417, "Pretrain/Step Time": 8.659121591597795} +{"Pretrain/Learning Rate": 1.7834464384276022e-06, "Pretrain/Loss": 1.959897756576538, "Pretrain/Loss (Raw)": 1.9954038858413696, "Pretrain/Step": 8418, "Pretrain/Step Time": 8.659689657390118} +{"Pretrain/Learning Rate": 1.7802986564892737e-06, "Pretrain/Loss": 1.9617842435836792, "Pretrain/Loss (Raw)": 2.0863234996795654, "Pretrain/Step": 8419, "Pretrain/Step Time": 8.660698557272553} +{"Pretrain/Learning Rate": 1.7771535523563198e-06, "Pretrain/Loss": 1.9631714820861816, "Pretrain/Loss (Raw)": 2.282668352127075, "Pretrain/Step": 8420, "Pretrain/Step Time": 8.66236012428999} +{"Pretrain/Learning Rate": 1.7740111263914478e-06, "Pretrain/Loss": 1.9645178318023682, "Pretrain/Loss (Raw)": 1.9642759561538696, "Pretrain/Step": 8421, "Pretrain/Step Time": 8.661061886698008} +{"Pretrain/Learning Rate": 1.7708713789570536e-06, "Pretrain/Loss": 1.9659762382507324, "Pretrain/Loss (Raw)": 2.1919641494750977, "Pretrain/Step": 8422, "Pretrain/Step Time": 8.660489562898874} +{"Pretrain/Learning Rate": 1.767734310415234e-06, "Pretrain/Loss": 1.9682438373565674, "Pretrain/Loss (Raw)": 2.0078024864196777, "Pretrain/Step": 8423, "Pretrain/Step Time": 8.66149302944541} +{"Pretrain/Learning Rate": 1.7645999211277686e-06, "Pretrain/Loss": 1.969040870666504, "Pretrain/Loss (Raw)": 2.0523202419281006, "Pretrain/Step": 8424, "Pretrain/Step Time": 8.658824125304818} +{"Pretrain/Learning Rate": 1.7614682114561298e-06, "Pretrain/Loss": 1.9680981636047363, "Pretrain/Loss (Raw)": 1.889083743095398, "Pretrain/Step": 8425, "Pretrain/Step Time": 8.667400479316711} +{"Pretrain/Learning Rate": 1.7583391817614757e-06, "Pretrain/Loss": 1.9668517112731934, "Pretrain/Loss (Raw)": 1.823669672012329, "Pretrain/Step": 8426, "Pretrain/Step Time": 8.67149979248643} +{"Pretrain/Learning Rate": 1.7552128324046707e-06, "Pretrain/Loss": 1.9683083295822144, "Pretrain/Loss (Raw)": 2.172421932220459, "Pretrain/Step": 8427, "Pretrain/Step Time": 8.672365218400955} +{"Pretrain/Learning Rate": 1.752089163746254e-06, "Pretrain/Loss": 1.9670190811157227, "Pretrain/Loss (Raw)": 1.8965009450912476, "Pretrain/Step": 8428, "Pretrain/Step Time": 8.672490909695625} +{"Pretrain/Learning Rate": 1.7489681761464565e-06, "Pretrain/Loss": 1.9659130573272705, "Pretrain/Loss (Raw)": 1.829193115234375, "Pretrain/Step": 8429, "Pretrain/Step Time": 8.66975549608469} +{"Pretrain/Learning Rate": 1.7458498699652186e-06, "Pretrain/Loss": 1.9667012691497803, "Pretrain/Loss (Raw)": 1.865908145904541, "Pretrain/Step": 8430, "Pretrain/Step Time": 8.668688109144568} +{"Pretrain/Learning Rate": 1.7427342455621498e-06, "Pretrain/Loss": 1.9672913551330566, "Pretrain/Loss (Raw)": 2.1212897300720215, "Pretrain/Step": 8431, "Pretrain/Step Time": 8.66231295093894} +{"Pretrain/Learning Rate": 1.7396213032965597e-06, "Pretrain/Loss": 1.9703930616378784, "Pretrain/Loss (Raw)": 2.048342227935791, "Pretrain/Step": 8432, "Pretrain/Step Time": 8.660744048655033} +{"Pretrain/Learning Rate": 1.7365110435274419e-06, "Pretrain/Loss": 1.967454433441162, "Pretrain/Loss (Raw)": 1.6976006031036377, "Pretrain/Step": 8433, "Pretrain/Step Time": 8.663371523842216} +{"Pretrain/Learning Rate": 1.733403466613498e-06, "Pretrain/Loss": 1.9657273292541504, "Pretrain/Loss (Raw)": 1.9554909467697144, "Pretrain/Step": 8434, "Pretrain/Step Time": 8.664323257282376} +{"Pretrain/Learning Rate": 1.7302985729131e-06, "Pretrain/Loss": 1.9675278663635254, "Pretrain/Loss (Raw)": 1.9798141717910767, "Pretrain/Step": 8435, "Pretrain/Step Time": 8.669941456988454} +{"Pretrain/Learning Rate": 1.7271963627843223e-06, "Pretrain/Loss": 1.967005968093872, "Pretrain/Loss (Raw)": 1.8385767936706543, "Pretrain/Step": 8436, "Pretrain/Step Time": 8.666195150464773} +{"Pretrain/Learning Rate": 1.7240968365849208e-06, "Pretrain/Loss": 1.9665324687957764, "Pretrain/Loss (Raw)": 1.9456952810287476, "Pretrain/Step": 8437, "Pretrain/Step Time": 8.66853441670537} +{"Pretrain/Learning Rate": 1.7209999946723564e-06, "Pretrain/Loss": 1.9654347896575928, "Pretrain/Loss (Raw)": 1.942335844039917, "Pretrain/Step": 8438, "Pretrain/Step Time": 8.672566901892424} +{"Pretrain/Learning Rate": 1.717905837403766e-06, "Pretrain/Loss": 1.9655675888061523, "Pretrain/Loss (Raw)": 2.0545830726623535, "Pretrain/Step": 8439, "Pretrain/Step Time": 8.666701216250658} +{"Pretrain/Learning Rate": 1.7148143651359833e-06, "Pretrain/Loss": 1.96583890914917, "Pretrain/Loss (Raw)": 1.972810983657837, "Pretrain/Step": 8440, "Pretrain/Step Time": 8.667877156287432} +{"Pretrain/Learning Rate": 1.711725578225526e-06, "Pretrain/Loss": 1.9651083946228027, "Pretrain/Loss (Raw)": 1.7014929056167603, "Pretrain/Step": 8441, "Pretrain/Step Time": 8.664220014587045} +{"Pretrain/Learning Rate": 1.708639477028623e-06, "Pretrain/Loss": 1.9635076522827148, "Pretrain/Loss (Raw)": 1.772474765777588, "Pretrain/Step": 8442, "Pretrain/Step Time": 8.66300642490387} +{"Pretrain/Learning Rate": 1.705556061901159e-06, "Pretrain/Loss": 1.960729956626892, "Pretrain/Loss (Raw)": 1.6516567468643188, "Pretrain/Step": 8443, "Pretrain/Step Time": 8.662718899548054} +{"Pretrain/Learning Rate": 1.7024753331987442e-06, "Pretrain/Loss": 1.9596638679504395, "Pretrain/Loss (Raw)": 1.9369621276855469, "Pretrain/Step": 8444, "Pretrain/Step Time": 8.660162128508091} +{"Pretrain/Learning Rate": 1.699397291276647e-06, "Pretrain/Loss": 1.9560282230377197, "Pretrain/Loss (Raw)": 1.5774567127227783, "Pretrain/Step": 8445, "Pretrain/Step Time": 8.660415967926383} +{"Pretrain/Learning Rate": 1.6963219364898613e-06, "Pretrain/Loss": 1.9576098918914795, "Pretrain/Loss (Raw)": 2.078869104385376, "Pretrain/Step": 8446, "Pretrain/Step Time": 8.656448315829039} +{"Pretrain/Learning Rate": 1.6932492691930312e-06, "Pretrain/Loss": 1.956305742263794, "Pretrain/Loss (Raw)": 1.6898726224899292, "Pretrain/Step": 8447, "Pretrain/Step Time": 8.658581830561161} +{"Pretrain/Learning Rate": 1.6901792897405233e-06, "Pretrain/Loss": 1.957442283630371, "Pretrain/Loss (Raw)": 1.8871957063674927, "Pretrain/Step": 8448, "Pretrain/Step Time": 8.658765519037843} +{"Pretrain/Learning Rate": 1.6871119984863765e-06, "Pretrain/Loss": 1.9580276012420654, "Pretrain/Loss (Raw)": 2.014556407928467, "Pretrain/Step": 8449, "Pretrain/Step Time": 8.658841393887997} +{"Pretrain/Learning Rate": 1.6840473957843355e-06, "Pretrain/Loss": 1.958160161972046, "Pretrain/Loss (Raw)": 2.094553232192993, "Pretrain/Step": 8450, "Pretrain/Step Time": 8.657708404585719} +{"Pretrain/Learning Rate": 1.6809854819878096e-06, "Pretrain/Loss": 1.9560483694076538, "Pretrain/Loss (Raw)": 1.7472660541534424, "Pretrain/Step": 8451, "Pretrain/Step Time": 8.659557512030005} +{"Pretrain/Learning Rate": 1.6779262574499243e-06, "Pretrain/Loss": 1.9562972784042358, "Pretrain/Loss (Raw)": 1.911730170249939, "Pretrain/Step": 8452, "Pretrain/Step Time": 8.657250836491585} +{"Pretrain/Learning Rate": 1.674869722523481e-06, "Pretrain/Loss": 1.9554945230484009, "Pretrain/Loss (Raw)": 1.9684813022613525, "Pretrain/Step": 8453, "Pretrain/Step Time": 8.658704375848174} +{"Pretrain/Learning Rate": 1.6718158775609727e-06, "Pretrain/Loss": 1.9519339799880981, "Pretrain/Loss (Raw)": 1.8198484182357788, "Pretrain/Step": 8454, "Pretrain/Step Time": 8.658448515459895} +{"Pretrain/Learning Rate": 1.6687647229145787e-06, "Pretrain/Loss": 1.9491091966629028, "Pretrain/Loss (Raw)": 1.6258270740509033, "Pretrain/Step": 8455, "Pretrain/Step Time": 8.659660553559661} +{"Pretrain/Learning Rate": 1.6657162589361814e-06, "Pretrain/Loss": 1.9488990306854248, "Pretrain/Loss (Raw)": 1.9493064880371094, "Pretrain/Step": 8456, "Pretrain/Step Time": 8.659672668203712} +{"Pretrain/Learning Rate": 1.6626704859773413e-06, "Pretrain/Loss": 1.9500718116760254, "Pretrain/Loss (Raw)": 1.8863911628723145, "Pretrain/Step": 8457, "Pretrain/Step Time": 8.659253422170877} +{"Pretrain/Learning Rate": 1.6596274043893078e-06, "Pretrain/Loss": 1.950463056564331, "Pretrain/Loss (Raw)": 2.108809232711792, "Pretrain/Step": 8458, "Pretrain/Step Time": 8.656997330486774} +{"Pretrain/Learning Rate": 1.6565870145230228e-06, "Pretrain/Loss": 1.9510775804519653, "Pretrain/Loss (Raw)": 2.0735788345336914, "Pretrain/Step": 8459, "Pretrain/Step Time": 8.659354401752353} +{"Pretrain/Learning Rate": 1.653549316729125e-06, "Pretrain/Loss": 1.9513943195343018, "Pretrain/Loss (Raw)": 2.024214029312134, "Pretrain/Step": 8460, "Pretrain/Step Time": 8.654979839920998} +{"Pretrain/Learning Rate": 1.6505143113579314e-06, "Pretrain/Loss": 1.9501034021377563, "Pretrain/Loss (Raw)": 1.9894495010375977, "Pretrain/Step": 8461, "Pretrain/Step Time": 8.654543731361628} +{"Pretrain/Learning Rate": 1.6474819987594536e-06, "Pretrain/Loss": 1.9526060819625854, "Pretrain/Loss (Raw)": 2.051856279373169, "Pretrain/Step": 8462, "Pretrain/Step Time": 8.650521269068122} +{"Pretrain/Learning Rate": 1.64445237928339e-06, "Pretrain/Loss": 1.95003080368042, "Pretrain/Loss (Raw)": 1.7506533861160278, "Pretrain/Step": 8463, "Pretrain/Step Time": 8.654109966009855} +{"Pretrain/Learning Rate": 1.6414254532791357e-06, "Pretrain/Loss": 1.9503583908081055, "Pretrain/Loss (Raw)": 1.9817206859588623, "Pretrain/Step": 8464, "Pretrain/Step Time": 8.655997775495052} +{"Pretrain/Learning Rate": 1.6384012210957672e-06, "Pretrain/Loss": 1.9523833990097046, "Pretrain/Loss (Raw)": 1.9727070331573486, "Pretrain/Step": 8465, "Pretrain/Step Time": 8.652536919340491} +{"Pretrain/Learning Rate": 1.6353796830820529e-06, "Pretrain/Loss": 1.9543113708496094, "Pretrain/Loss (Raw)": 2.156926393508911, "Pretrain/Step": 8466, "Pretrain/Step Time": 8.649524325504899} +{"Pretrain/Learning Rate": 1.6323608395864498e-06, "Pretrain/Loss": 1.95503568649292, "Pretrain/Loss (Raw)": 2.114556312561035, "Pretrain/Step": 8467, "Pretrain/Step Time": 8.651375690475106} +{"Pretrain/Learning Rate": 1.6293446909571075e-06, "Pretrain/Loss": 1.9543311595916748, "Pretrain/Loss (Raw)": 1.8566911220550537, "Pretrain/Step": 8468, "Pretrain/Step Time": 8.64888584986329} +{"Pretrain/Learning Rate": 1.6263312375418643e-06, "Pretrain/Loss": 1.9551466703414917, "Pretrain/Loss (Raw)": 1.5229434967041016, "Pretrain/Step": 8469, "Pretrain/Step Time": 8.644723681733012} +{"Pretrain/Learning Rate": 1.6233204796882368e-06, "Pretrain/Loss": 1.9544529914855957, "Pretrain/Loss (Raw)": 1.880202054977417, "Pretrain/Step": 8470, "Pretrain/Step Time": 8.645092319697142} +{"Pretrain/Learning Rate": 1.6203124177434497e-06, "Pretrain/Loss": 1.9510266780853271, "Pretrain/Loss (Raw)": 1.7958385944366455, "Pretrain/Step": 8471, "Pretrain/Step Time": 8.638579247519374} +{"Pretrain/Learning Rate": 1.6173070520544065e-06, "Pretrain/Loss": 1.9487955570220947, "Pretrain/Loss (Raw)": 1.730601191520691, "Pretrain/Step": 8472, "Pretrain/Step Time": 8.64390205591917} +{"Pretrain/Learning Rate": 1.6143043829676934e-06, "Pretrain/Loss": 1.948026180267334, "Pretrain/Loss (Raw)": 1.967578649520874, "Pretrain/Step": 8473, "Pretrain/Step Time": 8.640725621953607} +{"Pretrain/Learning Rate": 1.611304410829595e-06, "Pretrain/Loss": 1.9447085857391357, "Pretrain/Loss (Raw)": 1.802126169204712, "Pretrain/Step": 8474, "Pretrain/Step Time": 8.644073711708188} +{"Pretrain/Learning Rate": 1.6083071359860868e-06, "Pretrain/Loss": 1.9457499980926514, "Pretrain/Loss (Raw)": 1.9878194332122803, "Pretrain/Step": 8475, "Pretrain/Step Time": 8.645342556759715} +{"Pretrain/Learning Rate": 1.6053125587828233e-06, "Pretrain/Loss": 1.944260835647583, "Pretrain/Loss (Raw)": 1.8202251195907593, "Pretrain/Step": 8476, "Pretrain/Step Time": 8.645159909501672} +{"Pretrain/Learning Rate": 1.6023206795651557e-06, "Pretrain/Loss": 1.94402277469635, "Pretrain/Loss (Raw)": 1.9558643102645874, "Pretrain/Step": 8477, "Pretrain/Step Time": 8.640542730689049} +{"Pretrain/Learning Rate": 1.5993314986781166e-06, "Pretrain/Loss": 1.9452769756317139, "Pretrain/Loss (Raw)": 1.8941624164581299, "Pretrain/Step": 8478, "Pretrain/Step Time": 8.640158111229539} +{"Pretrain/Learning Rate": 1.5963450164664385e-06, "Pretrain/Loss": 1.9447754621505737, "Pretrain/Loss (Raw)": 1.8697768449783325, "Pretrain/Step": 8479, "Pretrain/Step Time": 8.641612516716123} +{"Pretrain/Learning Rate": 1.5933612332745373e-06, "Pretrain/Loss": 1.9441919326782227, "Pretrain/Loss (Raw)": 2.034668445587158, "Pretrain/Step": 8480, "Pretrain/Step Time": 8.637773487716913} +{"Pretrain/Learning Rate": 1.5903801494465131e-06, "Pretrain/Loss": 1.9415462017059326, "Pretrain/Loss (Raw)": 1.8892446756362915, "Pretrain/Step": 8481, "Pretrain/Step Time": 8.649370031431317} +{"Pretrain/Learning Rate": 1.5874017653261574e-06, "Pretrain/Loss": 1.9418998956680298, "Pretrain/Loss (Raw)": 2.0424866676330566, "Pretrain/Step": 8482, "Pretrain/Step Time": 8.64768965356052} +{"Pretrain/Learning Rate": 1.5844260812569621e-06, "Pretrain/Loss": 1.9420210123062134, "Pretrain/Loss (Raw)": 2.1022837162017822, "Pretrain/Step": 8483, "Pretrain/Step Time": 8.645932467654347} +{"Pretrain/Learning Rate": 1.5814530975820806e-06, "Pretrain/Loss": 1.946277379989624, "Pretrain/Loss (Raw)": 2.1674976348876953, "Pretrain/Step": 8484, "Pretrain/Step Time": 8.643245410174131} +{"Pretrain/Learning Rate": 1.578482814644383e-06, "Pretrain/Loss": 1.9450116157531738, "Pretrain/Loss (Raw)": 1.9615081548690796, "Pretrain/Step": 8485, "Pretrain/Step Time": 8.642248859629035} +{"Pretrain/Learning Rate": 1.5755152327864093e-06, "Pretrain/Loss": 1.9470096826553345, "Pretrain/Loss (Raw)": 2.0707592964172363, "Pretrain/Step": 8486, "Pretrain/Step Time": 8.636341897770762} +{"Pretrain/Learning Rate": 1.572550352350405e-06, "Pretrain/Loss": 1.9442291259765625, "Pretrain/Loss (Raw)": 1.8576961755752563, "Pretrain/Step": 8487, "Pretrain/Step Time": 8.638482579961419} +{"Pretrain/Learning Rate": 1.5695881736782825e-06, "Pretrain/Loss": 1.9458351135253906, "Pretrain/Loss (Raw)": 2.097429037094116, "Pretrain/Step": 8488, "Pretrain/Step Time": 8.638363944366574} +{"Pretrain/Learning Rate": 1.5666286971116605e-06, "Pretrain/Loss": 1.944925308227539, "Pretrain/Loss (Raw)": 2.0143864154815674, "Pretrain/Step": 8489, "Pretrain/Step Time": 8.635292369872332} +{"Pretrain/Learning Rate": 1.5636719229918385e-06, "Pretrain/Loss": 1.9426889419555664, "Pretrain/Loss (Raw)": 1.483995795249939, "Pretrain/Step": 8490, "Pretrain/Step Time": 8.633849566802382} +{"Pretrain/Learning Rate": 1.5607178516598126e-06, "Pretrain/Loss": 1.9427990913391113, "Pretrain/Loss (Raw)": 1.942521572113037, "Pretrain/Step": 8491, "Pretrain/Step Time": 8.632575005292892} +{"Pretrain/Learning Rate": 1.557766483456244e-06, "Pretrain/Loss": 1.9421576261520386, "Pretrain/Loss (Raw)": 1.8860338926315308, "Pretrain/Step": 8492, "Pretrain/Step Time": 8.6323151756078} +{"Pretrain/Learning Rate": 1.5548178187215128e-06, "Pretrain/Loss": 1.943033218383789, "Pretrain/Loss (Raw)": 2.007477045059204, "Pretrain/Step": 8493, "Pretrain/Step Time": 8.632102029398084} +{"Pretrain/Learning Rate": 1.5518718577956697e-06, "Pretrain/Loss": 1.94456148147583, "Pretrain/Loss (Raw)": 1.9517335891723633, "Pretrain/Step": 8494, "Pretrain/Step Time": 8.628150111064315} +{"Pretrain/Learning Rate": 1.5489286010184539e-06, "Pretrain/Loss": 1.945300579071045, "Pretrain/Loss (Raw)": 1.937530755996704, "Pretrain/Step": 8495, "Pretrain/Step Time": 8.630056401714683} +{"Pretrain/Learning Rate": 1.545988048729291e-06, "Pretrain/Loss": 1.9446347951889038, "Pretrain/Loss (Raw)": 1.8602778911590576, "Pretrain/Step": 8496, "Pretrain/Step Time": 8.62756716646254} +{"Pretrain/Learning Rate": 1.5430502012673126e-06, "Pretrain/Loss": 1.9417457580566406, "Pretrain/Loss (Raw)": 1.9195002317428589, "Pretrain/Step": 8497, "Pretrain/Step Time": 8.631025766953826} +{"Pretrain/Learning Rate": 1.5401150589713171e-06, "Pretrain/Loss": 1.9416546821594238, "Pretrain/Loss (Raw)": 2.0006206035614014, "Pretrain/Step": 8498, "Pretrain/Step Time": 8.63325790502131} +{"Pretrain/Learning Rate": 1.5371826221797975e-06, "Pretrain/Loss": 1.9431439638137817, "Pretrain/Loss (Raw)": 2.158944606781006, "Pretrain/Step": 8499, "Pretrain/Step Time": 8.629063986241817} +{"Pretrain/Learning Rate": 1.534252891230936e-06, "Pretrain/Loss": 1.9435782432556152, "Pretrain/Loss (Raw)": 1.9903810024261475, "Pretrain/Step": 8500, "Pretrain/Step Time": 8.628169538453221} +{"Pretrain/Learning Rate": 1.5313258664626073e-06, "Pretrain/Loss": 1.943469762802124, "Pretrain/Loss (Raw)": 2.059821367263794, "Pretrain/Step": 8501, "Pretrain/Step Time": 8.629209836944938} +{"Pretrain/Learning Rate": 1.5284015482123714e-06, "Pretrain/Loss": 1.9432220458984375, "Pretrain/Loss (Raw)": 2.0866875648498535, "Pretrain/Step": 8502, "Pretrain/Step Time": 8.627102263271809} +{"Pretrain/Learning Rate": 1.5254799368174672e-06, "Pretrain/Loss": 1.9431767463684082, "Pretrain/Loss (Raw)": 2.099806308746338, "Pretrain/Step": 8503, "Pretrain/Step Time": 8.629179978743196} +{"Pretrain/Learning Rate": 1.5225610326148304e-06, "Pretrain/Loss": 1.9417611360549927, "Pretrain/Loss (Raw)": 1.9062763452529907, "Pretrain/Step": 8504, "Pretrain/Step Time": 8.629659496247768} +{"Pretrain/Learning Rate": 1.5196448359410891e-06, "Pretrain/Loss": 1.9424116611480713, "Pretrain/Loss (Raw)": 2.0488383769989014, "Pretrain/Step": 8505, "Pretrain/Step Time": 8.632015971466899} +{"Pretrain/Learning Rate": 1.5167313471325468e-06, "Pretrain/Loss": 1.9408397674560547, "Pretrain/Loss (Raw)": 1.7359066009521484, "Pretrain/Step": 8506, "Pretrain/Step Time": 8.634006030857563} +{"Pretrain/Learning Rate": 1.513820566525201e-06, "Pretrain/Loss": 1.9420497417449951, "Pretrain/Loss (Raw)": 2.1152586936950684, "Pretrain/Step": 8507, "Pretrain/Step Time": 8.634773971512914} +{"Pretrain/Learning Rate": 1.510912494454736e-06, "Pretrain/Loss": 1.9431945085525513, "Pretrain/Loss (Raw)": 1.6743626594543457, "Pretrain/Step": 8508, "Pretrain/Step Time": 8.640110068023205} +{"Pretrain/Learning Rate": 1.5080071312565308e-06, "Pretrain/Loss": 1.9459044933319092, "Pretrain/Loss (Raw)": 2.183126926422119, "Pretrain/Step": 8509, "Pretrain/Step Time": 8.638128945603967} +{"Pretrain/Learning Rate": 1.5051044772656397e-06, "Pretrain/Loss": 1.9446957111358643, "Pretrain/Loss (Raw)": 1.8366291522979736, "Pretrain/Step": 8510, "Pretrain/Step Time": 8.637090908363461} +{"Pretrain/Learning Rate": 1.5022045328168088e-06, "Pretrain/Loss": 1.949070692062378, "Pretrain/Loss (Raw)": 1.8384648561477661, "Pretrain/Step": 8511, "Pretrain/Step Time": 8.634993338957429} +{"Pretrain/Learning Rate": 1.4993072982444816e-06, "Pretrain/Loss": 1.9530197381973267, "Pretrain/Loss (Raw)": 2.279344320297241, "Pretrain/Step": 8512, "Pretrain/Step Time": 8.642160011455417} +{"Pretrain/Learning Rate": 1.4964127738827744e-06, "Pretrain/Loss": 1.9519860744476318, "Pretrain/Loss (Raw)": 1.9008125066757202, "Pretrain/Step": 8513, "Pretrain/Step Time": 8.642588324844837} +{"Pretrain/Learning Rate": 1.4935209600654977e-06, "Pretrain/Loss": 1.9503612518310547, "Pretrain/Loss (Raw)": 1.8456006050109863, "Pretrain/Step": 8514, "Pretrain/Step Time": 8.641636168584228} +{"Pretrain/Learning Rate": 1.4906318571261484e-06, "Pretrain/Loss": 1.9493660926818848, "Pretrain/Loss (Raw)": 1.9529175758361816, "Pretrain/Step": 8515, "Pretrain/Step Time": 8.642677376046777} +{"Pretrain/Learning Rate": 1.4877454653979162e-06, "Pretrain/Loss": 1.9519295692443848, "Pretrain/Loss (Raw)": 2.0778470039367676, "Pretrain/Step": 8516, "Pretrain/Step Time": 8.643257737159729} +{"Pretrain/Learning Rate": 1.4848617852136676e-06, "Pretrain/Loss": 1.9504203796386719, "Pretrain/Loss (Raw)": 1.894580602645874, "Pretrain/Step": 8517, "Pretrain/Step Time": 8.64036638662219} +{"Pretrain/Learning Rate": 1.4819808169059674e-06, "Pretrain/Loss": 1.9485654830932617, "Pretrain/Loss (Raw)": 2.017812728881836, "Pretrain/Step": 8518, "Pretrain/Step Time": 8.644159508869052} +{"Pretrain/Learning Rate": 1.4791025608070552e-06, "Pretrain/Loss": 1.9470694065093994, "Pretrain/Loss (Raw)": 1.870096206665039, "Pretrain/Step": 8519, "Pretrain/Step Time": 8.645391792058945} +{"Pretrain/Learning Rate": 1.476227017248874e-06, "Pretrain/Loss": 1.9442992210388184, "Pretrain/Loss (Raw)": 1.651833415031433, "Pretrain/Step": 8520, "Pretrain/Step Time": 8.643267471343279} +{"Pretrain/Learning Rate": 1.4733541865630418e-06, "Pretrain/Loss": 1.942580223083496, "Pretrain/Loss (Raw)": 1.7458065748214722, "Pretrain/Step": 8521, "Pretrain/Step Time": 8.644084002822638} +{"Pretrain/Learning Rate": 1.4704840690808659e-06, "Pretrain/Loss": 1.9422942399978638, "Pretrain/Loss (Raw)": 2.012746572494507, "Pretrain/Step": 8522, "Pretrain/Step Time": 8.638811757788062} +{"Pretrain/Learning Rate": 1.4676166651333367e-06, "Pretrain/Loss": 1.9450289011001587, "Pretrain/Loss (Raw)": 2.145756483078003, "Pretrain/Step": 8523, "Pretrain/Step Time": 8.63707260787487} +{"Pretrain/Learning Rate": 1.4647519750511512e-06, "Pretrain/Loss": 1.945259690284729, "Pretrain/Loss (Raw)": 1.807481288909912, "Pretrain/Step": 8524, "Pretrain/Step Time": 8.63692114688456} +{"Pretrain/Learning Rate": 1.461889999164659e-06, "Pretrain/Loss": 1.9461175203323364, "Pretrain/Loss (Raw)": 1.8154687881469727, "Pretrain/Step": 8525, "Pretrain/Step Time": 8.636422250419855} +{"Pretrain/Learning Rate": 1.4590307378039348e-06, "Pretrain/Loss": 1.9443838596343994, "Pretrain/Loss (Raw)": 1.8073378801345825, "Pretrain/Step": 8526, "Pretrain/Step Time": 8.637305811047554} +{"Pretrain/Learning Rate": 1.4561741912987093e-06, "Pretrain/Loss": 1.9426705837249756, "Pretrain/Loss (Raw)": 1.880205750465393, "Pretrain/Step": 8527, "Pretrain/Step Time": 8.639995576813817} +{"Pretrain/Learning Rate": 1.4533203599784245e-06, "Pretrain/Loss": 1.9428575038909912, "Pretrain/Loss (Raw)": 1.9242753982543945, "Pretrain/Step": 8528, "Pretrain/Step Time": 8.649596964940429} +{"Pretrain/Learning Rate": 1.4504692441721867e-06, "Pretrain/Loss": 1.942091941833496, "Pretrain/Loss (Raw)": 1.9330655336380005, "Pretrain/Step": 8529, "Pretrain/Step Time": 8.64696397446096} +{"Pretrain/Learning Rate": 1.4476208442088052e-06, "Pretrain/Loss": 1.9353229999542236, "Pretrain/Loss (Raw)": 1.188692331314087, "Pretrain/Step": 8530, "Pretrain/Step Time": 8.645038990303874} +{"Pretrain/Learning Rate": 1.4447751604167697e-06, "Pretrain/Loss": 1.9364627599716187, "Pretrain/Loss (Raw)": 1.9901015758514404, "Pretrain/Step": 8531, "Pretrain/Step Time": 8.643162973225117} +{"Pretrain/Learning Rate": 1.4419321931242624e-06, "Pretrain/Loss": 1.9342916011810303, "Pretrain/Loss (Raw)": 1.758796215057373, "Pretrain/Step": 8532, "Pretrain/Step Time": 8.646283997222781} +{"Pretrain/Learning Rate": 1.4390919426591404e-06, "Pretrain/Loss": 1.9342992305755615, "Pretrain/Loss (Raw)": 1.8969762325286865, "Pretrain/Step": 8533, "Pretrain/Step Time": 8.644838089123368} +{"Pretrain/Learning Rate": 1.4362544093489583e-06, "Pretrain/Loss": 1.933103322982788, "Pretrain/Loss (Raw)": 1.9530236721038818, "Pretrain/Step": 8534, "Pretrain/Step Time": 8.643864769488573} +{"Pretrain/Learning Rate": 1.4334195935209572e-06, "Pretrain/Loss": 1.927950143814087, "Pretrain/Loss (Raw)": 1.3876458406448364, "Pretrain/Step": 8535, "Pretrain/Step Time": 8.64381667971611} +{"Pretrain/Learning Rate": 1.4305874955020559e-06, "Pretrain/Loss": 1.9273500442504883, "Pretrain/Loss (Raw)": 1.9747233390808105, "Pretrain/Step": 8536, "Pretrain/Step Time": 8.647095572203398} +{"Pretrain/Learning Rate": 1.427758115618863e-06, "Pretrain/Loss": 1.9285684823989868, "Pretrain/Loss (Raw)": 2.037477493286133, "Pretrain/Step": 8537, "Pretrain/Step Time": 8.644693620502949} +{"Pretrain/Learning Rate": 1.4249314541976866e-06, "Pretrain/Loss": 1.9284206628799438, "Pretrain/Loss (Raw)": 2.0161192417144775, "Pretrain/Step": 8538, "Pretrain/Step Time": 8.646749844774604} +{"Pretrain/Learning Rate": 1.422107511564502e-06, "Pretrain/Loss": 1.928585410118103, "Pretrain/Loss (Raw)": 1.9919003248214722, "Pretrain/Step": 8539, "Pretrain/Step Time": 8.645208362489939} +{"Pretrain/Learning Rate": 1.4192862880449825e-06, "Pretrain/Loss": 1.9297077655792236, "Pretrain/Loss (Raw)": 2.1816213130950928, "Pretrain/Step": 8540, "Pretrain/Step Time": 8.644749460741878} +{"Pretrain/Learning Rate": 1.4164677839644813e-06, "Pretrain/Loss": 1.9281768798828125, "Pretrain/Loss (Raw)": 1.7872463464736938, "Pretrain/Step": 8541, "Pretrain/Step Time": 8.644018085673451} +{"Pretrain/Learning Rate": 1.4136519996480469e-06, "Pretrain/Loss": 1.928454875946045, "Pretrain/Loss (Raw)": 1.999047875404358, "Pretrain/Step": 8542, "Pretrain/Step Time": 8.640865564346313} +{"Pretrain/Learning Rate": 1.4108389354204055e-06, "Pretrain/Loss": 1.9266784191131592, "Pretrain/Loss (Raw)": 1.7690895795822144, "Pretrain/Step": 8543, "Pretrain/Step Time": 8.644056288525462} +{"Pretrain/Learning Rate": 1.4080285916059754e-06, "Pretrain/Loss": 1.9248790740966797, "Pretrain/Loss (Raw)": 1.9803040027618408, "Pretrain/Step": 8544, "Pretrain/Step Time": 8.64362638629973} +{"Pretrain/Learning Rate": 1.405220968528853e-06, "Pretrain/Loss": 1.926491141319275, "Pretrain/Loss (Raw)": 1.916646122932434, "Pretrain/Step": 8545, "Pretrain/Step Time": 8.644878527149558} +{"Pretrain/Learning Rate": 1.402416066512835e-06, "Pretrain/Loss": 1.929598093032837, "Pretrain/Loss (Raw)": 2.393080234527588, "Pretrain/Step": 8546, "Pretrain/Step Time": 8.643391106277704} +{"Pretrain/Learning Rate": 1.3996138858813928e-06, "Pretrain/Loss": 1.9299869537353516, "Pretrain/Loss (Raw)": 2.1361043453216553, "Pretrain/Step": 8547, "Pretrain/Step Time": 8.647337527945638} +{"Pretrain/Learning Rate": 1.396814426957685e-06, "Pretrain/Loss": 1.9273762702941895, "Pretrain/Loss (Raw)": 1.948503851890564, "Pretrain/Step": 8548, "Pretrain/Step Time": 8.643156284466386} +{"Pretrain/Learning Rate": 1.394017690064553e-06, "Pretrain/Loss": 1.9263386726379395, "Pretrain/Loss (Raw)": 1.8314472436904907, "Pretrain/Step": 8549, "Pretrain/Step Time": 8.6408506706357} +{"Pretrain/Learning Rate": 1.3912236755245416e-06, "Pretrain/Loss": 1.92398202419281, "Pretrain/Loss (Raw)": 1.8903274536132812, "Pretrain/Step": 8550, "Pretrain/Step Time": 8.643089415505528} +{"Pretrain/Learning Rate": 1.3884323836598655e-06, "Pretrain/Loss": 1.9240349531173706, "Pretrain/Loss (Raw)": 2.0145797729492188, "Pretrain/Step": 8551, "Pretrain/Step Time": 8.644202552735806} +{"Pretrain/Learning Rate": 1.3856438147924229e-06, "Pretrain/Loss": 1.9218952655792236, "Pretrain/Loss (Raw)": 1.778436303138733, "Pretrain/Step": 8552, "Pretrain/Step Time": 8.643869519233704} +{"Pretrain/Learning Rate": 1.3828579692438142e-06, "Pretrain/Loss": 1.920729637145996, "Pretrain/Loss (Raw)": 1.7398940324783325, "Pretrain/Step": 8553, "Pretrain/Step Time": 8.633724473416805} +{"Pretrain/Learning Rate": 1.3800748473353137e-06, "Pretrain/Loss": 1.919992208480835, "Pretrain/Loss (Raw)": 1.729257345199585, "Pretrain/Step": 8554, "Pretrain/Step Time": 8.632236579433084} +{"Pretrain/Learning Rate": 1.377294449387881e-06, "Pretrain/Loss": 1.918154001235962, "Pretrain/Loss (Raw)": 1.9371401071548462, "Pretrain/Step": 8555, "Pretrain/Step Time": 8.62991545163095} +{"Pretrain/Learning Rate": 1.3745167757221622e-06, "Pretrain/Loss": 1.9170403480529785, "Pretrain/Loss (Raw)": 1.7539424896240234, "Pretrain/Step": 8556, "Pretrain/Step Time": 8.626858655363321} +{"Pretrain/Learning Rate": 1.3717418266585014e-06, "Pretrain/Loss": 1.9193856716156006, "Pretrain/Loss (Raw)": 2.1294121742248535, "Pretrain/Step": 8557, "Pretrain/Step Time": 8.630920266732574} +{"Pretrain/Learning Rate": 1.3689696025169118e-06, "Pretrain/Loss": 1.9192101955413818, "Pretrain/Loss (Raw)": 1.8434447050094604, "Pretrain/Step": 8558, "Pretrain/Step Time": 8.63700052537024} +{"Pretrain/Learning Rate": 1.366200103617099e-06, "Pretrain/Loss": 1.9156240224838257, "Pretrain/Loss (Raw)": 1.6622554063796997, "Pretrain/Step": 8559, "Pretrain/Step Time": 8.637279426679015} +{"Pretrain/Learning Rate": 1.3634333302784546e-06, "Pretrain/Loss": 1.914910078048706, "Pretrain/Loss (Raw)": 1.9569565057754517, "Pretrain/Step": 8560, "Pretrain/Step Time": 8.64411317743361} +{"Pretrain/Learning Rate": 1.3606692828200623e-06, "Pretrain/Loss": 1.9172682762145996, "Pretrain/Loss (Raw)": 1.9994474649429321, "Pretrain/Step": 8561, "Pretrain/Step Time": 8.644700957462192} +{"Pretrain/Learning Rate": 1.3579079615606781e-06, "Pretrain/Loss": 1.9168442487716675, "Pretrain/Loss (Raw)": 1.9012236595153809, "Pretrain/Step": 8562, "Pretrain/Step Time": 8.64044825360179} +{"Pretrain/Learning Rate": 1.355149366818756e-06, "Pretrain/Loss": 1.9163475036621094, "Pretrain/Loss (Raw)": 1.9162300825119019, "Pretrain/Step": 8563, "Pretrain/Step Time": 8.636322317644954} +{"Pretrain/Learning Rate": 1.3523934989124214e-06, "Pretrain/Loss": 1.9193155765533447, "Pretrain/Loss (Raw)": 2.21848201751709, "Pretrain/Step": 8564, "Pretrain/Step Time": 8.637793900445104} +{"Pretrain/Learning Rate": 1.3496403581595042e-06, "Pretrain/Loss": 1.9204192161560059, "Pretrain/Loss (Raw)": 2.0869557857513428, "Pretrain/Step": 8565, "Pretrain/Step Time": 8.639332573860884} +{"Pretrain/Learning Rate": 1.3468899448775023e-06, "Pretrain/Loss": 1.9196685552597046, "Pretrain/Loss (Raw)": 1.8462620973587036, "Pretrain/Step": 8566, "Pretrain/Step Time": 8.63919191621244} +{"Pretrain/Learning Rate": 1.3441422593836128e-06, "Pretrain/Loss": 1.9205272197723389, "Pretrain/Loss (Raw)": 2.164491653442383, "Pretrain/Step": 8567, "Pretrain/Step Time": 8.643100595101714} +{"Pretrain/Learning Rate": 1.3413973019947013e-06, "Pretrain/Loss": 1.919911503791809, "Pretrain/Loss (Raw)": 1.8940048217773438, "Pretrain/Step": 8568, "Pretrain/Step Time": 8.644133936613798} +{"Pretrain/Learning Rate": 1.3386550730273452e-06, "Pretrain/Loss": 1.9222464561462402, "Pretrain/Loss (Raw)": 2.0003626346588135, "Pretrain/Step": 8569, "Pretrain/Step Time": 8.646506190299988} +{"Pretrain/Learning Rate": 1.3359155727977745e-06, "Pretrain/Loss": 1.9246879816055298, "Pretrain/Loss (Raw)": 2.0849881172180176, "Pretrain/Step": 8570, "Pretrain/Step Time": 8.643678586930037} +{"Pretrain/Learning Rate": 1.3331788016219315e-06, "Pretrain/Loss": 1.9265432357788086, "Pretrain/Loss (Raw)": 1.8891327381134033, "Pretrain/Step": 8571, "Pretrain/Step Time": 8.65046419762075} +{"Pretrain/Learning Rate": 1.3304447598154274e-06, "Pretrain/Loss": 1.926223874092102, "Pretrain/Loss (Raw)": 1.8960726261138916, "Pretrain/Step": 8572, "Pretrain/Step Time": 8.64771980047226} +{"Pretrain/Learning Rate": 1.3277134476935766e-06, "Pretrain/Loss": 1.926456332206726, "Pretrain/Loss (Raw)": 1.6072183847427368, "Pretrain/Step": 8573, "Pretrain/Step Time": 8.647803794592619} +{"Pretrain/Learning Rate": 1.324984865571352e-06, "Pretrain/Loss": 1.9251506328582764, "Pretrain/Loss (Raw)": 1.9117262363433838, "Pretrain/Step": 8574, "Pretrain/Step Time": 8.653998686000705} +{"Pretrain/Learning Rate": 1.3222590137634328e-06, "Pretrain/Loss": 1.9249836206436157, "Pretrain/Loss (Raw)": 1.6685079336166382, "Pretrain/Step": 8575, "Pretrain/Step Time": 8.653394471853971} +{"Pretrain/Learning Rate": 1.319535892584181e-06, "Pretrain/Loss": 1.9261701107025146, "Pretrain/Loss (Raw)": 2.039076805114746, "Pretrain/Step": 8576, "Pretrain/Step Time": 8.653895167633891} +{"Pretrain/Learning Rate": 1.3168155023476348e-06, "Pretrain/Loss": 1.9252517223358154, "Pretrain/Loss (Raw)": 1.8969935178756714, "Pretrain/Step": 8577, "Pretrain/Step Time": 8.651008723303676} +{"Pretrain/Learning Rate": 1.3140978433675206e-06, "Pretrain/Loss": 1.9208037853240967, "Pretrain/Loss (Raw)": 1.5252240896224976, "Pretrain/Step": 8578, "Pretrain/Step Time": 8.653297524899244} +{"Pretrain/Learning Rate": 1.3113829159572572e-06, "Pretrain/Loss": 1.9225132465362549, "Pretrain/Loss (Raw)": 1.9660677909851074, "Pretrain/Step": 8579, "Pretrain/Step Time": 8.651040818542242} +{"Pretrain/Learning Rate": 1.3086707204299414e-06, "Pretrain/Loss": 1.9212960004806519, "Pretrain/Loss (Raw)": 1.7559239864349365, "Pretrain/Step": 8580, "Pretrain/Step Time": 8.65520247258246} +{"Pretrain/Learning Rate": 1.3059612570983537e-06, "Pretrain/Loss": 1.9206974506378174, "Pretrain/Loss (Raw)": 1.891866683959961, "Pretrain/Step": 8581, "Pretrain/Step Time": 8.660327387973666} +{"Pretrain/Learning Rate": 1.3032545262749635e-06, "Pretrain/Loss": 1.9173134565353394, "Pretrain/Loss (Raw)": 1.3867043256759644, "Pretrain/Step": 8582, "Pretrain/Step Time": 8.662339577451348} +{"Pretrain/Learning Rate": 1.3005505282719238e-06, "Pretrain/Loss": 1.919824481010437, "Pretrain/Loss (Raw)": 1.9472343921661377, "Pretrain/Step": 8583, "Pretrain/Step Time": 8.656078880652785} +{"Pretrain/Learning Rate": 1.297849263401074e-06, "Pretrain/Loss": 1.9196841716766357, "Pretrain/Loss (Raw)": 1.9313398599624634, "Pretrain/Step": 8584, "Pretrain/Step Time": 8.654342744499445} +{"Pretrain/Learning Rate": 1.2951507319739375e-06, "Pretrain/Loss": 1.9222722053527832, "Pretrain/Loss (Raw)": 2.217651128768921, "Pretrain/Step": 8585, "Pretrain/Step Time": 8.655993102118373} +{"Pretrain/Learning Rate": 1.2924549343017122e-06, "Pretrain/Loss": 1.9217804670333862, "Pretrain/Loss (Raw)": 2.0458784103393555, "Pretrain/Step": 8586, "Pretrain/Step Time": 8.65667220018804} +{"Pretrain/Learning Rate": 1.289761870695305e-06, "Pretrain/Loss": 1.9219645261764526, "Pretrain/Loss (Raw)": 2.097140073776245, "Pretrain/Step": 8587, "Pretrain/Step Time": 8.656409114599228} +{"Pretrain/Learning Rate": 1.2870715414652817e-06, "Pretrain/Loss": 1.9193276166915894, "Pretrain/Loss (Raw)": 1.6866908073425293, "Pretrain/Step": 8588, "Pretrain/Step Time": 8.661445258185267} +{"Pretrain/Learning Rate": 1.2843839469219104e-06, "Pretrain/Loss": 1.9177582263946533, "Pretrain/Loss (Raw)": 1.7885733842849731, "Pretrain/Step": 8589, "Pretrain/Step Time": 8.661997150629759} +{"Pretrain/Learning Rate": 1.2816990873751267e-06, "Pretrain/Loss": 1.914962887763977, "Pretrain/Loss (Raw)": 1.6940442323684692, "Pretrain/Step": 8590, "Pretrain/Step Time": 8.664878021925688} +{"Pretrain/Learning Rate": 1.2790169631345744e-06, "Pretrain/Loss": 1.9180099964141846, "Pretrain/Loss (Raw)": 2.1406891345977783, "Pretrain/Step": 8591, "Pretrain/Step Time": 8.6617486551404} +{"Pretrain/Learning Rate": 1.2763375745095645e-06, "Pretrain/Loss": 1.917952299118042, "Pretrain/Loss (Raw)": 1.9743319749832153, "Pretrain/Step": 8592, "Pretrain/Step Time": 8.665542218834162} +{"Pretrain/Learning Rate": 1.2736609218090888e-06, "Pretrain/Loss": 1.9168477058410645, "Pretrain/Loss (Raw)": 1.8313158750534058, "Pretrain/Step": 8593, "Pretrain/Step Time": 8.664186496287584} +{"Pretrain/Learning Rate": 1.2709870053418421e-06, "Pretrain/Loss": 1.9141154289245605, "Pretrain/Loss (Raw)": 1.807202935218811, "Pretrain/Step": 8594, "Pretrain/Step Time": 8.665611354634166} +{"Pretrain/Learning Rate": 1.2683158254161887e-06, "Pretrain/Loss": 1.9136993885040283, "Pretrain/Loss (Raw)": 2.0612998008728027, "Pretrain/Step": 8595, "Pretrain/Step Time": 8.66233996488154} +{"Pretrain/Learning Rate": 1.2656473823401821e-06, "Pretrain/Loss": 1.9134684801101685, "Pretrain/Loss (Raw)": 1.8271405696868896, "Pretrain/Step": 8596, "Pretrain/Step Time": 8.663324357941747} +{"Pretrain/Learning Rate": 1.2629816764215542e-06, "Pretrain/Loss": 1.9161231517791748, "Pretrain/Loss (Raw)": 1.862727403640747, "Pretrain/Step": 8597, "Pretrain/Step Time": 8.66304006241262} +{"Pretrain/Learning Rate": 1.2603187079677392e-06, "Pretrain/Loss": 1.9175645112991333, "Pretrain/Loss (Raw)": 2.064706802368164, "Pretrain/Step": 8598, "Pretrain/Step Time": 8.662354739382863} +{"Pretrain/Learning Rate": 1.2576584772858307e-06, "Pretrain/Loss": 1.9193997383117676, "Pretrain/Loss (Raw)": 2.0307559967041016, "Pretrain/Step": 8599, "Pretrain/Step Time": 8.66703063249588} +{"Pretrain/Learning Rate": 1.2550009846826277e-06, "Pretrain/Loss": 1.9230133295059204, "Pretrain/Loss (Raw)": 2.193127393722534, "Pretrain/Step": 8600, "Pretrain/Step Time": 8.664716113358736} +{"Pretrain/Learning Rate": 1.2523462304645961e-06, "Pretrain/Loss": 1.9209399223327637, "Pretrain/Loss (Raw)": 1.702185869216919, "Pretrain/Step": 8601, "Pretrain/Step Time": 8.664836924523115} +{"Pretrain/Learning Rate": 1.2496942149379048e-06, "Pretrain/Loss": 1.922461986541748, "Pretrain/Loss (Raw)": 1.996941089630127, "Pretrain/Step": 8602, "Pretrain/Step Time": 8.664409605786204} +{"Pretrain/Learning Rate": 1.2470449384083927e-06, "Pretrain/Loss": 1.9212068319320679, "Pretrain/Loss (Raw)": 1.827165961265564, "Pretrain/Step": 8603, "Pretrain/Step Time": 8.663769153878093} +{"Pretrain/Learning Rate": 1.2443984011815845e-06, "Pretrain/Loss": 1.9225609302520752, "Pretrain/Loss (Raw)": 1.9935626983642578, "Pretrain/Step": 8604, "Pretrain/Step Time": 8.665230503305793} +{"Pretrain/Learning Rate": 1.2417546035626864e-06, "Pretrain/Loss": 1.9234669208526611, "Pretrain/Loss (Raw)": 2.071807622909546, "Pretrain/Step": 8605, "Pretrain/Step Time": 8.669942392036319} +{"Pretrain/Learning Rate": 1.2391135458566072e-06, "Pretrain/Loss": 1.9232702255249023, "Pretrain/Loss (Raw)": 1.8690016269683838, "Pretrain/Step": 8606, "Pretrain/Step Time": 8.669455932453275} +{"Pretrain/Learning Rate": 1.236475228367917e-06, "Pretrain/Loss": 1.9232122898101807, "Pretrain/Loss (Raw)": 1.8623580932617188, "Pretrain/Step": 8607, "Pretrain/Step Time": 8.66764166019857} +{"Pretrain/Learning Rate": 1.2338396514008839e-06, "Pretrain/Loss": 1.9237489700317383, "Pretrain/Loss (Raw)": 2.1033642292022705, "Pretrain/Step": 8608, "Pretrain/Step Time": 8.668554874137044} +{"Pretrain/Learning Rate": 1.2312068152594447e-06, "Pretrain/Loss": 1.9241541624069214, "Pretrain/Loss (Raw)": 1.9410992860794067, "Pretrain/Step": 8609, "Pretrain/Step Time": 8.661134988069534} +{"Pretrain/Learning Rate": 1.228576720247246e-06, "Pretrain/Loss": 1.924526333808899, "Pretrain/Loss (Raw)": 2.090132713317871, "Pretrain/Step": 8610, "Pretrain/Step Time": 8.664152167737484} +{"Pretrain/Learning Rate": 1.2259493666675891e-06, "Pretrain/Loss": 1.9243806600570679, "Pretrain/Loss (Raw)": 2.0836479663848877, "Pretrain/Step": 8611, "Pretrain/Step Time": 8.664270063862205} +{"Pretrain/Learning Rate": 1.2233247548234795e-06, "Pretrain/Loss": 1.9217253923416138, "Pretrain/Loss (Raw)": 1.8276114463806152, "Pretrain/Step": 8612, "Pretrain/Step Time": 8.66566687822342} +{"Pretrain/Learning Rate": 1.2207028850175967e-06, "Pretrain/Loss": 1.92084538936615, "Pretrain/Loss (Raw)": 1.848865032196045, "Pretrain/Step": 8613, "Pretrain/Step Time": 8.66914357803762} +{"Pretrain/Learning Rate": 1.2180837575523158e-06, "Pretrain/Loss": 1.9200115203857422, "Pretrain/Loss (Raw)": 1.9640270471572876, "Pretrain/Step": 8614, "Pretrain/Step Time": 8.669649291783571} +{"Pretrain/Learning Rate": 1.2154673727296728e-06, "Pretrain/Loss": 1.9208751916885376, "Pretrain/Loss (Raw)": 1.9682508707046509, "Pretrain/Step": 8615, "Pretrain/Step Time": 8.672995818778872} +{"Pretrain/Learning Rate": 1.21285373085141e-06, "Pretrain/Loss": 1.917945146560669, "Pretrain/Loss (Raw)": 1.722365379333496, "Pretrain/Step": 8616, "Pretrain/Step Time": 8.668747298419476} +{"Pretrain/Learning Rate": 1.2102428322189468e-06, "Pretrain/Loss": 1.9167499542236328, "Pretrain/Loss (Raw)": 1.8614169359207153, "Pretrain/Step": 8617, "Pretrain/Step Time": 8.667902676388621} +{"Pretrain/Learning Rate": 1.207634677133379e-06, "Pretrain/Loss": 1.9198453426361084, "Pretrain/Loss (Raw)": 1.8802016973495483, "Pretrain/Step": 8618, "Pretrain/Step Time": 8.669663229957223} +{"Pretrain/Learning Rate": 1.205029265895491e-06, "Pretrain/Loss": 1.9198006391525269, "Pretrain/Loss (Raw)": 1.9368046522140503, "Pretrain/Step": 8619, "Pretrain/Step Time": 8.672498013824224} +{"Pretrain/Learning Rate": 1.2024265988057588e-06, "Pretrain/Loss": 1.9180359840393066, "Pretrain/Loss (Raw)": 1.6601403951644897, "Pretrain/Step": 8620, "Pretrain/Step Time": 8.679758226498961} +{"Pretrain/Learning Rate": 1.1998266761643256e-06, "Pretrain/Loss": 1.9186899662017822, "Pretrain/Loss (Raw)": 2.0911903381347656, "Pretrain/Step": 8621, "Pretrain/Step Time": 8.676261665299535} +{"Pretrain/Learning Rate": 1.1972294982710326e-06, "Pretrain/Loss": 1.9199504852294922, "Pretrain/Loss (Raw)": 2.113086700439453, "Pretrain/Step": 8622, "Pretrain/Step Time": 8.677554178982973} +{"Pretrain/Learning Rate": 1.1946350654253924e-06, "Pretrain/Loss": 1.9191393852233887, "Pretrain/Loss (Raw)": 1.8337196111679077, "Pretrain/Step": 8623, "Pretrain/Step Time": 8.677534842863679} +{"Pretrain/Learning Rate": 1.192043377926616e-06, "Pretrain/Loss": 1.9206111431121826, "Pretrain/Loss (Raw)": 2.0486600399017334, "Pretrain/Step": 8624, "Pretrain/Step Time": 8.672479813918471} +{"Pretrain/Learning Rate": 1.189454436073581e-06, "Pretrain/Loss": 1.9200819730758667, "Pretrain/Loss (Raw)": 1.851761817932129, "Pretrain/Step": 8625, "Pretrain/Step Time": 8.672647219151258} +{"Pretrain/Learning Rate": 1.1868682401648595e-06, "Pretrain/Loss": 1.920647144317627, "Pretrain/Loss (Raw)": 2.0729660987854004, "Pretrain/Step": 8626, "Pretrain/Step Time": 8.671430073678493} +{"Pretrain/Learning Rate": 1.184284790498702e-06, "Pretrain/Loss": 1.9191080331802368, "Pretrain/Loss (Raw)": 1.9619414806365967, "Pretrain/Step": 8627, "Pretrain/Step Time": 8.670432602986693} +{"Pretrain/Learning Rate": 1.1817040873730506e-06, "Pretrain/Loss": 1.919684886932373, "Pretrain/Loss (Raw)": 2.0642049312591553, "Pretrain/Step": 8628, "Pretrain/Step Time": 8.66560940258205} +{"Pretrain/Learning Rate": 1.1791261310855172e-06, "Pretrain/Loss": 1.918792963027954, "Pretrain/Loss (Raw)": 1.9456565380096436, "Pretrain/Step": 8629, "Pretrain/Step Time": 8.664258774369955} +{"Pretrain/Learning Rate": 1.1765509219334058e-06, "Pretrain/Loss": 1.9166442155838013, "Pretrain/Loss (Raw)": 1.811646580696106, "Pretrain/Step": 8630, "Pretrain/Step Time": 8.665868420153856} +{"Pretrain/Learning Rate": 1.1739784602136983e-06, "Pretrain/Loss": 1.9133577346801758, "Pretrain/Loss (Raw)": 1.6791483163833618, "Pretrain/Step": 8631, "Pretrain/Step Time": 8.669063927605748} +{"Pretrain/Learning Rate": 1.171408746223071e-06, "Pretrain/Loss": 1.914649486541748, "Pretrain/Loss (Raw)": 2.0716116428375244, "Pretrain/Step": 8632, "Pretrain/Step Time": 8.673725459724665} +{"Pretrain/Learning Rate": 1.1688417802578706e-06, "Pretrain/Loss": 1.9135375022888184, "Pretrain/Loss (Raw)": 1.9065124988555908, "Pretrain/Step": 8633, "Pretrain/Step Time": 8.66862159408629} +{"Pretrain/Learning Rate": 1.1662775626141293e-06, "Pretrain/Loss": 1.915041208267212, "Pretrain/Loss (Raw)": 1.9283720254898071, "Pretrain/Step": 8634, "Pretrain/Step Time": 8.66608682833612} +{"Pretrain/Learning Rate": 1.1637160935875717e-06, "Pretrain/Loss": 1.915088415145874, "Pretrain/Loss (Raw)": 2.121307373046875, "Pretrain/Step": 8635, "Pretrain/Step Time": 8.666470058262348} +{"Pretrain/Learning Rate": 1.1611573734735925e-06, "Pretrain/Loss": 1.91670823097229, "Pretrain/Loss (Raw)": 1.881695032119751, "Pretrain/Step": 8636, "Pretrain/Step Time": 8.664385812357068} +{"Pretrain/Learning Rate": 1.1586014025672775e-06, "Pretrain/Loss": 1.9160842895507812, "Pretrain/Loss (Raw)": 2.103257417678833, "Pretrain/Step": 8637, "Pretrain/Step Time": 8.66912654787302} +{"Pretrain/Learning Rate": 1.1560481811633912e-06, "Pretrain/Loss": 1.91630220413208, "Pretrain/Loss (Raw)": 1.8645228147506714, "Pretrain/Step": 8638, "Pretrain/Step Time": 8.668192371726036} +{"Pretrain/Learning Rate": 1.1534977095563892e-06, "Pretrain/Loss": 1.9171717166900635, "Pretrain/Loss (Raw)": 1.9497758150100708, "Pretrain/Step": 8639, "Pretrain/Step Time": 8.667095987126231} +{"Pretrain/Learning Rate": 1.1509499880403979e-06, "Pretrain/Loss": 1.9134491682052612, "Pretrain/Loss (Raw)": 1.8028484582901, "Pretrain/Step": 8640, "Pretrain/Step Time": 8.659847835078835} +{"Pretrain/Learning Rate": 1.1484050169092347e-06, "Pretrain/Loss": 1.9137732982635498, "Pretrain/Loss (Raw)": 1.9423099756240845, "Pretrain/Step": 8641, "Pretrain/Step Time": 8.666437709704041} +{"Pretrain/Learning Rate": 1.1458627964563928e-06, "Pretrain/Loss": 1.9155452251434326, "Pretrain/Loss (Raw)": 2.0724122524261475, "Pretrain/Step": 8642, "Pretrain/Step Time": 8.666039308533072} +{"Pretrain/Learning Rate": 1.1433233269750627e-06, "Pretrain/Loss": 1.915726661682129, "Pretrain/Loss (Raw)": 1.9761333465576172, "Pretrain/Step": 8643, "Pretrain/Step Time": 8.662173260003328} +{"Pretrain/Learning Rate": 1.1407866087581043e-06, "Pretrain/Loss": 1.916195273399353, "Pretrain/Loss (Raw)": 2.1378228664398193, "Pretrain/Step": 8644, "Pretrain/Step Time": 8.663504840806127} +{"Pretrain/Learning Rate": 1.1382526420980588e-06, "Pretrain/Loss": 1.9169230461120605, "Pretrain/Loss (Raw)": 1.9877547025680542, "Pretrain/Step": 8645, "Pretrain/Step Time": 8.66304192878306} +{"Pretrain/Learning Rate": 1.135721427287159e-06, "Pretrain/Loss": 1.9170455932617188, "Pretrain/Loss (Raw)": 2.033480405807495, "Pretrain/Step": 8646, "Pretrain/Step Time": 8.661703210324049} +{"Pretrain/Learning Rate": 1.1331929646173162e-06, "Pretrain/Loss": 1.9171746969223022, "Pretrain/Loss (Raw)": 1.886625051498413, "Pretrain/Step": 8647, "Pretrain/Step Time": 8.6585658993572} +{"Pretrain/Learning Rate": 1.1306672543801273e-06, "Pretrain/Loss": 1.9169328212738037, "Pretrain/Loss (Raw)": 1.6208597421646118, "Pretrain/Step": 8648, "Pretrain/Step Time": 8.662529626861215} +{"Pretrain/Learning Rate": 1.1281442968668648e-06, "Pretrain/Loss": 1.918359637260437, "Pretrain/Loss (Raw)": 1.928452968597412, "Pretrain/Step": 8649, "Pretrain/Step Time": 8.661079121753573} +{"Pretrain/Learning Rate": 1.125624092368488e-06, "Pretrain/Loss": 1.918940782546997, "Pretrain/Loss (Raw)": 2.087136745452881, "Pretrain/Step": 8650, "Pretrain/Step Time": 8.666111780330539} +{"Pretrain/Learning Rate": 1.1231066411756475e-06, "Pretrain/Loss": 1.918937087059021, "Pretrain/Loss (Raw)": 2.1452906131744385, "Pretrain/Step": 8651, "Pretrain/Step Time": 8.666533136740327} +{"Pretrain/Learning Rate": 1.1205919435786554e-06, "Pretrain/Loss": 1.9186487197875977, "Pretrain/Loss (Raw)": 1.7705696821212769, "Pretrain/Step": 8652, "Pretrain/Step Time": 8.669406782835722} +{"Pretrain/Learning Rate": 1.1180799998675245e-06, "Pretrain/Loss": 1.9204790592193604, "Pretrain/Loss (Raw)": 2.049750328063965, "Pretrain/Step": 8653, "Pretrain/Step Time": 8.666728338226676} +{"Pretrain/Learning Rate": 1.1155708103319395e-06, "Pretrain/Loss": 1.9222474098205566, "Pretrain/Loss (Raw)": 2.0336830615997314, "Pretrain/Step": 8654, "Pretrain/Step Time": 8.666730381548405} +{"Pretrain/Learning Rate": 1.1130643752612858e-06, "Pretrain/Loss": 1.9235734939575195, "Pretrain/Loss (Raw)": 2.0499470233917236, "Pretrain/Step": 8655, "Pretrain/Step Time": 8.667683636769652} +{"Pretrain/Learning Rate": 1.1105606949445984e-06, "Pretrain/Loss": 1.9224934577941895, "Pretrain/Loss (Raw)": 1.7860301733016968, "Pretrain/Step": 8656, "Pretrain/Step Time": 8.65784771554172} +{"Pretrain/Learning Rate": 1.1080597696706247e-06, "Pretrain/Loss": 1.9228246212005615, "Pretrain/Loss (Raw)": 1.9754480123519897, "Pretrain/Step": 8657, "Pretrain/Step Time": 8.665018497034907} +{"Pretrain/Learning Rate": 1.1055615997277806e-06, "Pretrain/Loss": 1.9284757375717163, "Pretrain/Loss (Raw)": 1.9120385646820068, "Pretrain/Step": 8658, "Pretrain/Step Time": 8.666137116029859} +{"Pretrain/Learning Rate": 1.1030661854041695e-06, "Pretrain/Loss": 1.9282640218734741, "Pretrain/Loss (Raw)": 1.9630041122436523, "Pretrain/Step": 8659, "Pretrain/Step Time": 8.665031442418694} +{"Pretrain/Learning Rate": 1.1005735269875695e-06, "Pretrain/Loss": 1.9272958040237427, "Pretrain/Loss (Raw)": 1.6348662376403809, "Pretrain/Step": 8660, "Pretrain/Step Time": 8.66267722286284} +{"Pretrain/Learning Rate": 1.0980836247654501e-06, "Pretrain/Loss": 1.9272782802581787, "Pretrain/Loss (Raw)": 1.8947337865829468, "Pretrain/Step": 8661, "Pretrain/Step Time": 8.663733871653676} +{"Pretrain/Learning Rate": 1.0955964790249546e-06, "Pretrain/Loss": 1.9274990558624268, "Pretrain/Loss (Raw)": 1.9812806844711304, "Pretrain/Step": 8662, "Pretrain/Step Time": 8.662837378680706} +{"Pretrain/Learning Rate": 1.0931120900529169e-06, "Pretrain/Loss": 1.931861400604248, "Pretrain/Loss (Raw)": 1.9460195302963257, "Pretrain/Step": 8663, "Pretrain/Step Time": 8.66607160679996} +{"Pretrain/Learning Rate": 1.0906304581358411e-06, "Pretrain/Loss": 1.9310929775238037, "Pretrain/Loss (Raw)": 1.87636137008667, "Pretrain/Step": 8664, "Pretrain/Step Time": 8.663909828290343} +{"Pretrain/Learning Rate": 1.0881515835599293e-06, "Pretrain/Loss": 1.9316215515136719, "Pretrain/Loss (Raw)": 2.105137586593628, "Pretrain/Step": 8665, "Pretrain/Step Time": 8.66277820058167} +{"Pretrain/Learning Rate": 1.0856754666110553e-06, "Pretrain/Loss": 1.930822730064392, "Pretrain/Loss (Raw)": 1.913870930671692, "Pretrain/Step": 8666, "Pretrain/Step Time": 8.666857002303004} +{"Pretrain/Learning Rate": 1.0832021075747711e-06, "Pretrain/Loss": 1.9289586544036865, "Pretrain/Loss (Raw)": 1.7533202171325684, "Pretrain/Step": 8667, "Pretrain/Step Time": 8.664073316380382} +{"Pretrain/Learning Rate": 1.0807315067363184e-06, "Pretrain/Loss": 1.9272949695587158, "Pretrain/Loss (Raw)": 1.9686418771743774, "Pretrain/Step": 8668, "Pretrain/Step Time": 8.667772149667144} +{"Pretrain/Learning Rate": 1.0782636643806215e-06, "Pretrain/Loss": 1.9283701181411743, "Pretrain/Loss (Raw)": 1.9248769283294678, "Pretrain/Step": 8669, "Pretrain/Step Time": 8.664509166032076} +{"Pretrain/Learning Rate": 1.0757985807922838e-06, "Pretrain/Loss": 1.9280109405517578, "Pretrain/Loss (Raw)": 1.953066110610962, "Pretrain/Step": 8670, "Pretrain/Step Time": 8.670029925182462} +{"Pretrain/Learning Rate": 1.073336256255586e-06, "Pretrain/Loss": 1.9295926094055176, "Pretrain/Loss (Raw)": 1.9715461730957031, "Pretrain/Step": 8671, "Pretrain/Step Time": 8.668649358674884} +{"Pretrain/Learning Rate": 1.0708766910544954e-06, "Pretrain/Loss": 1.9314231872558594, "Pretrain/Loss (Raw)": 2.2146263122558594, "Pretrain/Step": 8672, "Pretrain/Step Time": 8.666487418115139} +{"Pretrain/Learning Rate": 1.0684198854726656e-06, "Pretrain/Loss": 1.9318392276763916, "Pretrain/Loss (Raw)": 1.969889760017395, "Pretrain/Step": 8673, "Pretrain/Step Time": 8.665585048496723} +{"Pretrain/Learning Rate": 1.065965839793423e-06, "Pretrain/Loss": 1.9249876737594604, "Pretrain/Loss (Raw)": 1.5160824060440063, "Pretrain/Step": 8674, "Pretrain/Step Time": 8.668007735162973} +{"Pretrain/Learning Rate": 1.0635145542997772e-06, "Pretrain/Loss": 1.9183180332183838, "Pretrain/Loss (Raw)": 1.2824070453643799, "Pretrain/Step": 8675, "Pretrain/Step Time": 8.66497209481895} +{"Pretrain/Learning Rate": 1.0610660292744296e-06, "Pretrain/Loss": 1.917220115661621, "Pretrain/Loss (Raw)": 1.8079649209976196, "Pretrain/Step": 8676, "Pretrain/Step Time": 8.667390406131744} +{"Pretrain/Learning Rate": 1.0586202649997517e-06, "Pretrain/Loss": 1.918989896774292, "Pretrain/Loss (Raw)": 2.0579726696014404, "Pretrain/Step": 8677, "Pretrain/Step Time": 8.666086791083217} +{"Pretrain/Learning Rate": 1.0561772617578014e-06, "Pretrain/Loss": 1.9189616441726685, "Pretrain/Loss (Raw)": 1.8867148160934448, "Pretrain/Step": 8678, "Pretrain/Step Time": 8.664267618209124} +{"Pretrain/Learning Rate": 1.0537370198303116e-06, "Pretrain/Loss": 1.917824387550354, "Pretrain/Loss (Raw)": 1.8690110445022583, "Pretrain/Step": 8679, "Pretrain/Step Time": 8.662789022549987} +{"Pretrain/Learning Rate": 1.0512995394987096e-06, "Pretrain/Loss": 1.9233722686767578, "Pretrain/Loss (Raw)": 2.488553524017334, "Pretrain/Step": 8680, "Pretrain/Step Time": 8.66360860131681} +{"Pretrain/Learning Rate": 1.048864821044096e-06, "Pretrain/Loss": 1.9251370429992676, "Pretrain/Loss (Raw)": 1.965786337852478, "Pretrain/Step": 8681, "Pretrain/Step Time": 8.66702894307673} +{"Pretrain/Learning Rate": 1.0464328647472515e-06, "Pretrain/Loss": 1.925997018814087, "Pretrain/Loss (Raw)": 1.8393436670303345, "Pretrain/Step": 8682, "Pretrain/Step Time": 8.662705194205046} +{"Pretrain/Learning Rate": 1.0440036708886407e-06, "Pretrain/Loss": 1.9251959323883057, "Pretrain/Loss (Raw)": 1.8346024751663208, "Pretrain/Step": 8683, "Pretrain/Step Time": 8.664223674684763} +{"Pretrain/Learning Rate": 1.0415772397484119e-06, "Pretrain/Loss": 1.927398443222046, "Pretrain/Loss (Raw)": 2.035862922668457, "Pretrain/Step": 8684, "Pretrain/Step Time": 8.667459031566978} +{"Pretrain/Learning Rate": 1.0391535716063938e-06, "Pretrain/Loss": 1.9275469779968262, "Pretrain/Loss (Raw)": 2.148416519165039, "Pretrain/Step": 8685, "Pretrain/Step Time": 8.66499305702746} +{"Pretrain/Learning Rate": 1.0367326667420907e-06, "Pretrain/Loss": 1.9292757511138916, "Pretrain/Loss (Raw)": 2.06473970413208, "Pretrain/Step": 8686, "Pretrain/Step Time": 8.657513324171305} +{"Pretrain/Learning Rate": 1.0343145254346931e-06, "Pretrain/Loss": 1.9301199913024902, "Pretrain/Loss (Raw)": 1.7703028917312622, "Pretrain/Step": 8687, "Pretrain/Step Time": 8.65910354629159} +{"Pretrain/Learning Rate": 1.031899147963078e-06, "Pretrain/Loss": 1.9298149347305298, "Pretrain/Loss (Raw)": 1.917915940284729, "Pretrain/Step": 8688, "Pretrain/Step Time": 8.651596305891871} +{"Pretrain/Learning Rate": 1.0294865346057947e-06, "Pretrain/Loss": 1.9273607730865479, "Pretrain/Loss (Raw)": 1.6853079795837402, "Pretrain/Step": 8689, "Pretrain/Step Time": 8.650442799553275} +{"Pretrain/Learning Rate": 1.0270766856410764e-06, "Pretrain/Loss": 1.9289958477020264, "Pretrain/Loss (Raw)": 2.110527992248535, "Pretrain/Step": 8690, "Pretrain/Step Time": 8.656627522781491} +{"Pretrain/Learning Rate": 1.0246696013468338e-06, "Pretrain/Loss": 1.9308390617370605, "Pretrain/Loss (Raw)": 2.152158498764038, "Pretrain/Step": 8691, "Pretrain/Step Time": 8.656854003667831} +{"Pretrain/Learning Rate": 1.0222652820006785e-06, "Pretrain/Loss": 1.9271225929260254, "Pretrain/Loss (Raw)": 1.742763638496399, "Pretrain/Step": 8692, "Pretrain/Step Time": 8.658232672140002} +{"Pretrain/Learning Rate": 1.019863727879869e-06, "Pretrain/Loss": 1.9263060092926025, "Pretrain/Loss (Raw)": 1.9824298620224, "Pretrain/Step": 8693, "Pretrain/Step Time": 8.655181864276528} +{"Pretrain/Learning Rate": 1.0174649392613755e-06, "Pretrain/Loss": 1.92783784866333, "Pretrain/Loss (Raw)": 2.0423500537872314, "Pretrain/Step": 8694, "Pretrain/Step Time": 8.651097647845745} +{"Pretrain/Learning Rate": 1.0150689164218325e-06, "Pretrain/Loss": 1.9242832660675049, "Pretrain/Loss (Raw)": 1.7094941139221191, "Pretrain/Step": 8695, "Pretrain/Step Time": 8.650792380794883} +{"Pretrain/Learning Rate": 1.0126756596375686e-06, "Pretrain/Loss": 1.9239978790283203, "Pretrain/Loss (Raw)": 1.8574789762496948, "Pretrain/Step": 8696, "Pretrain/Step Time": 8.654149709269404} +{"Pretrain/Learning Rate": 1.0102851691845716e-06, "Pretrain/Loss": 1.9241501092910767, "Pretrain/Loss (Raw)": 2.019847869873047, "Pretrain/Step": 8697, "Pretrain/Step Time": 8.65415988303721} +{"Pretrain/Learning Rate": 1.0078974453385375e-06, "Pretrain/Loss": 1.9223321676254272, "Pretrain/Loss (Raw)": 1.8522900342941284, "Pretrain/Step": 8698, "Pretrain/Step Time": 8.653246073052287} +{"Pretrain/Learning Rate": 1.0055124883748213e-06, "Pretrain/Loss": 1.9222564697265625, "Pretrain/Loss (Raw)": 1.8794372081756592, "Pretrain/Step": 8699, "Pretrain/Step Time": 8.648593755438924} +{"Pretrain/Learning Rate": 1.0031302985684777e-06, "Pretrain/Loss": 1.9226337671279907, "Pretrain/Loss (Raw)": 1.9443753957748413, "Pretrain/Step": 8700, "Pretrain/Step Time": 8.652911510318518} +{"Pretrain/Learning Rate": 1.0007508761942176e-06, "Pretrain/Loss": 1.9253690242767334, "Pretrain/Loss (Raw)": 1.957324504852295, "Pretrain/Step": 8701, "Pretrain/Step Time": 8.650193367153406} +{"Pretrain/Learning Rate": 9.983742215264575e-07, "Pretrain/Loss": 1.925070881843567, "Pretrain/Loss (Raw)": 1.873580813407898, "Pretrain/Step": 8702, "Pretrain/Step Time": 8.648535808548331} +{"Pretrain/Learning Rate": 9.96000334839281e-07, "Pretrain/Loss": 1.9276206493377686, "Pretrain/Loss (Raw)": 1.9948656558990479, "Pretrain/Step": 8703, "Pretrain/Step Time": 8.646221252158284} +{"Pretrain/Learning Rate": 9.93629216406458e-07, "Pretrain/Loss": 1.9270045757293701, "Pretrain/Loss (Raw)": 1.9602253437042236, "Pretrain/Step": 8704, "Pretrain/Step Time": 8.645903887227178} +{"Pretrain/Learning Rate": 9.91260866501431e-07, "Pretrain/Loss": 1.9278385639190674, "Pretrain/Loss (Raw)": 2.0037360191345215, "Pretrain/Step": 8705, "Pretrain/Step Time": 8.648776473477483} +{"Pretrain/Learning Rate": 9.888952853973371e-07, "Pretrain/Loss": 1.9313839673995972, "Pretrain/Loss (Raw)": 1.979047417640686, "Pretrain/Step": 8706, "Pretrain/Step Time": 8.652171675115824} +{"Pretrain/Learning Rate": 9.86532473366983e-07, "Pretrain/Loss": 1.9281582832336426, "Pretrain/Loss (Raw)": 1.553162932395935, "Pretrain/Step": 8707, "Pretrain/Step Time": 8.651292007416487} +{"Pretrain/Learning Rate": 9.841724306828587e-07, "Pretrain/Loss": 1.930936336517334, "Pretrain/Loss (Raw)": 2.1115264892578125, "Pretrain/Step": 8708, "Pretrain/Step Time": 8.64960004761815} +{"Pretrain/Learning Rate": 9.818151576171358e-07, "Pretrain/Loss": 1.933218240737915, "Pretrain/Loss (Raw)": 2.1839544773101807, "Pretrain/Step": 8709, "Pretrain/Step Time": 8.644414892420173} +{"Pretrain/Learning Rate": 9.794606544416662e-07, "Pretrain/Loss": 1.9377373456954956, "Pretrain/Loss (Raw)": 1.9651508331298828, "Pretrain/Step": 8710, "Pretrain/Step Time": 8.642956491559744} +{"Pretrain/Learning Rate": 9.771089214279827e-07, "Pretrain/Loss": 1.9373011589050293, "Pretrain/Loss (Raw)": 1.8913915157318115, "Pretrain/Step": 8711, "Pretrain/Step Time": 8.645685520023108} +{"Pretrain/Learning Rate": 9.74759958847299e-07, "Pretrain/Loss": 1.938890814781189, "Pretrain/Loss (Raw)": 2.1348257064819336, "Pretrain/Step": 8712, "Pretrain/Step Time": 8.649865884333849} +{"Pretrain/Learning Rate": 9.724137669705036e-07, "Pretrain/Loss": 1.937196135520935, "Pretrain/Loss (Raw)": 2.000729560852051, "Pretrain/Step": 8713, "Pretrain/Step Time": 8.65270883217454} +{"Pretrain/Learning Rate": 9.700703460681803e-07, "Pretrain/Loss": 1.9338459968566895, "Pretrain/Loss (Raw)": 1.6170625686645508, "Pretrain/Step": 8714, "Pretrain/Step Time": 8.652745736762881} +{"Pretrain/Learning Rate": 9.677296964105742e-07, "Pretrain/Loss": 1.933408498764038, "Pretrain/Loss (Raw)": 2.041147232055664, "Pretrain/Step": 8715, "Pretrain/Step Time": 8.65171723626554} +{"Pretrain/Learning Rate": 9.653918182676218e-07, "Pretrain/Loss": 1.9354803562164307, "Pretrain/Loss (Raw)": 1.9518839120864868, "Pretrain/Step": 8716, "Pretrain/Step Time": 8.647348219528794} +{"Pretrain/Learning Rate": 9.630567119089412e-07, "Pretrain/Loss": 1.9371895790100098, "Pretrain/Loss (Raw)": 2.0073435306549072, "Pretrain/Step": 8717, "Pretrain/Step Time": 8.650694089010358} +{"Pretrain/Learning Rate": 9.607243776038278e-07, "Pretrain/Loss": 1.9398967027664185, "Pretrain/Loss (Raw)": 2.0405640602111816, "Pretrain/Step": 8718, "Pretrain/Step Time": 8.650506179779768} +{"Pretrain/Learning Rate": 9.583948156212552e-07, "Pretrain/Loss": 1.9396411180496216, "Pretrain/Loss (Raw)": 2.1079771518707275, "Pretrain/Step": 8719, "Pretrain/Step Time": 8.65226880647242} +{"Pretrain/Learning Rate": 9.560680262298783e-07, "Pretrain/Loss": 1.9392412900924683, "Pretrain/Loss (Raw)": 1.9231542348861694, "Pretrain/Step": 8720, "Pretrain/Step Time": 8.64926009438932} +{"Pretrain/Learning Rate": 9.537440096980377e-07, "Pretrain/Loss": 1.9397339820861816, "Pretrain/Loss (Raw)": 1.894362449645996, "Pretrain/Step": 8721, "Pretrain/Step Time": 8.653489459306002} +{"Pretrain/Learning Rate": 9.514227662937469e-07, "Pretrain/Loss": 1.9400758743286133, "Pretrain/Loss (Raw)": 1.850982427597046, "Pretrain/Step": 8722, "Pretrain/Step Time": 8.654193559661508} +{"Pretrain/Learning Rate": 9.49104296284703e-07, "Pretrain/Loss": 1.9393980503082275, "Pretrain/Loss (Raw)": 1.9745428562164307, "Pretrain/Step": 8723, "Pretrain/Step Time": 8.655382756143808} +{"Pretrain/Learning Rate": 9.467885999382809e-07, "Pretrain/Loss": 1.9398796558380127, "Pretrain/Loss (Raw)": 1.8887925148010254, "Pretrain/Step": 8724, "Pretrain/Step Time": 8.653663260862231} +{"Pretrain/Learning Rate": 9.444756775215446e-07, "Pretrain/Loss": 1.940899133682251, "Pretrain/Loss (Raw)": 1.9931974411010742, "Pretrain/Step": 8725, "Pretrain/Step Time": 8.65163460560143} +{"Pretrain/Learning Rate": 9.421655293012227e-07, "Pretrain/Loss": 1.940949559211731, "Pretrain/Loss (Raw)": 2.071171760559082, "Pretrain/Step": 8726, "Pretrain/Step Time": 8.658889785408974} +{"Pretrain/Learning Rate": 9.398581555437408e-07, "Pretrain/Loss": 1.9391075372695923, "Pretrain/Loss (Raw)": 1.7949780225753784, "Pretrain/Step": 8727, "Pretrain/Step Time": 8.657500822097063} +{"Pretrain/Learning Rate": 9.375535565151861e-07, "Pretrain/Loss": 1.937575101852417, "Pretrain/Loss (Raw)": 1.9969806671142578, "Pretrain/Step": 8728, "Pretrain/Step Time": 8.66239352338016} +{"Pretrain/Learning Rate": 9.352517324813431e-07, "Pretrain/Loss": 1.9406951665878296, "Pretrain/Loss (Raw)": 2.1015560626983643, "Pretrain/Step": 8729, "Pretrain/Step Time": 8.665977561846375} +{"Pretrain/Learning Rate": 9.329526837076691e-07, "Pretrain/Loss": 1.93766450881958, "Pretrain/Loss (Raw)": 1.609009861946106, "Pretrain/Step": 8730, "Pretrain/Step Time": 8.66503481566906} +{"Pretrain/Learning Rate": 9.306564104592963e-07, "Pretrain/Loss": 1.938913106918335, "Pretrain/Loss (Raw)": 1.9869880676269531, "Pretrain/Step": 8731, "Pretrain/Step Time": 8.662857364863157} +{"Pretrain/Learning Rate": 9.283629130010463e-07, "Pretrain/Loss": 1.9375100135803223, "Pretrain/Loss (Raw)": 1.8139597177505493, "Pretrain/Step": 8732, "Pretrain/Step Time": 8.66208947636187} +{"Pretrain/Learning Rate": 9.260721915974158e-07, "Pretrain/Loss": 1.933873176574707, "Pretrain/Loss (Raw)": 1.6063084602355957, "Pretrain/Step": 8733, "Pretrain/Step Time": 8.659887559711933} +{"Pretrain/Learning Rate": 9.237842465125768e-07, "Pretrain/Loss": 1.9339067935943604, "Pretrain/Loss (Raw)": 1.8732961416244507, "Pretrain/Step": 8734, "Pretrain/Step Time": 8.660533433780074} +{"Pretrain/Learning Rate": 9.214990780103932e-07, "Pretrain/Loss": 1.9341011047363281, "Pretrain/Loss (Raw)": 1.8872312307357788, "Pretrain/Step": 8735, "Pretrain/Step Time": 8.659309772774577} +{"Pretrain/Learning Rate": 9.192166863543933e-07, "Pretrain/Loss": 1.932870626449585, "Pretrain/Loss (Raw)": 1.9458461999893188, "Pretrain/Step": 8736, "Pretrain/Step Time": 8.665338017046452} +{"Pretrain/Learning Rate": 9.169370718078024e-07, "Pretrain/Loss": 1.9343643188476562, "Pretrain/Loss (Raw)": 2.1322898864746094, "Pretrain/Step": 8737, "Pretrain/Step Time": 8.65941433236003} +{"Pretrain/Learning Rate": 9.146602346335075e-07, "Pretrain/Loss": 1.9330623149871826, "Pretrain/Loss (Raw)": 1.923497200012207, "Pretrain/Step": 8738, "Pretrain/Step Time": 8.66082294844091} +{"Pretrain/Learning Rate": 9.123861750940904e-07, "Pretrain/Loss": 1.9310736656188965, "Pretrain/Loss (Raw)": 1.829089641571045, "Pretrain/Step": 8739, "Pretrain/Step Time": 8.663717549294233} +{"Pretrain/Learning Rate": 9.101148934518022e-07, "Pretrain/Loss": 1.933107852935791, "Pretrain/Loss (Raw)": 2.087989330291748, "Pretrain/Step": 8740, "Pretrain/Step Time": 8.659498568624258} +{"Pretrain/Learning Rate": 9.078463899685835e-07, "Pretrain/Loss": 1.9350647926330566, "Pretrain/Loss (Raw)": 2.0993518829345703, "Pretrain/Step": 8741, "Pretrain/Step Time": 8.6569768730551} +{"Pretrain/Learning Rate": 9.055806649060416e-07, "Pretrain/Loss": 1.9353934526443481, "Pretrain/Loss (Raw)": 2.006096601486206, "Pretrain/Step": 8742, "Pretrain/Step Time": 8.662438308820128} +{"Pretrain/Learning Rate": 9.033177185254732e-07, "Pretrain/Loss": 1.934967279434204, "Pretrain/Loss (Raw)": 1.9136953353881836, "Pretrain/Step": 8743, "Pretrain/Step Time": 8.659326113760471} +{"Pretrain/Learning Rate": 9.010575510878555e-07, "Pretrain/Loss": 1.937788963317871, "Pretrain/Loss (Raw)": 2.083552837371826, "Pretrain/Step": 8744, "Pretrain/Step Time": 8.66221010312438} +{"Pretrain/Learning Rate": 8.988001628538411e-07, "Pretrain/Loss": 1.938137173652649, "Pretrain/Loss (Raw)": 1.9059853553771973, "Pretrain/Step": 8745, "Pretrain/Step Time": 8.665111409500241} +{"Pretrain/Learning Rate": 8.965455540837553e-07, "Pretrain/Loss": 1.9379500150680542, "Pretrain/Loss (Raw)": 1.8562415838241577, "Pretrain/Step": 8746, "Pretrain/Step Time": 8.659888682886958} +{"Pretrain/Learning Rate": 8.942937250376176e-07, "Pretrain/Loss": 1.938069224357605, "Pretrain/Loss (Raw)": 1.9520597457885742, "Pretrain/Step": 8747, "Pretrain/Step Time": 8.65960517525673} +{"Pretrain/Learning Rate": 8.920446759751177e-07, "Pretrain/Loss": 1.9385738372802734, "Pretrain/Loss (Raw)": 1.724744200706482, "Pretrain/Step": 8748, "Pretrain/Step Time": 8.652472205460072} +{"Pretrain/Learning Rate": 8.897984071556259e-07, "Pretrain/Loss": 1.936476707458496, "Pretrain/Loss (Raw)": 1.8227355480194092, "Pretrain/Step": 8749, "Pretrain/Step Time": 8.657933695241809} +{"Pretrain/Learning Rate": 8.875549188381904e-07, "Pretrain/Loss": 1.9356787204742432, "Pretrain/Loss (Raw)": 2.0109665393829346, "Pretrain/Step": 8750, "Pretrain/Step Time": 8.656987650319934} +{"Pretrain/Learning Rate": 8.85314211281546e-07, "Pretrain/Loss": 1.9367945194244385, "Pretrain/Loss (Raw)": 1.9765288829803467, "Pretrain/Step": 8751, "Pretrain/Step Time": 8.6546101719141} +{"Pretrain/Learning Rate": 8.830762847440998e-07, "Pretrain/Loss": 1.9370651245117188, "Pretrain/Loss (Raw)": 2.083306074142456, "Pretrain/Step": 8752, "Pretrain/Step Time": 8.660406116396189} +{"Pretrain/Learning Rate": 8.808411394839372e-07, "Pretrain/Loss": 1.9354274272918701, "Pretrain/Loss (Raw)": 1.6421347856521606, "Pretrain/Step": 8753, "Pretrain/Step Time": 8.66036937944591} +{"Pretrain/Learning Rate": 8.786087757588269e-07, "Pretrain/Loss": 1.9351527690887451, "Pretrain/Loss (Raw)": 2.037808418273926, "Pretrain/Step": 8754, "Pretrain/Step Time": 8.66066037863493} +{"Pretrain/Learning Rate": 8.763791938262184e-07, "Pretrain/Loss": 1.935225486755371, "Pretrain/Loss (Raw)": 1.9712446928024292, "Pretrain/Step": 8755, "Pretrain/Step Time": 8.665189230814576} +{"Pretrain/Learning Rate": 8.741523939432339e-07, "Pretrain/Loss": 1.9368095397949219, "Pretrain/Loss (Raw)": 2.2669806480407715, "Pretrain/Step": 8756, "Pretrain/Step Time": 8.664462707936764} +{"Pretrain/Learning Rate": 8.719283763666792e-07, "Pretrain/Loss": 1.937002182006836, "Pretrain/Loss (Raw)": 1.970288634300232, "Pretrain/Step": 8757, "Pretrain/Step Time": 8.664458263665438} +{"Pretrain/Learning Rate": 8.697071413530433e-07, "Pretrain/Loss": 1.939689040184021, "Pretrain/Loss (Raw)": 2.155580759048462, "Pretrain/Step": 8758, "Pretrain/Step Time": 8.669380517676473} +{"Pretrain/Learning Rate": 8.674886891584827e-07, "Pretrain/Loss": 1.9422798156738281, "Pretrain/Loss (Raw)": 2.0107550621032715, "Pretrain/Step": 8759, "Pretrain/Step Time": 8.670392552390695} +{"Pretrain/Learning Rate": 8.652730200388426e-07, "Pretrain/Loss": 1.9424443244934082, "Pretrain/Loss (Raw)": 2.092684268951416, "Pretrain/Step": 8760, "Pretrain/Step Time": 8.66697215102613} +{"Pretrain/Learning Rate": 8.630601342496436e-07, "Pretrain/Loss": 1.9434510469436646, "Pretrain/Loss (Raw)": 2.035358428955078, "Pretrain/Step": 8761, "Pretrain/Step Time": 8.670792577788234} +{"Pretrain/Learning Rate": 8.608500320460899e-07, "Pretrain/Loss": 1.9446280002593994, "Pretrain/Loss (Raw)": 2.0790367126464844, "Pretrain/Step": 8762, "Pretrain/Step Time": 8.669375825673342} +{"Pretrain/Learning Rate": 8.586427136830555e-07, "Pretrain/Loss": 1.9436702728271484, "Pretrain/Loss (Raw)": 1.9987064599990845, "Pretrain/Step": 8763, "Pretrain/Step Time": 8.668444922193885} +{"Pretrain/Learning Rate": 8.564381794151033e-07, "Pretrain/Loss": 1.9448994398117065, "Pretrain/Loss (Raw)": 2.0390381813049316, "Pretrain/Step": 8764, "Pretrain/Step Time": 8.667258199304342} +{"Pretrain/Learning Rate": 8.542364294964633e-07, "Pretrain/Loss": 1.9413961172103882, "Pretrain/Loss (Raw)": 1.6548126935958862, "Pretrain/Step": 8765, "Pretrain/Step Time": 8.665598699823022} +{"Pretrain/Learning Rate": 8.52037464181063e-07, "Pretrain/Loss": 1.9407405853271484, "Pretrain/Loss (Raw)": 1.7806403636932373, "Pretrain/Step": 8766, "Pretrain/Step Time": 8.666764099150896} +{"Pretrain/Learning Rate": 8.498412837224884e-07, "Pretrain/Loss": 1.9395043849945068, "Pretrain/Loss (Raw)": 1.791525959968567, "Pretrain/Step": 8767, "Pretrain/Step Time": 8.670157777145505} +{"Pretrain/Learning Rate": 8.476478883740175e-07, "Pretrain/Loss": 1.941503643989563, "Pretrain/Loss (Raw)": 2.0587522983551025, "Pretrain/Step": 8768, "Pretrain/Step Time": 8.670439455658197} +{"Pretrain/Learning Rate": 8.454572783885978e-07, "Pretrain/Loss": 1.9418532848358154, "Pretrain/Loss (Raw)": 1.9870598316192627, "Pretrain/Step": 8769, "Pretrain/Step Time": 8.66239375807345} +{"Pretrain/Learning Rate": 8.43269454018869e-07, "Pretrain/Loss": 1.940680742263794, "Pretrain/Loss (Raw)": 1.9223260879516602, "Pretrain/Step": 8770, "Pretrain/Step Time": 8.664760755375028} +{"Pretrain/Learning Rate": 8.410844155171376e-07, "Pretrain/Loss": 1.939476490020752, "Pretrain/Loss (Raw)": 1.8220016956329346, "Pretrain/Step": 8771, "Pretrain/Step Time": 8.668070184066892} +{"Pretrain/Learning Rate": 8.389021631353911e-07, "Pretrain/Loss": 1.9370369911193848, "Pretrain/Loss (Raw)": 1.8255724906921387, "Pretrain/Step": 8772, "Pretrain/Step Time": 8.665401447564363} +{"Pretrain/Learning Rate": 8.367226971252945e-07, "Pretrain/Loss": 1.9363762140274048, "Pretrain/Loss (Raw)": 1.9031696319580078, "Pretrain/Step": 8773, "Pretrain/Step Time": 8.668901761993766} +{"Pretrain/Learning Rate": 8.345460177381998e-07, "Pretrain/Loss": 1.9359465837478638, "Pretrain/Loss (Raw)": 1.9784904718399048, "Pretrain/Step": 8774, "Pretrain/Step Time": 8.672331439331174} +{"Pretrain/Learning Rate": 8.323721252251309e-07, "Pretrain/Loss": 1.9369821548461914, "Pretrain/Loss (Raw)": 2.0191662311553955, "Pretrain/Step": 8775, "Pretrain/Step Time": 8.675464445725083} +{"Pretrain/Learning Rate": 8.302010198367904e-07, "Pretrain/Loss": 1.9407932758331299, "Pretrain/Loss (Raw)": 2.1086959838867188, "Pretrain/Step": 8776, "Pretrain/Step Time": 8.670641737058759} +{"Pretrain/Learning Rate": 8.280327018235556e-07, "Pretrain/Loss": 1.941153883934021, "Pretrain/Loss (Raw)": 1.9745960235595703, "Pretrain/Step": 8777, "Pretrain/Step Time": 8.672498475760221} +{"Pretrain/Learning Rate": 8.258671714354987e-07, "Pretrain/Loss": 1.9390640258789062, "Pretrain/Loss (Raw)": 1.8196399211883545, "Pretrain/Step": 8778, "Pretrain/Step Time": 8.664711939170957} +{"Pretrain/Learning Rate": 8.23704428922345e-07, "Pretrain/Loss": 1.9360462427139282, "Pretrain/Loss (Raw)": 1.7590198516845703, "Pretrain/Step": 8779, "Pretrain/Step Time": 8.665779884904623} +{"Pretrain/Learning Rate": 8.215444745335227e-07, "Pretrain/Loss": 1.937806487083435, "Pretrain/Loss (Raw)": 1.9958728551864624, "Pretrain/Step": 8780, "Pretrain/Step Time": 8.665610639378428} +{"Pretrain/Learning Rate": 8.193873085181214e-07, "Pretrain/Loss": 1.9370369911193848, "Pretrain/Loss (Raw)": 1.9512569904327393, "Pretrain/Step": 8781, "Pretrain/Step Time": 8.665638756006956} +{"Pretrain/Learning Rate": 8.172329311249255e-07, "Pretrain/Loss": 1.9355692863464355, "Pretrain/Loss (Raw)": 1.8458164930343628, "Pretrain/Step": 8782, "Pretrain/Step Time": 8.66758707165718} +{"Pretrain/Learning Rate": 8.150813426023751e-07, "Pretrain/Loss": 1.936154842376709, "Pretrain/Loss (Raw)": 2.12489652633667, "Pretrain/Step": 8783, "Pretrain/Step Time": 8.666879322379827} +{"Pretrain/Learning Rate": 8.129325431986079e-07, "Pretrain/Loss": 1.937137246131897, "Pretrain/Loss (Raw)": 1.9117767810821533, "Pretrain/Step": 8784, "Pretrain/Step Time": 8.665299978107214} +{"Pretrain/Learning Rate": 8.107865331614339e-07, "Pretrain/Loss": 1.9370296001434326, "Pretrain/Loss (Raw)": 1.9616684913635254, "Pretrain/Step": 8785, "Pretrain/Step Time": 8.65980408154428} +{"Pretrain/Learning Rate": 8.086433127383413e-07, "Pretrain/Loss": 1.936279058456421, "Pretrain/Loss (Raw)": 1.815972089767456, "Pretrain/Step": 8786, "Pretrain/Step Time": 8.656695764511824} +{"Pretrain/Learning Rate": 8.065028821764909e-07, "Pretrain/Loss": 1.9369937181472778, "Pretrain/Loss (Raw)": 2.0544843673706055, "Pretrain/Step": 8787, "Pretrain/Step Time": 8.658571882173419} +{"Pretrain/Learning Rate": 8.043652417227349e-07, "Pretrain/Loss": 1.9392454624176025, "Pretrain/Loss (Raw)": 1.9230897426605225, "Pretrain/Step": 8788, "Pretrain/Step Time": 8.661615597084165} +{"Pretrain/Learning Rate": 8.022303916235929e-07, "Pretrain/Loss": 1.9394187927246094, "Pretrain/Loss (Raw)": 1.9169251918792725, "Pretrain/Step": 8789, "Pretrain/Step Time": 8.661133635789156} +{"Pretrain/Learning Rate": 8.000983321252681e-07, "Pretrain/Loss": 1.9410107135772705, "Pretrain/Loss (Raw)": 2.1850368976593018, "Pretrain/Step": 8790, "Pretrain/Step Time": 8.664850484579802} +{"Pretrain/Learning Rate": 7.979690634736304e-07, "Pretrain/Loss": 1.9417142868041992, "Pretrain/Loss (Raw)": 2.036080837249756, "Pretrain/Step": 8791, "Pretrain/Step Time": 8.661038916558027} +{"Pretrain/Learning Rate": 7.958425859142498e-07, "Pretrain/Loss": 1.942457675933838, "Pretrain/Loss (Raw)": 1.97152578830719, "Pretrain/Step": 8792, "Pretrain/Step Time": 8.661339730024338} +{"Pretrain/Learning Rate": 7.937188996923556e-07, "Pretrain/Loss": 1.9408142566680908, "Pretrain/Loss (Raw)": 1.8947694301605225, "Pretrain/Step": 8793, "Pretrain/Step Time": 8.662642318755388} +{"Pretrain/Learning Rate": 7.915980050528599e-07, "Pretrain/Loss": 1.9414918422698975, "Pretrain/Loss (Raw)": 2.0005996227264404, "Pretrain/Step": 8794, "Pretrain/Step Time": 8.657255133613944} +{"Pretrain/Learning Rate": 7.894799022403532e-07, "Pretrain/Loss": 1.9442397356033325, "Pretrain/Loss (Raw)": 2.105053186416626, "Pretrain/Step": 8795, "Pretrain/Step Time": 8.660687554627657} +{"Pretrain/Learning Rate": 7.873645914991123e-07, "Pretrain/Loss": 1.9443769454956055, "Pretrain/Loss (Raw)": 1.9861927032470703, "Pretrain/Step": 8796, "Pretrain/Step Time": 8.658311549574137} +{"Pretrain/Learning Rate": 7.852520730730812e-07, "Pretrain/Loss": 1.9462264776229858, "Pretrain/Loss (Raw)": 2.161633253097534, "Pretrain/Step": 8797, "Pretrain/Step Time": 8.659816624596715} +{"Pretrain/Learning Rate": 7.831423472058785e-07, "Pretrain/Loss": 1.9467822313308716, "Pretrain/Loss (Raw)": 2.024195909500122, "Pretrain/Step": 8798, "Pretrain/Step Time": 8.658108038827777} +{"Pretrain/Learning Rate": 7.810354141408211e-07, "Pretrain/Loss": 1.946685791015625, "Pretrain/Loss (Raw)": 1.9592078924179077, "Pretrain/Step": 8799, "Pretrain/Step Time": 8.6547576431185} +{"Pretrain/Learning Rate": 7.789312741208809e-07, "Pretrain/Loss": 1.9446589946746826, "Pretrain/Loss (Raw)": 1.9551838636398315, "Pretrain/Step": 8800, "Pretrain/Step Time": 8.65743782185018} +{"Pretrain/Learning Rate": 7.768299273887198e-07, "Pretrain/Loss": 1.9450089931488037, "Pretrain/Loss (Raw)": 2.0146987438201904, "Pretrain/Step": 8801, "Pretrain/Step Time": 8.654368149116635} +{"Pretrain/Learning Rate": 7.747313741866713e-07, "Pretrain/Loss": 1.9480006694793701, "Pretrain/Loss (Raw)": 1.8990062475204468, "Pretrain/Step": 8802, "Pretrain/Step Time": 8.656892210245132} +{"Pretrain/Learning Rate": 7.726356147567559e-07, "Pretrain/Loss": 1.9525213241577148, "Pretrain/Loss (Raw)": 1.861061692237854, "Pretrain/Step": 8803, "Pretrain/Step Time": 8.656699024140835} +{"Pretrain/Learning Rate": 7.705426493406665e-07, "Pretrain/Loss": 1.9546234607696533, "Pretrain/Loss (Raw)": 2.0770392417907715, "Pretrain/Step": 8804, "Pretrain/Step Time": 8.65746158733964} +{"Pretrain/Learning Rate": 7.684524781797708e-07, "Pretrain/Loss": 1.9540175199508667, "Pretrain/Loss (Raw)": 1.9804109334945679, "Pretrain/Step": 8805, "Pretrain/Step Time": 8.659677350893617} +{"Pretrain/Learning Rate": 7.663651015151152e-07, "Pretrain/Loss": 1.9536776542663574, "Pretrain/Loss (Raw)": 1.8432197570800781, "Pretrain/Step": 8806, "Pretrain/Step Time": 8.660825101658702} +{"Pretrain/Learning Rate": 7.64280519587432e-07, "Pretrain/Loss": 1.953392744064331, "Pretrain/Loss (Raw)": 1.8325419425964355, "Pretrain/Step": 8807, "Pretrain/Step Time": 8.66389925032854} +{"Pretrain/Learning Rate": 7.621987326371205e-07, "Pretrain/Loss": 1.9483742713928223, "Pretrain/Loss (Raw)": 1.8461737632751465, "Pretrain/Step": 8808, "Pretrain/Step Time": 8.66045904532075} +{"Pretrain/Learning Rate": 7.601197409042665e-07, "Pretrain/Loss": 1.947822093963623, "Pretrain/Loss (Raw)": 1.8951228857040405, "Pretrain/Step": 8809, "Pretrain/Step Time": 8.659470377489924} +{"Pretrain/Learning Rate": 7.5804354462862e-07, "Pretrain/Loss": 1.9484953880310059, "Pretrain/Loss (Raw)": 1.9255276918411255, "Pretrain/Step": 8810, "Pretrain/Step Time": 8.66184350848198} +{"Pretrain/Learning Rate": 7.55970144049628e-07, "Pretrain/Loss": 1.9497960805892944, "Pretrain/Loss (Raw)": 2.001079559326172, "Pretrain/Step": 8811, "Pretrain/Step Time": 8.661710539832711} +{"Pretrain/Learning Rate": 7.538995394063996e-07, "Pretrain/Loss": 1.9509387016296387, "Pretrain/Loss (Raw)": 2.182116746902466, "Pretrain/Step": 8812, "Pretrain/Step Time": 8.660185562446713} +{"Pretrain/Learning Rate": 7.518317309377298e-07, "Pretrain/Loss": 1.9484567642211914, "Pretrain/Loss (Raw)": 1.8307286500930786, "Pretrain/Step": 8813, "Pretrain/Step Time": 8.665164537727833} +{"Pretrain/Learning Rate": 7.497667188820834e-07, "Pretrain/Loss": 1.9477418661117554, "Pretrain/Loss (Raw)": 1.9732320308685303, "Pretrain/Step": 8814, "Pretrain/Step Time": 8.667663158848882} +{"Pretrain/Learning Rate": 7.477045034776087e-07, "Pretrain/Loss": 1.950183629989624, "Pretrain/Loss (Raw)": 2.0828475952148438, "Pretrain/Step": 8815, "Pretrain/Step Time": 8.66847525537014} +{"Pretrain/Learning Rate": 7.45645084962135e-07, "Pretrain/Loss": 1.9498929977416992, "Pretrain/Loss (Raw)": 1.8807251453399658, "Pretrain/Step": 8816, "Pretrain/Step Time": 8.667960686609149} +{"Pretrain/Learning Rate": 7.435884635731582e-07, "Pretrain/Loss": 1.9498461484909058, "Pretrain/Loss (Raw)": 1.6793080568313599, "Pretrain/Step": 8817, "Pretrain/Step Time": 8.668443411588669} +{"Pretrain/Learning Rate": 7.415346395478584e-07, "Pretrain/Loss": 1.9499101638793945, "Pretrain/Loss (Raw)": 2.1187100410461426, "Pretrain/Step": 8818, "Pretrain/Step Time": 8.662568926811218} +{"Pretrain/Learning Rate": 7.394836131230987e-07, "Pretrain/Loss": 1.947559118270874, "Pretrain/Loss (Raw)": 1.851226568222046, "Pretrain/Step": 8819, "Pretrain/Step Time": 8.663691399618983} +{"Pretrain/Learning Rate": 7.37435384535401e-07, "Pretrain/Loss": 1.9493441581726074, "Pretrain/Loss (Raw)": 1.9712622165679932, "Pretrain/Step": 8820, "Pretrain/Step Time": 8.663158858194947} +{"Pretrain/Learning Rate": 7.353899540209902e-07, "Pretrain/Loss": 1.9497616291046143, "Pretrain/Loss (Raw)": 2.0358633995056152, "Pretrain/Step": 8821, "Pretrain/Step Time": 8.667303765192628} +{"Pretrain/Learning Rate": 7.333473218157416e-07, "Pretrain/Loss": 1.949308156967163, "Pretrain/Loss (Raw)": 1.984300971031189, "Pretrain/Step": 8822, "Pretrain/Step Time": 8.667226951569319} +{"Pretrain/Learning Rate": 7.313074881552362e-07, "Pretrain/Loss": 1.9509775638580322, "Pretrain/Loss (Raw)": 1.92317533493042, "Pretrain/Step": 8823, "Pretrain/Step Time": 8.665905006229877} +{"Pretrain/Learning Rate": 7.292704532747024e-07, "Pretrain/Loss": 1.9502437114715576, "Pretrain/Loss (Raw)": 1.7635530233383179, "Pretrain/Step": 8824, "Pretrain/Step Time": 8.659654911607504} +{"Pretrain/Learning Rate": 7.272362174090691e-07, "Pretrain/Loss": 1.9476828575134277, "Pretrain/Loss (Raw)": 1.692055106163025, "Pretrain/Step": 8825, "Pretrain/Step Time": 8.66139587201178} +{"Pretrain/Learning Rate": 7.252047807929347e-07, "Pretrain/Loss": 1.9470651149749756, "Pretrain/Loss (Raw)": 1.77321457862854, "Pretrain/Step": 8826, "Pretrain/Step Time": 8.665888734161854} +{"Pretrain/Learning Rate": 7.2317614366057e-07, "Pretrain/Loss": 1.9476830959320068, "Pretrain/Loss (Raw)": 1.9585464000701904, "Pretrain/Step": 8827, "Pretrain/Step Time": 8.668200425803661} +{"Pretrain/Learning Rate": 7.211503062459268e-07, "Pretrain/Loss": 1.9481399059295654, "Pretrain/Loss (Raw)": 2.002847194671631, "Pretrain/Step": 8828, "Pretrain/Step Time": 8.669130891561508} +{"Pretrain/Learning Rate": 7.191272687826378e-07, "Pretrain/Loss": 1.9486280679702759, "Pretrain/Loss (Raw)": 2.019805908203125, "Pretrain/Step": 8829, "Pretrain/Step Time": 8.669781874865294} +{"Pretrain/Learning Rate": 7.17107031504008e-07, "Pretrain/Loss": 1.9500839710235596, "Pretrain/Loss (Raw)": 2.059931993484497, "Pretrain/Step": 8830, "Pretrain/Step Time": 8.666976768523455} +{"Pretrain/Learning Rate": 7.150895946430203e-07, "Pretrain/Loss": 1.9487321376800537, "Pretrain/Loss (Raw)": 1.8218340873718262, "Pretrain/Step": 8831, "Pretrain/Step Time": 8.669043788686395} +{"Pretrain/Learning Rate": 7.130749584323304e-07, "Pretrain/Loss": 1.948686122894287, "Pretrain/Loss (Raw)": 1.954332947731018, "Pretrain/Step": 8832, "Pretrain/Step Time": 8.671981891617179} +{"Pretrain/Learning Rate": 7.110631231042858e-07, "Pretrain/Loss": 1.9491157531738281, "Pretrain/Loss (Raw)": 2.0587353706359863, "Pretrain/Step": 8833, "Pretrain/Step Time": 8.669495694339275} +{"Pretrain/Learning Rate": 7.090540888908925e-07, "Pretrain/Loss": 1.9494284391403198, "Pretrain/Loss (Raw)": 2.019064426422119, "Pretrain/Step": 8834, "Pretrain/Step Time": 8.664952093735337} +{"Pretrain/Learning Rate": 7.070478560238458e-07, "Pretrain/Loss": 1.9537590742111206, "Pretrain/Loss (Raw)": 2.1074862480163574, "Pretrain/Step": 8835, "Pretrain/Step Time": 8.669963728636503} +{"Pretrain/Learning Rate": 7.050444247345078e-07, "Pretrain/Loss": 1.949316382408142, "Pretrain/Loss (Raw)": 1.542870044708252, "Pretrain/Step": 8836, "Pretrain/Step Time": 8.673685429617763} +{"Pretrain/Learning Rate": 7.030437952539326e-07, "Pretrain/Loss": 1.948190450668335, "Pretrain/Loss (Raw)": 2.0398361682891846, "Pretrain/Step": 8837, "Pretrain/Step Time": 8.675391798838973} +{"Pretrain/Learning Rate": 7.010459678128384e-07, "Pretrain/Loss": 1.9477695226669312, "Pretrain/Loss (Raw)": 1.9112604856491089, "Pretrain/Step": 8838, "Pretrain/Step Time": 8.67734383046627} +{"Pretrain/Learning Rate": 6.990509426416186e-07, "Pretrain/Loss": 1.9486186504364014, "Pretrain/Loss (Raw)": 2.0000922679901123, "Pretrain/Step": 8839, "Pretrain/Step Time": 8.678786186501384} +{"Pretrain/Learning Rate": 6.970587199703588e-07, "Pretrain/Loss": 1.9474515914916992, "Pretrain/Loss (Raw)": 1.9854297637939453, "Pretrain/Step": 8840, "Pretrain/Step Time": 8.676881080493331} +{"Pretrain/Learning Rate": 6.950693000288055e-07, "Pretrain/Loss": 1.9440743923187256, "Pretrain/Loss (Raw)": 1.5684467554092407, "Pretrain/Step": 8841, "Pretrain/Step Time": 8.671725863590837} +{"Pretrain/Learning Rate": 6.930826830463922e-07, "Pretrain/Loss": 1.9453117847442627, "Pretrain/Loss (Raw)": 1.7754558324813843, "Pretrain/Step": 8842, "Pretrain/Step Time": 8.672319946810603} +{"Pretrain/Learning Rate": 6.910988692522158e-07, "Pretrain/Loss": 1.943955659866333, "Pretrain/Loss (Raw)": 1.8675616979599, "Pretrain/Step": 8843, "Pretrain/Step Time": 8.679612809792161} +{"Pretrain/Learning Rate": 6.891178588750686e-07, "Pretrain/Loss": 1.945474624633789, "Pretrain/Loss (Raw)": 2.1463239192962646, "Pretrain/Step": 8844, "Pretrain/Step Time": 8.679116709157825} +{"Pretrain/Learning Rate": 6.871396521434065e-07, "Pretrain/Loss": 1.9454736709594727, "Pretrain/Loss (Raw)": 2.007215738296509, "Pretrain/Step": 8845, "Pretrain/Step Time": 8.674989901483059} +{"Pretrain/Learning Rate": 6.851642492853666e-07, "Pretrain/Loss": 1.9457041025161743, "Pretrain/Loss (Raw)": 2.07004714012146, "Pretrain/Step": 8846, "Pretrain/Step Time": 8.674044877290726} +{"Pretrain/Learning Rate": 6.831916505287555e-07, "Pretrain/Loss": 1.944846510887146, "Pretrain/Loss (Raw)": 1.9982208013534546, "Pretrain/Step": 8847, "Pretrain/Step Time": 8.671755464747548} +{"Pretrain/Learning Rate": 6.812218561010719e-07, "Pretrain/Loss": 1.9434177875518799, "Pretrain/Loss (Raw)": 1.7402770519256592, "Pretrain/Step": 8848, "Pretrain/Step Time": 8.67141443490982} +{"Pretrain/Learning Rate": 6.792548662294785e-07, "Pretrain/Loss": 1.94390070438385, "Pretrain/Loss (Raw)": 1.9561737775802612, "Pretrain/Step": 8849, "Pretrain/Step Time": 8.667165925726295} +{"Pretrain/Learning Rate": 6.772906811408159e-07, "Pretrain/Loss": 1.9449173212051392, "Pretrain/Loss (Raw)": 1.9810912609100342, "Pretrain/Step": 8850, "Pretrain/Step Time": 8.667535584419966} +{"Pretrain/Learning Rate": 6.75329301061603e-07, "Pretrain/Loss": 1.9467658996582031, "Pretrain/Loss (Raw)": 2.2111799716949463, "Pretrain/Step": 8851, "Pretrain/Step Time": 8.671373164281249} +{"Pretrain/Learning Rate": 6.733707262180394e-07, "Pretrain/Loss": 1.9483888149261475, "Pretrain/Loss (Raw)": 2.096520185470581, "Pretrain/Step": 8852, "Pretrain/Step Time": 8.675172293558717} +{"Pretrain/Learning Rate": 6.714149568359945e-07, "Pretrain/Loss": 1.9467805624008179, "Pretrain/Loss (Raw)": 1.7873398065567017, "Pretrain/Step": 8853, "Pretrain/Step Time": 8.677345996722579} +{"Pretrain/Learning Rate": 6.694619931410156e-07, "Pretrain/Loss": 1.9470709562301636, "Pretrain/Loss (Raw)": 2.1083340644836426, "Pretrain/Step": 8854, "Pretrain/Step Time": 8.668381612747908} +{"Pretrain/Learning Rate": 6.675118353583254e-07, "Pretrain/Loss": 1.946089506149292, "Pretrain/Loss (Raw)": 1.6693601608276367, "Pretrain/Step": 8855, "Pretrain/Step Time": 8.667416486889124} +{"Pretrain/Learning Rate": 6.655644837128328e-07, "Pretrain/Loss": 1.9446916580200195, "Pretrain/Loss (Raw)": 1.8180726766586304, "Pretrain/Step": 8856, "Pretrain/Step Time": 8.659574491903186} +{"Pretrain/Learning Rate": 6.636199384291137e-07, "Pretrain/Loss": 1.9441214799880981, "Pretrain/Loss (Raw)": 2.0285489559173584, "Pretrain/Step": 8857, "Pretrain/Step Time": 8.657251564785838} +{"Pretrain/Learning Rate": 6.616781997314164e-07, "Pretrain/Loss": 1.9473037719726562, "Pretrain/Loss (Raw)": 2.0163381099700928, "Pretrain/Step": 8858, "Pretrain/Step Time": 8.663314944133162} +{"Pretrain/Learning Rate": 6.597392678436731e-07, "Pretrain/Loss": 1.944272518157959, "Pretrain/Loss (Raw)": 1.599005103111267, "Pretrain/Step": 8859, "Pretrain/Step Time": 8.665939249098301} +{"Pretrain/Learning Rate": 6.578031429894993e-07, "Pretrain/Loss": 1.9464428424835205, "Pretrain/Loss (Raw)": 2.0917487144470215, "Pretrain/Step": 8860, "Pretrain/Step Time": 8.666141260415316} +{"Pretrain/Learning Rate": 6.558698253921664e-07, "Pretrain/Loss": 1.9456948041915894, "Pretrain/Loss (Raw)": 1.5105652809143066, "Pretrain/Step": 8861, "Pretrain/Step Time": 8.663329431787133} +{"Pretrain/Learning Rate": 6.539393152746404e-07, "Pretrain/Loss": 1.9447872638702393, "Pretrain/Loss (Raw)": 1.7571274042129517, "Pretrain/Step": 8862, "Pretrain/Step Time": 8.662901908159256} +{"Pretrain/Learning Rate": 6.520116128595516e-07, "Pretrain/Loss": 1.9465694427490234, "Pretrain/Loss (Raw)": 2.115358591079712, "Pretrain/Step": 8863, "Pretrain/Step Time": 8.665167111903429} +{"Pretrain/Learning Rate": 6.500867183692195e-07, "Pretrain/Loss": 1.94480562210083, "Pretrain/Loss (Raw)": 1.7200645208358765, "Pretrain/Step": 8864, "Pretrain/Step Time": 8.659524697810411} +{"Pretrain/Learning Rate": 6.481646320256246e-07, "Pretrain/Loss": 1.9426275491714478, "Pretrain/Loss (Raw)": 1.8535112142562866, "Pretrain/Step": 8865, "Pretrain/Step Time": 8.661428168416023} +{"Pretrain/Learning Rate": 6.462453540504343e-07, "Pretrain/Loss": 1.943526268005371, "Pretrain/Loss (Raw)": 2.038529872894287, "Pretrain/Step": 8866, "Pretrain/Step Time": 8.6606505792588} +{"Pretrain/Learning Rate": 6.443288846649881e-07, "Pretrain/Loss": 1.9446816444396973, "Pretrain/Loss (Raw)": 1.9769688844680786, "Pretrain/Step": 8867, "Pretrain/Step Time": 8.661797000095248} +{"Pretrain/Learning Rate": 6.424152240903065e-07, "Pretrain/Loss": 1.9448988437652588, "Pretrain/Loss (Raw)": 2.1158013343811035, "Pretrain/Step": 8868, "Pretrain/Step Time": 8.662195704877377} +{"Pretrain/Learning Rate": 6.405043725470738e-07, "Pretrain/Loss": 1.943824052810669, "Pretrain/Loss (Raw)": 1.9617736339569092, "Pretrain/Step": 8869, "Pretrain/Step Time": 8.663773966953158} +{"Pretrain/Learning Rate": 6.385963302556641e-07, "Pretrain/Loss": 1.9435386657714844, "Pretrain/Loss (Raw)": 1.9695638418197632, "Pretrain/Step": 8870, "Pretrain/Step Time": 8.658192124217749} +{"Pretrain/Learning Rate": 6.366910974361206e-07, "Pretrain/Loss": 1.9449433088302612, "Pretrain/Loss (Raw)": 2.0934994220733643, "Pretrain/Step": 8871, "Pretrain/Step Time": 8.653602067381144} +{"Pretrain/Learning Rate": 6.347886743081649e-07, "Pretrain/Loss": 1.945660948753357, "Pretrain/Loss (Raw)": 2.175414800643921, "Pretrain/Step": 8872, "Pretrain/Step Time": 8.655999476090074} +{"Pretrain/Learning Rate": 6.328890610911881e-07, "Pretrain/Loss": 1.9445297718048096, "Pretrain/Loss (Raw)": 1.7611863613128662, "Pretrain/Step": 8873, "Pretrain/Step Time": 8.658766459673643} +{"Pretrain/Learning Rate": 6.309922580042676e-07, "Pretrain/Loss": 1.9466066360473633, "Pretrain/Loss (Raw)": 2.1220717430114746, "Pretrain/Step": 8874, "Pretrain/Step Time": 8.664767013862729} +{"Pretrain/Learning Rate": 6.290982652661509e-07, "Pretrain/Loss": 1.9463090896606445, "Pretrain/Loss (Raw)": 1.9139764308929443, "Pretrain/Step": 8875, "Pretrain/Step Time": 8.664313647896051} +{"Pretrain/Learning Rate": 6.272070830952631e-07, "Pretrain/Loss": 1.948935866355896, "Pretrain/Loss (Raw)": 2.0609793663024902, "Pretrain/Step": 8876, "Pretrain/Step Time": 8.663405872881413} +{"Pretrain/Learning Rate": 6.253187117096992e-07, "Pretrain/Loss": 1.9496058225631714, "Pretrain/Loss (Raw)": 1.9084855318069458, "Pretrain/Step": 8877, "Pretrain/Step Time": 8.661891367286444} +{"Pretrain/Learning Rate": 6.234331513272435e-07, "Pretrain/Loss": 1.9493191242218018, "Pretrain/Loss (Raw)": 1.9742674827575684, "Pretrain/Step": 8878, "Pretrain/Step Time": 8.664422687143087} +{"Pretrain/Learning Rate": 6.215504021653412e-07, "Pretrain/Loss": 1.948900818824768, "Pretrain/Loss (Raw)": 1.9229830503463745, "Pretrain/Step": 8879, "Pretrain/Step Time": 8.663369016721845} +{"Pretrain/Learning Rate": 6.196704644411189e-07, "Pretrain/Loss": 1.947981834411621, "Pretrain/Loss (Raw)": 1.9656683206558228, "Pretrain/Step": 8880, "Pretrain/Step Time": 8.662737276405096} +{"Pretrain/Learning Rate": 6.177933383713835e-07, "Pretrain/Loss": 1.950589895248413, "Pretrain/Loss (Raw)": 1.975990653038025, "Pretrain/Step": 8881, "Pretrain/Step Time": 8.660556934773922} +{"Pretrain/Learning Rate": 6.159190241726148e-07, "Pretrain/Loss": 1.9480507373809814, "Pretrain/Loss (Raw)": 1.712782621383667, "Pretrain/Step": 8882, "Pretrain/Step Time": 8.660298550501466} +{"Pretrain/Learning Rate": 6.140475220609676e-07, "Pretrain/Loss": 1.946916103363037, "Pretrain/Loss (Raw)": 1.8260273933410645, "Pretrain/Step": 8883, "Pretrain/Step Time": 8.658639699220657} +{"Pretrain/Learning Rate": 6.121788322522637e-07, "Pretrain/Loss": 1.9423835277557373, "Pretrain/Loss (Raw)": 1.6867996454238892, "Pretrain/Step": 8884, "Pretrain/Step Time": 8.666046755388379} +{"Pretrain/Learning Rate": 6.103129549620223e-07, "Pretrain/Loss": 1.9401404857635498, "Pretrain/Loss (Raw)": 1.6831777095794678, "Pretrain/Step": 8885, "Pretrain/Step Time": 8.665570609271526} +{"Pretrain/Learning Rate": 6.084498904054187e-07, "Pretrain/Loss": 1.9386006593704224, "Pretrain/Loss (Raw)": 1.9584840536117554, "Pretrain/Step": 8886, "Pretrain/Step Time": 8.659906629472971} +{"Pretrain/Learning Rate": 6.065896387973086e-07, "Pretrain/Loss": 1.9385831356048584, "Pretrain/Loss (Raw)": 2.0085084438323975, "Pretrain/Step": 8887, "Pretrain/Step Time": 8.653571974486113} +{"Pretrain/Learning Rate": 6.04732200352226e-07, "Pretrain/Loss": 1.939421534538269, "Pretrain/Loss (Raw)": 2.200004816055298, "Pretrain/Step": 8888, "Pretrain/Step Time": 8.651753166690469} +{"Pretrain/Learning Rate": 6.028775752843801e-07, "Pretrain/Loss": 1.9365302324295044, "Pretrain/Loss (Raw)": 1.6652752161026, "Pretrain/Step": 8889, "Pretrain/Step Time": 8.652703138068318} +{"Pretrain/Learning Rate": 6.010257638076583e-07, "Pretrain/Loss": 1.936476230621338, "Pretrain/Loss (Raw)": 2.0721092224121094, "Pretrain/Step": 8890, "Pretrain/Step Time": 8.654028186574578} +{"Pretrain/Learning Rate": 5.991767661356145e-07, "Pretrain/Loss": 1.9372962713241577, "Pretrain/Loss (Raw)": 2.1036739349365234, "Pretrain/Step": 8891, "Pretrain/Step Time": 8.656073672696948} +{"Pretrain/Learning Rate": 5.973305824814867e-07, "Pretrain/Loss": 1.9376250505447388, "Pretrain/Loss (Raw)": 2.0811305046081543, "Pretrain/Step": 8892, "Pretrain/Step Time": 8.65755731612444} +{"Pretrain/Learning Rate": 5.954872130581851e-07, "Pretrain/Loss": 1.9403787851333618, "Pretrain/Loss (Raw)": 2.0072977542877197, "Pretrain/Step": 8893, "Pretrain/Step Time": 8.657581822946668} +{"Pretrain/Learning Rate": 5.936466580782979e-07, "Pretrain/Loss": 1.940952181816101, "Pretrain/Loss (Raw)": 1.8540256023406982, "Pretrain/Step": 8894, "Pretrain/Step Time": 8.654628533869982} +{"Pretrain/Learning Rate": 5.918089177540858e-07, "Pretrain/Loss": 1.942850947380066, "Pretrain/Loss (Raw)": 2.034557819366455, "Pretrain/Step": 8895, "Pretrain/Step Time": 8.654425885528326} +{"Pretrain/Learning Rate": 5.899739922974795e-07, "Pretrain/Loss": 1.9436063766479492, "Pretrain/Loss (Raw)": 2.1554558277130127, "Pretrain/Step": 8896, "Pretrain/Step Time": 8.65591823682189} +{"Pretrain/Learning Rate": 5.881418819200985e-07, "Pretrain/Loss": 1.9437041282653809, "Pretrain/Loss (Raw)": 1.9995728731155396, "Pretrain/Step": 8897, "Pretrain/Step Time": 8.661713767796755} +{"Pretrain/Learning Rate": 5.863125868332292e-07, "Pretrain/Loss": 1.9435142278671265, "Pretrain/Loss (Raw)": 1.8980293273925781, "Pretrain/Step": 8898, "Pretrain/Step Time": 8.662382861599326} +{"Pretrain/Learning Rate": 5.844861072478336e-07, "Pretrain/Loss": 1.9441003799438477, "Pretrain/Loss (Raw)": 1.8970263004302979, "Pretrain/Step": 8899, "Pretrain/Step Time": 8.660261558368802} +{"Pretrain/Learning Rate": 5.826624433745486e-07, "Pretrain/Loss": 1.9462634325027466, "Pretrain/Loss (Raw)": 2.1024365425109863, "Pretrain/Step": 8900, "Pretrain/Step Time": 8.660429103299975} +{"Pretrain/Learning Rate": 5.808415954236924e-07, "Pretrain/Loss": 1.9472966194152832, "Pretrain/Loss (Raw)": 2.035412311553955, "Pretrain/Step": 8901, "Pretrain/Step Time": 8.658334970474243} +{"Pretrain/Learning Rate": 5.790235636052438e-07, "Pretrain/Loss": 1.9470245838165283, "Pretrain/Loss (Raw)": 1.943682074546814, "Pretrain/Step": 8902, "Pretrain/Step Time": 8.653599144890904} +{"Pretrain/Learning Rate": 5.772083481288771e-07, "Pretrain/Loss": 1.9478968381881714, "Pretrain/Loss (Raw)": 2.1308040618896484, "Pretrain/Step": 8903, "Pretrain/Step Time": 8.654826318845153} +{"Pretrain/Learning Rate": 5.753959492039246e-07, "Pretrain/Loss": 1.9452471733093262, "Pretrain/Loss (Raw)": 1.7695512771606445, "Pretrain/Step": 8904, "Pretrain/Step Time": 8.65769524872303} +{"Pretrain/Learning Rate": 5.73586367039411e-07, "Pretrain/Loss": 1.945624828338623, "Pretrain/Loss (Raw)": 2.022918462753296, "Pretrain/Step": 8905, "Pretrain/Step Time": 8.659877797588706} +{"Pretrain/Learning Rate": 5.717796018440108e-07, "Pretrain/Loss": 1.9466443061828613, "Pretrain/Loss (Raw)": 1.95013427734375, "Pretrain/Step": 8906, "Pretrain/Step Time": 8.662327706813812} +{"Pretrain/Learning Rate": 5.69975653826102e-07, "Pretrain/Loss": 1.9488338232040405, "Pretrain/Loss (Raw)": 2.039278984069824, "Pretrain/Step": 8907, "Pretrain/Step Time": 8.657584266737103} +{"Pretrain/Learning Rate": 5.681745231937124e-07, "Pretrain/Loss": 1.9498932361602783, "Pretrain/Loss (Raw)": 2.131479024887085, "Pretrain/Step": 8908, "Pretrain/Step Time": 8.656771443784237} +{"Pretrain/Learning Rate": 5.663762101545706e-07, "Pretrain/Loss": 1.9494831562042236, "Pretrain/Loss (Raw)": 1.8987751007080078, "Pretrain/Step": 8909, "Pretrain/Step Time": 8.657876949757338} +{"Pretrain/Learning Rate": 5.645807149160548e-07, "Pretrain/Loss": 1.9505560398101807, "Pretrain/Loss (Raw)": 1.9831384420394897, "Pretrain/Step": 8910, "Pretrain/Step Time": 8.656761314719915} +{"Pretrain/Learning Rate": 5.627880376852357e-07, "Pretrain/Loss": 1.9502027034759521, "Pretrain/Loss (Raw)": 2.07966685295105, "Pretrain/Step": 8911, "Pretrain/Step Time": 8.65849032625556} +{"Pretrain/Learning Rate": 5.609981786688534e-07, "Pretrain/Loss": 1.9498584270477295, "Pretrain/Loss (Raw)": 1.8677090406417847, "Pretrain/Step": 8912, "Pretrain/Step Time": 8.661151137202978} +{"Pretrain/Learning Rate": 5.592111380733206e-07, "Pretrain/Loss": 1.9470776319503784, "Pretrain/Loss (Raw)": 1.6057345867156982, "Pretrain/Step": 8913, "Pretrain/Step Time": 8.664025152102113} +{"Pretrain/Learning Rate": 5.574269161047252e-07, "Pretrain/Loss": 1.949008822441101, "Pretrain/Loss (Raw)": 2.063173294067383, "Pretrain/Step": 8914, "Pretrain/Step Time": 8.666615031659603} +{"Pretrain/Learning Rate": 5.556455129688387e-07, "Pretrain/Loss": 1.9480855464935303, "Pretrain/Loss (Raw)": 1.9362980127334595, "Pretrain/Step": 8915, "Pretrain/Step Time": 8.668201951310039} +{"Pretrain/Learning Rate": 5.538669288710968e-07, "Pretrain/Loss": 1.9482269287109375, "Pretrain/Loss (Raw)": 1.9411898851394653, "Pretrain/Step": 8916, "Pretrain/Step Time": 8.663824580609798} +{"Pretrain/Learning Rate": 5.520911640166132e-07, "Pretrain/Loss": 1.9475581645965576, "Pretrain/Loss (Raw)": 1.8313212394714355, "Pretrain/Step": 8917, "Pretrain/Step Time": 8.671248750761151} +{"Pretrain/Learning Rate": 5.503182186101796e-07, "Pretrain/Loss": 1.9423270225524902, "Pretrain/Loss (Raw)": 1.5154513120651245, "Pretrain/Step": 8918, "Pretrain/Step Time": 8.66812583245337} +{"Pretrain/Learning Rate": 5.485480928562603e-07, "Pretrain/Loss": 1.9442341327667236, "Pretrain/Loss (Raw)": 2.2801918983459473, "Pretrain/Step": 8919, "Pretrain/Step Time": 8.675230653956532} +{"Pretrain/Learning Rate": 5.467807869589919e-07, "Pretrain/Loss": 1.9441004991531372, "Pretrain/Loss (Raw)": 1.9544177055358887, "Pretrain/Step": 8920, "Pretrain/Step Time": 8.673209903761744} +{"Pretrain/Learning Rate": 5.45016301122192e-07, "Pretrain/Loss": 1.9446868896484375, "Pretrain/Loss (Raw)": 1.9698234796524048, "Pretrain/Step": 8921, "Pretrain/Step Time": 8.677111681550741} +{"Pretrain/Learning Rate": 5.432546355493479e-07, "Pretrain/Loss": 1.9439653158187866, "Pretrain/Loss (Raw)": 1.9082366228103638, "Pretrain/Step": 8922, "Pretrain/Step Time": 8.673923410475254} +{"Pretrain/Learning Rate": 5.414957904436219e-07, "Pretrain/Loss": 1.9433050155639648, "Pretrain/Loss (Raw)": 2.0205447673797607, "Pretrain/Step": 8923, "Pretrain/Step Time": 8.674499675631523} +{"Pretrain/Learning Rate": 5.397397660078573e-07, "Pretrain/Loss": 1.9405784606933594, "Pretrain/Loss (Raw)": 1.6371917724609375, "Pretrain/Step": 8924, "Pretrain/Step Time": 8.673173010349274} +{"Pretrain/Learning Rate": 5.37986562444559e-07, "Pretrain/Loss": 1.9397921562194824, "Pretrain/Loss (Raw)": 2.0609827041625977, "Pretrain/Step": 8925, "Pretrain/Step Time": 8.677546430379152} +{"Pretrain/Learning Rate": 5.362361799559207e-07, "Pretrain/Loss": 1.9371984004974365, "Pretrain/Loss (Raw)": 1.692206859588623, "Pretrain/Step": 8926, "Pretrain/Step Time": 8.674190817400813} +{"Pretrain/Learning Rate": 5.344886187438031e-07, "Pretrain/Loss": 1.9354612827301025, "Pretrain/Loss (Raw)": 1.7368428707122803, "Pretrain/Step": 8927, "Pretrain/Step Time": 8.67889915779233} +{"Pretrain/Learning Rate": 5.327438790097449e-07, "Pretrain/Loss": 1.9350719451904297, "Pretrain/Loss (Raw)": 1.9053484201431274, "Pretrain/Step": 8928, "Pretrain/Step Time": 8.682155691087246} +{"Pretrain/Learning Rate": 5.310019609549521e-07, "Pretrain/Loss": 1.9359335899353027, "Pretrain/Loss (Raw)": 2.1249828338623047, "Pretrain/Step": 8929, "Pretrain/Step Time": 8.6847885530442} +{"Pretrain/Learning Rate": 5.292628647803194e-07, "Pretrain/Loss": 1.936338186264038, "Pretrain/Loss (Raw)": 1.9508036375045776, "Pretrain/Step": 8930, "Pretrain/Step Time": 8.679305294528604} +{"Pretrain/Learning Rate": 5.27526590686403e-07, "Pretrain/Loss": 1.9375965595245361, "Pretrain/Loss (Raw)": 2.0221235752105713, "Pretrain/Step": 8931, "Pretrain/Step Time": 8.680278912186623} +{"Pretrain/Learning Rate": 5.257931388734344e-07, "Pretrain/Loss": 1.9375005960464478, "Pretrain/Loss (Raw)": 2.0647714138031006, "Pretrain/Step": 8932, "Pretrain/Step Time": 8.676911886781454} +{"Pretrain/Learning Rate": 5.240625095413287e-07, "Pretrain/Loss": 1.9372992515563965, "Pretrain/Loss (Raw)": 1.954635739326477, "Pretrain/Step": 8933, "Pretrain/Step Time": 8.678374502807856} +{"Pretrain/Learning Rate": 5.223347028896708e-07, "Pretrain/Loss": 1.9402046203613281, "Pretrain/Loss (Raw)": 2.215102195739746, "Pretrain/Step": 8934, "Pretrain/Step Time": 8.676081765443087} +{"Pretrain/Learning Rate": 5.206097191177151e-07, "Pretrain/Loss": 1.9412740468978882, "Pretrain/Loss (Raw)": 1.9694331884384155, "Pretrain/Step": 8935, "Pretrain/Step Time": 8.67322612926364} +{"Pretrain/Learning Rate": 5.188875584243996e-07, "Pretrain/Loss": 1.943314552307129, "Pretrain/Loss (Raw)": 2.1073546409606934, "Pretrain/Step": 8936, "Pretrain/Step Time": 8.676837142556906} +{"Pretrain/Learning Rate": 5.171682210083268e-07, "Pretrain/Loss": 1.9469504356384277, "Pretrain/Loss (Raw)": 2.3605058193206787, "Pretrain/Step": 8937, "Pretrain/Step Time": 8.675021639093757} +{"Pretrain/Learning Rate": 5.15451707067785e-07, "Pretrain/Loss": 1.9483110904693604, "Pretrain/Loss (Raw)": 2.0997066497802734, "Pretrain/Step": 8938, "Pretrain/Step Time": 8.674833629280329} +{"Pretrain/Learning Rate": 5.137380168007244e-07, "Pretrain/Loss": 1.9470793008804321, "Pretrain/Loss (Raw)": 1.8434109687805176, "Pretrain/Step": 8939, "Pretrain/Step Time": 8.67269722558558} +{"Pretrain/Learning Rate": 5.120271504047813e-07, "Pretrain/Loss": 1.9452919960021973, "Pretrain/Loss (Raw)": 1.9533302783966064, "Pretrain/Step": 8940, "Pretrain/Step Time": 8.672115365043283} +{"Pretrain/Learning Rate": 5.103191080772535e-07, "Pretrain/Loss": 1.9458777904510498, "Pretrain/Loss (Raw)": 1.9057233333587646, "Pretrain/Step": 8941, "Pretrain/Step Time": 8.665564253926277} +{"Pretrain/Learning Rate": 5.086138900151333e-07, "Pretrain/Loss": 1.9444880485534668, "Pretrain/Loss (Raw)": 1.7953460216522217, "Pretrain/Step": 8942, "Pretrain/Step Time": 8.663640627637506} +{"Pretrain/Learning Rate": 5.069114964150606e-07, "Pretrain/Loss": 1.9430354833602905, "Pretrain/Loss (Raw)": 1.8969111442565918, "Pretrain/Step": 8943, "Pretrain/Step Time": 8.662941461429} +{"Pretrain/Learning Rate": 5.052119274733702e-07, "Pretrain/Loss": 1.944077968597412, "Pretrain/Loss (Raw)": 2.0141682624816895, "Pretrain/Step": 8944, "Pretrain/Step Time": 8.666832340881228} +{"Pretrain/Learning Rate": 5.035151833860635e-07, "Pretrain/Loss": 1.9468228816986084, "Pretrain/Loss (Raw)": 2.0306556224823, "Pretrain/Step": 8945, "Pretrain/Step Time": 8.66668226197362} +{"Pretrain/Learning Rate": 5.018212643488202e-07, "Pretrain/Loss": 1.9469523429870605, "Pretrain/Loss (Raw)": 2.13527774810791, "Pretrain/Step": 8946, "Pretrain/Step Time": 8.669303795322776} +{"Pretrain/Learning Rate": 5.001301705569838e-07, "Pretrain/Loss": 1.9473320245742798, "Pretrain/Loss (Raw)": 1.8998297452926636, "Pretrain/Step": 8947, "Pretrain/Step Time": 8.670322682708502} +{"Pretrain/Learning Rate": 4.984419022055848e-07, "Pretrain/Loss": 1.9460505247116089, "Pretrain/Loss (Raw)": 1.8072214126586914, "Pretrain/Step": 8948, "Pretrain/Step Time": 8.668587073683739} +{"Pretrain/Learning Rate": 4.967564594893198e-07, "Pretrain/Loss": 1.9453449249267578, "Pretrain/Loss (Raw)": 1.9455465078353882, "Pretrain/Step": 8949, "Pretrain/Step Time": 8.667651092633605} +{"Pretrain/Learning Rate": 4.95073842602567e-07, "Pretrain/Loss": 1.9448649883270264, "Pretrain/Loss (Raw)": 1.9228709936141968, "Pretrain/Step": 8950, "Pretrain/Step Time": 8.671035796403885} +{"Pretrain/Learning Rate": 4.933940517393626e-07, "Pretrain/Loss": 1.9451565742492676, "Pretrain/Loss (Raw)": 1.9605015516281128, "Pretrain/Step": 8951, "Pretrain/Step Time": 8.66896728053689} +{"Pretrain/Learning Rate": 4.917170870934407e-07, "Pretrain/Loss": 1.944946527481079, "Pretrain/Loss (Raw)": 1.7366780042648315, "Pretrain/Step": 8952, "Pretrain/Step Time": 8.677166394889355} +{"Pretrain/Learning Rate": 4.900429488581909e-07, "Pretrain/Loss": 1.946617841720581, "Pretrain/Loss (Raw)": 1.9059666395187378, "Pretrain/Step": 8953, "Pretrain/Step Time": 8.67455230653286} +{"Pretrain/Learning Rate": 4.883716372266811e-07, "Pretrain/Loss": 1.9466392993927002, "Pretrain/Loss (Raw)": 1.775967001914978, "Pretrain/Step": 8954, "Pretrain/Step Time": 8.672255329787731} +{"Pretrain/Learning Rate": 4.867031523916571e-07, "Pretrain/Loss": 1.9468555450439453, "Pretrain/Loss (Raw)": 1.9862210750579834, "Pretrain/Step": 8955, "Pretrain/Step Time": 8.666366782039404} +{"Pretrain/Learning Rate": 4.850374945455344e-07, "Pretrain/Loss": 1.9478509426116943, "Pretrain/Loss (Raw)": 2.1302716732025146, "Pretrain/Step": 8956, "Pretrain/Step Time": 8.66189681366086} +{"Pretrain/Learning Rate": 4.833746638804093e-07, "Pretrain/Loss": 1.945961833000183, "Pretrain/Loss (Raw)": 1.7779935598373413, "Pretrain/Step": 8957, "Pretrain/Step Time": 8.664106480777264} +{"Pretrain/Learning Rate": 4.817146605880424e-07, "Pretrain/Loss": 1.945336103439331, "Pretrain/Loss (Raw)": 1.9798462390899658, "Pretrain/Step": 8958, "Pretrain/Step Time": 8.665495127439499} +{"Pretrain/Learning Rate": 4.800574848598749e-07, "Pretrain/Loss": 1.9459309577941895, "Pretrain/Loss (Raw)": 1.8979688882827759, "Pretrain/Step": 8959, "Pretrain/Step Time": 8.663772564381361} +{"Pretrain/Learning Rate": 4.784031368870206e-07, "Pretrain/Loss": 1.945496916770935, "Pretrain/Loss (Raw)": 1.8987724781036377, "Pretrain/Step": 8960, "Pretrain/Step Time": 8.660877699032426} +{"Pretrain/Learning Rate": 4.7675161686026595e-07, "Pretrain/Loss": 1.9456629753112793, "Pretrain/Loss (Raw)": 2.079993963241577, "Pretrain/Step": 8961, "Pretrain/Step Time": 8.659896476194263} +{"Pretrain/Learning Rate": 4.751029249700695e-07, "Pretrain/Loss": 1.9464131593704224, "Pretrain/Loss (Raw)": 2.1150848865509033, "Pretrain/Step": 8962, "Pretrain/Step Time": 8.66289472207427} +{"Pretrain/Learning Rate": 4.734570614065709e-07, "Pretrain/Loss": 1.9445061683654785, "Pretrain/Loss (Raw)": 1.8634041547775269, "Pretrain/Step": 8963, "Pretrain/Step Time": 8.659057242795825} +{"Pretrain/Learning Rate": 4.718140263595794e-07, "Pretrain/Loss": 1.9494664669036865, "Pretrain/Loss (Raw)": 2.1777589321136475, "Pretrain/Step": 8964, "Pretrain/Step Time": 8.65597665682435} +{"Pretrain/Learning Rate": 4.701738200185712e-07, "Pretrain/Loss": 1.9497345685958862, "Pretrain/Loss (Raw)": 2.074171781539917, "Pretrain/Step": 8965, "Pretrain/Step Time": 8.651013556867838} +{"Pretrain/Learning Rate": 4.6853644257270624e-07, "Pretrain/Loss": 1.9497957229614258, "Pretrain/Loss (Raw)": 1.9190855026245117, "Pretrain/Step": 8966, "Pretrain/Step Time": 8.650814656168222} +{"Pretrain/Learning Rate": 4.6690189421081943e-07, "Pretrain/Loss": 1.9485116004943848, "Pretrain/Loss (Raw)": 1.8357197046279907, "Pretrain/Step": 8967, "Pretrain/Step Time": 8.649966645985842} +{"Pretrain/Learning Rate": 4.6527017512140723e-07, "Pretrain/Loss": 1.9459106922149658, "Pretrain/Loss (Raw)": 1.652524709701538, "Pretrain/Step": 8968, "Pretrain/Step Time": 8.65430723130703} +{"Pretrain/Learning Rate": 4.6364128549264976e-07, "Pretrain/Loss": 1.9491006135940552, "Pretrain/Loss (Raw)": 1.9767425060272217, "Pretrain/Step": 8969, "Pretrain/Step Time": 8.652536571025848} +{"Pretrain/Learning Rate": 4.6201522551239664e-07, "Pretrain/Loss": 1.9476374387741089, "Pretrain/Loss (Raw)": 1.5881766080856323, "Pretrain/Step": 8970, "Pretrain/Step Time": 8.653447875753045} +{"Pretrain/Learning Rate": 4.603919953681757e-07, "Pretrain/Loss": 1.9476772546768188, "Pretrain/Loss (Raw)": 1.8726587295532227, "Pretrain/Step": 8971, "Pretrain/Step Time": 8.64505710825324} +{"Pretrain/Learning Rate": 4.587715952471872e-07, "Pretrain/Loss": 1.9463952779769897, "Pretrain/Loss (Raw)": 1.9822345972061157, "Pretrain/Step": 8972, "Pretrain/Step Time": 8.648045651614666} +{"Pretrain/Learning Rate": 4.5715402533629826e-07, "Pretrain/Loss": 1.9486756324768066, "Pretrain/Loss (Raw)": 2.299093008041382, "Pretrain/Step": 8973, "Pretrain/Step Time": 8.652425318956375} +{"Pretrain/Learning Rate": 4.5553928582205417e-07, "Pretrain/Loss": 1.9471718072891235, "Pretrain/Loss (Raw)": 1.8775614500045776, "Pretrain/Step": 8974, "Pretrain/Step Time": 8.650608712807298} +{"Pretrain/Learning Rate": 4.539273768906782e-07, "Pretrain/Loss": 1.9463937282562256, "Pretrain/Loss (Raw)": 1.8986268043518066, "Pretrain/Step": 8975, "Pretrain/Step Time": 8.652886509895325} +{"Pretrain/Learning Rate": 4.523182987280633e-07, "Pretrain/Loss": 1.9463584423065186, "Pretrain/Loss (Raw)": 1.7357693910598755, "Pretrain/Step": 8976, "Pretrain/Step Time": 8.653447778895497} +{"Pretrain/Learning Rate": 4.507120515197749e-07, "Pretrain/Loss": 1.9427683353424072, "Pretrain/Loss (Raw)": 1.4966193437576294, "Pretrain/Step": 8977, "Pretrain/Step Time": 8.654131142422557} +{"Pretrain/Learning Rate": 4.49108635451051e-07, "Pretrain/Loss": 1.944411039352417, "Pretrain/Loss (Raw)": 2.191368579864502, "Pretrain/Step": 8978, "Pretrain/Step Time": 8.656609220430255} +{"Pretrain/Learning Rate": 4.475080507068102e-07, "Pretrain/Loss": 1.9437320232391357, "Pretrain/Loss (Raw)": 2.124255418777466, "Pretrain/Step": 8979, "Pretrain/Step Time": 8.65790369361639} +{"Pretrain/Learning Rate": 4.4591029747163283e-07, "Pretrain/Loss": 1.9424428939819336, "Pretrain/Loss (Raw)": 1.9315166473388672, "Pretrain/Step": 8980, "Pretrain/Step Time": 8.654389584437013} +{"Pretrain/Learning Rate": 4.443153759297852e-07, "Pretrain/Loss": 1.9440555572509766, "Pretrain/Loss (Raw)": 1.9937783479690552, "Pretrain/Step": 8981, "Pretrain/Step Time": 8.654727371409535} +{"Pretrain/Learning Rate": 4.427232862651953e-07, "Pretrain/Loss": 1.943402647972107, "Pretrain/Loss (Raw)": 2.0247559547424316, "Pretrain/Step": 8982, "Pretrain/Step Time": 8.657254992052913} +{"Pretrain/Learning Rate": 4.4113402866147734e-07, "Pretrain/Loss": 1.9454419612884521, "Pretrain/Loss (Raw)": 1.9303957223892212, "Pretrain/Step": 8983, "Pretrain/Step Time": 8.661392388865352} +{"Pretrain/Learning Rate": 4.395476033019069e-07, "Pretrain/Loss": 1.9479767084121704, "Pretrain/Loss (Raw)": 2.1425070762634277, "Pretrain/Step": 8984, "Pretrain/Step Time": 8.665124401450157} +{"Pretrain/Learning Rate": 4.3796401036944043e-07, "Pretrain/Loss": 1.94734787940979, "Pretrain/Loss (Raw)": 1.9480664730072021, "Pretrain/Step": 8985, "Pretrain/Step Time": 8.664415394887328} +{"Pretrain/Learning Rate": 4.3638325004670135e-07, "Pretrain/Loss": 1.948447585105896, "Pretrain/Loss (Raw)": 2.157099962234497, "Pretrain/Step": 8986, "Pretrain/Step Time": 8.659788681194186} +{"Pretrain/Learning Rate": 4.3480532251599647e-07, "Pretrain/Loss": 1.9511384963989258, "Pretrain/Loss (Raw)": 1.943433403968811, "Pretrain/Step": 8987, "Pretrain/Step Time": 8.65715529769659} +{"Pretrain/Learning Rate": 4.3323022795929425e-07, "Pretrain/Loss": 1.9507536888122559, "Pretrain/Loss (Raw)": 2.0425100326538086, "Pretrain/Step": 8988, "Pretrain/Step Time": 8.656087769195437} +{"Pretrain/Learning Rate": 4.316579665582465e-07, "Pretrain/Loss": 1.9544545412063599, "Pretrain/Loss (Raw)": 1.9842545986175537, "Pretrain/Step": 8989, "Pretrain/Step Time": 8.65772831439972} +{"Pretrain/Learning Rate": 4.300885384941694e-07, "Pretrain/Loss": 1.955318570137024, "Pretrain/Loss (Raw)": 1.8677270412445068, "Pretrain/Step": 8990, "Pretrain/Step Time": 8.657058231532574} +{"Pretrain/Learning Rate": 4.285219439480653e-07, "Pretrain/Loss": 1.9541029930114746, "Pretrain/Loss (Raw)": 1.9597653150558472, "Pretrain/Step": 8991, "Pretrain/Step Time": 8.658199053257704} +{"Pretrain/Learning Rate": 4.2695818310058975e-07, "Pretrain/Loss": 1.9567103385925293, "Pretrain/Loss (Raw)": 2.0538058280944824, "Pretrain/Step": 8992, "Pretrain/Step Time": 8.65715099684894} +{"Pretrain/Learning Rate": 4.253972561320901e-07, "Pretrain/Loss": 1.9585518836975098, "Pretrain/Loss (Raw)": 2.0892374515533447, "Pretrain/Step": 8993, "Pretrain/Step Time": 8.657346855849028} +{"Pretrain/Learning Rate": 4.23839163222578e-07, "Pretrain/Loss": 1.9567410945892334, "Pretrain/Loss (Raw)": 1.806754231452942, "Pretrain/Step": 8994, "Pretrain/Step Time": 8.661456398665905} +{"Pretrain/Learning Rate": 4.222839045517402e-07, "Pretrain/Loss": 1.9563837051391602, "Pretrain/Loss (Raw)": 1.9312236309051514, "Pretrain/Step": 8995, "Pretrain/Step Time": 8.661956259980798} +{"Pretrain/Learning Rate": 4.2073148029893593e-07, "Pretrain/Loss": 1.9567420482635498, "Pretrain/Loss (Raw)": 2.1616621017456055, "Pretrain/Step": 8996, "Pretrain/Step Time": 8.66059359535575} +{"Pretrain/Learning Rate": 4.191818906431999e-07, "Pretrain/Loss": 1.9575707912445068, "Pretrain/Loss (Raw)": 2.067854404449463, "Pretrain/Step": 8997, "Pretrain/Step Time": 8.660629592835903} +{"Pretrain/Learning Rate": 4.176351357632363e-07, "Pretrain/Loss": 1.9569250345230103, "Pretrain/Loss (Raw)": 1.8869116306304932, "Pretrain/Step": 8998, "Pretrain/Step Time": 8.66289153881371} +{"Pretrain/Learning Rate": 4.160912158374247e-07, "Pretrain/Loss": 1.9568475484848022, "Pretrain/Loss (Raw)": 2.083577871322632, "Pretrain/Step": 8999, "Pretrain/Step Time": 8.667964190244675} +{"Pretrain/Learning Rate": 4.1455013104381714e-07, "Pretrain/Loss": 1.9530075788497925, "Pretrain/Loss (Raw)": 1.6838892698287964, "Pretrain/Step": 9000, "Pretrain/Step Time": 8.668960850685835} +{"Pretrain/Learning Rate": 4.1301188156013803e-07, "Pretrain/Loss": 1.9547914266586304, "Pretrain/Loss (Raw)": 1.9895246028900146, "Pretrain/Step": 9001, "Pretrain/Step Time": 8.668181685730815} +{"Pretrain/Learning Rate": 4.1147646756378997e-07, "Pretrain/Loss": 1.9539334774017334, "Pretrain/Loss (Raw)": 2.012247085571289, "Pretrain/Step": 9002, "Pretrain/Step Time": 8.666403582319617} +{"Pretrain/Learning Rate": 4.099438892318369e-07, "Pretrain/Loss": 1.95351243019104, "Pretrain/Loss (Raw)": 1.8600993156433105, "Pretrain/Step": 9003, "Pretrain/Step Time": 8.665723592042923} +{"Pretrain/Learning Rate": 4.084141467410263e-07, "Pretrain/Loss": 1.9539833068847656, "Pretrain/Loss (Raw)": 2.121246814727783, "Pretrain/Step": 9004, "Pretrain/Step Time": 8.665296778082848} +{"Pretrain/Learning Rate": 4.0688724026777814e-07, "Pretrain/Loss": 1.9548777341842651, "Pretrain/Loss (Raw)": 2.022960662841797, "Pretrain/Step": 9005, "Pretrain/Step Time": 8.662341697141528} +{"Pretrain/Learning Rate": 4.0536316998817937e-07, "Pretrain/Loss": 1.9560359716415405, "Pretrain/Loss (Raw)": 2.1225264072418213, "Pretrain/Step": 9006, "Pretrain/Step Time": 8.665131157264113} +{"Pretrain/Learning Rate": 4.038419360779921e-07, "Pretrain/Loss": 1.9549853801727295, "Pretrain/Loss (Raw)": 1.7885016202926636, "Pretrain/Step": 9007, "Pretrain/Step Time": 8.668193735182285} +{"Pretrain/Learning Rate": 4.023235387126567e-07, "Pretrain/Loss": 1.9558730125427246, "Pretrain/Loss (Raw)": 2.079289674758911, "Pretrain/Step": 9008, "Pretrain/Step Time": 8.66949756257236} +{"Pretrain/Learning Rate": 4.008079780672774e-07, "Pretrain/Loss": 1.9566658735275269, "Pretrain/Loss (Raw)": 2.0774762630462646, "Pretrain/Step": 9009, "Pretrain/Step Time": 8.669440392404795} +{"Pretrain/Learning Rate": 3.992952543166367e-07, "Pretrain/Loss": 1.9577491283416748, "Pretrain/Loss (Raw)": 1.851453423500061, "Pretrain/Step": 9010, "Pretrain/Step Time": 8.674164604395628} +{"Pretrain/Learning Rate": 3.977853676351867e-07, "Pretrain/Loss": 1.958315372467041, "Pretrain/Loss (Raw)": 1.8985027074813843, "Pretrain/Step": 9011, "Pretrain/Step Time": 8.671245329082012} +{"Pretrain/Learning Rate": 3.9627831819706305e-07, "Pretrain/Loss": 1.961106538772583, "Pretrain/Loss (Raw)": 2.0440659523010254, "Pretrain/Step": 9012, "Pretrain/Step Time": 8.665530601516366} +{"Pretrain/Learning Rate": 3.947741061760574e-07, "Pretrain/Loss": 1.9659059047698975, "Pretrain/Loss (Raw)": 2.297494888305664, "Pretrain/Step": 9013, "Pretrain/Step Time": 8.662622336298227} +{"Pretrain/Learning Rate": 3.932727317456475e-07, "Pretrain/Loss": 1.9673470258712769, "Pretrain/Loss (Raw)": 2.1429443359375, "Pretrain/Step": 9014, "Pretrain/Step Time": 8.668196860700846} +{"Pretrain/Learning Rate": 3.9177419507897274e-07, "Pretrain/Loss": 1.9644012451171875, "Pretrain/Loss (Raw)": 1.6314620971679688, "Pretrain/Step": 9015, "Pretrain/Step Time": 8.671337010338902} +{"Pretrain/Learning Rate": 3.902784963488587e-07, "Pretrain/Loss": 1.9628722667694092, "Pretrain/Loss (Raw)": 2.004276752471924, "Pretrain/Step": 9016, "Pretrain/Step Time": 8.671456079930067} +{"Pretrain/Learning Rate": 3.887856357277925e-07, "Pretrain/Loss": 1.9650510549545288, "Pretrain/Loss (Raw)": 1.944167137145996, "Pretrain/Step": 9017, "Pretrain/Step Time": 8.6697543784976} +{"Pretrain/Learning Rate": 3.872956133879391e-07, "Pretrain/Loss": 1.9646368026733398, "Pretrain/Loss (Raw)": 2.019073963165283, "Pretrain/Step": 9018, "Pretrain/Step Time": 8.667521202936769} +{"Pretrain/Learning Rate": 3.858084295011333e-07, "Pretrain/Loss": 1.9630098342895508, "Pretrain/Loss (Raw)": 1.8954455852508545, "Pretrain/Step": 9019, "Pretrain/Step Time": 8.665995987132192} +{"Pretrain/Learning Rate": 3.843240842388879e-07, "Pretrain/Loss": 1.9570300579071045, "Pretrain/Loss (Raw)": 1.315700888633728, "Pretrain/Step": 9020, "Pretrain/Step Time": 8.664047215133905} +{"Pretrain/Learning Rate": 3.8284257777237984e-07, "Pretrain/Loss": 1.9545676708221436, "Pretrain/Loss (Raw)": 1.6921162605285645, "Pretrain/Step": 9021, "Pretrain/Step Time": 8.663811212405562} +{"Pretrain/Learning Rate": 3.8136391027246696e-07, "Pretrain/Loss": 1.9554862976074219, "Pretrain/Loss (Raw)": 1.9716157913208008, "Pretrain/Step": 9022, "Pretrain/Step Time": 8.668004535138607} +{"Pretrain/Learning Rate": 3.7988808190967116e-07, "Pretrain/Loss": 1.9548989534378052, "Pretrain/Loss (Raw)": 1.9593764543533325, "Pretrain/Step": 9023, "Pretrain/Step Time": 8.666038136929274} +{"Pretrain/Learning Rate": 3.7841509285420076e-07, "Pretrain/Loss": 1.952156901359558, "Pretrain/Loss (Raw)": 1.804461121559143, "Pretrain/Step": 9024, "Pretrain/Step Time": 8.667072504758835} +{"Pretrain/Learning Rate": 3.769449432759198e-07, "Pretrain/Loss": 1.9484293460845947, "Pretrain/Loss (Raw)": 1.5224478244781494, "Pretrain/Step": 9025, "Pretrain/Step Time": 8.665816500782967} +{"Pretrain/Learning Rate": 3.7547763334437603e-07, "Pretrain/Loss": 1.9484686851501465, "Pretrain/Loss (Raw)": 1.903065800666809, "Pretrain/Step": 9026, "Pretrain/Step Time": 8.661857046186924} +{"Pretrain/Learning Rate": 3.740131632287841e-07, "Pretrain/Loss": 1.9484138488769531, "Pretrain/Loss (Raw)": 1.890011191368103, "Pretrain/Step": 9027, "Pretrain/Step Time": 8.666797686368227} +{"Pretrain/Learning Rate": 3.725515330980395e-07, "Pretrain/Loss": 1.947563648223877, "Pretrain/Loss (Raw)": 1.9936119318008423, "Pretrain/Step": 9028, "Pretrain/Step Time": 8.669134549796581} +{"Pretrain/Learning Rate": 3.71092743120699e-07, "Pretrain/Loss": 1.9462366104125977, "Pretrain/Loss (Raw)": 1.8655496835708618, "Pretrain/Step": 9029, "Pretrain/Step Time": 8.673380844295025} +{"Pretrain/Learning Rate": 3.6963679346499746e-07, "Pretrain/Loss": 1.9463064670562744, "Pretrain/Loss (Raw)": 1.9526280164718628, "Pretrain/Step": 9030, "Pretrain/Step Time": 8.67089557275176} +{"Pretrain/Learning Rate": 3.681836842988423e-07, "Pretrain/Loss": 1.9448039531707764, "Pretrain/Loss (Raw)": 1.938483476638794, "Pretrain/Step": 9031, "Pretrain/Step Time": 8.668556144461036} +{"Pretrain/Learning Rate": 3.6673341578981614e-07, "Pretrain/Loss": 1.9442552328109741, "Pretrain/Loss (Raw)": 1.6993062496185303, "Pretrain/Step": 9032, "Pretrain/Step Time": 8.663814762607217} +{"Pretrain/Learning Rate": 3.6528598810516567e-07, "Pretrain/Loss": 1.9447262287139893, "Pretrain/Loss (Raw)": 2.0831997394561768, "Pretrain/Step": 9033, "Pretrain/Step Time": 8.662986999377608} +{"Pretrain/Learning Rate": 3.6384140141181853e-07, "Pretrain/Loss": 1.9424084424972534, "Pretrain/Loss (Raw)": 1.653454303741455, "Pretrain/Step": 9034, "Pretrain/Step Time": 8.66152318380773} +{"Pretrain/Learning Rate": 3.6239965587637203e-07, "Pretrain/Loss": 1.9428398609161377, "Pretrain/Loss (Raw)": 2.094521999359131, "Pretrain/Step": 9035, "Pretrain/Step Time": 8.66601774096489} +{"Pretrain/Learning Rate": 3.609607516650931e-07, "Pretrain/Loss": 1.9395854473114014, "Pretrain/Loss (Raw)": 1.7149062156677246, "Pretrain/Step": 9036, "Pretrain/Step Time": 8.667588580399752} +{"Pretrain/Learning Rate": 3.5952468894392133e-07, "Pretrain/Loss": 1.9394354820251465, "Pretrain/Loss (Raw)": 1.8795793056488037, "Pretrain/Step": 9037, "Pretrain/Step Time": 8.665975537151098} +{"Pretrain/Learning Rate": 3.5809146787847415e-07, "Pretrain/Loss": 1.9393947124481201, "Pretrain/Loss (Raw)": 1.9779185056686401, "Pretrain/Step": 9038, "Pretrain/Step Time": 8.667165139690042} +{"Pretrain/Learning Rate": 3.5666108863403327e-07, "Pretrain/Loss": 1.937021017074585, "Pretrain/Loss (Raw)": 1.7758408784866333, "Pretrain/Step": 9039, "Pretrain/Step Time": 8.663320956751704} +{"Pretrain/Learning Rate": 3.552335513755611e-07, "Pretrain/Loss": 1.9370704889297485, "Pretrain/Loss (Raw)": 1.8740357160568237, "Pretrain/Step": 9040, "Pretrain/Step Time": 8.66381562128663} +{"Pretrain/Learning Rate": 3.538088562676817e-07, "Pretrain/Loss": 1.9432659149169922, "Pretrain/Loss (Raw)": 2.3987555503845215, "Pretrain/Step": 9041, "Pretrain/Step Time": 8.660803196951747} +{"Pretrain/Learning Rate": 3.523870034747051e-07, "Pretrain/Loss": 1.9426661729812622, "Pretrain/Loss (Raw)": 1.9863944053649902, "Pretrain/Step": 9042, "Pretrain/Step Time": 8.659000117331743} +{"Pretrain/Learning Rate": 3.50967993160603e-07, "Pretrain/Loss": 1.9419282674789429, "Pretrain/Loss (Raw)": 1.8418502807617188, "Pretrain/Step": 9043, "Pretrain/Step Time": 8.661327321082354} +{"Pretrain/Learning Rate": 3.4955182548901955e-07, "Pretrain/Loss": 1.941914677619934, "Pretrain/Loss (Raw)": 1.9394491910934448, "Pretrain/Step": 9044, "Pretrain/Step Time": 8.661254880949855} +{"Pretrain/Learning Rate": 3.4813850062327956e-07, "Pretrain/Loss": 1.9420394897460938, "Pretrain/Loss (Raw)": 1.8472900390625, "Pretrain/Step": 9045, "Pretrain/Step Time": 8.65664646960795} +{"Pretrain/Learning Rate": 3.467280187263694e-07, "Pretrain/Loss": 1.9454448223114014, "Pretrain/Loss (Raw)": 1.951330542564392, "Pretrain/Step": 9046, "Pretrain/Step Time": 8.654567470774055} +{"Pretrain/Learning Rate": 3.4532037996095334e-07, "Pretrain/Loss": 1.9428659677505493, "Pretrain/Loss (Raw)": 1.9501113891601562, "Pretrain/Step": 9047, "Pretrain/Step Time": 8.649061745032668} +{"Pretrain/Learning Rate": 3.4391558448936825e-07, "Pretrain/Loss": 1.9425315856933594, "Pretrain/Loss (Raw)": 1.911617398262024, "Pretrain/Step": 9048, "Pretrain/Step Time": 8.649514997377992} +{"Pretrain/Learning Rate": 3.4251363247362054e-07, "Pretrain/Loss": 1.9427964687347412, "Pretrain/Loss (Raw)": 2.0037314891815186, "Pretrain/Step": 9049, "Pretrain/Step Time": 8.644548194482923} +{"Pretrain/Learning Rate": 3.4111452407539214e-07, "Pretrain/Loss": 1.943354845046997, "Pretrain/Loss (Raw)": 1.9796923398971558, "Pretrain/Step": 9050, "Pretrain/Step Time": 8.647189758718014} +{"Pretrain/Learning Rate": 3.397182594560344e-07, "Pretrain/Loss": 1.9435358047485352, "Pretrain/Loss (Raw)": 2.0437123775482178, "Pretrain/Step": 9051, "Pretrain/Step Time": 8.650275770574808} +{"Pretrain/Learning Rate": 3.3832483877656584e-07, "Pretrain/Loss": 1.9438365697860718, "Pretrain/Loss (Raw)": 1.6757007837295532, "Pretrain/Step": 9052, "Pretrain/Step Time": 8.650958308950067} +{"Pretrain/Learning Rate": 3.369342621976884e-07, "Pretrain/Loss": 1.940260887145996, "Pretrain/Loss (Raw)": 1.6032872200012207, "Pretrain/Step": 9053, "Pretrain/Step Time": 8.645418269559741} +{"Pretrain/Learning Rate": 3.355465298797711e-07, "Pretrain/Loss": 1.942354679107666, "Pretrain/Loss (Raw)": 1.9602254629135132, "Pretrain/Step": 9054, "Pretrain/Step Time": 8.64580725133419} +{"Pretrain/Learning Rate": 3.3416164198284694e-07, "Pretrain/Loss": 1.9438445568084717, "Pretrain/Loss (Raw)": 1.92753267288208, "Pretrain/Step": 9055, "Pretrain/Step Time": 8.64581036195159} +{"Pretrain/Learning Rate": 3.327795986666327e-07, "Pretrain/Loss": 1.945512056350708, "Pretrain/Loss (Raw)": 2.118803024291992, "Pretrain/Step": 9056, "Pretrain/Step Time": 8.64409046806395} +{"Pretrain/Learning Rate": 3.3140040009051186e-07, "Pretrain/Loss": 1.9425233602523804, "Pretrain/Loss (Raw)": 1.7424150705337524, "Pretrain/Step": 9057, "Pretrain/Step Time": 8.641593990847468} +{"Pretrain/Learning Rate": 3.300240464135379e-07, "Pretrain/Loss": 1.9403090476989746, "Pretrain/Loss (Raw)": 1.6673883199691772, "Pretrain/Step": 9058, "Pretrain/Step Time": 8.641860013827682} +{"Pretrain/Learning Rate": 3.286505377944393e-07, "Pretrain/Loss": 1.9402588605880737, "Pretrain/Loss (Raw)": 2.015681266784668, "Pretrain/Step": 9059, "Pretrain/Step Time": 8.645427467301488} +{"Pretrain/Learning Rate": 3.2727987439161724e-07, "Pretrain/Loss": 1.939751386642456, "Pretrain/Loss (Raw)": 1.9998215436935425, "Pretrain/Step": 9060, "Pretrain/Step Time": 8.649607161059976} +{"Pretrain/Learning Rate": 3.2591205636313957e-07, "Pretrain/Loss": 1.9420249462127686, "Pretrain/Loss (Raw)": 2.245650291442871, "Pretrain/Step": 9061, "Pretrain/Step Time": 8.646959545090795} +{"Pretrain/Learning Rate": 3.2454708386675525e-07, "Pretrain/Loss": 1.9394906759262085, "Pretrain/Loss (Raw)": 1.8907142877578735, "Pretrain/Step": 9062, "Pretrain/Step Time": 8.646592194214463} +{"Pretrain/Learning Rate": 3.2318495705987437e-07, "Pretrain/Loss": 1.940420150756836, "Pretrain/Loss (Raw)": 2.088413953781128, "Pretrain/Step": 9063, "Pretrain/Step Time": 8.649516759440303} +{"Pretrain/Learning Rate": 3.218256760995825e-07, "Pretrain/Loss": 1.9372239112854004, "Pretrain/Loss (Raw)": 1.6982362270355225, "Pretrain/Step": 9064, "Pretrain/Step Time": 8.651211723685265} +{"Pretrain/Learning Rate": 3.20469241142643e-07, "Pretrain/Loss": 1.9318902492523193, "Pretrain/Loss (Raw)": 1.6777929067611694, "Pretrain/Step": 9065, "Pretrain/Step Time": 8.65033140964806} +{"Pretrain/Learning Rate": 3.1911565234548633e-07, "Pretrain/Loss": 1.931086540222168, "Pretrain/Loss (Raw)": 1.9968254566192627, "Pretrain/Step": 9066, "Pretrain/Step Time": 8.653182053938508} +{"Pretrain/Learning Rate": 3.177649098642099e-07, "Pretrain/Loss": 1.9304454326629639, "Pretrain/Loss (Raw)": 1.7613396644592285, "Pretrain/Step": 9067, "Pretrain/Step Time": 8.65905318595469} +{"Pretrain/Learning Rate": 3.1641701385459186e-07, "Pretrain/Loss": 1.928871512413025, "Pretrain/Loss (Raw)": 1.7518900632858276, "Pretrain/Step": 9068, "Pretrain/Step Time": 8.658755891025066} +{"Pretrain/Learning Rate": 3.150719644720773e-07, "Pretrain/Loss": 1.9292893409729004, "Pretrain/Loss (Raw)": 1.9591926336288452, "Pretrain/Step": 9069, "Pretrain/Step Time": 8.65966858714819} +{"Pretrain/Learning Rate": 3.1372976187178105e-07, "Pretrain/Loss": 1.9277405738830566, "Pretrain/Loss (Raw)": 1.5971158742904663, "Pretrain/Step": 9070, "Pretrain/Step Time": 8.660104103386402} +{"Pretrain/Learning Rate": 3.123904062084959e-07, "Pretrain/Loss": 1.9292902946472168, "Pretrain/Loss (Raw)": 2.0952749252319336, "Pretrain/Step": 9071, "Pretrain/Step Time": 8.658705838024616} +{"Pretrain/Learning Rate": 3.110538976366789e-07, "Pretrain/Loss": 1.9284241199493408, "Pretrain/Loss (Raw)": 1.9032853841781616, "Pretrain/Step": 9072, "Pretrain/Step Time": 8.66004372946918} +{"Pretrain/Learning Rate": 3.0972023631046786e-07, "Pretrain/Loss": 1.9271682500839233, "Pretrain/Loss (Raw)": 1.869912028312683, "Pretrain/Step": 9073, "Pretrain/Step Time": 8.658297566697001} +{"Pretrain/Learning Rate": 3.083894223836592e-07, "Pretrain/Loss": 1.926044225692749, "Pretrain/Loss (Raw)": 1.9913954734802246, "Pretrain/Step": 9074, "Pretrain/Step Time": 8.657404469326138} +{"Pretrain/Learning Rate": 3.070614560097357e-07, "Pretrain/Loss": 1.9271717071533203, "Pretrain/Loss (Raw)": 2.0441384315490723, "Pretrain/Step": 9075, "Pretrain/Step Time": 8.658358097076416} +{"Pretrain/Learning Rate": 3.0573633734184146e-07, "Pretrain/Loss": 1.9266972541809082, "Pretrain/Loss (Raw)": 1.7465049028396606, "Pretrain/Step": 9076, "Pretrain/Step Time": 8.660684380680323} +{"Pretrain/Learning Rate": 3.044140665327988e-07, "Pretrain/Loss": 1.9261503219604492, "Pretrain/Loss (Raw)": 1.8755533695220947, "Pretrain/Step": 9077, "Pretrain/Step Time": 8.659523153677583} +{"Pretrain/Learning Rate": 3.0309464373509125e-07, "Pretrain/Loss": 1.9261562824249268, "Pretrain/Loss (Raw)": 1.9236317873001099, "Pretrain/Step": 9078, "Pretrain/Step Time": 8.655885433778167} +{"Pretrain/Learning Rate": 3.017780691008859e-07, "Pretrain/Loss": 1.9255328178405762, "Pretrain/Loss (Raw)": 1.8806995153427124, "Pretrain/Step": 9079, "Pretrain/Step Time": 8.662181735038757} +{"Pretrain/Learning Rate": 3.00464342782017e-07, "Pretrain/Loss": 1.9267661571502686, "Pretrain/Loss (Raw)": 1.8945502042770386, "Pretrain/Step": 9080, "Pretrain/Step Time": 8.657140742987394} +{"Pretrain/Learning Rate": 2.9915346492998817e-07, "Pretrain/Loss": 1.9282089471817017, "Pretrain/Loss (Raw)": 2.090629816055298, "Pretrain/Step": 9081, "Pretrain/Step Time": 8.658129638060927} +{"Pretrain/Learning Rate": 2.9784543569597314e-07, "Pretrain/Loss": 1.9267733097076416, "Pretrain/Loss (Raw)": 1.592214822769165, "Pretrain/Step": 9082, "Pretrain/Step Time": 8.65775098837912} +{"Pretrain/Learning Rate": 2.9654025523082607e-07, "Pretrain/Loss": 1.9266636371612549, "Pretrain/Loss (Raw)": 1.9721803665161133, "Pretrain/Step": 9083, "Pretrain/Step Time": 8.665088277310133} +{"Pretrain/Learning Rate": 2.9523792368506275e-07, "Pretrain/Loss": 1.9246606826782227, "Pretrain/Loss (Raw)": 1.8738961219787598, "Pretrain/Step": 9084, "Pretrain/Step Time": 8.665208708494902} +{"Pretrain/Learning Rate": 2.9393844120887415e-07, "Pretrain/Loss": 1.9255168437957764, "Pretrain/Loss (Raw)": 1.887576937675476, "Pretrain/Step": 9085, "Pretrain/Step Time": 8.662363570183516} +{"Pretrain/Learning Rate": 2.926418079521237e-07, "Pretrain/Loss": 1.925760269165039, "Pretrain/Loss (Raw)": 2.0110085010528564, "Pretrain/Step": 9086, "Pretrain/Step Time": 8.662764897570014} +{"Pretrain/Learning Rate": 2.913480240643446e-07, "Pretrain/Loss": 1.9263627529144287, "Pretrain/Loss (Raw)": 1.9750856161117554, "Pretrain/Step": 9087, "Pretrain/Step Time": 8.668124260380864} +{"Pretrain/Learning Rate": 2.900570896947424e-07, "Pretrain/Loss": 1.926253318786621, "Pretrain/Loss (Raw)": 1.8847535848617554, "Pretrain/Step": 9088, "Pretrain/Step Time": 8.668214375153184} +{"Pretrain/Learning Rate": 2.8876900499219263e-07, "Pretrain/Loss": 1.9218299388885498, "Pretrain/Loss (Raw)": 1.5138139724731445, "Pretrain/Step": 9089, "Pretrain/Step Time": 8.668259471654892} +{"Pretrain/Learning Rate": 2.8748377010524574e-07, "Pretrain/Loss": 1.9216911792755127, "Pretrain/Loss (Raw)": 2.0973150730133057, "Pretrain/Step": 9090, "Pretrain/Step Time": 8.664640652015805} +{"Pretrain/Learning Rate": 2.8620138518211934e-07, "Pretrain/Loss": 1.9223215579986572, "Pretrain/Loss (Raw)": 1.9440889358520508, "Pretrain/Step": 9091, "Pretrain/Step Time": 8.66567206569016} +{"Pretrain/Learning Rate": 2.849218503707035e-07, "Pretrain/Loss": 1.9193609952926636, "Pretrain/Loss (Raw)": 1.7988159656524658, "Pretrain/Step": 9092, "Pretrain/Step Time": 8.664652045816183} +{"Pretrain/Learning Rate": 2.836451658185607e-07, "Pretrain/Loss": 1.9155192375183105, "Pretrain/Loss (Raw)": 1.5824307203292847, "Pretrain/Step": 9093, "Pretrain/Step Time": 8.669899864122272} +{"Pretrain/Learning Rate": 2.82371331672926e-07, "Pretrain/Loss": 1.9172887802124023, "Pretrain/Loss (Raw)": 2.1455764770507812, "Pretrain/Step": 9094, "Pretrain/Step Time": 8.666740447282791} +{"Pretrain/Learning Rate": 2.8110034808070396e-07, "Pretrain/Loss": 1.9183484315872192, "Pretrain/Loss (Raw)": 1.9713525772094727, "Pretrain/Step": 9095, "Pretrain/Step Time": 8.667338812723756} +{"Pretrain/Learning Rate": 2.7983221518846634e-07, "Pretrain/Loss": 1.9172148704528809, "Pretrain/Loss (Raw)": 1.5074485540390015, "Pretrain/Step": 9096, "Pretrain/Step Time": 8.660129042342305} +{"Pretrain/Learning Rate": 2.7856693314246287e-07, "Pretrain/Loss": 1.916366696357727, "Pretrain/Loss (Raw)": 1.8681690692901611, "Pretrain/Step": 9097, "Pretrain/Step Time": 8.66167325899005} +{"Pretrain/Learning Rate": 2.773045020886156e-07, "Pretrain/Loss": 1.9196438789367676, "Pretrain/Loss (Raw)": 2.007645845413208, "Pretrain/Step": 9098, "Pretrain/Step Time": 8.665949515998363} +{"Pretrain/Learning Rate": 2.760449221725081e-07, "Pretrain/Loss": 1.9198483228683472, "Pretrain/Loss (Raw)": 1.898830533027649, "Pretrain/Step": 9099, "Pretrain/Step Time": 8.668226264417171} +{"Pretrain/Learning Rate": 2.74788193539402e-07, "Pretrain/Loss": 1.917129397392273, "Pretrain/Loss (Raw)": 1.634221076965332, "Pretrain/Step": 9100, "Pretrain/Step Time": 8.66642146371305} +{"Pretrain/Learning Rate": 2.7353431633423134e-07, "Pretrain/Loss": 1.9144384860992432, "Pretrain/Loss (Raw)": 1.9546526670455933, "Pretrain/Step": 9101, "Pretrain/Step Time": 8.663736898452044} +{"Pretrain/Learning Rate": 2.722832907015971e-07, "Pretrain/Loss": 1.9152846336364746, "Pretrain/Loss (Raw)": 1.9858596324920654, "Pretrain/Step": 9102, "Pretrain/Step Time": 8.664059868082404} +{"Pretrain/Learning Rate": 2.710351167857783e-07, "Pretrain/Loss": 1.9140148162841797, "Pretrain/Loss (Raw)": 1.7360880374908447, "Pretrain/Step": 9103, "Pretrain/Step Time": 8.662861658260226} +{"Pretrain/Learning Rate": 2.6978979473071264e-07, "Pretrain/Loss": 1.9151031970977783, "Pretrain/Loss (Raw)": 1.8750934600830078, "Pretrain/Step": 9104, "Pretrain/Step Time": 8.662927120923996} +{"Pretrain/Learning Rate": 2.6854732468002133e-07, "Pretrain/Loss": 1.918825387954712, "Pretrain/Loss (Raw)": 1.9730671644210815, "Pretrain/Step": 9105, "Pretrain/Step Time": 8.665003003552556} +{"Pretrain/Learning Rate": 2.6730770677699245e-07, "Pretrain/Loss": 1.9170048236846924, "Pretrain/Loss (Raw)": 1.9583256244659424, "Pretrain/Step": 9106, "Pretrain/Step Time": 8.664491534233093} +{"Pretrain/Learning Rate": 2.6607094116458123e-07, "Pretrain/Loss": 1.915311336517334, "Pretrain/Loss (Raw)": 1.907480001449585, "Pretrain/Step": 9107, "Pretrain/Step Time": 8.658020362257957} +{"Pretrain/Learning Rate": 2.6483702798542066e-07, "Pretrain/Loss": 1.915273666381836, "Pretrain/Loss (Raw)": 1.9267033338546753, "Pretrain/Step": 9108, "Pretrain/Step Time": 8.65713156759739} +{"Pretrain/Learning Rate": 2.636059673818081e-07, "Pretrain/Loss": 1.915432333946228, "Pretrain/Loss (Raw)": 2.014086961746216, "Pretrain/Step": 9109, "Pretrain/Step Time": 8.657047929242253} +{"Pretrain/Learning Rate": 2.623777594957216e-07, "Pretrain/Loss": 1.9161465167999268, "Pretrain/Loss (Raw)": 2.116166114807129, "Pretrain/Step": 9110, "Pretrain/Step Time": 8.657677663490176} +{"Pretrain/Learning Rate": 2.6115240446879517e-07, "Pretrain/Loss": 1.9170055389404297, "Pretrain/Loss (Raw)": 2.040339231491089, "Pretrain/Step": 9111, "Pretrain/Step Time": 8.656638270244002} +{"Pretrain/Learning Rate": 2.599299024423491e-07, "Pretrain/Loss": 1.9154160022735596, "Pretrain/Loss (Raw)": 1.9390628337860107, "Pretrain/Step": 9112, "Pretrain/Step Time": 8.654667533934116} +{"Pretrain/Learning Rate": 2.587102535573621e-07, "Pretrain/Loss": 1.9150753021240234, "Pretrain/Loss (Raw)": 1.9044526815414429, "Pretrain/Step": 9113, "Pretrain/Step Time": 8.655763952061534} +{"Pretrain/Learning Rate": 2.5749345795449687e-07, "Pretrain/Loss": 1.9129829406738281, "Pretrain/Loss (Raw)": 1.8892908096313477, "Pretrain/Step": 9114, "Pretrain/Step Time": 8.662661636248231} +{"Pretrain/Learning Rate": 2.562795157740744e-07, "Pretrain/Loss": 1.9115636348724365, "Pretrain/Loss (Raw)": 1.7617576122283936, "Pretrain/Step": 9115, "Pretrain/Step Time": 8.66273770481348} +{"Pretrain/Learning Rate": 2.5506842715609656e-07, "Pretrain/Loss": 1.9099812507629395, "Pretrain/Loss (Raw)": 1.8399558067321777, "Pretrain/Step": 9116, "Pretrain/Step Time": 8.664497803896666} +{"Pretrain/Learning Rate": 2.5386019224022673e-07, "Pretrain/Loss": 1.9104483127593994, "Pretrain/Loss (Raw)": 2.044041156768799, "Pretrain/Step": 9117, "Pretrain/Step Time": 8.664966627955437} +{"Pretrain/Learning Rate": 2.526548111658117e-07, "Pretrain/Loss": 1.9089274406433105, "Pretrain/Loss (Raw)": 1.6730492115020752, "Pretrain/Step": 9118, "Pretrain/Step Time": 8.66623967513442} +{"Pretrain/Learning Rate": 2.514522840718542e-07, "Pretrain/Loss": 1.9097316265106201, "Pretrain/Loss (Raw)": 2.0627076625823975, "Pretrain/Step": 9119, "Pretrain/Step Time": 8.664120396599174} +{"Pretrain/Learning Rate": 2.502526110970377e-07, "Pretrain/Loss": 1.9093279838562012, "Pretrain/Loss (Raw)": 2.0021543502807617, "Pretrain/Step": 9120, "Pretrain/Step Time": 8.67011491023004} +{"Pretrain/Learning Rate": 2.490557923797154e-07, "Pretrain/Loss": 1.9074971675872803, "Pretrain/Loss (Raw)": 1.854873776435852, "Pretrain/Step": 9121, "Pretrain/Step Time": 8.670340597629547} +{"Pretrain/Learning Rate": 2.478618280579104e-07, "Pretrain/Loss": 1.9093114137649536, "Pretrain/Loss (Raw)": 2.0389792919158936, "Pretrain/Step": 9122, "Pretrain/Step Time": 8.664622884243727} +{"Pretrain/Learning Rate": 2.466707182693151e-07, "Pretrain/Loss": 1.908848524093628, "Pretrain/Loss (Raw)": 1.871975302696228, "Pretrain/Step": 9123, "Pretrain/Step Time": 8.661800500005484} +{"Pretrain/Learning Rate": 2.45482463151292e-07, "Pretrain/Loss": 1.9060425758361816, "Pretrain/Loss (Raw)": 1.8024910688400269, "Pretrain/Step": 9124, "Pretrain/Step Time": 8.667332725599408} +{"Pretrain/Learning Rate": 2.442970628408814e-07, "Pretrain/Loss": 1.9049463272094727, "Pretrain/Loss (Raw)": 1.9275506734848022, "Pretrain/Step": 9125, "Pretrain/Step Time": 8.66521792858839} +{"Pretrain/Learning Rate": 2.4311451747478233e-07, "Pretrain/Loss": 1.9030745029449463, "Pretrain/Loss (Raw)": 1.6473206281661987, "Pretrain/Step": 9126, "Pretrain/Step Time": 8.666094334796071} +{"Pretrain/Learning Rate": 2.4193482718937733e-07, "Pretrain/Loss": 1.9019674062728882, "Pretrain/Loss (Raw)": 1.941854476928711, "Pretrain/Step": 9127, "Pretrain/Step Time": 8.660869123414159} +{"Pretrain/Learning Rate": 2.4075799212071317e-07, "Pretrain/Loss": 1.9018521308898926, "Pretrain/Loss (Raw)": 1.6691455841064453, "Pretrain/Step": 9128, "Pretrain/Step Time": 8.662296051159501} +{"Pretrain/Learning Rate": 2.395840124045062e-07, "Pretrain/Loss": 1.9018915891647339, "Pretrain/Loss (Raw)": 1.994569182395935, "Pretrain/Step": 9129, "Pretrain/Step Time": 8.663527814671397} +{"Pretrain/Learning Rate": 2.384128881761455e-07, "Pretrain/Loss": 1.9020214080810547, "Pretrain/Loss (Raw)": 2.028858184814453, "Pretrain/Step": 9130, "Pretrain/Step Time": 8.661795493215322} +{"Pretrain/Learning Rate": 2.3724461957068956e-07, "Pretrain/Loss": 1.9037129878997803, "Pretrain/Loss (Raw)": 2.0766313076019287, "Pretrain/Step": 9131, "Pretrain/Step Time": 8.661173358559608} +{"Pretrain/Learning Rate": 2.360792067228723e-07, "Pretrain/Loss": 1.9020488262176514, "Pretrain/Loss (Raw)": 1.9082237482070923, "Pretrain/Step": 9132, "Pretrain/Step Time": 8.662279911339283} +{"Pretrain/Learning Rate": 2.349166497670918e-07, "Pretrain/Loss": 1.9016331434249878, "Pretrain/Loss (Raw)": 1.9697537422180176, "Pretrain/Step": 9133, "Pretrain/Step Time": 8.66411111317575} +{"Pretrain/Learning Rate": 2.337569488374186e-07, "Pretrain/Loss": 1.9011222124099731, "Pretrain/Loss (Raw)": 2.057131767272949, "Pretrain/Step": 9134, "Pretrain/Step Time": 8.658036073669791} +{"Pretrain/Learning Rate": 2.3260010406759846e-07, "Pretrain/Loss": 1.902437448501587, "Pretrain/Loss (Raw)": 1.956852912902832, "Pretrain/Step": 9135, "Pretrain/Step Time": 8.658532479777932} +{"Pretrain/Learning Rate": 2.3144611559104134e-07, "Pretrain/Loss": 1.9016159772872925, "Pretrain/Loss (Raw)": 1.9741463661193848, "Pretrain/Step": 9136, "Pretrain/Step Time": 8.654888151213527} +{"Pretrain/Learning Rate": 2.3029498354083245e-07, "Pretrain/Loss": 1.900524377822876, "Pretrain/Loss (Raw)": 1.9377294778823853, "Pretrain/Step": 9137, "Pretrain/Step Time": 8.659555757418275} +{"Pretrain/Learning Rate": 2.2914670804972394e-07, "Pretrain/Loss": 1.900671124458313, "Pretrain/Loss (Raw)": 1.8702442646026611, "Pretrain/Step": 9138, "Pretrain/Step Time": 8.655299229547381} +{"Pretrain/Learning Rate": 2.2800128925014042e-07, "Pretrain/Loss": 1.9013688564300537, "Pretrain/Loss (Raw)": 1.9878209829330444, "Pretrain/Step": 9139, "Pretrain/Step Time": 8.660676369443536} +{"Pretrain/Learning Rate": 2.26858727274179e-07, "Pretrain/Loss": 1.9005191326141357, "Pretrain/Loss (Raw)": 1.9352871179580688, "Pretrain/Step": 9140, "Pretrain/Step Time": 8.658484211191535} +{"Pretrain/Learning Rate": 2.2571902225360374e-07, "Pretrain/Loss": 1.8975121974945068, "Pretrain/Loss (Raw)": 1.9126126766204834, "Pretrain/Step": 9141, "Pretrain/Step Time": 8.660479750484228} +{"Pretrain/Learning Rate": 2.2458217431984842e-07, "Pretrain/Loss": 1.8954635858535767, "Pretrain/Loss (Raw)": 1.880729079246521, "Pretrain/Step": 9142, "Pretrain/Step Time": 8.658846609294415} +{"Pretrain/Learning Rate": 2.2344818360402476e-07, "Pretrain/Loss": 1.8981608152389526, "Pretrain/Loss (Raw)": 1.976707100868225, "Pretrain/Step": 9143, "Pretrain/Step Time": 8.658415814861655} +{"Pretrain/Learning Rate": 2.2231705023690875e-07, "Pretrain/Loss": 1.898658275604248, "Pretrain/Loss (Raw)": 2.067955732345581, "Pretrain/Step": 9144, "Pretrain/Step Time": 8.665429707616568} +{"Pretrain/Learning Rate": 2.2118877434894325e-07, "Pretrain/Loss": 1.901167869567871, "Pretrain/Loss (Raw)": 2.2654006481170654, "Pretrain/Step": 9145, "Pretrain/Step Time": 8.667906800284982} +{"Pretrain/Learning Rate": 2.2006335607025196e-07, "Pretrain/Loss": 1.899361252784729, "Pretrain/Loss (Raw)": 1.7878272533416748, "Pretrain/Step": 9146, "Pretrain/Step Time": 8.669859882444143} +{"Pretrain/Learning Rate": 2.1894079553062276e-07, "Pretrain/Loss": 1.8998050689697266, "Pretrain/Loss (Raw)": 1.952242374420166, "Pretrain/Step": 9147, "Pretrain/Step Time": 8.670081578195095} +{"Pretrain/Learning Rate": 2.1782109285951034e-07, "Pretrain/Loss": 1.905096411705017, "Pretrain/Loss (Raw)": 1.9929918050765991, "Pretrain/Step": 9148, "Pretrain/Step Time": 8.665044268593192} +{"Pretrain/Learning Rate": 2.167042481860504e-07, "Pretrain/Loss": 1.9068124294281006, "Pretrain/Loss (Raw)": 1.9117733240127563, "Pretrain/Step": 9149, "Pretrain/Step Time": 8.663560451939702} +{"Pretrain/Learning Rate": 2.1559026163903427e-07, "Pretrain/Loss": 1.9051804542541504, "Pretrain/Loss (Raw)": 1.7627168893814087, "Pretrain/Step": 9150, "Pretrain/Step Time": 8.662776125594974} +{"Pretrain/Learning Rate": 2.1447913334694258e-07, "Pretrain/Loss": 1.9029814004898071, "Pretrain/Loss (Raw)": 1.677891492843628, "Pretrain/Step": 9151, "Pretrain/Step Time": 8.663952132686973} +{"Pretrain/Learning Rate": 2.1337086343790613e-07, "Pretrain/Loss": 1.9022471904754639, "Pretrain/Loss (Raw)": 1.7104984521865845, "Pretrain/Step": 9152, "Pretrain/Step Time": 8.660794280469418} +{"Pretrain/Learning Rate": 2.1226545203974212e-07, "Pretrain/Loss": 1.905418872833252, "Pretrain/Loss (Raw)": 1.9284127950668335, "Pretrain/Step": 9153, "Pretrain/Step Time": 8.656008066609502} +{"Pretrain/Learning Rate": 2.1116289927992917e-07, "Pretrain/Loss": 1.9044406414031982, "Pretrain/Loss (Raw)": 1.7778481245040894, "Pretrain/Step": 9154, "Pretrain/Step Time": 8.663087792694569} +{"Pretrain/Learning Rate": 2.1006320528562107e-07, "Pretrain/Loss": 1.9048086404800415, "Pretrain/Loss (Raw)": 1.9371291399002075, "Pretrain/Step": 9155, "Pretrain/Step Time": 8.658913787454367} +{"Pretrain/Learning Rate": 2.0896637018363863e-07, "Pretrain/Loss": 1.9047247171401978, "Pretrain/Loss (Raw)": 1.9828625917434692, "Pretrain/Step": 9156, "Pretrain/Step Time": 8.657669872045517} +{"Pretrain/Learning Rate": 2.0787239410047232e-07, "Pretrain/Loss": 1.9059422016143799, "Pretrain/Loss (Raw)": 2.021397352218628, "Pretrain/Step": 9157, "Pretrain/Step Time": 8.65381783619523} +{"Pretrain/Learning Rate": 2.0678127716228236e-07, "Pretrain/Loss": 1.9062269926071167, "Pretrain/Loss (Raw)": 1.9890801906585693, "Pretrain/Step": 9158, "Pretrain/Step Time": 8.655033117160201} +{"Pretrain/Learning Rate": 2.056930194949097e-07, "Pretrain/Loss": 1.9071590900421143, "Pretrain/Loss (Raw)": 2.0577900409698486, "Pretrain/Step": 9159, "Pretrain/Step Time": 8.654858464375138} +{"Pretrain/Learning Rate": 2.0460762122385125e-07, "Pretrain/Loss": 1.9084839820861816, "Pretrain/Loss (Raw)": 1.8688783645629883, "Pretrain/Step": 9160, "Pretrain/Step Time": 8.658874850720167} +{"Pretrain/Learning Rate": 2.035250824742818e-07, "Pretrain/Loss": 1.908311128616333, "Pretrain/Loss (Raw)": 2.0610952377319336, "Pretrain/Step": 9161, "Pretrain/Step Time": 8.658629346638918} +{"Pretrain/Learning Rate": 2.02445403371046e-07, "Pretrain/Loss": 1.9116488695144653, "Pretrain/Loss (Raw)": 2.080683946609497, "Pretrain/Step": 9162, "Pretrain/Step Time": 8.661814427003264} +{"Pretrain/Learning Rate": 2.0136858403865534e-07, "Pretrain/Loss": 1.9106900691986084, "Pretrain/Loss (Raw)": 1.97179114818573, "Pretrain/Step": 9163, "Pretrain/Step Time": 8.661667466163635} +{"Pretrain/Learning Rate": 2.00294624601291e-07, "Pretrain/Loss": 1.913817048072815, "Pretrain/Loss (Raw)": 2.115147352218628, "Pretrain/Step": 9164, "Pretrain/Step Time": 8.65796790830791} +{"Pretrain/Learning Rate": 1.9922352518281505e-07, "Pretrain/Loss": 1.915886402130127, "Pretrain/Loss (Raw)": 2.144453525543213, "Pretrain/Step": 9165, "Pretrain/Step Time": 8.659126747399569} +{"Pretrain/Learning Rate": 1.9815528590674537e-07, "Pretrain/Loss": 1.9156029224395752, "Pretrain/Loss (Raw)": 1.9416496753692627, "Pretrain/Step": 9166, "Pretrain/Step Time": 8.655074382200837} +{"Pretrain/Learning Rate": 1.9708990689627783e-07, "Pretrain/Loss": 1.915950059890747, "Pretrain/Loss (Raw)": 1.8202660083770752, "Pretrain/Step": 9167, "Pretrain/Step Time": 8.657931458204985} +{"Pretrain/Learning Rate": 1.9602738827427802e-07, "Pretrain/Loss": 1.918203592300415, "Pretrain/Loss (Raw)": 2.1624886989593506, "Pretrain/Step": 9168, "Pretrain/Step Time": 8.657096646726131} +{"Pretrain/Learning Rate": 1.9496773016327852e-07, "Pretrain/Loss": 1.9134087562561035, "Pretrain/Loss (Raw)": 1.7850117683410645, "Pretrain/Step": 9169, "Pretrain/Step Time": 8.662466660141945} +{"Pretrain/Learning Rate": 1.9391093268548988e-07, "Pretrain/Loss": 1.9138489961624146, "Pretrain/Loss (Raw)": 2.0427541732788086, "Pretrain/Step": 9170, "Pretrain/Step Time": 8.661250928416848} +{"Pretrain/Learning Rate": 1.9285699596277852e-07, "Pretrain/Loss": 1.9151043891906738, "Pretrain/Loss (Raw)": 2.002544403076172, "Pretrain/Step": 9171, "Pretrain/Step Time": 8.656864693388343} +{"Pretrain/Learning Rate": 1.918059201166944e-07, "Pretrain/Loss": 1.9168052673339844, "Pretrain/Loss (Raw)": 2.157153367996216, "Pretrain/Step": 9172, "Pretrain/Step Time": 8.664090491831303} +{"Pretrain/Learning Rate": 1.9075770526845172e-07, "Pretrain/Loss": 1.9178428649902344, "Pretrain/Loss (Raw)": 1.980102300643921, "Pretrain/Step": 9173, "Pretrain/Step Time": 8.659414798021317} +{"Pretrain/Learning Rate": 1.8971235153893708e-07, "Pretrain/Loss": 1.919319748878479, "Pretrain/Loss (Raw)": 2.140378475189209, "Pretrain/Step": 9174, "Pretrain/Step Time": 8.661985935643315} +{"Pretrain/Learning Rate": 1.8866985904870127e-07, "Pretrain/Loss": 1.9216296672821045, "Pretrain/Loss (Raw)": 2.2457776069641113, "Pretrain/Step": 9175, "Pretrain/Step Time": 8.66104089282453} +{"Pretrain/Learning Rate": 1.8763022791797314e-07, "Pretrain/Loss": 1.92215895652771, "Pretrain/Loss (Raw)": 1.9793660640716553, "Pretrain/Step": 9176, "Pretrain/Step Time": 8.667201738804579} +{"Pretrain/Learning Rate": 1.8659345826664844e-07, "Pretrain/Loss": 1.922061562538147, "Pretrain/Loss (Raw)": 1.9912630319595337, "Pretrain/Step": 9177, "Pretrain/Step Time": 8.66827050037682} +{"Pretrain/Learning Rate": 1.8555955021428984e-07, "Pretrain/Loss": 1.9219714403152466, "Pretrain/Loss (Raw)": 1.9681626558303833, "Pretrain/Step": 9178, "Pretrain/Step Time": 8.668919138610363} +{"Pretrain/Learning Rate": 1.8452850388013255e-07, "Pretrain/Loss": 1.9226963520050049, "Pretrain/Loss (Raw)": 2.136488437652588, "Pretrain/Step": 9179, "Pretrain/Step Time": 8.663114238530397} +{"Pretrain/Learning Rate": 1.8350031938308144e-07, "Pretrain/Loss": 1.9224956035614014, "Pretrain/Loss (Raw)": 1.65001380443573, "Pretrain/Step": 9180, "Pretrain/Step Time": 8.663881236687303} +{"Pretrain/Learning Rate": 1.8247499684171666e-07, "Pretrain/Loss": 1.9262824058532715, "Pretrain/Loss (Raw)": 2.087984800338745, "Pretrain/Step": 9181, "Pretrain/Step Time": 8.665950622409582} +{"Pretrain/Learning Rate": 1.8145253637427695e-07, "Pretrain/Loss": 1.927736759185791, "Pretrain/Loss (Raw)": 2.1464052200317383, "Pretrain/Step": 9182, "Pretrain/Step Time": 8.666671570390463} +{"Pretrain/Learning Rate": 1.8043293809867635e-07, "Pretrain/Loss": 1.929086446762085, "Pretrain/Loss (Raw)": 2.1002895832061768, "Pretrain/Step": 9183, "Pretrain/Step Time": 8.66448606364429} +{"Pretrain/Learning Rate": 1.7941620213250688e-07, "Pretrain/Loss": 1.9271968603134155, "Pretrain/Loss (Raw)": 1.8769261837005615, "Pretrain/Step": 9184, "Pretrain/Step Time": 8.66375520825386} +{"Pretrain/Learning Rate": 1.7840232859301919e-07, "Pretrain/Loss": 1.9299672842025757, "Pretrain/Loss (Raw)": 2.0970258712768555, "Pretrain/Step": 9185, "Pretrain/Step Time": 8.669135143980384} +{"Pretrain/Learning Rate": 1.7739131759713924e-07, "Pretrain/Loss": 1.931506633758545, "Pretrain/Loss (Raw)": 1.864426851272583, "Pretrain/Step": 9186, "Pretrain/Step Time": 8.67031741887331} +{"Pretrain/Learning Rate": 1.7638316926145702e-07, "Pretrain/Loss": 1.9310798645019531, "Pretrain/Loss (Raw)": 1.9610596895217896, "Pretrain/Step": 9187, "Pretrain/Step Time": 8.668015107512474} +{"Pretrain/Learning Rate": 1.7537788370224351e-07, "Pretrain/Loss": 1.9327659606933594, "Pretrain/Loss (Raw)": 2.2156527042388916, "Pretrain/Step": 9188, "Pretrain/Step Time": 8.665119661018252} +{"Pretrain/Learning Rate": 1.7437546103542814e-07, "Pretrain/Loss": 1.9259870052337646, "Pretrain/Loss (Raw)": 1.3779268264770508, "Pretrain/Step": 9189, "Pretrain/Step Time": 8.668170429766178} +{"Pretrain/Learning Rate": 1.7337590137661842e-07, "Pretrain/Loss": 1.9276273250579834, "Pretrain/Loss (Raw)": 2.1006722450256348, "Pretrain/Step": 9190, "Pretrain/Step Time": 8.673087513074279} +{"Pretrain/Learning Rate": 1.7237920484108327e-07, "Pretrain/Loss": 1.9274331331253052, "Pretrain/Loss (Raw)": 2.0635640621185303, "Pretrain/Step": 9191, "Pretrain/Step Time": 8.66635861620307} +{"Pretrain/Learning Rate": 1.7138537154377243e-07, "Pretrain/Loss": 1.929234504699707, "Pretrain/Loss (Raw)": 1.928808331489563, "Pretrain/Step": 9192, "Pretrain/Step Time": 8.665399769321084} +{"Pretrain/Learning Rate": 1.70394401599297e-07, "Pretrain/Loss": 1.930769443511963, "Pretrain/Loss (Raw)": 1.8742681741714478, "Pretrain/Step": 9193, "Pretrain/Step Time": 8.665070036426187} +{"Pretrain/Learning Rate": 1.6940629512194052e-07, "Pretrain/Loss": 1.9293134212493896, "Pretrain/Loss (Raw)": 1.8104485273361206, "Pretrain/Step": 9194, "Pretrain/Step Time": 8.662216108292341} +{"Pretrain/Learning Rate": 1.6842105222565352e-07, "Pretrain/Loss": 1.9306352138519287, "Pretrain/Loss (Raw)": 1.930525779724121, "Pretrain/Step": 9195, "Pretrain/Step Time": 8.66004135645926} +{"Pretrain/Learning Rate": 1.6743867302406458e-07, "Pretrain/Loss": 1.9304695129394531, "Pretrain/Loss (Raw)": 1.7307014465332031, "Pretrain/Step": 9196, "Pretrain/Step Time": 8.660478616133332} +{"Pretrain/Learning Rate": 1.6645915763045804e-07, "Pretrain/Loss": 1.9296894073486328, "Pretrain/Loss (Raw)": 1.8593313694000244, "Pretrain/Step": 9197, "Pretrain/Step Time": 8.660571817308664} +{"Pretrain/Learning Rate": 1.654825061578047e-07, "Pretrain/Loss": 1.9320766925811768, "Pretrain/Loss (Raw)": 1.9026962518692017, "Pretrain/Step": 9198, "Pretrain/Step Time": 8.661143120378256} +{"Pretrain/Learning Rate": 1.6450871871873108e-07, "Pretrain/Loss": 1.9321677684783936, "Pretrain/Loss (Raw)": 2.1069321632385254, "Pretrain/Step": 9199, "Pretrain/Step Time": 8.658963261172175} +{"Pretrain/Learning Rate": 1.6353779542554182e-07, "Pretrain/Loss": 1.9320534467697144, "Pretrain/Loss (Raw)": 1.8886346817016602, "Pretrain/Step": 9200, "Pretrain/Step Time": 8.656061945483088} +{"Pretrain/Learning Rate": 1.6256973639020569e-07, "Pretrain/Loss": 1.9319615364074707, "Pretrain/Loss (Raw)": 1.8581414222717285, "Pretrain/Step": 9201, "Pretrain/Step Time": 8.662052122876048} +{"Pretrain/Learning Rate": 1.6160454172436667e-07, "Pretrain/Loss": 1.9313836097717285, "Pretrain/Loss (Raw)": 1.9174350500106812, "Pretrain/Step": 9202, "Pretrain/Step Time": 8.664473935961723} +{"Pretrain/Learning Rate": 1.60642211539333e-07, "Pretrain/Loss": 1.9306139945983887, "Pretrain/Loss (Raw)": 1.9456170797348022, "Pretrain/Step": 9203, "Pretrain/Step Time": 8.662217622622848} +{"Pretrain/Learning Rate": 1.5968274594608812e-07, "Pretrain/Loss": 1.9308454990386963, "Pretrain/Loss (Raw)": 1.776162028312683, "Pretrain/Step": 9204, "Pretrain/Step Time": 8.661362681537867} +{"Pretrain/Learning Rate": 1.587261450552796e-07, "Pretrain/Loss": 1.9315330982208252, "Pretrain/Loss (Raw)": 1.9635523557662964, "Pretrain/Step": 9205, "Pretrain/Step Time": 8.658404590561986} +{"Pretrain/Learning Rate": 1.5777240897722757e-07, "Pretrain/Loss": 1.929012417793274, "Pretrain/Loss (Raw)": 1.6009783744812012, "Pretrain/Step": 9206, "Pretrain/Step Time": 8.667273472994566} +{"Pretrain/Learning Rate": 1.5682153782192177e-07, "Pretrain/Loss": 1.9291516542434692, "Pretrain/Loss (Raw)": 1.8985326290130615, "Pretrain/Step": 9207, "Pretrain/Step Time": 8.660685669630766} +{"Pretrain/Learning Rate": 1.5587353169902175e-07, "Pretrain/Loss": 1.9281346797943115, "Pretrain/Loss (Raw)": 1.7643674612045288, "Pretrain/Step": 9208, "Pretrain/Step Time": 8.659661984071136} +{"Pretrain/Learning Rate": 1.5492839071785392e-07, "Pretrain/Loss": 1.9261538982391357, "Pretrain/Loss (Raw)": 1.8370909690856934, "Pretrain/Step": 9209, "Pretrain/Step Time": 8.664509722962976} +{"Pretrain/Learning Rate": 1.5398611498742e-07, "Pretrain/Loss": 1.929795503616333, "Pretrain/Loss (Raw)": 2.058347702026367, "Pretrain/Step": 9210, "Pretrain/Step Time": 8.667375817894936} +{"Pretrain/Learning Rate": 1.5304670461638582e-07, "Pretrain/Loss": 1.9287033081054688, "Pretrain/Loss (Raw)": 1.832367181777954, "Pretrain/Step": 9211, "Pretrain/Step Time": 8.661941265687346} +{"Pretrain/Learning Rate": 1.521101597130842e-07, "Pretrain/Loss": 1.9273180961608887, "Pretrain/Loss (Raw)": 1.6966049671173096, "Pretrain/Step": 9212, "Pretrain/Step Time": 8.660567004233599} +{"Pretrain/Learning Rate": 1.5117648038553144e-07, "Pretrain/Loss": 1.9284392595291138, "Pretrain/Loss (Raw)": 2.031076669692993, "Pretrain/Step": 9213, "Pretrain/Step Time": 8.65994269773364} +{"Pretrain/Learning Rate": 1.502456667413943e-07, "Pretrain/Loss": 1.928619623184204, "Pretrain/Loss (Raw)": 2.0341074466705322, "Pretrain/Step": 9214, "Pretrain/Step Time": 8.658670397475362} +{"Pretrain/Learning Rate": 1.493177188880257e-07, "Pretrain/Loss": 1.927351951599121, "Pretrain/Loss (Raw)": 1.8128024339675903, "Pretrain/Step": 9215, "Pretrain/Step Time": 8.654403071850538} +{"Pretrain/Learning Rate": 1.4839263693243732e-07, "Pretrain/Loss": 1.9289820194244385, "Pretrain/Loss (Raw)": 2.0934152603149414, "Pretrain/Step": 9216, "Pretrain/Step Time": 8.657423792406917} +{"Pretrain/Learning Rate": 1.4747042098131326e-07, "Pretrain/Loss": 1.932200312614441, "Pretrain/Loss (Raw)": 1.9257538318634033, "Pretrain/Step": 9217, "Pretrain/Step Time": 8.663973432034254} +{"Pretrain/Learning Rate": 1.4655107114101007e-07, "Pretrain/Loss": 1.9299607276916504, "Pretrain/Loss (Raw)": 1.810653567314148, "Pretrain/Step": 9218, "Pretrain/Step Time": 8.663932660594583} +{"Pretrain/Learning Rate": 1.4563458751755132e-07, "Pretrain/Loss": 1.92899489402771, "Pretrain/Loss (Raw)": 1.8204460144042969, "Pretrain/Step": 9219, "Pretrain/Step Time": 8.662455704063177} +{"Pretrain/Learning Rate": 1.4472097021662745e-07, "Pretrain/Loss": 1.9307353496551514, "Pretrain/Loss (Raw)": 2.021608829498291, "Pretrain/Step": 9220, "Pretrain/Step Time": 8.665479011833668} +{"Pretrain/Learning Rate": 1.4381021934360417e-07, "Pretrain/Loss": 1.9337910413742065, "Pretrain/Loss (Raw)": 1.9735521078109741, "Pretrain/Step": 9221, "Pretrain/Step Time": 8.664920937269926} +{"Pretrain/Learning Rate": 1.4290233500351414e-07, "Pretrain/Loss": 1.9323453903198242, "Pretrain/Loss (Raw)": 1.9605259895324707, "Pretrain/Step": 9222, "Pretrain/Step Time": 8.66926352120936} +{"Pretrain/Learning Rate": 1.4199731730105693e-07, "Pretrain/Loss": 1.9328176975250244, "Pretrain/Loss (Raw)": 2.0318214893341064, "Pretrain/Step": 9223, "Pretrain/Step Time": 8.670066056773067} +{"Pretrain/Learning Rate": 1.4109516634060182e-07, "Pretrain/Loss": 1.9360214471817017, "Pretrain/Loss (Raw)": 1.9175224304199219, "Pretrain/Step": 9224, "Pretrain/Step Time": 8.67034330777824} +{"Pretrain/Learning Rate": 1.401958822261934e-07, "Pretrain/Loss": 1.9346144199371338, "Pretrain/Loss (Raw)": 1.6880747079849243, "Pretrain/Step": 9225, "Pretrain/Step Time": 8.670792486518621} +{"Pretrain/Learning Rate": 1.3929946506153758e-07, "Pretrain/Loss": 1.9335095882415771, "Pretrain/Loss (Raw)": 1.8662288188934326, "Pretrain/Step": 9226, "Pretrain/Step Time": 8.666215995326638} +{"Pretrain/Learning Rate": 1.3840591495001554e-07, "Pretrain/Loss": 1.9347665309906006, "Pretrain/Loss (Raw)": 2.059727668762207, "Pretrain/Step": 9227, "Pretrain/Step Time": 8.666547529399395} +{"Pretrain/Learning Rate": 1.375152319946754e-07, "Pretrain/Loss": 1.942145586013794, "Pretrain/Loss (Raw)": 2.5787229537963867, "Pretrain/Step": 9228, "Pretrain/Step Time": 8.668157692998648} +{"Pretrain/Learning Rate": 1.3662741629823506e-07, "Pretrain/Loss": 1.9419828653335571, "Pretrain/Loss (Raw)": 1.9338349103927612, "Pretrain/Step": 9229, "Pretrain/Step Time": 8.66637190245092} +{"Pretrain/Learning Rate": 1.357424679630792e-07, "Pretrain/Loss": 1.9393701553344727, "Pretrain/Loss (Raw)": 1.65142822265625, "Pretrain/Step": 9230, "Pretrain/Step Time": 8.667417900636792} +{"Pretrain/Learning Rate": 1.348603870912679e-07, "Pretrain/Loss": 1.9403526782989502, "Pretrain/Loss (Raw)": 1.8618404865264893, "Pretrain/Step": 9231, "Pretrain/Step Time": 8.666446102783084} +{"Pretrain/Learning Rate": 1.3398117378452534e-07, "Pretrain/Loss": 1.9418238401412964, "Pretrain/Loss (Raw)": 2.0634162425994873, "Pretrain/Step": 9232, "Pretrain/Step Time": 8.667523100972176} +{"Pretrain/Learning Rate": 1.331048281442454e-07, "Pretrain/Loss": 1.9393725395202637, "Pretrain/Loss (Raw)": 1.6593022346496582, "Pretrain/Step": 9233, "Pretrain/Step Time": 8.667930498719215} +{"Pretrain/Learning Rate": 1.322313502714917e-07, "Pretrain/Loss": 1.9379082918167114, "Pretrain/Loss (Raw)": 1.770885944366455, "Pretrain/Step": 9234, "Pretrain/Step Time": 8.665596451610327} +{"Pretrain/Learning Rate": 1.3136074026700307e-07, "Pretrain/Loss": 1.937628984451294, "Pretrain/Loss (Raw)": 1.8717323541641235, "Pretrain/Step": 9235, "Pretrain/Step Time": 8.664970610290766} +{"Pretrain/Learning Rate": 1.30492998231177e-07, "Pretrain/Loss": 1.9371095895767212, "Pretrain/Loss (Raw)": 1.8602312803268433, "Pretrain/Step": 9236, "Pretrain/Step Time": 8.665105665102601} +{"Pretrain/Learning Rate": 1.296281242640862e-07, "Pretrain/Loss": 1.9369069337844849, "Pretrain/Loss (Raw)": 1.9881426095962524, "Pretrain/Step": 9237, "Pretrain/Step Time": 8.667014550417662} +{"Pretrain/Learning Rate": 1.2876611846547593e-07, "Pretrain/Loss": 1.9362883567810059, "Pretrain/Loss (Raw)": 2.0369811058044434, "Pretrain/Step": 9238, "Pretrain/Step Time": 8.665449801832438} +{"Pretrain/Learning Rate": 1.2790698093474995e-07, "Pretrain/Loss": 1.937631607055664, "Pretrain/Loss (Raw)": 2.2122769355773926, "Pretrain/Step": 9239, "Pretrain/Step Time": 8.665336608886719} +{"Pretrain/Learning Rate": 1.270507117709957e-07, "Pretrain/Loss": 1.9373877048492432, "Pretrain/Loss (Raw)": 1.9078460931777954, "Pretrain/Step": 9240, "Pretrain/Step Time": 8.665164502337575} +{"Pretrain/Learning Rate": 1.2619731107295917e-07, "Pretrain/Loss": 1.9369022846221924, "Pretrain/Loss (Raw)": 1.8423148393630981, "Pretrain/Step": 9241, "Pretrain/Step Time": 8.668176732957363} +{"Pretrain/Learning Rate": 1.2534677893905334e-07, "Pretrain/Loss": 1.9380946159362793, "Pretrain/Loss (Raw)": 2.041916847229004, "Pretrain/Step": 9242, "Pretrain/Step Time": 8.66156492382288} +{"Pretrain/Learning Rate": 1.244991154673747e-07, "Pretrain/Loss": 1.9400923252105713, "Pretrain/Loss (Raw)": 2.0174739360809326, "Pretrain/Step": 9243, "Pretrain/Step Time": 8.66442539356649} +{"Pretrain/Learning Rate": 1.2365432075567007e-07, "Pretrain/Loss": 1.93961501121521, "Pretrain/Loss (Raw)": 1.7788585424423218, "Pretrain/Step": 9244, "Pretrain/Step Time": 8.6600351780653} +{"Pretrain/Learning Rate": 1.228123949013754e-07, "Pretrain/Loss": 1.9398670196533203, "Pretrain/Loss (Raw)": 2.076282262802124, "Pretrain/Step": 9245, "Pretrain/Step Time": 8.659940717741847} +{"Pretrain/Learning Rate": 1.2197333800157973e-07, "Pretrain/Loss": 1.942601203918457, "Pretrain/Loss (Raw)": 2.0230348110198975, "Pretrain/Step": 9246, "Pretrain/Step Time": 8.658097574487329} +{"Pretrain/Learning Rate": 1.2113715015304728e-07, "Pretrain/Loss": 1.9408657550811768, "Pretrain/Loss (Raw)": 1.840553641319275, "Pretrain/Step": 9247, "Pretrain/Step Time": 8.662544848397374} +{"Pretrain/Learning Rate": 1.2030383145221203e-07, "Pretrain/Loss": 1.9399633407592773, "Pretrain/Loss (Raw)": 1.8866575956344604, "Pretrain/Step": 9248, "Pretrain/Step Time": 8.658138068392873} +{"Pretrain/Learning Rate": 1.1947338199517489e-07, "Pretrain/Loss": 1.9391590356826782, "Pretrain/Loss (Raw)": 1.7519301176071167, "Pretrain/Step": 9249, "Pretrain/Step Time": 8.660030014812946} +{"Pretrain/Learning Rate": 1.1864580187770647e-07, "Pretrain/Loss": 1.939208745956421, "Pretrain/Loss (Raw)": 2.045332908630371, "Pretrain/Step": 9250, "Pretrain/Step Time": 8.658736672252417} +{"Pretrain/Learning Rate": 1.1782109119524986e-07, "Pretrain/Loss": 1.9410456418991089, "Pretrain/Loss (Raw)": 2.1070973873138428, "Pretrain/Step": 9251, "Pretrain/Step Time": 8.657892828807235} +{"Pretrain/Learning Rate": 1.169992500429179e-07, "Pretrain/Loss": 1.9401999711990356, "Pretrain/Loss (Raw)": 1.6942580938339233, "Pretrain/Step": 9252, "Pretrain/Step Time": 8.65779379196465} +{"Pretrain/Learning Rate": 1.1618027851548197e-07, "Pretrain/Loss": 1.9411258697509766, "Pretrain/Loss (Raw)": 2.046049118041992, "Pretrain/Step": 9253, "Pretrain/Step Time": 8.661911457777023} +{"Pretrain/Learning Rate": 1.1536417670739152e-07, "Pretrain/Loss": 1.9423415660858154, "Pretrain/Loss (Raw)": 1.8029338121414185, "Pretrain/Step": 9254, "Pretrain/Step Time": 8.663301946595311} +{"Pretrain/Learning Rate": 1.1455094471276573e-07, "Pretrain/Loss": 1.9439882040023804, "Pretrain/Loss (Raw)": 2.1526238918304443, "Pretrain/Step": 9255, "Pretrain/Step Time": 8.669701954349875} +{"Pretrain/Learning Rate": 1.1374058262539067e-07, "Pretrain/Loss": 1.9467679262161255, "Pretrain/Loss (Raw)": 2.024956226348877, "Pretrain/Step": 9256, "Pretrain/Step Time": 8.662350490689278} +{"Pretrain/Learning Rate": 1.1293309053871659e-07, "Pretrain/Loss": 1.9477260112762451, "Pretrain/Loss (Raw)": 2.117205858230591, "Pretrain/Step": 9257, "Pretrain/Step Time": 8.658705899491906} +{"Pretrain/Learning Rate": 1.1212846854587177e-07, "Pretrain/Loss": 1.9474411010742188, "Pretrain/Loss (Raw)": 1.9923949241638184, "Pretrain/Step": 9258, "Pretrain/Step Time": 8.66162853129208} +{"Pretrain/Learning Rate": 1.113267167396459e-07, "Pretrain/Loss": 1.949115514755249, "Pretrain/Loss (Raw)": 2.290952205657959, "Pretrain/Step": 9259, "Pretrain/Step Time": 8.663807727396488} +{"Pretrain/Learning Rate": 1.1052783521250387e-07, "Pretrain/Loss": 1.947676658630371, "Pretrain/Loss (Raw)": 1.7240381240844727, "Pretrain/Step": 9260, "Pretrain/Step Time": 8.66328115016222} +{"Pretrain/Learning Rate": 1.0973182405657479e-07, "Pretrain/Loss": 1.9478771686553955, "Pretrain/Loss (Raw)": 1.995423436164856, "Pretrain/Step": 9261, "Pretrain/Step Time": 8.665107944980264} +{"Pretrain/Learning Rate": 1.089386833636602e-07, "Pretrain/Loss": 1.947110652923584, "Pretrain/Loss (Raw)": 1.95902419090271, "Pretrain/Step": 9262, "Pretrain/Step Time": 8.666571829468012} +{"Pretrain/Learning Rate": 1.0814841322522585e-07, "Pretrain/Loss": 1.9471774101257324, "Pretrain/Loss (Raw)": 1.965384602546692, "Pretrain/Step": 9263, "Pretrain/Step Time": 8.669576935470104} +{"Pretrain/Learning Rate": 1.0736101373240992e-07, "Pretrain/Loss": 1.9473081827163696, "Pretrain/Loss (Raw)": 1.9908932447433472, "Pretrain/Step": 9264, "Pretrain/Step Time": 8.671600533649325} +{"Pretrain/Learning Rate": 1.0657648497601757e-07, "Pretrain/Loss": 1.9470670223236084, "Pretrain/Loss (Raw)": 1.9068779945373535, "Pretrain/Step": 9265, "Pretrain/Step Time": 8.666738599538803} +{"Pretrain/Learning Rate": 1.0579482704653199e-07, "Pretrain/Loss": 1.945648431777954, "Pretrain/Loss (Raw)": 1.6886450052261353, "Pretrain/Step": 9266, "Pretrain/Step Time": 8.66705035045743} +{"Pretrain/Learning Rate": 1.0501604003408938e-07, "Pretrain/Loss": 1.9450174570083618, "Pretrain/Loss (Raw)": 1.9070597887039185, "Pretrain/Step": 9267, "Pretrain/Step Time": 8.671099128201604} +{"Pretrain/Learning Rate": 1.042401240285068e-07, "Pretrain/Loss": 1.9453208446502686, "Pretrain/Loss (Raw)": 1.9741244316101074, "Pretrain/Step": 9268, "Pretrain/Step Time": 8.674839412793517} +{"Pretrain/Learning Rate": 1.0346707911926268e-07, "Pretrain/Loss": 1.9470405578613281, "Pretrain/Loss (Raw)": 2.1327481269836426, "Pretrain/Step": 9269, "Pretrain/Step Time": 8.680838635191321} +{"Pretrain/Learning Rate": 1.0269690539551625e-07, "Pretrain/Loss": 1.9451720714569092, "Pretrain/Loss (Raw)": 1.6415425539016724, "Pretrain/Step": 9270, "Pretrain/Step Time": 8.67570641823113} +{"Pretrain/Learning Rate": 1.0192960294607978e-07, "Pretrain/Loss": 1.9454160928726196, "Pretrain/Loss (Raw)": 2.007951021194458, "Pretrain/Step": 9271, "Pretrain/Step Time": 8.672083020210266} +{"Pretrain/Learning Rate": 1.011651718594464e-07, "Pretrain/Loss": 1.9437568187713623, "Pretrain/Loss (Raw)": 1.8555710315704346, "Pretrain/Step": 9272, "Pretrain/Step Time": 8.671015430241823} +{"Pretrain/Learning Rate": 1.0040361222377059e-07, "Pretrain/Loss": 1.94132661819458, "Pretrain/Loss (Raw)": 1.9543243646621704, "Pretrain/Step": 9273, "Pretrain/Step Time": 8.66870448552072} +{"Pretrain/Learning Rate": 9.964492412688209e-08, "Pretrain/Loss": 1.9444584846496582, "Pretrain/Loss (Raw)": 2.188713788986206, "Pretrain/Step": 9274, "Pretrain/Step Time": 8.666484387591481} +{"Pretrain/Learning Rate": 9.88891076562748e-08, "Pretrain/Loss": 1.9427974224090576, "Pretrain/Loss (Raw)": 1.7396351099014282, "Pretrain/Step": 9275, "Pretrain/Step Time": 8.666676118969917} +{"Pretrain/Learning Rate": 9.813616289911509e-08, "Pretrain/Loss": 1.9420740604400635, "Pretrain/Loss (Raw)": 1.900389313697815, "Pretrain/Step": 9276, "Pretrain/Step Time": 8.667919246479869} +{"Pretrain/Learning Rate": 9.738608994223352e-08, "Pretrain/Loss": 1.9410895109176636, "Pretrain/Loss (Raw)": 1.7857600450515747, "Pretrain/Step": 9277, "Pretrain/Step Time": 8.669737664982677} +{"Pretrain/Learning Rate": 9.663888887213313e-08, "Pretrain/Loss": 1.9434078931808472, "Pretrain/Loss (Raw)": 2.0594570636749268, "Pretrain/Step": 9278, "Pretrain/Step Time": 8.665049780160189} +{"Pretrain/Learning Rate": 9.589455977498385e-08, "Pretrain/Loss": 1.945358395576477, "Pretrain/Loss (Raw)": 1.9275556802749634, "Pretrain/Step": 9279, "Pretrain/Step Time": 8.668914726004004} +{"Pretrain/Learning Rate": 9.515310273662814e-08, "Pretrain/Loss": 1.9464203119277954, "Pretrain/Loss (Raw)": 1.8464279174804688, "Pretrain/Step": 9280, "Pretrain/Step Time": 8.67318775691092} +{"Pretrain/Learning Rate": 9.441451784256706e-08, "Pretrain/Loss": 1.947777509689331, "Pretrain/Loss (Raw)": 2.1021299362182617, "Pretrain/Step": 9281, "Pretrain/Step Time": 8.676457360386848} +{"Pretrain/Learning Rate": 9.3678805177988e-08, "Pretrain/Loss": 1.9499976634979248, "Pretrain/Loss (Raw)": 2.0620243549346924, "Pretrain/Step": 9282, "Pretrain/Step Time": 8.670140517875552} +{"Pretrain/Learning Rate": 9.294596482772866e-08, "Pretrain/Loss": 1.9508200883865356, "Pretrain/Loss (Raw)": 2.0424060821533203, "Pretrain/Step": 9283, "Pretrain/Step Time": 8.670971980318427} +{"Pretrain/Learning Rate": 9.221599687630755e-08, "Pretrain/Loss": 1.9505295753479004, "Pretrain/Loss (Raw)": 1.9456615447998047, "Pretrain/Step": 9284, "Pretrain/Step Time": 8.670215554535389} +{"Pretrain/Learning Rate": 9.148890140790733e-08, "Pretrain/Loss": 1.9502842426300049, "Pretrain/Loss (Raw)": 1.9900180101394653, "Pretrain/Step": 9285, "Pretrain/Step Time": 8.66946766525507} +{"Pretrain/Learning Rate": 9.076467850638037e-08, "Pretrain/Loss": 1.95039701461792, "Pretrain/Loss (Raw)": 2.003511428833008, "Pretrain/Step": 9286, "Pretrain/Step Time": 8.669846344739199} +{"Pretrain/Learning Rate": 9.004332825524597e-08, "Pretrain/Loss": 1.9515154361724854, "Pretrain/Loss (Raw)": 2.2009499073028564, "Pretrain/Step": 9287, "Pretrain/Step Time": 8.670573726296425} +{"Pretrain/Learning Rate": 8.932485073769592e-08, "Pretrain/Loss": 1.950816035270691, "Pretrain/Loss (Raw)": 1.7793484926223755, "Pretrain/Step": 9288, "Pretrain/Step Time": 8.672835489735007} +{"Pretrain/Learning Rate": 8.860924603658338e-08, "Pretrain/Loss": 1.950343370437622, "Pretrain/Loss (Raw)": 2.000602960586548, "Pretrain/Step": 9289, "Pretrain/Step Time": 8.669486405327916} +{"Pretrain/Learning Rate": 8.789651423444234e-08, "Pretrain/Loss": 1.9517582654953003, "Pretrain/Loss (Raw)": 2.261789560317993, "Pretrain/Step": 9290, "Pretrain/Step Time": 8.66456582956016} +{"Pretrain/Learning Rate": 8.718665541346261e-08, "Pretrain/Loss": 1.9521241188049316, "Pretrain/Loss (Raw)": 2.018627882003784, "Pretrain/Step": 9291, "Pretrain/Step Time": 8.662937575951219} +{"Pretrain/Learning Rate": 8.647966965551202e-08, "Pretrain/Loss": 1.9505033493041992, "Pretrain/Loss (Raw)": 1.9076594114303589, "Pretrain/Step": 9292, "Pretrain/Step Time": 8.666807459667325} +{"Pretrain/Learning Rate": 8.577555704212259e-08, "Pretrain/Loss": 1.9505192041397095, "Pretrain/Loss (Raw)": 2.1464955806732178, "Pretrain/Step": 9293, "Pretrain/Step Time": 8.666056526824832} +{"Pretrain/Learning Rate": 8.507431765449603e-08, "Pretrain/Loss": 1.951133370399475, "Pretrain/Loss (Raw)": 2.02026629447937, "Pretrain/Step": 9294, "Pretrain/Step Time": 8.667376672849059} +{"Pretrain/Learning Rate": 8.437595157350098e-08, "Pretrain/Loss": 1.952989101409912, "Pretrain/Loss (Raw)": 2.0577926635742188, "Pretrain/Step": 9295, "Pretrain/Step Time": 8.669505605474114} +{"Pretrain/Learning Rate": 8.368045887967858e-08, "Pretrain/Loss": 1.951024055480957, "Pretrain/Loss (Raw)": 1.9109705686569214, "Pretrain/Step": 9296, "Pretrain/Step Time": 8.670002728700638} +{"Pretrain/Learning Rate": 8.298783965323409e-08, "Pretrain/Loss": 1.954010009765625, "Pretrain/Loss (Raw)": 2.167207717895508, "Pretrain/Step": 9297, "Pretrain/Step Time": 8.66398848965764} +{"Pretrain/Learning Rate": 8.22980939740453e-08, "Pretrain/Loss": 1.954047679901123, "Pretrain/Loss (Raw)": 2.047581672668457, "Pretrain/Step": 9298, "Pretrain/Step Time": 8.667538333684206} +{"Pretrain/Learning Rate": 8.161122192165693e-08, "Pretrain/Loss": 1.9505170583724976, "Pretrain/Loss (Raw)": 1.5506219863891602, "Pretrain/Step": 9299, "Pretrain/Step Time": 8.667806450277567} +{"Pretrain/Learning Rate": 8.092722357528059e-08, "Pretrain/Loss": 1.9484684467315674, "Pretrain/Loss (Raw)": 1.8949273824691772, "Pretrain/Step": 9300, "Pretrain/Step Time": 8.66304619051516} +{"Pretrain/Learning Rate": 8.024609901380042e-08, "Pretrain/Loss": 1.9506546258926392, "Pretrain/Loss (Raw)": 2.2599313259124756, "Pretrain/Step": 9301, "Pretrain/Step Time": 8.663116056472063} +{"Pretrain/Learning Rate": 7.956784831576469e-08, "Pretrain/Loss": 1.9511243104934692, "Pretrain/Loss (Raw)": 2.200505495071411, "Pretrain/Step": 9302, "Pretrain/Step Time": 8.661372711881995} +{"Pretrain/Learning Rate": 7.889247155939417e-08, "Pretrain/Loss": 1.9473034143447876, "Pretrain/Loss (Raw)": 1.7567020654678345, "Pretrain/Step": 9303, "Pretrain/Step Time": 8.663829401135445} +{"Pretrain/Learning Rate": 7.821996882257654e-08, "Pretrain/Loss": 1.9410319328308105, "Pretrain/Loss (Raw)": 1.1766153573989868, "Pretrain/Step": 9304, "Pretrain/Step Time": 8.658145161345601} +{"Pretrain/Learning Rate": 7.755034018286644e-08, "Pretrain/Loss": 1.9402996301651, "Pretrain/Loss (Raw)": 1.8975235223770142, "Pretrain/Step": 9305, "Pretrain/Step Time": 8.656156986951828} +{"Pretrain/Learning Rate": 7.688358571748821e-08, "Pretrain/Loss": 1.9400286674499512, "Pretrain/Loss (Raw)": 1.9334852695465088, "Pretrain/Step": 9306, "Pretrain/Step Time": 8.655413696542382} +{"Pretrain/Learning Rate": 7.621970550333868e-08, "Pretrain/Loss": 1.940026044845581, "Pretrain/Loss (Raw)": 2.1361582279205322, "Pretrain/Step": 9307, "Pretrain/Step Time": 8.65617647767067} +{"Pretrain/Learning Rate": 7.555869961697881e-08, "Pretrain/Loss": 1.941879391670227, "Pretrain/Loss (Raw)": 1.8872231245040894, "Pretrain/Step": 9308, "Pretrain/Step Time": 8.656497817486525} +{"Pretrain/Learning Rate": 7.490056813463375e-08, "Pretrain/Loss": 1.9424734115600586, "Pretrain/Loss (Raw)": 2.164029121398926, "Pretrain/Step": 9309, "Pretrain/Step Time": 8.6552924066782} +{"Pretrain/Learning Rate": 7.424531113220945e-08, "Pretrain/Loss": 1.9402153491973877, "Pretrain/Loss (Raw)": 1.857390284538269, "Pretrain/Step": 9310, "Pretrain/Step Time": 8.6592349242419} +{"Pretrain/Learning Rate": 7.359292868526769e-08, "Pretrain/Loss": 1.93842613697052, "Pretrain/Loss (Raw)": 1.8712522983551025, "Pretrain/Step": 9311, "Pretrain/Step Time": 8.65864272415638} +{"Pretrain/Learning Rate": 7.294342086904827e-08, "Pretrain/Loss": 1.9376477003097534, "Pretrain/Loss (Raw)": 1.7772883176803589, "Pretrain/Step": 9312, "Pretrain/Step Time": 8.666721912100911} +{"Pretrain/Learning Rate": 7.229678775845238e-08, "Pretrain/Loss": 1.9374291896820068, "Pretrain/Loss (Raw)": 2.0690629482269287, "Pretrain/Step": 9313, "Pretrain/Step Time": 8.663234408944845} +{"Pretrain/Learning Rate": 7.165302942805374e-08, "Pretrain/Loss": 1.9382439851760864, "Pretrain/Loss (Raw)": 1.9687190055847168, "Pretrain/Step": 9314, "Pretrain/Step Time": 8.665324384346604} +{"Pretrain/Learning Rate": 7.101214595209571e-08, "Pretrain/Loss": 1.9381163120269775, "Pretrain/Loss (Raw)": 1.9447156190872192, "Pretrain/Step": 9315, "Pretrain/Step Time": 8.666119810193777} +{"Pretrain/Learning Rate": 7.037413740448306e-08, "Pretrain/Loss": 1.934185266494751, "Pretrain/Loss (Raw)": 1.7124680280685425, "Pretrain/Step": 9316, "Pretrain/Step Time": 8.665401773527265} +{"Pretrain/Learning Rate": 6.973900385880138e-08, "Pretrain/Loss": 1.937767744064331, "Pretrain/Loss (Raw)": 1.8364906311035156, "Pretrain/Step": 9317, "Pretrain/Step Time": 8.6648602578789} +{"Pretrain/Learning Rate": 6.910674538828931e-08, "Pretrain/Loss": 1.9378774166107178, "Pretrain/Loss (Raw)": 2.1147067546844482, "Pretrain/Step": 9318, "Pretrain/Step Time": 8.660175615921617} +{"Pretrain/Learning Rate": 6.847736206586908e-08, "Pretrain/Loss": 1.9377433061599731, "Pretrain/Loss (Raw)": 2.046400785446167, "Pretrain/Step": 9319, "Pretrain/Step Time": 8.663632586598396} +{"Pretrain/Learning Rate": 6.785085396411872e-08, "Pretrain/Loss": 1.9392271041870117, "Pretrain/Loss (Raw)": 2.118725061416626, "Pretrain/Step": 9320, "Pretrain/Step Time": 8.664040362462401} +{"Pretrain/Learning Rate": 6.722722115529156e-08, "Pretrain/Loss": 1.9375874996185303, "Pretrain/Loss (Raw)": 1.6644072532653809, "Pretrain/Step": 9321, "Pretrain/Step Time": 8.666072769090533} +{"Pretrain/Learning Rate": 6.660646371130785e-08, "Pretrain/Loss": 1.9405202865600586, "Pretrain/Loss (Raw)": 2.1858487129211426, "Pretrain/Step": 9322, "Pretrain/Step Time": 8.666026689112186} +{"Pretrain/Learning Rate": 6.598858170375755e-08, "Pretrain/Loss": 1.935626745223999, "Pretrain/Loss (Raw)": 1.3041611909866333, "Pretrain/Step": 9323, "Pretrain/Step Time": 8.664783377200365} +{"Pretrain/Learning Rate": 6.537357520389753e-08, "Pretrain/Loss": 1.9387255907058716, "Pretrain/Loss (Raw)": 2.127336025238037, "Pretrain/Step": 9324, "Pretrain/Step Time": 8.666285444051027} +{"Pretrain/Learning Rate": 6.476144428265163e-08, "Pretrain/Loss": 1.9399700164794922, "Pretrain/Loss (Raw)": 2.0186355113983154, "Pretrain/Step": 9325, "Pretrain/Step Time": 8.666458444669843} +{"Pretrain/Learning Rate": 6.415218901061614e-08, "Pretrain/Loss": 1.9413485527038574, "Pretrain/Loss (Raw)": 2.079141139984131, "Pretrain/Step": 9326, "Pretrain/Step Time": 8.66941369138658} +{"Pretrain/Learning Rate": 6.354580945805156e-08, "Pretrain/Loss": 1.9394885301589966, "Pretrain/Loss (Raw)": 1.8688554763793945, "Pretrain/Step": 9327, "Pretrain/Step Time": 8.6710198931396} +{"Pretrain/Learning Rate": 6.294230569488802e-08, "Pretrain/Loss": 1.9399354457855225, "Pretrain/Loss (Raw)": 1.9458352327346802, "Pretrain/Step": 9328, "Pretrain/Step Time": 8.67414808832109} +{"Pretrain/Learning Rate": 6.234167779072542e-08, "Pretrain/Loss": 1.9388766288757324, "Pretrain/Loss (Raw)": 1.7225983142852783, "Pretrain/Step": 9329, "Pretrain/Step Time": 8.670329866930842} +{"Pretrain/Learning Rate": 6.174392581483057e-08, "Pretrain/Loss": 1.9388632774353027, "Pretrain/Loss (Raw)": 1.9157402515411377, "Pretrain/Step": 9330, "Pretrain/Step Time": 8.669034382328391} +{"Pretrain/Learning Rate": 6.114904983613722e-08, "Pretrain/Loss": 1.9407689571380615, "Pretrain/Loss (Raw)": 2.189546823501587, "Pretrain/Step": 9331, "Pretrain/Step Time": 8.67722698673606} +{"Pretrain/Learning Rate": 6.055704992325162e-08, "Pretrain/Loss": 1.9429779052734375, "Pretrain/Loss (Raw)": 2.058906078338623, "Pretrain/Step": 9332, "Pretrain/Step Time": 8.675549704581499} +{"Pretrain/Learning Rate": 5.99679261444469e-08, "Pretrain/Loss": 1.9443280696868896, "Pretrain/Loss (Raw)": 2.1363778114318848, "Pretrain/Step": 9333, "Pretrain/Step Time": 8.677424475550652} +{"Pretrain/Learning Rate": 5.938167856766319e-08, "Pretrain/Loss": 1.9468129873275757, "Pretrain/Loss (Raw)": 1.9190477132797241, "Pretrain/Step": 9334, "Pretrain/Step Time": 8.669047826901078} +{"Pretrain/Learning Rate": 5.87983072605075e-08, "Pretrain/Loss": 1.9462958574295044, "Pretrain/Loss (Raw)": 1.832328200340271, "Pretrain/Step": 9335, "Pretrain/Step Time": 8.673189176246524} +{"Pretrain/Learning Rate": 5.821781229025658e-08, "Pretrain/Loss": 1.9450548887252808, "Pretrain/Loss (Raw)": 1.6055258512496948, "Pretrain/Step": 9336, "Pretrain/Step Time": 8.671848302707076} +{"Pretrain/Learning Rate": 5.764019372385687e-08, "Pretrain/Loss": 1.9459221363067627, "Pretrain/Loss (Raw)": 1.948095679283142, "Pretrain/Step": 9337, "Pretrain/Step Time": 8.666299832984805} +{"Pretrain/Learning Rate": 5.706545162792454e-08, "Pretrain/Loss": 1.946661114692688, "Pretrain/Loss (Raw)": 2.152942657470703, "Pretrain/Step": 9338, "Pretrain/Step Time": 8.663419065997005} +{"Pretrain/Learning Rate": 5.649358606873989e-08, "Pretrain/Loss": 1.9486618041992188, "Pretrain/Loss (Raw)": 2.0884547233581543, "Pretrain/Step": 9339, "Pretrain/Step Time": 8.665631894022226} +{"Pretrain/Learning Rate": 5.5924597112250176e-08, "Pretrain/Loss": 1.9475562572479248, "Pretrain/Loss (Raw)": 1.5550973415374756, "Pretrain/Step": 9340, "Pretrain/Step Time": 8.670898042619228} +{"Pretrain/Learning Rate": 5.5358484824077905e-08, "Pretrain/Loss": 1.9478414058685303, "Pretrain/Loss (Raw)": 2.067574977874756, "Pretrain/Step": 9341, "Pretrain/Step Time": 8.672118591144681} +{"Pretrain/Learning Rate": 5.479524926950696e-08, "Pretrain/Loss": 1.94638192653656, "Pretrain/Loss (Raw)": 1.8473060131072998, "Pretrain/Step": 9342, "Pretrain/Step Time": 8.673109237104654} +{"Pretrain/Learning Rate": 5.4234890513490954e-08, "Pretrain/Loss": 1.9471944570541382, "Pretrain/Loss (Raw)": 1.9167975187301636, "Pretrain/Step": 9343, "Pretrain/Step Time": 8.676236366853118} +{"Pretrain/Learning Rate": 5.367740862065873e-08, "Pretrain/Loss": 1.9458632469177246, "Pretrain/Loss (Raw)": 1.9230153560638428, "Pretrain/Step": 9344, "Pretrain/Step Time": 8.678788581863046} +{"Pretrain/Learning Rate": 5.3122803655300533e-08, "Pretrain/Loss": 1.9463591575622559, "Pretrain/Loss (Raw)": 1.9892313480377197, "Pretrain/Step": 9345, "Pretrain/Step Time": 8.672452261671424} +{"Pretrain/Learning Rate": 5.257107568137076e-08, "Pretrain/Loss": 1.946777582168579, "Pretrain/Loss (Raw)": 1.8642157316207886, "Pretrain/Step": 9346, "Pretrain/Step Time": 8.673905761912465} +{"Pretrain/Learning Rate": 5.2022224762501845e-08, "Pretrain/Loss": 1.945507287979126, "Pretrain/Loss (Raw)": 1.6578419208526611, "Pretrain/Step": 9347, "Pretrain/Step Time": 8.676769264042377} +{"Pretrain/Learning Rate": 5.147625096199038e-08, "Pretrain/Loss": 1.9448200464248657, "Pretrain/Loss (Raw)": 1.9336483478546143, "Pretrain/Step": 9348, "Pretrain/Step Time": 8.674496803432703} +{"Pretrain/Learning Rate": 5.0933154342797105e-08, "Pretrain/Loss": 1.9427639245986938, "Pretrain/Loss (Raw)": 1.7103707790374756, "Pretrain/Step": 9349, "Pretrain/Step Time": 8.669880710542202} +{"Pretrain/Learning Rate": 5.039293496755526e-08, "Pretrain/Loss": 1.9426666498184204, "Pretrain/Loss (Raw)": 1.9480806589126587, "Pretrain/Step": 9350, "Pretrain/Step Time": 8.666997192427516} +{"Pretrain/Learning Rate": 4.9855592898567784e-08, "Pretrain/Loss": 1.9416416883468628, "Pretrain/Loss (Raw)": 1.9006129503250122, "Pretrain/Step": 9351, "Pretrain/Step Time": 8.66480128839612} +{"Pretrain/Learning Rate": 4.9321128197804543e-08, "Pretrain/Loss": 1.9419097900390625, "Pretrain/Loss (Raw)": 1.9518336057662964, "Pretrain/Step": 9352, "Pretrain/Step Time": 8.666930502280593} +{"Pretrain/Learning Rate": 4.8789540926896806e-08, "Pretrain/Loss": 1.944661021232605, "Pretrain/Loss (Raw)": 2.040238857269287, "Pretrain/Step": 9353, "Pretrain/Step Time": 8.670550243929029} +{"Pretrain/Learning Rate": 4.826083114715385e-08, "Pretrain/Loss": 1.9445934295654297, "Pretrain/Loss (Raw)": 1.8575791120529175, "Pretrain/Step": 9354, "Pretrain/Step Time": 8.669469939544797} +{"Pretrain/Learning Rate": 4.7734998919549135e-08, "Pretrain/Loss": 1.9438135623931885, "Pretrain/Loss (Raw)": 1.9599063396453857, "Pretrain/Step": 9355, "Pretrain/Step Time": 8.667780239135027} +{"Pretrain/Learning Rate": 4.7212044304723035e-08, "Pretrain/Loss": 1.9351601600646973, "Pretrain/Loss (Raw)": 1.4710835218429565, "Pretrain/Step": 9356, "Pretrain/Step Time": 8.664555080235004} +{"Pretrain/Learning Rate": 4.6691967362985645e-08, "Pretrain/Loss": 1.9360439777374268, "Pretrain/Loss (Raw)": 2.046973943710327, "Pretrain/Step": 9357, "Pretrain/Step Time": 8.668330922722816} +{"Pretrain/Learning Rate": 4.6174768154316764e-08, "Pretrain/Loss": 1.9384726285934448, "Pretrain/Loss (Raw)": 1.9622927904129028, "Pretrain/Step": 9358, "Pretrain/Step Time": 8.669607158750296} +{"Pretrain/Learning Rate": 4.566044673835479e-08, "Pretrain/Loss": 1.937493085861206, "Pretrain/Loss (Raw)": 1.7364554405212402, "Pretrain/Step": 9359, "Pretrain/Step Time": 8.672449136152864} +{"Pretrain/Learning Rate": 4.514900317442172e-08, "Pretrain/Loss": 1.9360909461975098, "Pretrain/Loss (Raw)": 1.8839261531829834, "Pretrain/Step": 9360, "Pretrain/Step Time": 8.66833002306521} +{"Pretrain/Learning Rate": 4.464043752149816e-08, "Pretrain/Loss": 1.9373937845230103, "Pretrain/Loss (Raw)": 1.826083779335022, "Pretrain/Step": 9361, "Pretrain/Step Time": 8.666990797966719} +{"Pretrain/Learning Rate": 4.413474983823163e-08, "Pretrain/Loss": 1.9396432638168335, "Pretrain/Loss (Raw)": 2.0588252544403076, "Pretrain/Step": 9362, "Pretrain/Step Time": 8.665378574281931} +{"Pretrain/Learning Rate": 4.363194018293937e-08, "Pretrain/Loss": 1.940291166305542, "Pretrain/Loss (Raw)": 1.9546637535095215, "Pretrain/Step": 9363, "Pretrain/Step Time": 8.674007629975677} +{"Pretrain/Learning Rate": 4.313200861361388e-08, "Pretrain/Loss": 1.9433234930038452, "Pretrain/Loss (Raw)": 2.248366355895996, "Pretrain/Step": 9364, "Pretrain/Step Time": 8.673246966674924} +{"Pretrain/Learning Rate": 4.2634955187900727e-08, "Pretrain/Loss": 1.9426699876785278, "Pretrain/Loss (Raw)": 1.9044848680496216, "Pretrain/Step": 9365, "Pretrain/Step Time": 8.673929646611214} +{"Pretrain/Learning Rate": 4.2140779963131815e-08, "Pretrain/Loss": 1.9424033164978027, "Pretrain/Loss (Raw)": 2.002850294113159, "Pretrain/Step": 9366, "Pretrain/Step Time": 8.675994226709008} +{"Pretrain/Learning Rate": 4.164948299629212e-08, "Pretrain/Loss": 1.9362609386444092, "Pretrain/Loss (Raw)": 1.4260531663894653, "Pretrain/Step": 9367, "Pretrain/Step Time": 8.672801034525037} +{"Pretrain/Learning Rate": 4.1161064344041875e-08, "Pretrain/Loss": 1.9375741481781006, "Pretrain/Loss (Raw)": 2.0759377479553223, "Pretrain/Step": 9368, "Pretrain/Step Time": 8.672616019845009} +{"Pretrain/Learning Rate": 4.0675524062708245e-08, "Pretrain/Loss": 1.9364010095596313, "Pretrain/Loss (Raw)": 1.6921470165252686, "Pretrain/Step": 9369, "Pretrain/Step Time": 8.673844009637833} +{"Pretrain/Learning Rate": 4.019286220828255e-08, "Pretrain/Loss": 1.9359955787658691, "Pretrain/Loss (Raw)": 1.990036964416504, "Pretrain/Step": 9370, "Pretrain/Step Time": 8.674675066024065} +{"Pretrain/Learning Rate": 3.971307883643416e-08, "Pretrain/Loss": 1.9366780519485474, "Pretrain/Loss (Raw)": 2.1048190593719482, "Pretrain/Step": 9371, "Pretrain/Step Time": 8.674156179651618} +{"Pretrain/Learning Rate": 3.923617400248825e-08, "Pretrain/Loss": 1.9375402927398682, "Pretrain/Loss (Raw)": 1.889228105545044, "Pretrain/Step": 9372, "Pretrain/Step Time": 8.677450761198997} +{"Pretrain/Learning Rate": 3.876214776144527e-08, "Pretrain/Loss": 1.9374148845672607, "Pretrain/Loss (Raw)": 2.0602376461029053, "Pretrain/Step": 9373, "Pretrain/Step Time": 8.682875061407685} +{"Pretrain/Learning Rate": 3.8291000167972604e-08, "Pretrain/Loss": 1.9362014532089233, "Pretrain/Loss (Raw)": 1.8677018880844116, "Pretrain/Step": 9374, "Pretrain/Step Time": 8.68241978995502} +{"Pretrain/Learning Rate": 3.782273127640734e-08, "Pretrain/Loss": 1.9381980895996094, "Pretrain/Loss (Raw)": 2.0961296558380127, "Pretrain/Step": 9375, "Pretrain/Step Time": 8.67754514887929} +{"Pretrain/Learning Rate": 3.735734114074796e-08, "Pretrain/Loss": 1.937983512878418, "Pretrain/Loss (Raw)": 1.8591853380203247, "Pretrain/Step": 9376, "Pretrain/Step Time": 8.680527007207274} +{"Pretrain/Learning Rate": 3.6894829814668185e-08, "Pretrain/Loss": 1.9398374557495117, "Pretrain/Loss (Raw)": 1.9892393350601196, "Pretrain/Step": 9377, "Pretrain/Step Time": 8.679575312882662} +{"Pretrain/Learning Rate": 3.643519735150869e-08, "Pretrain/Loss": 1.9393389225006104, "Pretrain/Loss (Raw)": 1.981520414352417, "Pretrain/Step": 9378, "Pretrain/Step Time": 8.684030843898654} +{"Pretrain/Learning Rate": 3.5978443804274286e-08, "Pretrain/Loss": 1.9376952648162842, "Pretrain/Loss (Raw)": 1.896714687347412, "Pretrain/Step": 9379, "Pretrain/Step Time": 8.684908019378781} +{"Pretrain/Learning Rate": 3.552456922563674e-08, "Pretrain/Loss": 1.9389405250549316, "Pretrain/Loss (Raw)": 1.8536561727523804, "Pretrain/Step": 9380, "Pretrain/Step Time": 8.681246269494295} +{"Pretrain/Learning Rate": 3.5073573667945836e-08, "Pretrain/Loss": 1.9381672143936157, "Pretrain/Loss (Raw)": 1.9470504522323608, "Pretrain/Step": 9381, "Pretrain/Step Time": 8.676959041506052} +{"Pretrain/Learning Rate": 3.46254571832072e-08, "Pretrain/Loss": 1.9394100904464722, "Pretrain/Loss (Raw)": 1.962022066116333, "Pretrain/Step": 9382, "Pretrain/Step Time": 8.671425128355622} +{"Pretrain/Learning Rate": 3.418021982310171e-08, "Pretrain/Loss": 1.9361997842788696, "Pretrain/Loss (Raw)": 1.7417136430740356, "Pretrain/Step": 9383, "Pretrain/Step Time": 8.666547445580363} +{"Pretrain/Learning Rate": 3.3737861638977184e-08, "Pretrain/Loss": 1.9374017715454102, "Pretrain/Loss (Raw)": 2.178804397583008, "Pretrain/Step": 9384, "Pretrain/Step Time": 8.668568067252636} +{"Pretrain/Learning Rate": 3.3298382681845595e-08, "Pretrain/Loss": 1.9350794553756714, "Pretrain/Loss (Raw)": 1.819946527481079, "Pretrain/Step": 9385, "Pretrain/Step Time": 8.668645430356264} +{"Pretrain/Learning Rate": 3.28617830023914e-08, "Pretrain/Loss": 1.9358713626861572, "Pretrain/Loss (Raw)": 2.0937790870666504, "Pretrain/Step": 9386, "Pretrain/Step Time": 8.664934556931257} +{"Pretrain/Learning Rate": 3.242806265096876e-08, "Pretrain/Loss": 1.9352326393127441, "Pretrain/Loss (Raw)": 2.209182024002075, "Pretrain/Step": 9387, "Pretrain/Step Time": 8.664410077035427} +{"Pretrain/Learning Rate": 3.199722167759045e-08, "Pretrain/Loss": 1.9359042644500732, "Pretrain/Loss (Raw)": 1.810016393661499, "Pretrain/Step": 9388, "Pretrain/Step Time": 8.665171928703785} +{"Pretrain/Learning Rate": 3.15692601319445e-08, "Pretrain/Loss": 1.9359538555145264, "Pretrain/Loss (Raw)": 2.001760959625244, "Pretrain/Step": 9389, "Pretrain/Step Time": 8.662393692880869} +{"Pretrain/Learning Rate": 3.114417806338865e-08, "Pretrain/Loss": 1.934090495109558, "Pretrain/Loss (Raw)": 1.720507025718689, "Pretrain/Step": 9390, "Pretrain/Step Time": 8.663251504302025} +{"Pretrain/Learning Rate": 3.072197552094203e-08, "Pretrain/Loss": 1.9309251308441162, "Pretrain/Loss (Raw)": 1.5602120161056519, "Pretrain/Step": 9391, "Pretrain/Step Time": 8.660352490842342} +{"Pretrain/Learning Rate": 3.0302652553296226e-08, "Pretrain/Loss": 1.9301509857177734, "Pretrain/Loss (Raw)": 1.8918135166168213, "Pretrain/Step": 9392, "Pretrain/Step Time": 8.656812006607652} +{"Pretrain/Learning Rate": 2.98862092088098e-08, "Pretrain/Loss": 1.9291203022003174, "Pretrain/Loss (Raw)": 1.7749415636062622, "Pretrain/Step": 9393, "Pretrain/Step Time": 8.660865610465407} +{"Pretrain/Learning Rate": 2.947264553551099e-08, "Pretrain/Loss": 1.9286036491394043, "Pretrain/Loss (Raw)": 1.6225348711013794, "Pretrain/Step": 9394, "Pretrain/Step Time": 8.659166287630796} +{"Pretrain/Learning Rate": 2.9061961581089424e-08, "Pretrain/Loss": 1.9290599822998047, "Pretrain/Loss (Raw)": 1.9654631614685059, "Pretrain/Step": 9395, "Pretrain/Step Time": 8.656839882954955} +{"Pretrain/Learning Rate": 2.8654157392909997e-08, "Pretrain/Loss": 1.9292964935302734, "Pretrain/Loss (Raw)": 2.004385232925415, "Pretrain/Step": 9396, "Pretrain/Step Time": 8.65280925296247} +{"Pretrain/Learning Rate": 2.824923301800175e-08, "Pretrain/Loss": 1.9269185066223145, "Pretrain/Loss (Raw)": 1.828369379043579, "Pretrain/Step": 9397, "Pretrain/Step Time": 8.646615946665406} +{"Pretrain/Learning Rate": 2.7847188503063447e-08, "Pretrain/Loss": 1.926725149154663, "Pretrain/Loss (Raw)": 1.6167997121810913, "Pretrain/Step": 9398, "Pretrain/Step Time": 8.648259254172444} +{"Pretrain/Learning Rate": 2.7448023894457997e-08, "Pretrain/Loss": 1.9251580238342285, "Pretrain/Loss (Raw)": 1.8073481321334839, "Pretrain/Step": 9399, "Pretrain/Step Time": 8.649020250886679} +{"Pretrain/Learning Rate": 2.7051739238223572e-08, "Pretrain/Loss": 1.9246203899383545, "Pretrain/Loss (Raw)": 1.7867697477340698, "Pretrain/Step": 9400, "Pretrain/Step Time": 8.643522961065173} +{"Pretrain/Learning Rate": 2.6658334580056954e-08, "Pretrain/Loss": 1.9232486486434937, "Pretrain/Loss (Raw)": 1.7787290811538696, "Pretrain/Step": 9401, "Pretrain/Step Time": 8.646190764382482} +{"Pretrain/Learning Rate": 2.626780996533018e-08, "Pretrain/Loss": 1.922255039215088, "Pretrain/Loss (Raw)": 2.0615363121032715, "Pretrain/Step": 9402, "Pretrain/Step Time": 8.64466061256826} +{"Pretrain/Learning Rate": 2.588016543907945e-08, "Pretrain/Loss": 1.9248377084732056, "Pretrain/Loss (Raw)": 2.07020902633667, "Pretrain/Step": 9403, "Pretrain/Step Time": 8.649469470605254} +{"Pretrain/Learning Rate": 2.549540104601067e-08, "Pretrain/Loss": 1.9267972707748413, "Pretrain/Loss (Raw)": 2.151228427886963, "Pretrain/Step": 9404, "Pretrain/Step Time": 8.653634747490287} +{"Pretrain/Learning Rate": 2.5113516830493898e-08, "Pretrain/Loss": 1.9278106689453125, "Pretrain/Loss (Raw)": 1.9154707193374634, "Pretrain/Step": 9405, "Pretrain/Step Time": 8.652879614382982} +{"Pretrain/Learning Rate": 2.4734512836574465e-08, "Pretrain/Loss": 1.9261229038238525, "Pretrain/Loss (Raw)": 1.8434245586395264, "Pretrain/Step": 9406, "Pretrain/Step Time": 8.658944442868233} +{"Pretrain/Learning Rate": 2.4358389107956292e-08, "Pretrain/Loss": 1.9246466159820557, "Pretrain/Loss (Raw)": 1.7385740280151367, "Pretrain/Step": 9407, "Pretrain/Step Time": 8.65418898127973} +{"Pretrain/Learning Rate": 2.3985145688018575e-08, "Pretrain/Loss": 1.9252395629882812, "Pretrain/Loss (Raw)": 1.9223322868347168, "Pretrain/Step": 9408, "Pretrain/Step Time": 8.651865284889936} +{"Pretrain/Learning Rate": 2.361478261980743e-08, "Pretrain/Loss": 1.9243783950805664, "Pretrain/Loss (Raw)": 1.9918959140777588, "Pretrain/Step": 9409, "Pretrain/Step Time": 8.65087658725679} +{"Pretrain/Learning Rate": 2.324729994602759e-08, "Pretrain/Loss": 1.9241652488708496, "Pretrain/Loss (Raw)": 2.034757614135742, "Pretrain/Step": 9410, "Pretrain/Step Time": 8.652272157371044} +{"Pretrain/Learning Rate": 2.288269770906737e-08, "Pretrain/Loss": 1.9240360260009766, "Pretrain/Loss (Raw)": 2.0258584022521973, "Pretrain/Step": 9411, "Pretrain/Step Time": 8.656151123344898} +{"Pretrain/Learning Rate": 2.2520975950968137e-08, "Pretrain/Loss": 1.9252926111221313, "Pretrain/Loss (Raw)": 2.1065025329589844, "Pretrain/Step": 9412, "Pretrain/Step Time": 8.655560404062271} +{"Pretrain/Learning Rate": 2.2162134713446524e-08, "Pretrain/Loss": 1.9273717403411865, "Pretrain/Loss (Raw)": 2.2561445236206055, "Pretrain/Step": 9413, "Pretrain/Step Time": 8.65388268046081} +{"Pretrain/Learning Rate": 2.1806174037888872e-08, "Pretrain/Loss": 1.9274382591247559, "Pretrain/Loss (Raw)": 2.012035369873047, "Pretrain/Step": 9414, "Pretrain/Step Time": 8.653534166514874} +{"Pretrain/Learning Rate": 2.1453093965342896e-08, "Pretrain/Loss": 1.9235050678253174, "Pretrain/Loss (Raw)": 1.6974812746047974, "Pretrain/Step": 9415, "Pretrain/Step Time": 8.659985406324267} +{"Pretrain/Learning Rate": 2.110289453653158e-08, "Pretrain/Loss": 1.9245636463165283, "Pretrain/Loss (Raw)": 1.9148595333099365, "Pretrain/Step": 9416, "Pretrain/Step Time": 8.657545506954193} +{"Pretrain/Learning Rate": 2.0755575791836513e-08, "Pretrain/Loss": 1.9250080585479736, "Pretrain/Loss (Raw)": 2.0574843883514404, "Pretrain/Step": 9417, "Pretrain/Step Time": 8.661492047831416} +{"Pretrain/Learning Rate": 2.041113777131731e-08, "Pretrain/Loss": 1.9230928421020508, "Pretrain/Loss (Raw)": 2.0166356563568115, "Pretrain/Step": 9418, "Pretrain/Step Time": 8.666452454403043} +{"Pretrain/Learning Rate": 2.0069580514689435e-08, "Pretrain/Loss": 1.9233070611953735, "Pretrain/Loss (Raw)": 2.0460572242736816, "Pretrain/Step": 9419, "Pretrain/Step Time": 8.669044213369489} +{"Pretrain/Learning Rate": 1.9730904061349143e-08, "Pretrain/Loss": 1.9237512350082397, "Pretrain/Loss (Raw)": 1.96451997756958, "Pretrain/Step": 9420, "Pretrain/Step Time": 8.666626354679465} +{"Pretrain/Learning Rate": 1.939510845035131e-08, "Pretrain/Loss": 1.921576976776123, "Pretrain/Loss (Raw)": 1.868178367614746, "Pretrain/Step": 9421, "Pretrain/Step Time": 8.66694294475019} +{"Pretrain/Learning Rate": 1.9062193720423284e-08, "Pretrain/Loss": 1.9219834804534912, "Pretrain/Loss (Raw)": 2.072295904159546, "Pretrain/Step": 9422, "Pretrain/Step Time": 8.667487129569054} +{"Pretrain/Learning Rate": 1.8732159909956583e-08, "Pretrain/Loss": 1.9206151962280273, "Pretrain/Loss (Raw)": 1.8826645612716675, "Pretrain/Step": 9423, "Pretrain/Step Time": 8.670831732451916} +{"Pretrain/Learning Rate": 1.8405007057012425e-08, "Pretrain/Loss": 1.9226415157318115, "Pretrain/Loss (Raw)": 2.1703433990478516, "Pretrain/Step": 9424, "Pretrain/Step Time": 8.669987577944994} +{"Pretrain/Learning Rate": 1.8080735199318966e-08, "Pretrain/Loss": 1.9188848733901978, "Pretrain/Loss (Raw)": 1.6863467693328857, "Pretrain/Step": 9425, "Pretrain/Step Time": 8.672422099858522} +{"Pretrain/Learning Rate": 1.775934437427684e-08, "Pretrain/Loss": 1.9181021451950073, "Pretrain/Loss (Raw)": 1.9473963975906372, "Pretrain/Step": 9426, "Pretrain/Step Time": 8.672495217993855} +{"Pretrain/Learning Rate": 1.7440834618945302e-08, "Pretrain/Loss": 1.919490098953247, "Pretrain/Loss (Raw)": 1.7282767295837402, "Pretrain/Step": 9427, "Pretrain/Step Time": 8.67117389664054} +{"Pretrain/Learning Rate": 1.7125205970058843e-08, "Pretrain/Loss": 1.9182097911834717, "Pretrain/Loss (Raw)": 1.7310535907745361, "Pretrain/Step": 9428, "Pretrain/Step Time": 8.669817999005318} +{"Pretrain/Learning Rate": 1.681245846401336e-08, "Pretrain/Loss": 1.9176323413848877, "Pretrain/Loss (Raw)": 2.186018466949463, "Pretrain/Step": 9429, "Pretrain/Step Time": 8.67007590457797} +{"Pretrain/Learning Rate": 1.650259213688554e-08, "Pretrain/Loss": 1.914726972579956, "Pretrain/Loss (Raw)": 1.8286166191101074, "Pretrain/Step": 9430, "Pretrain/Step Time": 8.673445725813508} +{"Pretrain/Learning Rate": 1.6195607024399593e-08, "Pretrain/Loss": 1.9172993898391724, "Pretrain/Loss (Raw)": 2.085972547531128, "Pretrain/Step": 9431, "Pretrain/Step Time": 8.672207647934556} +{"Pretrain/Learning Rate": 1.5891503161968857e-08, "Pretrain/Loss": 1.9204920530319214, "Pretrain/Loss (Raw)": 1.5852816104888916, "Pretrain/Step": 9432, "Pretrain/Step Time": 8.673208110034466} +{"Pretrain/Learning Rate": 1.559028058465417e-08, "Pretrain/Loss": 1.921399474143982, "Pretrain/Loss (Raw)": 2.013655662536621, "Pretrain/Step": 9433, "Pretrain/Step Time": 8.672740308567882} +{"Pretrain/Learning Rate": 1.5291939327202742e-08, "Pretrain/Loss": 1.9199128150939941, "Pretrain/Loss (Raw)": 1.7431938648223877, "Pretrain/Step": 9434, "Pretrain/Step Time": 8.673381755128503} +{"Pretrain/Learning Rate": 1.499647942401483e-08, "Pretrain/Loss": 1.91880464553833, "Pretrain/Loss (Raw)": 1.9943194389343262, "Pretrain/Step": 9435, "Pretrain/Step Time": 8.678478067740798} +{"Pretrain/Learning Rate": 1.4703900909165957e-08, "Pretrain/Loss": 1.9149646759033203, "Pretrain/Loss (Raw)": 1.3957042694091797, "Pretrain/Step": 9436, "Pretrain/Step Time": 8.676564807072282} +{"Pretrain/Learning Rate": 1.4414203816398574e-08, "Pretrain/Loss": 1.912785530090332, "Pretrain/Loss (Raw)": 1.885097861289978, "Pretrain/Step": 9437, "Pretrain/Step Time": 8.684092490002513} +{"Pretrain/Learning Rate": 1.4127388179119294e-08, "Pretrain/Loss": 1.9152508974075317, "Pretrain/Loss (Raw)": 2.1729655265808105, "Pretrain/Step": 9438, "Pretrain/Step Time": 8.680206056684256} +{"Pretrain/Learning Rate": 1.3843454030409986e-08, "Pretrain/Loss": 1.9165213108062744, "Pretrain/Loss (Raw)": 2.033858060836792, "Pretrain/Step": 9439, "Pretrain/Step Time": 8.686447061598301} +{"Pretrain/Learning Rate": 1.3562401403008352e-08, "Pretrain/Loss": 1.9152568578720093, "Pretrain/Loss (Raw)": 1.6154426336288452, "Pretrain/Step": 9440, "Pretrain/Step Time": 8.676919348537922} +{"Pretrain/Learning Rate": 1.3284230329332902e-08, "Pretrain/Loss": 1.9156869649887085, "Pretrain/Loss (Raw)": 2.124112367630005, "Pretrain/Step": 9441, "Pretrain/Step Time": 8.676452539861202} +{"Pretrain/Learning Rate": 1.3008940841460759e-08, "Pretrain/Loss": 1.9154300689697266, "Pretrain/Loss (Raw)": 1.9358309507369995, "Pretrain/Step": 9442, "Pretrain/Step Time": 8.67636775225401} +{"Pretrain/Learning Rate": 1.2736532971141523e-08, "Pretrain/Loss": 1.9155263900756836, "Pretrain/Loss (Raw)": 1.9570549726486206, "Pretrain/Step": 9443, "Pretrain/Step Time": 8.673725282773376} +{"Pretrain/Learning Rate": 1.2467006749788956e-08, "Pretrain/Loss": 1.9168479442596436, "Pretrain/Loss (Raw)": 1.8816308975219727, "Pretrain/Step": 9444, "Pretrain/Step Time": 8.67477754689753} +{"Pretrain/Learning Rate": 1.2200362208483751e-08, "Pretrain/Loss": 1.9196962118148804, "Pretrain/Loss (Raw)": 2.2010626792907715, "Pretrain/Step": 9445, "Pretrain/Step Time": 8.671284755691886} +{"Pretrain/Learning Rate": 1.1936599377981861e-08, "Pretrain/Loss": 1.9199647903442383, "Pretrain/Loss (Raw)": 2.1490864753723145, "Pretrain/Step": 9446, "Pretrain/Step Time": 8.677382631227374} +{"Pretrain/Learning Rate": 1.1675718288697845e-08, "Pretrain/Loss": 1.9176353216171265, "Pretrain/Loss (Raw)": 1.7482295036315918, "Pretrain/Step": 9447, "Pretrain/Step Time": 8.673327336087823} +{"Pretrain/Learning Rate": 1.1417718970718749e-08, "Pretrain/Loss": 1.916785717010498, "Pretrain/Loss (Raw)": 2.0099728107452393, "Pretrain/Step": 9448, "Pretrain/Step Time": 8.67310287989676} +{"Pretrain/Learning Rate": 1.1162601453798549e-08, "Pretrain/Loss": 1.918475866317749, "Pretrain/Loss (Raw)": 1.8807498216629028, "Pretrain/Step": 9449, "Pretrain/Step Time": 8.670712811872363} +{"Pretrain/Learning Rate": 1.0910365767358155e-08, "Pretrain/Loss": 1.916490077972412, "Pretrain/Loss (Raw)": 1.9316704273223877, "Pretrain/Step": 9450, "Pretrain/Step Time": 8.671341344714165} +{"Pretrain/Learning Rate": 1.0661011940488186e-08, "Pretrain/Loss": 1.9227559566497803, "Pretrain/Loss (Raw)": 2.106182098388672, "Pretrain/Step": 9451, "Pretrain/Step Time": 8.667076202109456} +{"Pretrain/Learning Rate": 1.0414540001943418e-08, "Pretrain/Loss": 1.9216961860656738, "Pretrain/Loss (Raw)": 1.9916847944259644, "Pretrain/Step": 9452, "Pretrain/Step Time": 8.670404143631458} +{"Pretrain/Learning Rate": 1.017094998014556e-08, "Pretrain/Loss": 1.9221928119659424, "Pretrain/Loss (Raw)": 2.0822131633758545, "Pretrain/Step": 9453, "Pretrain/Step Time": 8.669920045882463} +{"Pretrain/Learning Rate": 9.93024190319436e-09, "Pretrain/Loss": 1.919216513633728, "Pretrain/Loss (Raw)": 1.6981778144836426, "Pretrain/Step": 9454, "Pretrain/Step Time": 8.667416838929057} +{"Pretrain/Learning Rate": 9.692415798842614e-09, "Pretrain/Loss": 1.9218370914459229, "Pretrain/Loss (Raw)": 2.204284429550171, "Pretrain/Step": 9455, "Pretrain/Step Time": 8.66516412422061} +{"Pretrain/Learning Rate": 9.457471694518383e-09, "Pretrain/Loss": 1.9216923713684082, "Pretrain/Loss (Raw)": 1.9273124933242798, "Pretrain/Step": 9456, "Pretrain/Step Time": 8.665708236396313} +{"Pretrain/Learning Rate": 9.225409617319436e-09, "Pretrain/Loss": 1.92244291305542, "Pretrain/Loss (Raw)": 1.8186792135238647, "Pretrain/Step": 9457, "Pretrain/Step Time": 8.663441022858024} +{"Pretrain/Learning Rate": 8.996229594007699e-09, "Pretrain/Loss": 1.922269582748413, "Pretrain/Loss (Raw)": 1.8935374021530151, "Pretrain/Step": 9458, "Pretrain/Step Time": 8.665176512673497} +{"Pretrain/Learning Rate": 8.769931651009255e-09, "Pretrain/Loss": 1.9200667142868042, "Pretrain/Loss (Raw)": 1.9075846672058105, "Pretrain/Step": 9459, "Pretrain/Step Time": 8.654605789110065} +{"Pretrain/Learning Rate": 8.546515814425449e-09, "Pretrain/Loss": 1.9190263748168945, "Pretrain/Loss (Raw)": 1.925750970840454, "Pretrain/Step": 9460, "Pretrain/Step Time": 8.655212434008718} +{"Pretrain/Learning Rate": 8.325982110024554e-09, "Pretrain/Loss": 1.915806531906128, "Pretrain/Loss (Raw)": 1.7242438793182373, "Pretrain/Step": 9461, "Pretrain/Step Time": 8.654764611274004} +{"Pretrain/Learning Rate": 8.108330563233458e-09, "Pretrain/Loss": 1.914840579032898, "Pretrain/Loss (Raw)": 1.7953931093215942, "Pretrain/Step": 9462, "Pretrain/Step Time": 8.658872600644827} +{"Pretrain/Learning Rate": 7.893561199154297e-09, "Pretrain/Loss": 1.9162521362304688, "Pretrain/Loss (Raw)": 2.0129966735839844, "Pretrain/Step": 9463, "Pretrain/Step Time": 8.660575609654188} +{"Pretrain/Learning Rate": 7.681674042558928e-09, "Pretrain/Loss": 1.9180502891540527, "Pretrain/Loss (Raw)": 1.835689902305603, "Pretrain/Step": 9464, "Pretrain/Step Time": 8.663383800536394} +{"Pretrain/Learning Rate": 7.472669117877807e-09, "Pretrain/Loss": 1.918180227279663, "Pretrain/Loss (Raw)": 1.9647451639175415, "Pretrain/Step": 9465, "Pretrain/Step Time": 8.666482225060463} +{"Pretrain/Learning Rate": 7.266546449219424e-09, "Pretrain/Loss": 1.9156618118286133, "Pretrain/Loss (Raw)": 1.8305776119232178, "Pretrain/Step": 9466, "Pretrain/Step Time": 8.665317753329873} +{"Pretrain/Learning Rate": 7.0633060603508825e-09, "Pretrain/Loss": 1.9139107465744019, "Pretrain/Loss (Raw)": 1.864315152168274, "Pretrain/Step": 9467, "Pretrain/Step Time": 8.665983352810144} +{"Pretrain/Learning Rate": 6.862947974711764e-09, "Pretrain/Loss": 1.9173593521118164, "Pretrain/Loss (Raw)": 1.996518611907959, "Pretrain/Step": 9468, "Pretrain/Step Time": 8.661075146868825} +{"Pretrain/Learning Rate": 6.665472215411361e-09, "Pretrain/Loss": 1.9160118103027344, "Pretrain/Loss (Raw)": 1.8950990438461304, "Pretrain/Step": 9469, "Pretrain/Step Time": 8.66485303454101} +{"Pretrain/Learning Rate": 6.470878805220348e-09, "Pretrain/Loss": 1.9182090759277344, "Pretrain/Loss (Raw)": 2.1285550594329834, "Pretrain/Step": 9470, "Pretrain/Step Time": 8.665085539221764} +{"Pretrain/Learning Rate": 6.279167766579108e-09, "Pretrain/Loss": 1.9199355840682983, "Pretrain/Loss (Raw)": 2.1377837657928467, "Pretrain/Step": 9471, "Pretrain/Step Time": 8.661037601530552} +{"Pretrain/Learning Rate": 6.090339121600508e-09, "Pretrain/Loss": 1.9203987121582031, "Pretrain/Loss (Raw)": 1.9823089838027954, "Pretrain/Step": 9472, "Pretrain/Step Time": 8.656727828085423} +{"Pretrain/Learning Rate": 5.904392892058796e-09, "Pretrain/Loss": 1.9223201274871826, "Pretrain/Loss (Raw)": 2.2351746559143066, "Pretrain/Step": 9473, "Pretrain/Step Time": 8.657802326604724} +{"Pretrain/Learning Rate": 5.721329099400707e-09, "Pretrain/Loss": 1.924102544784546, "Pretrain/Loss (Raw)": 2.0923550128936768, "Pretrain/Step": 9474, "Pretrain/Step Time": 8.656385984271765} +{"Pretrain/Learning Rate": 5.54114776473158e-09, "Pretrain/Loss": 1.9256902933120728, "Pretrain/Loss (Raw)": 1.86106538772583, "Pretrain/Step": 9475, "Pretrain/Step Time": 8.651474002748728} +{"Pretrain/Learning Rate": 5.363848908837565e-09, "Pretrain/Loss": 1.9260320663452148, "Pretrain/Loss (Raw)": 1.9774104356765747, "Pretrain/Step": 9476, "Pretrain/Step Time": 8.653192730620503} +{"Pretrain/Learning Rate": 5.1894325521634205e-09, "Pretrain/Loss": 1.9279440641403198, "Pretrain/Loss (Raw)": 1.9551019668579102, "Pretrain/Step": 9477, "Pretrain/Step Time": 8.655399892479181} +{"Pretrain/Learning Rate": 5.01789871482361e-09, "Pretrain/Loss": 1.928792953491211, "Pretrain/Loss (Raw)": 2.0567402839660645, "Pretrain/Step": 9478, "Pretrain/Step Time": 8.656977623701096} +{"Pretrain/Learning Rate": 4.849247416599534e-09, "Pretrain/Loss": 1.926342487335205, "Pretrain/Loss (Raw)": 1.5869313478469849, "Pretrain/Step": 9479, "Pretrain/Step Time": 8.666290145367384} +{"Pretrain/Learning Rate": 4.683478676939523e-09, "Pretrain/Loss": 1.926957130432129, "Pretrain/Loss (Raw)": 2.0305235385894775, "Pretrain/Step": 9480, "Pretrain/Step Time": 8.663345076143742} +{"Pretrain/Learning Rate": 4.520592514964395e-09, "Pretrain/Loss": 1.9271514415740967, "Pretrain/Loss (Raw)": 2.0651068687438965, "Pretrain/Step": 9481, "Pretrain/Step Time": 8.658988805487752} +{"Pretrain/Learning Rate": 4.360588949456345e-09, "Pretrain/Loss": 1.9298629760742188, "Pretrain/Loss (Raw)": 2.2046592235565186, "Pretrain/Step": 9482, "Pretrain/Step Time": 8.66183233819902} +{"Pretrain/Learning Rate": 4.203467998867283e-09, "Pretrain/Loss": 1.930018663406372, "Pretrain/Loss (Raw)": 1.9798245429992676, "Pretrain/Step": 9483, "Pretrain/Step Time": 8.662490265443921} +{"Pretrain/Learning Rate": 4.049229681321598e-09, "Pretrain/Loss": 1.9338384866714478, "Pretrain/Loss (Raw)": 1.9600321054458618, "Pretrain/Step": 9484, "Pretrain/Step Time": 8.660794161260128} +{"Pretrain/Learning Rate": 3.897874014599512e-09, "Pretrain/Loss": 1.9347270727157593, "Pretrain/Loss (Raw)": 2.1607165336608887, "Pretrain/Step": 9485, "Pretrain/Step Time": 8.66355107538402} +{"Pretrain/Learning Rate": 3.749401016162058e-09, "Pretrain/Loss": 1.9348914623260498, "Pretrain/Loss (Raw)": 1.9833300113677979, "Pretrain/Step": 9486, "Pretrain/Step Time": 8.662144863978028} +{"Pretrain/Learning Rate": 3.603810703131649e-09, "Pretrain/Loss": 1.9357218742370605, "Pretrain/Loss (Raw)": 1.8427461385726929, "Pretrain/Step": 9487, "Pretrain/Step Time": 8.661405457183719} +{"Pretrain/Learning Rate": 3.4611030922948595e-09, "Pretrain/Loss": 1.936415672302246, "Pretrain/Loss (Raw)": 1.9727178812026978, "Pretrain/Step": 9488, "Pretrain/Step Time": 8.662237647920847} +{"Pretrain/Learning Rate": 3.3212782001107444e-09, "Pretrain/Loss": 1.936554193496704, "Pretrain/Loss (Raw)": 1.843824863433838, "Pretrain/Step": 9489, "Pretrain/Step Time": 8.660223925486207} +{"Pretrain/Learning Rate": 3.1843360427052937e-09, "Pretrain/Loss": 1.9366135597229004, "Pretrain/Loss (Raw)": 2.0664424896240234, "Pretrain/Step": 9490, "Pretrain/Step Time": 8.664704328402877} +{"Pretrain/Learning Rate": 3.0502766358714297e-09, "Pretrain/Loss": 1.9351918697357178, "Pretrain/Loss (Raw)": 1.7726651430130005, "Pretrain/Step": 9491, "Pretrain/Step Time": 8.659808341413736} +{"Pretrain/Learning Rate": 2.919099995069008e-09, "Pretrain/Loss": 1.9320495128631592, "Pretrain/Loss (Raw)": 1.846146583557129, "Pretrain/Step": 9492, "Pretrain/Step Time": 8.660993378609419} +{"Pretrain/Learning Rate": 2.790806135427593e-09, "Pretrain/Loss": 1.9288545846939087, "Pretrain/Loss (Raw)": 1.495540738105774, "Pretrain/Step": 9493, "Pretrain/Step Time": 8.661411179229617} +{"Pretrain/Learning Rate": 2.665395071740906e-09, "Pretrain/Loss": 1.9273910522460938, "Pretrain/Loss (Raw)": 1.8155298233032227, "Pretrain/Step": 9494, "Pretrain/Step Time": 8.659714149311185} +{"Pretrain/Learning Rate": 2.5428668184696024e-09, "Pretrain/Loss": 1.9301599264144897, "Pretrain/Loss (Raw)": 1.7804566621780396, "Pretrain/Step": 9495, "Pretrain/Step Time": 8.661727957427502} +{"Pretrain/Learning Rate": 2.423221389749597e-09, "Pretrain/Loss": 1.9297101497650146, "Pretrain/Loss (Raw)": 2.0183780193328857, "Pretrain/Step": 9496, "Pretrain/Step Time": 8.665296375751495} +{"Pretrain/Learning Rate": 2.306458799372635e-09, "Pretrain/Loss": 1.9332772493362427, "Pretrain/Loss (Raw)": 2.1487221717834473, "Pretrain/Step": 9497, "Pretrain/Step Time": 8.65983820706606} +{"Pretrain/Learning Rate": 2.192579060811273e-09, "Pretrain/Loss": 1.9302719831466675, "Pretrain/Loss (Raw)": 1.6053693294525146, "Pretrain/Step": 9498, "Pretrain/Step Time": 8.659553388133645} +{"Pretrain/Learning Rate": 2.081582187193898e-09, "Pretrain/Loss": 1.9303321838378906, "Pretrain/Loss (Raw)": 2.11250901222229, "Pretrain/Step": 9499, "Pretrain/Step Time": 8.65866052173078} +{"Pretrain/Learning Rate": 1.9734681913213815e-09, "Pretrain/Loss": 1.9320194721221924, "Pretrain/Loss (Raw)": 2.1052191257476807, "Pretrain/Step": 9500, "Pretrain/Step Time": 8.659347610548139} +{"Pretrain/Learning Rate": 1.868237085664304e-09, "Pretrain/Loss": 1.9323046207427979, "Pretrain/Loss (Raw)": 2.0967397689819336, "Pretrain/Step": 9501, "Pretrain/Step Time": 8.654005974531174} +{"Pretrain/Learning Rate": 1.7658888823574027e-09, "Pretrain/Loss": 1.932084560394287, "Pretrain/Loss (Raw)": 1.8395156860351562, "Pretrain/Step": 9502, "Pretrain/Step Time": 8.657017661258578} +{"Pretrain/Learning Rate": 1.6664235932051243e-09, "Pretrain/Loss": 1.929793119430542, "Pretrain/Loss (Raw)": 1.802843451499939, "Pretrain/Step": 9503, "Pretrain/Step Time": 8.65745928324759} +{"Pretrain/Learning Rate": 1.5698412296760723e-09, "Pretrain/Loss": 1.9300408363342285, "Pretrain/Loss (Raw)": 1.8908843994140625, "Pretrain/Step": 9504, "Pretrain/Step Time": 8.652905900031328} +{"Pretrain/Learning Rate": 1.4761418029085593e-09, "Pretrain/Loss": 1.9305014610290527, "Pretrain/Loss (Raw)": 2.0481951236724854, "Pretrain/Step": 9505, "Pretrain/Step Time": 8.648565825074911} +{"Pretrain/Learning Rate": 1.3853253237078311e-09, "Pretrain/Loss": 1.9318742752075195, "Pretrain/Loss (Raw)": 2.1572587490081787, "Pretrain/Step": 9506, "Pretrain/Step Time": 8.64806029573083} +{"Pretrain/Learning Rate": 1.2973918025516174e-09, "Pretrain/Loss": 1.9295709133148193, "Pretrain/Loss (Raw)": 1.6018702983856201, "Pretrain/Step": 9507, "Pretrain/Step Time": 8.651933355256915} +{"Pretrain/Learning Rate": 1.2123412495762544e-09, "Pretrain/Loss": 1.9300146102905273, "Pretrain/Loss (Raw)": 1.9104523658752441, "Pretrain/Step": 9508, "Pretrain/Step Time": 8.656873445957899} +{"Pretrain/Learning Rate": 1.1301736745905623e-09, "Pretrain/Loss": 1.92905855178833, "Pretrain/Loss (Raw)": 1.8246777057647705, "Pretrain/Step": 9509, "Pretrain/Step Time": 8.660776009783149} +{"Pretrain/Learning Rate": 1.050889087075846e-09, "Pretrain/Loss": 1.929186224937439, "Pretrain/Loss (Raw)": 1.9783623218536377, "Pretrain/Step": 9510, "Pretrain/Step Time": 8.662621485069394} +{"Pretrain/Learning Rate": 9.744874961664652e-10, "Pretrain/Loss": 1.9315886497497559, "Pretrain/Loss (Raw)": 2.0492055416107178, "Pretrain/Step": 9511, "Pretrain/Step Time": 8.665150890126824} +{"Pretrain/Learning Rate": 9.00968910683142e-10, "Pretrain/Loss": 1.9279121160507202, "Pretrain/Loss (Raw)": 1.7082271575927734, "Pretrain/Step": 9512, "Pretrain/Step Time": 8.664559479802847} +{"Pretrain/Learning Rate": 8.303333390968782e-10, "Pretrain/Loss": 1.9293663501739502, "Pretrain/Loss (Raw)": 2.006093740463257, "Pretrain/Step": 9513, "Pretrain/Step Time": 8.666883831843734} +{"Pretrain/Learning Rate": 7.625807895567106e-10, "Pretrain/Loss": 1.928581714630127, "Pretrain/Loss (Raw)": 1.9933465719223022, "Pretrain/Step": 9514, "Pretrain/Step Time": 8.67088676057756} +{"Pretrain/Learning Rate": 6.977112698758337e-10, "Pretrain/Loss": 1.9260118007659912, "Pretrain/Loss (Raw)": 1.8802094459533691, "Pretrain/Step": 9515, "Pretrain/Step Time": 8.668888350948691} +{"Pretrain/Learning Rate": 6.357247875371508e-10, "Pretrain/Loss": 1.9249267578125, "Pretrain/Loss (Raw)": 1.6711386442184448, "Pretrain/Step": 9516, "Pretrain/Step Time": 8.667395481839776} +{"Pretrain/Learning Rate": 5.766213496877226e-10, "Pretrain/Loss": 1.9235562086105347, "Pretrain/Loss (Raw)": 1.8263403177261353, "Pretrain/Step": 9517, "Pretrain/Step Time": 8.675237132236362} +{"Pretrain/Learning Rate": 5.20400963141543e-10, "Pretrain/Loss": 1.925534963607788, "Pretrain/Loss (Raw)": 1.9737865924835205, "Pretrain/Step": 9518, "Pretrain/Step Time": 8.675208060070872} +{"Pretrain/Learning Rate": 4.670636343850899e-10, "Pretrain/Loss": 1.9285473823547363, "Pretrain/Loss (Raw)": 1.9458000659942627, "Pretrain/Step": 9519, "Pretrain/Step Time": 8.673470193520188} +{"Pretrain/Learning Rate": 4.1660936956899874e-10, "Pretrain/Loss": 1.9300808906555176, "Pretrain/Loss (Raw)": 2.088103771209717, "Pretrain/Step": 9520, "Pretrain/Step Time": 8.674163771793246} +{"Pretrain/Learning Rate": 3.6903817451083846e-10, "Pretrain/Loss": 1.9323241710662842, "Pretrain/Loss (Raw)": 2.0620832443237305, "Pretrain/Step": 9521, "Pretrain/Step Time": 8.671726351603866} +{"Pretrain/Learning Rate": 3.2435005469788615e-10, "Pretrain/Loss": 1.9357895851135254, "Pretrain/Loss (Raw)": 2.066091775894165, "Pretrain/Step": 9522, "Pretrain/Step Time": 8.674301406368613} +{"Pretrain/Learning Rate": 2.825450152815767e-10, "Pretrain/Loss": 1.9352614879608154, "Pretrain/Loss (Raw)": 1.8978784084320068, "Pretrain/Step": 9523, "Pretrain/Step Time": 8.670138763263822} +{"Pretrain/Learning Rate": 2.436230610858292e-10, "Pretrain/Loss": 1.9356728792190552, "Pretrain/Loss (Raw)": 2.0570404529571533, "Pretrain/Step": 9524, "Pretrain/Step Time": 8.672268802300096} +{"Pretrain/Learning Rate": 2.075841965987202e-10, "Pretrain/Loss": 1.9341168403625488, "Pretrain/Loss (Raw)": 1.6291974782943726, "Pretrain/Step": 9525, "Pretrain/Step Time": 8.674556389451027} +{"Pretrain/Learning Rate": 1.7442842597525933e-10, "Pretrain/Loss": 1.937131404876709, "Pretrain/Loss (Raw)": 2.002668857574463, "Pretrain/Step": 9526, "Pretrain/Step Time": 8.67533086054027} +{"Pretrain/Learning Rate": 1.4415575304016494e-10, "Pretrain/Loss": 1.9358916282653809, "Pretrain/Loss (Raw)": 1.6486494541168213, "Pretrain/Step": 9527, "Pretrain/Step Time": 8.678495993837714} +{"Pretrain/Learning Rate": 1.1676618128231288e-10, "Pretrain/Loss": 1.9344353675842285, "Pretrain/Loss (Raw)": 1.6003843545913696, "Pretrain/Step": 9528, "Pretrain/Step Time": 8.677532020956278} +{"Pretrain/Learning Rate": 9.225971386583876e-11, "Pretrain/Loss": 1.937182903289795, "Pretrain/Loss (Raw)": 2.1304068565368652, "Pretrain/Step": 9529, "Pretrain/Step Time": 8.676140487194061} +{"Pretrain/Learning Rate": 7.063635361070908e-11, "Pretrain/Loss": 1.9365878105163574, "Pretrain/Loss (Raw)": 1.985351324081421, "Pretrain/Step": 9530, "Pretrain/Step Time": 8.68055696412921} +{"Pretrain/Learning Rate": 5.189610301492564e-11, "Pretrain/Loss": 1.9367854595184326, "Pretrain/Loss (Raw)": 2.0955169200897217, "Pretrain/Step": 9531, "Pretrain/Step Time": 8.674986051395535} +{"Pretrain/Learning Rate": 3.6038964235096675e-11, "Pretrain/Loss": 1.9346436262130737, "Pretrain/Loss (Raw)": 1.877066731452942, "Pretrain/Step": 9532, "Pretrain/Step Time": 8.675460040569305} +{"Pretrain/Learning Rate": 2.3064939105865713e-11, "Pretrain/Loss": 1.9344931840896606, "Pretrain/Loss (Raw)": 1.896211862564087, "Pretrain/Step": 9533, "Pretrain/Step Time": 8.676393447443843} +{"Pretrain/Learning Rate": 1.2974029120482733e-11, "Pretrain/Loss": 1.9347400665283203, "Pretrain/Loss (Raw)": 1.875044584274292, "Pretrain/Step": 9534, "Pretrain/Step Time": 8.67728285305202} +{"Pretrain/Learning Rate": 5.766235441906353e-12, "Pretrain/Loss": 1.9357835054397583, "Pretrain/Loss (Raw)": 1.8721203804016113, "Pretrain/Step": 9535, "Pretrain/Step Time": 8.675424484536052} +{"Pretrain/Learning Rate": 1.4415589028038411e-12, "Pretrain/Loss": 1.9365795850753784, "Pretrain/Loss (Raw)": 2.02423095703125, "Pretrain/Step": 9536, "Pretrain/Step Time": 8.674195971339941} +{"Pretrain/Learning Rate": 0.0, "Pretrain/Loss": 1.9364045858383179, "Pretrain/Loss (Raw)": 1.969498634338379, "Pretrain/Step": 9537, "Pretrain/Step Time": 8.674963986501098} diff --git a/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/run-metrics.jsonl b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/run-metrics.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d08f6491f9013b4c7990cfc9345da9eff04187e1 --- /dev/null +++ b/obelics+phi3-3b-continue-training-dfn-run1+stage-pretrain+x7/run-metrics.jsonl @@ -0,0 +1 @@ +{"hparams": {"dataset": {"align_stage_components": ["download/llava-laion-cc-sbu-558k/chat.json", "download/llava-laion-cc-sbu-558k"], "dataset_id": "obelics", "dataset_resampled": true, "dataset_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/datacomp/datacomp_hq_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/OBELICS/obelics_dfn_single_pkl:/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/data/synthdog-en/synthdog_single_pkl/", "finetune_stage_components": ["/mnt/raid5/weizhi/llava/llava_v1_5_mix665k.json", "/mnt/raid5/weizhi/llava/data"], "max_num_images": 6, "min_num_images": 1, "train_num_samples": 2441407, "type": "obelics", "workers": 4}, "model": {"align_epochs": 1, "align_global_batch_size": 256, "align_learning_rate": 0.001, "align_lr_scheduler_type": "linear-warmup+cosine-decay", "align_max_grad_norm": 1.0, "align_max_steps": null, "align_per_device_batch_size": 16, "align_train_strategy": "fsdp-shard-grad-op", "align_warmup_ratio": 0.03, "align_weight_decay": 0.0, "arch_specifier": "no-align+avgpool", "enable_gradient_checkpointing": true, "enable_mixed_precision_training": true, "finetune_epochs": 1, "finetune_global_batch_size": 128, "finetune_learning_rate": 2e-05, "finetune_lr_scheduler_type": "linear-warmup+cosine-decay", "finetune_max_grad_norm": 1.0, "finetune_max_steps": null, "finetune_per_device_batch_size": 16, "finetune_train_strategy": "fsdp-full-shard", "finetune_warmup_ratio": 0.03, "finetune_weight_decay": 0.1, "image_resize_strategy": "resize-naive", "llm_backbone_id": "phi3-3b", "llm_max_length": 4096, "model_id": "phi3-3b-continue-training-dfn", "pretrain_epochs": 1, "pretrain_global_batch_size": 256, "pretrain_learning_rate": 5e-05, "pretrain_lr_scheduler_type": "linear-warmup+cosine-decay", "pretrain_max_grad_norm": 1.0, "pretrain_max_steps": 9537, "pretrain_per_device_batch_size": 8, "pretrain_train_strategy": "fsdp-full-shard", "pretrain_warmup_ratio": 0.03, "pretrain_weight_decay": 0.01, "reduce_in_full_precision": false, "type": "one-stage+7b", "vision_backbone_id": "siglip-vit-so400m-384px"}, "mount_path": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/models", "pretrained_checkpoint": null, "run_id": "obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7", "run_root_dir": "/fsx-Training/shopqa-training-fsx-prod-us-east-1/home/wzwang/checkpoints", "seed": 7, "stage": "pretrain", "trackers": ["jsonl", "wandb"], "wandb_entity": null, "wandb_project": "mmpretrain"}, "run_id": "obelics+phi3-3b-continue-training-dfn+stage-pretrain+x7"}